├── .gitignore
├── ReadMe.md
├── cmd.example
├── color_flow
    ├── .gitignore
    ├── Makefile
    ├── README.txt
    ├── color_flow
    ├── color_flow.cpp
    ├── colorcode.cpp
    ├── colorcode.h
    ├── colortest
    ├── colortest.cpp
    ├── flowIO.cpp
    ├── flowIO.h
    └── imageLib
    │   ├── Convert.cpp
    │   ├── Convert.h
    │   ├── Convolve.cpp
    │   ├── Convolve.h
    │   ├── Copyright.h
    │   ├── Error.h
    │   ├── Image.cpp
    │   ├── Image.h
    │   ├── ImageIO.cpp
    │   ├── ImageIO.h
    │   ├── ImageIOpng.cpp
    │   ├── Makefile
    │   ├── README.txt
    │   ├── RefCntMem.cpp
    │   ├── RefCntMem.h
    │   └── imageLib.h
├── deep_flow2
    ├── .gitignore
    ├── COPYING
    ├── Makefile
    ├── Makefile.ddk
    ├── Makefile.zhujin.s
    ├── README
    ├── deepflow2
    ├── deepflow2-static
    ├── deepflow2.c
    ├── deepflow2.i
    ├── deepflow2.m
    ├── deepflow2.py
    ├── deepflow2_matlab.cpp
    ├── deepflow2_wrap.c
    ├── image.c
    ├── image.h
    ├── io.c
    ├── io.h
    ├── opticalflow.c
    ├── opticalflow.h
    ├── opticalflow_aux.c
    ├── opticalflow_aux.h
    ├── solver.c
    └── solver.h
├── deep_matching
    ├── .gitignore
    ├── Makefile
    ├── Makefile.bak
    ├── README.txt
    ├── caffe
    ├── caffe.zip
    ├── deep_matching_gpu.py
    ├── extra_layers.cpp
    ├── extra_layers.cu
    ├── extra_layers.hpp
    ├── flow_utils.py
    ├── gpudm.py
    ├── gpudm.swig
    ├── gpudm_wrap.cxx
    ├── helper.py
    ├── my_im2col.cpp
    ├── my_im2col.cu
    ├── my_im2col.hpp
    ├── net.py
    ├── numpy_image.h
    └── numpy_image.swg
└── optical_flow
    ├── bbc_pose.sh
    ├── flic_movies.sh
    ├── flow_pipeline.py
    ├── one_pic.sh
    ├── origin_pipeline.py
    └── origin_pipeline.sh


/.gitignore:
--------------------------------------------------------------------------------
 1 | ## General
 2 | 
 3 | # Compiled Object files
 4 | *.slo
 5 | *.lo
 6 | *.o
 7 | *.cuo
 8 | 
 9 | # Compiled Dynamic libraries
10 | *.so
11 | *.dylib
12 | 
13 | # Compiled Static libraries
14 | *.lai
15 | *.la
16 | *.a
17 | 
18 | # Compiled protocol buffers
19 | *.pb.h
20 | *.pb.cc
21 | *_pb2.py
22 | 
23 | # Compiled python
24 | *.pyc
25 | 
26 | # Compiled MATLAB
27 | *.mex*
28 | 
29 | # IPython notebook checkpoints
30 | .ipynb_checkpoints
31 | 
32 | # Editor temporaries
33 | *.swp
34 | *~
35 | 
36 | # Sublime Text settings
37 | *.sublime-workspace
38 | *.sublime-project
39 | 
40 | # Eclipse Project settings
41 | *.*project
42 | .settings
43 | 
44 | # QtCreator files
45 | *.user
46 | 
47 | # PyCharm files
48 | .idea
49 | 
50 | # OSX dir files
51 | .DS_Store
52 | 
53 | ## Caffe
54 | 
55 | # User's build configuration
56 | Makefile.config
57 | 
58 | # Data and models are either
59 | # 1. reference, and not casually committed
60 | # 2. custom, and live on their own unless they're deliberated contributed
61 | data/*
62 | models/*
63 | *.caffemodel
64 | *.caffemodel.h5
65 | *.solverstate
66 | *.solverstate.h5
67 | *.binaryproto
68 | *leveldb
69 | *lmdb
70 | 
71 | # build, distribute, and bins (+ python proto bindings)
72 | build
73 | .build_debug/*
74 | .build_release/*
75 | distribute/*
76 | *.testbin
77 | *.bin
78 | python/caffe/proto/
79 | cmake_build
80 | .cmake_build
81 | 
82 | # Generated documentation
83 | docs/_site
84 | docs/gathered
85 | _site
86 | doxygen
87 | docs/dev
88 | 
89 | # LevelDB files
90 | *.sst
91 | *.ldb
92 | LOCK
93 | LOG*
94 | CURRENT
95 | MANIFEST-*
96 | 
97 | # images
98 | images/


--------------------------------------------------------------------------------
/ReadMe.md:
--------------------------------------------------------------------------------
 1 | ### Declaration ####
 2 | This code is used for computing optical flow between two images.
 3 | 
 4 | This code is mentioned only for scientific or personal use. 
 5 | Please contact `DeepFlow`, `DeepMatching` and `ColorFlow` for commercial use.
 6 | 
 7 | DeepFlow:
 8 | 	http://lear.inrialpes.fr/src/deepflow/
 9 | 
10 | DeepMatching:
11 | 	http://lear.inrialpes.fr/src/deepmatching/
12 | 
13 | ColorFlow: 
14 | 	http://vision.middlebury.edu/flow/data/
15 | 
16 | ### Pipeline ###
17 | ```
18 | 0: prepare the images pairs
19 | 1: compute matches using `DeepMatching`
20 | 2: compute flo file using `DeepFlow`
21 | 3: compute optical flow using `ColorFlow`
22 | ```
23 | 
24 | 
25 | ### Installation ###
26 | ```
27 | 1 download the code, put them into some directory
28 | 
29 | 2 compiling `deep_matching`, `deep_flow2`, and `color_flow`
30 | 	please refer to `README` of each of them for more details.
31 | ```
32 | **The program was only tested under a 64-bit Linux distribution (Ubuntu 14.04).**
33 | 
34 | ### Example ###
35 | 	cd optical_flow && sh flow_pipeline.sh
36 | 
37 | or see `cmd.example` for more examples
38 | 
39 | 
40 | 


--------------------------------------------------------------------------------
/cmd.example:
--------------------------------------------------------------------------------
 1 | # demo 0
 2 | cd /path/to/web_gpudm_1
 3 | python deep_matching_gpu.py demo1.jpg demo2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse |cat 
 4 | python deep_matching_gpu.py demo1.jpg demo2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse -out demo1.txt 
 5 | 
 6 | # demo 1
 7 | cd /path/to/DeepFlow_release2.0
 8 | 
 9 | no match:
10 | 	./deepflow2 demo1.jpg demo2.jpg demo.flo
11 | 
12 | with match:
13 | 	python ../deep_matching/deep_matching_gpu.py demo1.jpg demo2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse |cat | ./deepflow2 demo1.jpg demo2.jpg demo.flo
14 | 	python ../deep_matching/deep_matching_gpu.py demo1.jpg demo2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse |cat | \
15 | 			./deepflow2 demo1.jpg demo2.jpg demo.flo -match
16 | 


--------------------------------------------------------------------------------
/color_flow/.gitignore:
--------------------------------------------------------------------------------
  1 | ## General
  2 | 
  3 | # Compiled Object files
  4 | *.slo
  5 | *.lo
  6 | *.o
  7 | *.cuo
  8 | 
  9 | # Compiled Dynamic libraries
 10 | *.so
 11 | *.dylib
 12 | 
 13 | # Compiled Static libraries
 14 | *.lai
 15 | *.la
 16 | *.a
 17 | 
 18 | # Compiled protocol buffers
 19 | *.pb.h
 20 | *.pb.cc
 21 | *_pb2.py
 22 | 
 23 | # Compiled python
 24 | *.pyc
 25 | 
 26 | # Compiled MATLAB
 27 | *.mex*
 28 | 
 29 | # IPython notebook checkpoints
 30 | .ipynb_checkpoints
 31 | 
 32 | # Editor temporaries
 33 | *.swp
 34 | *~
 35 | 
 36 | # Sublime Text settings
 37 | *.sublime-workspace
 38 | *.sublime-project
 39 | 
 40 | # Eclipse Project settings
 41 | *.*project
 42 | .settings
 43 | 
 44 | # QtCreator files
 45 | *.user
 46 | 
 47 | # PyCharm files
 48 | .idea
 49 | 
 50 | # OSX dir files
 51 | .DS_Store
 52 | 
 53 | ## Caffe
 54 | 
 55 | # User's build configuration
 56 | Makefile.config
 57 | 
 58 | # Data and models are either
 59 | # 1. reference, and not casually committed
 60 | # 2. custom, and live on their own unless they're deliberated contributed
 61 | data/*
 62 | models/*
 63 | *.caffemodel
 64 | *.caffemodel.h5
 65 | *.solverstate
 66 | *.solverstate.h5
 67 | *.binaryproto
 68 | *leveldb
 69 | *lmdb
 70 | 
 71 | # build, distribute, and bins (+ python proto bindings)
 72 | build
 73 | .build_debug/*
 74 | .build_release/*
 75 | distribute/*
 76 | *.testbin
 77 | *.bin
 78 | python/caffe/proto/
 79 | cmake_build
 80 | .cmake_build
 81 | 
 82 | # Generated documentation
 83 | docs/_site
 84 | docs/gathered
 85 | _site
 86 | doxygen
 87 | docs/dev
 88 | 
 89 | # LevelDB files
 90 | *.sst
 91 | *.ldb
 92 | LOCK
 93 | LOG*
 94 | CURRENT
 95 | MANIFEST-*
 96 | 
 97 | # images
 98 | *.jpg
 99 | *.png
100 | *.flo
101 | 


--------------------------------------------------------------------------------
/color_flow/Makefile:
--------------------------------------------------------------------------------
 1 | # Makefile for flow evaluation code
 2 | 
 3 | SRC = flowIO.cpp colorcode.cpp colortest.cpp color_flow.cpp
 4 | BIN = colortest color_flow
 5 | 
 6 | IMGLIB = imageLib
 7 | 
 8 | CC = g++
 9 | WARN = -W -Wall
10 | OPT ?= -O3
11 | CPPFLAGS = $(OPT) $(WARN) -I$(IMGLIB)
12 | LDLIBS = -L$(IMGLIB) -lImg -lpng -lz
13 | EXE = $(SRC:.cpp=.exe)
14 | 
15 | all: $(BIN)
16 | 
17 | colortest: colortest.cpp colorcode.cpp
18 | color_flow: color_flow.cpp flowIO.cpp colorcode.cpp
19 | 
20 | clean: 
21 | 	rm -f core *.stackdump
22 | 
23 | allclean: clean
24 | 	rm -f $(BIN) $(EXE)
25 | 


--------------------------------------------------------------------------------
/color_flow/README.txt:
--------------------------------------------------------------------------------
 1 | Some utilities for reading, writing, and color-coding .flo images
 2 | 
 3 | Daniel Scharstein, 7/2/07
 4 | updated 2/9/08 to fix bug in color_flow.cpp
 5 | updated 6/9/09 to make robust to NaN or constant 0 flow (thanks Jan Bouecke)
 6 | 
 7 | See flowIO.cpp for sample code for reading and writing .flo files.
 8 | Here's an excerpt from this file describing the flow file format:
 9 | 
10 | // ".flo" file format used for optical flow evaluation
11 | //
12 | // Stores 2-band float image for horizontal (u) and vertical (v) flow components.
13 | // Floats are stored in little-endian order.
14 | // A flow value is considered "unknown" if either |u| or |v| is greater than 1e9.
15 | //
16 | //  bytes  contents
17 | //
18 | //  0-3     tag: "PIEH" in ASCII, which in little endian happens to be the float 202021.25
19 | //          (just a sanity check that floats are represented correctly)
20 | //  4-7     width as an integer
21 | //  8-11    height as an integer
22 | //  12-end  data (width*height*2*4 bytes total)
23 | //          the float values for u and v, interleaved, in row order, i.e.,
24 | //          u[row0,col0], v[row0,col0], u[row0,col1], v[row0,col1], ...
25 | //
26 | 
27 | 
28 | Once you have a .flo file, you can create a color coding of it using
29 | color_flow
30 | 
31 | Use colortest to visualize the encoding
32 | 
33 | 
34 | To compile
35 | 
36 | cd imageLib
37 | make
38 | cd ..
39 | make
40 | ./colortest 10 colors.png
41 | 
42 | /// optical flow
43 | ./color_flow mude.flo mude.png
44 | 
45 | 


--------------------------------------------------------------------------------
/color_flow/color_flow:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/color_flow


--------------------------------------------------------------------------------
/color_flow/color_flow.cpp:
--------------------------------------------------------------------------------
  1 | // color_flow.cpp 
  2 | // color-code motion field
  3 | // normalizes based on specified value, or on maximum motion present otherwise
  4 | 
  5 | // DS 2/9/08 fixed bug in MotionToColor concerning reallocation of colim (thanks Yunpeng!)
  6 | 
  7 | static const char *usage = "\n  usage: %s [-quiet] in.flo out.png [maxmotion]\n";
  8 | 
  9 | #include <stdio.h>
 10 | #include <math.h>
 11 | #include "imageLib.h"
 12 | #include "flowIO.h"
 13 | #include "colorcode.h"
 14 | 
 15 | int verbose = 1;
 16 | 
 17 | void MotionToColor(CFloatImage motim, CByteImage &colim, float maxmotion)
 18 | {
 19 |     CShape sh = motim.Shape();
 20 |     int width = sh.width, height = sh.height;
 21 |     colim.ReAllocate(CShape(width, height, 3));
 22 |     int x, y;
 23 |     // determine motion range:
 24 |     float maxx = -999, maxy = -999;
 25 |     float minx =  999, miny =  999;
 26 |     float maxrad = -1;
 27 |     for (y = 0; y < height; y++) {
 28 | 	for (x = 0; x < width; x++) {
 29 | 	    float fx = motim.Pixel(x, y, 0);
 30 | 	    float fy = motim.Pixel(x, y, 1);
 31 | 	    if (unknown_flow(fx, fy))
 32 | 		continue;
 33 | 	    maxx = __max(maxx, fx);
 34 | 	    maxy = __max(maxy, fy);
 35 | 	    minx = __min(minx, fx);
 36 | 	    miny = __min(miny, fy);
 37 | 	    float rad = sqrt(fx * fx + fy * fy);
 38 | 	    maxrad = __max(maxrad, rad);
 39 | 	}
 40 |     }
 41 |     printf("max motion: %.4f  motion range: u = %.3f .. %.3f;  v = %.3f .. %.3f\n",
 42 | 	   maxrad, minx, maxx, miny, maxy);
 43 | 
 44 | 
 45 |     if (maxmotion > 0) // i.e., specified on commandline
 46 | 	maxrad = maxmotion;
 47 | 
 48 |     if (maxrad == 0) // if flow == 0 everywhere
 49 | 	maxrad = 1;
 50 | 
 51 |     if (verbose)
 52 | 	fprintf(stderr, "normalizing by %g\n", maxrad);
 53 | 
 54 |     for (y = 0; y < height; y++) {
 55 | 	for (x = 0; x < width; x++) {
 56 | 	    float fx = motim.Pixel(x, y, 0);
 57 | 	    float fy = motim.Pixel(x, y, 1);
 58 | 	    uchar *pix = &colim.Pixel(x, y, 0);
 59 | 	    if (unknown_flow(fx, fy)) {
 60 | 		pix[0] = pix[1] = pix[2] = 0;
 61 | 	    } else {
 62 | 		computeColor(fx/maxrad, fy/maxrad, pix);
 63 | 	    }
 64 | 	}
 65 |     }
 66 | }
 67 | 
 68 | int main(int argc, char *argv[])
 69 | {
 70 |     try {
 71 | 	int argn = 1;
 72 | 	if (argc > 1 && argv[1][0]=='-' && argv[1][1]=='q') {
 73 | 	    verbose = 0;
 74 | 	    argn++;
 75 | 	}
 76 | 	if (argn >= argc-3 && argn <= argc-2) {
 77 | 	    char *flowname = argv[argn++];
 78 | 	    char *outname = argv[argn++];
 79 | 	    float maxmotion = argn < argc ? atof(argv[argn++]) : -1;
 80 | 	    CFloatImage im, fband;
 81 | 	    ReadFlowFile(im, flowname);
 82 | 	    CByteImage band, outim;
 83 | 	    CShape sh = im.Shape();
 84 | 	    sh.nBands = 3;
 85 | 	    outim.ReAllocate(sh);
 86 | 	    outim.ClearPixels();
 87 | 	    MotionToColor(im, outim, maxmotion);
 88 | 	    WriteImageVerb(outim, outname, verbose);
 89 | 	} else
 90 | 	    throw CError(usage, argv[0]);
 91 |     }
 92 |     catch (CError &err) {
 93 | 	fprintf(stderr, err.message);
 94 | 	fprintf(stderr, "\n");
 95 | 	return -1;
 96 |     }
 97 | 
 98 |     return 0;
 99 | }
100 | 


--------------------------------------------------------------------------------
/color_flow/colorcode.cpp:
--------------------------------------------------------------------------------
 1 | // colorcode.cpp
 2 | //
 3 | // Color encoding of flow vectors
 4 | // adapted from the color circle idea described at
 5 | //   http://members.shaw.ca/quadibloc/other/colint.htm
 6 | //
 7 | // Daniel Scharstein, 4/2007
 8 | // added tick marks and out-of-range coding 6/05/07
 9 | 
10 | #include <stdlib.h>
11 | #include <math.h>
12 | typedef unsigned char uchar;
13 | 
14 | int ncols = 0;
15 | #define MAXCOLS 60
16 | int colorwheel[MAXCOLS][3];
17 | 
18 | 
19 | void setcols(int r, int g, int b, int k)
20 | {
21 |     colorwheel[k][0] = r;
22 |     colorwheel[k][1] = g;
23 |     colorwheel[k][2] = b;
24 | }
25 | 
26 | void makecolorwheel()
27 | {
28 |     // relative lengths of color transitions:
29 |     // these are chosen based on perceptual similarity
30 |     // (e.g. one can distinguish more shades between red and yellow 
31 |     //  than between yellow and green)
32 |     int RY = 15;
33 |     int YG = 6;
34 |     int GC = 4;
35 |     int CB = 11;
36 |     int BM = 13;
37 |     int MR = 6;
38 |     ncols = RY + YG + GC + CB + BM + MR;
39 |     //printf("ncols = %d\n", ncols);
40 |     if (ncols > MAXCOLS)
41 | 	exit(1);
42 |     int i;
43 |     int k = 0;
44 |     for (i = 0; i < RY; i++) setcols(255,	   255*i/RY,	 0,	       k++);
45 |     for (i = 0; i < YG; i++) setcols(255-255*i/YG, 255,		 0,	       k++);
46 |     for (i = 0; i < GC; i++) setcols(0,		   255,		 255*i/GC,     k++);
47 |     for (i = 0; i < CB; i++) setcols(0,		   255-255*i/CB, 255,	       k++);
48 |     for (i = 0; i < BM; i++) setcols(255*i/BM,	   0,		 255,	       k++);
49 |     for (i = 0; i < MR; i++) setcols(255,	   0,		 255-255*i/MR, k++);
50 | }
51 | 
52 | void computeColor(float fx, float fy, uchar *pix)
53 | {
54 |     if (ncols == 0)
55 | 	makecolorwheel();
56 | 
57 |     float rad = sqrt(fx * fx + fy * fy);
58 |     float a = atan2(-fy, -fx) / M_PI;
59 |     float fk = (a + 1.0) / 2.0 * (ncols-1);
60 |     int k0 = (int)fk;
61 |     int k1 = (k0 + 1) % ncols;
62 |     float f = fk - k0;
63 |     //f = 0; // uncomment to see original color wheel
64 |     for (int b = 0; b < 3; b++) {
65 | 	float col0 = colorwheel[k0][b] / 255.0;
66 | 	float col1 = colorwheel[k1][b] / 255.0;
67 | 	float col = (1 - f) * col0 + f * col1;
68 | 	if (rad <= 1)
69 | 	    col = 1 - rad * (1 - col); // increase saturation with radius
70 | 	else
71 | 	    col *= .75; // out of range
72 | 	pix[2 - b] = (int)(255.0 * col);
73 |     }
74 | }
75 | 


--------------------------------------------------------------------------------
/color_flow/colorcode.h:
--------------------------------------------------------------------------------
1 | void computeColor(float fx, float fy, uchar *pix);
2 | 


--------------------------------------------------------------------------------
/color_flow/colortest:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/colortest


--------------------------------------------------------------------------------
/color_flow/colortest.cpp:
--------------------------------------------------------------------------------
 1 | // colortest.cpp
 2 | 
 3 | // create a test image showing the color encoding
 4 | 
 5 | static char usage[] = "usage: %s range outimage [size]\n";
 6 | 
 7 | # include <stdio.h>
 8 | # include <math.h>
 9 | #include "imageLib.h"
10 | #include "colorcode.h"
11 | 
12 | int main(int argc, char **argv)
13 | {
14 |     int verbose = 1;
15 |     if (argc < 3) {
16 | 	fprintf(stderr, usage, argv[0]);
17 | 	exit(1);
18 |     }
19 |     int optind = 1;
20 |     float truerange = atof(argv[optind++]);
21 |     char *outname = argv[optind++];
22 |     int size = optind < argc ? atoi(argv[optind++]) : 151;
23 | 
24 |     float range = 1.04 * truerange; // make picture a bit bigger to show out-of-range coding
25 |     try {
26 | 	CShape sh(size, size, 3);
27 | 	CByteImage out(sh);
28 | 
29 | 	int s2 = size/2;
30 | 	for (int y = 0; y < size; y++) {
31 | 	    for (int x = 0; x < size; x++) {
32 | 		float fx = (float)x / (float)s2 * range - range;
33 | 		float fy = (float)y / (float)s2 * range - range;
34 | 		if (x == s2 || y == s2) // make black coordinate axes
35 | 		    continue;
36 | 		uchar *pix = &out.Pixel(x, y, 0);
37 | 		//fx = rintf(fx);
38 | 		//fy = rintf(fy);
39 | 		computeColor(fx/truerange, fy/truerange, pix);
40 | 	    }
41 | 	}
42 | 	int ir = (int)truerange;
43 | 	int ticksize = size < 120 ? 1 : 2;
44 | 	for (int k = -ir; k <= ir; k++) {
45 | 	    int ik = (int)(k / range * s2) + s2;
46 | 	    for (int t = -ticksize; t <= ticksize; t++) {
47 | 		uchar *pix;
48 | 		pix = &out.Pixel(ik, s2 + t, 0); pix[0] = pix[1] = pix[2] = 0;
49 | 		pix = &out.Pixel(s2 + t, ik, 0); pix[0] = pix[1] = pix[2] = 0;
50 | 	    }
51 | 	}
52 | 
53 | 	WriteImageVerb(out, outname, verbose);
54 |     }
55 |     catch (CError &err) {
56 | 	fprintf(stderr, err.message);
57 | 	fprintf(stderr, "\n");
58 | 	exit(1);
59 |     }
60 |     return 0;
61 | }
62 | 


--------------------------------------------------------------------------------
/color_flow/flowIO.cpp:
--------------------------------------------------------------------------------
  1 | // flow_io.cpp
  2 | //
  3 | // read and write our simple .flo flow file format
  4 | 
  5 | // ".flo" file format used for optical flow evaluation
  6 | //
  7 | // Stores 2-band float image for horizontal (u) and vertical (v) flow components.
  8 | // Floats are stored in little-endian order.
  9 | // A flow value is considered "unknown" if either |u| or |v| is greater than 1e9.
 10 | //
 11 | //  bytes  contents
 12 | //
 13 | //  0-3     tag: "PIEH" in ASCII, which in little endian happens to be the float 202021.25
 14 | //          (just a sanity check that floats are represented correctly)
 15 | //  4-7     width as an integer
 16 | //  8-11    height as an integer
 17 | //  12-end  data (width*height*2*4 bytes total)
 18 | //          the float values for u and v, interleaved, in row order, i.e.,
 19 | //          u[row0,col0], v[row0,col0], u[row0,col1], v[row0,col1], ...
 20 | //
 21 | 
 22 | 
 23 | // first four bytes, should be the same in little endian
 24 | #define TAG_FLOAT 202021.25  // check for this when READING the file
 25 | #define TAG_STRING "PIEH"    // use this when WRITING the file
 26 | 
 27 | 
 28 | #include <stdio.h>
 29 | #include <stdlib.h>
 30 | #include <math.h>
 31 | #include "imageLib.h"
 32 | #include "flowIO.h"
 33 | 
 34 | // return whether flow vector is unknown
 35 | bool unknown_flow(float u, float v) {
 36 |     return (fabs(u) >  UNKNOWN_FLOW_THRESH) 
 37 | 	|| (fabs(v) >  UNKNOWN_FLOW_THRESH)
 38 | 	|| isnan(u) || isnan(v);
 39 | }
 40 | 
 41 | bool unknown_flow(float *f) {
 42 |     return unknown_flow(f[0], f[1]);
 43 | }
 44 | 
 45 | // read a flow file into 2-band image
 46 | void ReadFlowFile(CFloatImage& img, const char* filename)
 47 | {
 48 |     if (filename == NULL)
 49 | 	throw CError("ReadFlowFile: empty filename");
 50 | 
 51 |     const char *dot = strrchr(filename, '.');
 52 |     if (strcmp(dot, ".flo") != 0)
 53 | 	throw CError("ReadFlowFile (%s): extension .flo expected", filename);
 54 | 
 55 |     FILE *stream = fopen(filename, "rb");
 56 |     if (stream == 0)
 57 |         throw CError("ReadFlowFile: could not open %s", filename);
 58 |     
 59 |     int width, height;
 60 |     float tag;
 61 | 
 62 |     if ((int)fread(&tag,    sizeof(float), 1, stream) != 1 ||
 63 | 	(int)fread(&width,  sizeof(int),   1, stream) != 1 ||
 64 | 	(int)fread(&height, sizeof(int),   1, stream) != 1)
 65 | 	throw CError("ReadFlowFile: problem reading file %s", filename);
 66 | 
 67 |     if (tag != TAG_FLOAT) // simple test for correct endian-ness
 68 | 	throw CError("ReadFlowFile(%s): wrong tag (possibly due to big-endian machine?)", filename);
 69 | 
 70 |     // another sanity check to see that integers were read correctly (99999 should do the trick...)
 71 |     if (width < 1 || width > 99999)
 72 | 	throw CError("ReadFlowFile(%s): illegal width %d", filename, width);
 73 | 
 74 |     if (height < 1 || height > 99999)
 75 | 	throw CError("ReadFlowFile(%s): illegal height %d", filename, height);
 76 | 
 77 |     int nBands = 2;
 78 |     CShape sh(width, height, nBands);
 79 |     img.ReAllocate(sh);
 80 | 
 81 |     //printf("reading %d x %d x 2 = %d floats\n", width, height, width*height*2);
 82 |     int n = nBands * width;
 83 |     for (int y = 0; y < height; y++) {
 84 | 	float* ptr = &img.Pixel(0, y, 0);
 85 | 	if ((int)fread(ptr, sizeof(float), n, stream) != n)
 86 | 	    throw CError("ReadFlowFile(%s): file is too short", filename);
 87 |     }
 88 | 
 89 |     if (fgetc(stream) != EOF)
 90 | 	throw CError("ReadFlowFile(%s): file is too long", filename);
 91 | 
 92 |     fclose(stream);
 93 | }
 94 | 
 95 | // write a 2-band image into flow file 
 96 | void WriteFlowFile(CFloatImage img, const char* filename)
 97 | {
 98 |     if (filename == NULL)
 99 | 	throw CError("WriteFlowFile: empty filename");
100 | 
101 |     const char *dot = strrchr(filename, '.');
102 |     if (dot == NULL)
103 | 	throw CError("WriteFlowFile: extension required in filename '%s'", filename);
104 | 
105 |     if (strcmp(dot, ".flo") != 0)
106 | 	throw CError("WriteFlowFile: filename '%s' should have extension '.flo'", filename);
107 | 
108 |     CShape sh = img.Shape();
109 |     int width = sh.width, height = sh.height, nBands = sh.nBands;
110 | 
111 |     if (nBands != 2)
112 | 	throw CError("WriteFlowFile(%s): image must have 2 bands", filename);
113 | 
114 |     FILE *stream = fopen(filename, "wb");
115 |     if (stream == 0)
116 |         throw CError("WriteFlowFile: could not open %s", filename);
117 | 
118 |     // write the header
119 |     fprintf(stream, TAG_STRING);
120 |     if ((int)fwrite(&width,  sizeof(int),   1, stream) != 1 ||
121 | 	(int)fwrite(&height, sizeof(int),   1, stream) != 1)
122 | 	throw CError("WriteFlowFile(%s): problem writing header", filename);
123 | 
124 |     // write the rows
125 |     int n = nBands * width;
126 |     for (int y = 0; y < height; y++) {
127 | 	float* ptr = &img.Pixel(0, y, 0);
128 | 	if ((int)fwrite(ptr, sizeof(float), n, stream) != n)
129 | 	    throw CError("WriteFlowFile(%s): problem writing data", filename); 
130 |    }
131 | 
132 |     fclose(stream);
133 | }
134 | 
135 | 
136 | /*
137 | int main() {
138 | 
139 |     try {
140 | 	CShape sh(5, 1, 2);
141 | 	CFloatImage img(sh);
142 | 	img.ClearPixels();
143 | 	img.Pixel(0, 0, 0) = -5.0f;
144 | 	char *filename = "test.flo";
145 | 
146 | 	WriteFlowFile(img, filename);
147 | 	ReadFlowFile(img, filename);
148 |     }
149 |     catch (CError &err) {
150 | 	fprintf(stderr, err.message);
151 | 	fprintf(stderr, "\n");
152 | 	exit(1);
153 |     }
154 | 
155 |     return 0;
156 | }
157 | */
158 | 


--------------------------------------------------------------------------------
/color_flow/flowIO.h:
--------------------------------------------------------------------------------
 1 | // flowIO.h
 2 | 
 3 | // the "official" threshold - if the absolute value of either 
 4 | // flow component is greater, it's considered unknown
 5 | #define UNKNOWN_FLOW_THRESH 1e9
 6 | 
 7 | // value to use to represent unknown flow
 8 | #define UNKNOWN_FLOW 1e10
 9 | 
10 | // return whether flow vector is unknown
11 | bool unknown_flow(float u, float v);
12 | bool unknown_flow(float *f);
13 | 
14 | // read a flow file into 2-band image
15 | void ReadFlowFile(CFloatImage& img, const char* filename);
16 | 
17 | // write a 2-band image into flow file 
18 | void WriteFlowFile(CFloatImage img, const char* filename);
19 | 
20 | 
21 | 


--------------------------------------------------------------------------------
/color_flow/imageLib/Convert.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Convert.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/Convert.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Convert.h


--------------------------------------------------------------------------------
/color_flow/imageLib/Convolve.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Convolve.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/Convolve.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Convolve.h


--------------------------------------------------------------------------------
/color_flow/imageLib/Copyright.h:
--------------------------------------------------------------------------------
 1 | /*
 2 | 
 3 | StereoMatcher 1.0
 4 | 
 5 | This Microsoft Research Source Code License Agreement ("MSR-SCLA") is
 6 | a legal agreement between you and Microsoft Corporation
 7 | (``Microsoft'' or ``we'') for the above pre-release Software. 
 8 | 
 9 | By installing, copying, compiling or otherwise using the Software found at
10 |  http://research.microsoft.com/downloads/,
11 | you agree to be bound by the terms of this MSR-SCLA. If you do not agree,
12 | do not install, copy, compile or use the Software. The Software is protected
13 | by copyright and other intellectual property laws and is licensed, not sold.
14 |     
15 | You may do anything you want with the Software for non-commercial research or
16 | teaching purposes, free of charge. In return, we simply ask that you agree to
17 | the following:
18 | 
19 | * To leave in place all copyright notices and licensing information that you
20 | might find in the Software.
21 | 
22 | * That you will not use the Software in a live operating environment where it
23 | may be relied upon to perform in the same manner as a commercially released
24 | product, or with data that has not been sufficiently backed up.
25 | 
26 | * To make freely available to others the source code of any modifications or
27 | additions you make to the Software source code, and any related documentation,
28 | solely and exclusively under the same terms as this License.
29 | 
30 | * That Microsoft is granted back, without limitations, the rights to reproduce,
31 | install, use, modify, distribute and transfer your source modifications or
32 | additions in source and/or object code formats. 
33 | 
34 | * That any feedback about the Software provided by you to us is voluntarily
35 | given, and Microsoft shall be free to use the feedback as it sees fit without
36 | obligation or restriction of any kind, even if the feedback is designated by
37 | you as confidential.
38 | 
39 | * NO WARRANTIES WHATSOEVER:  That the Software comes ``AS IS'', with all 
40 | faults and with no warranties, conditions or representations. None. 
41 | Not even the implied warranty of merchantability, warranty of fitness for
42 | a particular purpose, or any warranty against interference with your
43 | enjoyment of the Software or against infringement.  The entire risk as to
44 | satisfactory quality, performance, accuracy, and effort is with you.
45 | There is no warranty that this Software will fulfill any of your particular
46 | purposes or needs.
47 | 
48 | * That we have no duty of reasonable care or lack of negligence and that we
49 | are not obligated to (and will not) provide technical support or updates for
50 | the Software. 
51 | 
52 | * That we will not be liable for any damages, including those known as direct,
53 | indirect, special, consequential, or incidental damages related to the Software
54 | or this MSR-SCLA, nor any damages for negligence, to the maximum extent the
55 | law permits.
56 | 
57 | * That if you sue or threaten to sue anyone over patents that you think may
58 | apply to the Software or if you breach this MSR-SCLA in any way, your license
59 | to the Software ends automatically. 
60 | 
61 | * That this MSR-SCLA shall be construed and controlled by the laws of the
62 | State of Washington, USA, without regard to conflicts of law. 
63 | 
64 | 
65 | Copyright (c) Microsoft Corporation. All rights reserved
66 | 
67 | */
68 | 


--------------------------------------------------------------------------------
/color_flow/imageLib/Error.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Error.h


--------------------------------------------------------------------------------
/color_flow/imageLib/Image.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Image.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/Image.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/Image.h


--------------------------------------------------------------------------------
/color_flow/imageLib/ImageIO.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/ImageIO.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/ImageIO.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/ImageIO.h


--------------------------------------------------------------------------------
/color_flow/imageLib/ImageIOpng.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/ImageIOpng.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/Makefile:
--------------------------------------------------------------------------------
 1 | SRC = Convert.cpp Convolve.cpp Image.cpp ImageIO.cpp ImageIOpng.cpp RefCntMem.cpp
 2 | 
 3 | CC = g++
 4 | WARN = -W -Wall
 5 | OPT ?= -O3
 6 | CPPFLAGS = $(OPT) $(WARN)
 7 | 
 8 | OBJ = $(SRC:.cpp=.o)
 9 | 
10 | all: libImg.a
11 | 
12 | libImg.a: $(OBJ)
13 | 	rm -f libImg.a
14 | 	ar ruc libImg.a $(OBJ)
15 | 	ranlib libImg.a
16 | 
17 | clean: 
18 | 	rm -f $(OBJ) core *.stackdump *.bak
19 | 
20 | allclean: clean
21 | 	rm -f libImg.a
22 | 
23 | depend:
24 | 	@makedepend -Y -- $(CPPFLAGS) -- $(SRC) 2>> /dev/null
25 | 
26 | # DO NOT DELETE THIS LINE -- make depend depends on it.
27 | 
28 | Convert.o: Image.h RefCntMem.h Error.h Convert.h
29 | Convolve.o: Image.h RefCntMem.h Error.h Convert.h Convolve.h
30 | Image.o: Image.h RefCntMem.h Error.h
31 | ImageIO.o: Image.h RefCntMem.h Error.h ImageIO.h
32 | ImageIOpng.o: Image.h RefCntMem.h Error.h
33 | RefCntMem.o: RefCntMem.h
34 | 


--------------------------------------------------------------------------------
/color_flow/imageLib/README.txt:
--------------------------------------------------------------------------------
 1 | imageLib is a small C++ library for 2D multi-band images.  See Image.h
 2 | for more detail.  Reading and writing of images is supported in png
 3 | and pgm/ppm formats, as well as a subset of Targa.  See ImageIO.h for
 4 | more detail.
 5 | 
 6 | This code is derived from a subset of the StereoMatcher code by Rick
 7 | Szeliski and Daniel Scharstein, which is available at
 8 | http://research.microsoft.com/downloads/.
 9 | 
10 | This code is distributed under the same Source Code License Agreement
11 | as the original version.  Please see the file Copyright.h
12 | 
13 | Last change: 8/30/2012 - to get to compile under gcc 4 without warnings, and some minor fixes
14 | 


--------------------------------------------------------------------------------
/color_flow/imageLib/RefCntMem.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/RefCntMem.cpp


--------------------------------------------------------------------------------
/color_flow/imageLib/RefCntMem.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/color_flow/imageLib/RefCntMem.h


--------------------------------------------------------------------------------
/color_flow/imageLib/imageLib.h:
--------------------------------------------------------------------------------
1 | // imageLib.h
2 | 
3 | // common includes
4 | 
5 | #include "Error.h"
6 | #include "Image.h"
7 | #include "ImageIO.h"
8 | #include "Convert.h"
9 | 


--------------------------------------------------------------------------------
/deep_flow2/.gitignore:
--------------------------------------------------------------------------------
  1 | ## General
  2 | 
  3 | # Compiled Object files
  4 | *.slo
  5 | *.lo
  6 | *.o
  7 | *.cuo
  8 | 
  9 | # Compiled Dynamic libraries
 10 | *.so
 11 | *.dylib
 12 | 
 13 | # Compiled Static libraries
 14 | *.lai
 15 | *.la
 16 | *.a
 17 | 
 18 | # Compiled protocol buffers
 19 | *.pb.h
 20 | *.pb.cc
 21 | *_pb2.py
 22 | 
 23 | # Compiled python
 24 | *.pyc
 25 | 
 26 | # Compiled MATLAB
 27 | *.mex*
 28 | 
 29 | # IPython notebook checkpoints
 30 | .ipynb_checkpoints
 31 | 
 32 | # Editor temporaries
 33 | *.swp
 34 | *~
 35 | 
 36 | # Sublime Text settings
 37 | *.sublime-workspace
 38 | *.sublime-project
 39 | 
 40 | # Eclipse Project settings
 41 | *.*project
 42 | .settings
 43 | 
 44 | # QtCreator files
 45 | *.user
 46 | 
 47 | # PyCharm files
 48 | .idea
 49 | 
 50 | # OSX dir files
 51 | .DS_Store
 52 | 
 53 | ## Caffe
 54 | 
 55 | # User's build configuration
 56 | Makefile.config
 57 | 
 58 | # Data and models are either
 59 | # 1. reference, and not casually committed
 60 | # 2. custom, and live on their own unless they're deliberated contributed
 61 | data/*
 62 | models/*
 63 | *.caffemodel
 64 | *.caffemodel.h5
 65 | *.solverstate
 66 | *.solverstate.h5
 67 | *.binaryproto
 68 | *leveldb
 69 | *lmdb
 70 | 
 71 | # build, distribute, and bins (+ python proto bindings)
 72 | build
 73 | .build_debug/*
 74 | .build_release/*
 75 | distribute/*
 76 | *.testbin
 77 | *.bin
 78 | python/caffe/proto/
 79 | cmake_build
 80 | .cmake_build
 81 | 
 82 | # Generated documentation
 83 | docs/_site
 84 | docs/gathered
 85 | _site
 86 | doxygen
 87 | docs/dev
 88 | 
 89 | # LevelDB files
 90 | *.sst
 91 | *.ldb
 92 | LOCK
 93 | LOG*
 94 | CURRENT
 95 | MANIFEST-*
 96 | 
 97 | # images
 98 | *.jpg
 99 | *.png
100 | *.flo
101 | 


--------------------------------------------------------------------------------
/deep_flow2/Makefile:
--------------------------------------------------------------------------------
 1 | CC=gcc
 2 | 
 3 | CFLAGS=-Wall -g -O3 -msse4 -fPIC
 4 | LDFLAGS=-g -Wall -O3 -msse4 -fPIC
 5 | LIBFLAGS=-lm -ljpeg -lpng -L/usr/lib/x86_64-linux-gnu
 6 | LIBAFLAGS=-static /usr/lib/x86_64-linux-gnu/libjpeg.a /usr/lib/x86_64-linux-gnu/libpng.a /usr/lib/x86_64-linux-gnu/libz.a /usr/lib/x86_64-linux-gnu/libm.a
 7 | CPYTHONFLAGS=-I/usr/include/python2.7
 8 | 
 9 | SOURCES := $(shell find . -name '*.c' ! -name 'deepflow2_wrap.c')
10 | OBJ := $(SOURCES:%.c=%.o) 
11 | HEADERS := $(shell find . -name '*.h')
12 | 
13 | all: deepflow2
14 | 
15 | deepflow2: $(OBJ)
16 | 	$(CC) $(LDFLAGS) $^ $(LIBFLAGS) -o $@
17 | 
18 | deepflow2-static: $(OBJ)
19 | 	$(CC) -o $@ $^ $(LIBAFLAGS)
20 | 
21 | %.o: %.c
22 | 	$(CC) -o $@ $(CFLAGS) -c $+
23 | 
24 | python: all
25 | 	swig -python $(CPYTHONFLAGS) deepflow2.i
26 | 	gcc $(CFLAGS) -c deepflow2_wrap.c $(CPYTHONFLAGS)
27 | 	gcc -shared $(LDFLAGS) deepflow2_wrap.o $(OBJ) -o _deepflow2.so $(LIBFLAGS) 
28 | 
29 | 
30 | clean:
31 | 	rm -f *.o deepflow2 _deepflow2.so deepflow2.pyc deepflow2.mex???
32 | 


--------------------------------------------------------------------------------
/deep_flow2/Makefile.ddk:
--------------------------------------------------------------------------------
 1 | CC=gcc
 2 | 
 3 | CFLAGS=-Wall -g -O3 -msse4 -fPIC
 4 | LDFLAGS=-g -Wall -O3 -msse4 -fPIC
 5 | LIBFLAGS=-lm -ljpeg -lpng
 6 | LIBAFLAGS=-static /usr/lib/x86_64-linux-gnu/libjpeg.a /usr/lib/x86_64-linux-gnu/libpng.a /usr/lib/x86_64-linux-gnu/libz.a /usr/lib/x86_64-linux-gnu/libm.a
 7 | CPYTHONFLAGS=-I/usr/include/python2.7
 8 | 
 9 | SOURCES := $(shell find . -name '*.c' ! -name 'deepflow2_wrap.c')
10 | OBJ := $(SOURCES:%.c=%.o) 
11 | HEADERS := $(shell find . -name '*.h')
12 | 
13 | all: deepflow2
14 | 
15 | deepflow2: $(OBJ)
16 | 	$(CC) $(LDFLAGS) $(LIBFLAGS) -o $@ $^
17 | 
18 | deepflow2-static: $(OBJ)
19 | 	$(CC) -o $@ $^ $(LIBAFLAGS)
20 | 
21 | %.o: %.c
22 | 	$(CC) -o $@ $(CFLAGS) -c $+ 
23 | 
24 | python: all
25 | 	swig -python $(CPYTHONFLAGS) deepflow2.i
26 | 	gcc $(CFLAGS) -c deepflow2_wrap.c $(CPYTHONFLAGS)
27 | 	gcc -shared $(LDFLAGS) deepflow2_wrap.o $(OBJ) -o _deepflow2.so $(LIBFLAGS) 
28 | 
29 | 
30 | clean:
31 | 	rm -f *.o deepflow2 _deepflow2.so deepflow2.pyc deepflow2.mex???
32 | 


--------------------------------------------------------------------------------
/deep_flow2/Makefile.zhujin.s:
--------------------------------------------------------------------------------
 1 | CC=gcc
 2 | 
 3 | CFLAGS=-Wall -g -O3 -msse4 -fPIC
 4 | LDFLAGS=-g -Wall -O3 -msse4 -fPIC
 5 | LIBFLAGS=-lm -ljpeg -lpng -L/usr/lib/x86_64-linux-gnu
 6 | LIBAFLAGS=-static /usr/lib/x86_64-linux-gnu/libjpeg.a /usr/lib/x86_64-linux-gnu/libpng.a /usr/lib/x86_64-linux-gnu/libz.a /usr/lib/x86_64-linux-gnu/libm.a
 7 | CPYTHONFLAGS=-I/usr/include/python2.7
 8 | 
 9 | SOURCES := $(shell find . -name '*.c' ! -name 'deepflow2_wrap.c')
10 | OBJ := $(SOURCES:%.c=%.o) 
11 | HEADERS := $(shell find . -name '*.h')
12 | 
13 | all: deepflow2
14 | 
15 | deepflow2: $(OBJ)
16 | 	$(CC) $(LDFLAGS) $^ $(LIBFLAGS) -o $@
17 | 
18 | deepflow2-static: $(OBJ)
19 | 	$(CC) -o $@ $^ $(LIBAFLAGS)
20 | 
21 | %.o: %.c
22 | 	$(CC) -o $@ $(CFLAGS) -c $+
23 | 
24 | python: all
25 | 	swig -python $(CPYTHONFLAGS) deepflow2.i
26 | 	gcc $(CFLAGS) -c deepflow2_wrap.c $(CPYTHONFLAGS)
27 | 	gcc -shared $(LDFLAGS) deepflow2_wrap.o $(OBJ) -o _deepflow2.so $(LIBFLAGS) 
28 | 
29 | 
30 | clean:
31 | 	rm -f *.o deepflow2 _deepflow2.so deepflow2.pyc deepflow2.mex???
32 | 


--------------------------------------------------------------------------------
/deep_flow2/README:
--------------------------------------------------------------------------------
  1 | DeepFlow, v2.0
  2 | 
  3 | Our code is mentioned only for scientific or personal use.
  4 | Please contact us for commercial use.
  5 | 
  6 | DeepFlow2 is an improvement of DeepFlow that takes benefit of SSE instructions to speed up the computation and that incorporates a non-local weight for the smoothness term.
  7 | 
  8 | ### Compiling ###
  9 | 
 10 | Simply type 'make' and the code must compile.
 11 | The program was only tested under a 64-bit Linux distribution.
 12 | A static version is also provided in case of the compilation failure.
 13 | We do not give any support for other OS or compilation issues.
 14 | 
 15 | Dependencies:	(my own on ubuntu 14.04)
 16 | 	LIBAFLAGS=-static /usr/lib/x86_64-linux-gnu/libjpeg.a /usr/lib/x86_64-linux-gnu/libpng.a /usr/lib/x86_64-linux-gnu/libz.a /usr/lib/x86_64-linux-gnu/libm.a
 17 | 
 18 | ### Using DeepFlow2 ###
 19 | 
 20 | The general command to use DeepFlow2 is:
 21 | ./deepflow2 <im1> <im2> <filename.flo> [options]
 22 | 
 23 | 	e.g:
 24 | 		./deepflow2 sintel1.png sintel2.png sintel.flo
 25 | 		./deepflow2 mude1.jpg mude2.jpg mude.flo
 26 | 
 27 | For a list of the available options, you can type: 
 28 | 		./deepflow2 -h
 29 | >>>
 30 | 	-h, --help                                               print this message
 31 | 	-a, -alpha              <float>(12.0)                    weight of smoothness terms
 32 | 	-b, -beta               <float>(300.0)                   weight of descriptor matching
 33 | 	-g, -gamma              <float>(3.0)                     weight of gradient constancy assumption
 34 | 	-d, -delta              <float>(2.0)                     weight of color constancy assumption
 35 | 	-s, -sigma              <float>(0.8)                     standard deviation of Gaussian presmoothing kernel
 36 | 	-e, -eta                <float>(0.95)                    ratio factor for coarse-to-fine scheme
 37 | 	-minsize                <interger>(25)                   size of the coarsest level
 38 | 	-inner                  <integer>(5)                     number of inner fixed point iterations
 39 | 	-iter                   <integer>(25)                    number of iterations for the solver
 40 | 	-soromega               <float>(1.6)                     omega parameter of the sor method
 41 | 	-bk                     <float>(0.0)                     use decreasing beta i.e. beta(k) = beta*( k / kmax )^betak, if 0, a last iteration is done with beta=0
 42 | 
 43 | 	-match                                                   '-match filename' reads matches from a file and '-match' from stdin. Each line is the match with the first four numbers being x1 y1 x2 y2.
 44 | 
 45 | 	-sintel                                                  set the parameters to the one used in the arXiv paper for MPI-Sintel dataset
 46 | 	-middlebury                                              set the parameters to the one used in the arXiv paper for middlebury dataset
 47 | 	-kitti                                                   set the parameters to the one used in the arXiv paper for KITTI dataset
 48 | 
 49 | The option -match allows to give input matches, either from an input file or from stdin.
 50 | In particular, results from the paper use the results from DeepMatching.
 51 | 
 52 | ### Example including DeepMatching ###
 53 | 
 54 | To compute DeepFlow2 including the DeepMatching, you need to download the Deep Matching code on the dedicated webpage: http://lear.inrialpes.fr/src/deepmatching/.
 55 | The matches output by DeepMatching can directly be piped to DeepFlow2 like in the following example:
 56 | 
 57 | <deepmatching_path>/deepmatching sintel1.png sintel2.png | ./deepflow2 sintel1.png sintel2.png sintel.flo -match -sintel
 58 | (for small size images, you can add the option "-downscale 0" when extracting deepmatching for a better accuracy)
 59 | 
 60 | It creates a .flo file in a standard format. 
 61 | For instance, code for reading and displaying such format is available with the Middlebury dataset.
 62 | 
 63 | ### Warning: without matching ###
 64 | 
 65 | If you don't use any input match (i.e. you don't specify any -match argument), the method will be limited to a standard variational method without matching integration and thus will lose accuracy, specially for large displacements. This is the case in the opencv implementation.
 66 | 
 67 | ### Bugs and extensions ###
 68 | 
 69 | If you find bugs, etc., please feel free to contact me.
 70 | Contact details are available on my webpage.
 71 | http://lear.inrialpes.fr/people/pweinzae
 72 | 
 73 | ### History ###
 74 | 
 75 | December 2013  v1.0.0
 76 | March 2014     v1.0.1: memory leak fix + support for png images
 77 | March 2014     FastDeepFlow_v1.0.1: faster (~2x) version using SSE instructions. Results are slightly different due to floating point approximations.
 78 | September 2015 v2.0: incorporation of a local smoothness weight and of the computation of matches' weights
 79 | 
 80 | ### Matlab wrapper ###
 81 | 
 82 | To compile the wrapper, first compile the code using make, then open matlab and compile the mex-file:
 83 | >> mex deepflow2_matlab.cpp image.o io.o opticalflow.o opticalflow_aux.o solver.o -ljpeg -lpng -lm -output deepflow2
 84 | The wrapper has been tested on Matlab14b under Linux-64 bit. We do not provide any support for compilation issue.
 85 | 
 86 | Usage with DeepMatching (assuming that DeepMatching has been added to the path with the matlab wrapper compiled; note that matlab must be opened with atlas preloaded for DeepMatching computation: LD_PRELOAD=/usr/lib64/atlas/libtatlas.so.3 matlab):
 87 | >> im1 = single(imread('sintel1.png'));
 88 | >> im2 = single(imread('sintel2.png'));
 89 | >> matches = deepmatching(im1, im2);
 90 | >> flow = deepflow2(im1, im2, matches, '-sintel');
 91 | Calling deepflow2() will show the list of available options.
 92 | 
 93 | ### Python wrapper ###
 94 | 
 95 | The python wrapper requires numpy (and swig if you modify the code and recompile it). To compile it, 
 96 | type 'make python'. The wrapper has been tested under Linux-64 bit only. We do not provide any support for compilation issue.
 97 | 	make sure you have installed swig -> "sudo apt-get install swig"
 98 | 
 99 | Usage with DeepMatching (assuming that DeepMatching has been added to the pythonpath with the python wrapper compiled):
100 | >> from deepmatching import deepmatching
101 | >> from deepflow2 import deepflow2
102 | >> import numpy
103 | >> from PIL import Image
104 | >> im1 = numpy.array(Image.open('sintel1.png'))
105 | >> im2 = numpy.array(Image.open('sintel2.png'))
106 | >> matches = deepmatching(im1, im2)
107 | >> flow = deepflow2(im1, im2, matches, '-sintel')
108 | Callind deepflow2() will show the list of available options.
109 | 
110 | ### LICENCE CONDITIONS ###
111 | 
112 | Copyright (C) 2013 Philippe Weinzaepfel
113 | 
114 | This program is free software: you can redistribute it and/or modify
115 | it under the terms of the GNU General Public License as published by
116 | the Free Software Foundation, either version 3 of the License, or
117 | (at your option) any later version.
118 | 
119 | This program is distributed in the hope that it will be useful,
120 | but WITHOUT ANY WARRANTY; without even the implied warranty of
121 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
122 | GNU General Public License for more details.
123 | 
124 | You should have received a copy of the GNU General Public License
125 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
126 | 


--------------------------------------------------------------------------------
/deep_flow2/deepflow2:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/deep_flow2/deepflow2


--------------------------------------------------------------------------------
/deep_flow2/deepflow2-static:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/deep_flow2/deepflow2-static


--------------------------------------------------------------------------------
/deep_flow2/deepflow2.c:
--------------------------------------------------------------------------------
 1 | /*
 2 | Copyright (C) 2013 Philippe Weinzaepfel
 3 | 
 4 | This program is free software: you can redistribute it and/or modify
 5 | it under the terms of the GNU General Public License as published by
 6 | the Free Software Foundation, either version 3 of the License, or
 7 | (at your option) any later version.
 8 | 
 9 | This program is distributed in the hope that it will be useful,
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 | GNU General Public License for more details.
13 | 
14 | You should have received a copy of the GNU General Public License
15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
16 | */
17 | #include <stdio.h>
18 | #include <stdlib.h>
19 | #include <string.h>
20 | 
21 | #include "image.h"
22 | #include "opticalflow.h"
23 | #include "io.h"
24 | 
25 | int main(int argc, char ** argv){
26 |   
27 |     // load images
28 |     if(argc < 4){
29 |         fprintf(stderr,"Wrong command, require at least 3 arguments.\n\n");
30 |         usage(EXE_OPTIONS);
31 |         exit(1);
32 |     }
33 |     color_image_t *im1 = color_image_load(argv[1]), *im2 = color_image_load(argv[2]);
34 |     if(im1->width != im2->width || im1->height != im2->height){
35 |         fprintf(stderr,"Image dimensions does not match\n");
36 |         exit(1);
37 |     }
38 |   
39 |     // set params to default
40 |     optical_flow_params_t* params = (optical_flow_params_t*) malloc(sizeof(optical_flow_params_t));
41 |     if(!params){
42 |         fprintf(stderr,"error deepflow2(): not enough memory\n");
43 |         exit(1);
44 |     }
45 |     optical_flow_params_default(params);
46 | 
47 |     // parse options   
48 |     image_t **matches = parse_options(params, argc-4, &argv[4], EXE_OPTIONS, im1->width, im1->height);
49 | 	image_t *match_x = matches[0], *match_y = matches[1], *match_z = matches[2];
50 |     free(matches);
51 |     
52 |     image_t *wx = image_new(im1->width,im1->height), *wy = image_new(im1->width,im1->height);
53 |     optical_flow(wx, wy, im1, im2, params, match_x, match_y, match_z);
54 |     writeFlowFile(argv[3], wx, wy);
55 |     image_delete(wx);
56 |     image_delete(wy);
57 |     image_delete(match_x); image_delete(match_y); image_delete(match_z);
58 |     color_image_delete(im1); color_image_delete(im2);
59 |     free(params);
60 | 
61 |     return 0;
62 | }
63 | 


--------------------------------------------------------------------------------
/deep_flow2/deepflow2.i:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2013 Philippe Weinzaepfel
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
 16 | */
 17 | 
 18 | /*
 19 | Python wrapper
 20 | */
 21 | 
 22 | %module(docstring="Module to compute DeepFlow") deepflow2
 23 | 
 24 | %{
 25 |     #define SWIG_FILE_WITH_INIT
 26 | 
 27 |     #include <numpy/arrayobject.h>
 28 | 
 29 |     
 30 |     #define CHECK_NUMPY_ARRAY(a, expected_npy)                                 \
 31 |       if(!a) {                                                              \
 32 |         fprintf(stderr,"error in %s(): NULL input\n",__PRETTY_FUNCTION__);             \
 33 |         return NULL;                                                        \
 34 |       }                                                                     \
 35 |       if(!PyArray_Check(a)) {                                               \
 36 |         fprintf(stderr,"error in %s(): input not numpy array\n",__PRETTY_FUNCTION__);  \
 37 |         return NULL;                                                        \
 38 |       }                                                                     \
 39 |       if(!PyArray_ISCONTIGUOUS(a)) {                                        \
 40 |         fprintf(stderr,"error in %s(): array is not C-contiguous\n",__PRETTY_FUNCTION__);  \
 41 |         return NULL;                                                        \
 42 |       }                                                                     \
 43 |       if(PyArray_TYPE(a)!=expected_npy) {                                   \
 44 |         fprintf(stderr,"error in %s(): input has bad type (type id %d != " #expected_npy " %d)\n",__PRETTY_FUNCTION__, \
 45 |                 PyArray_TYPE(a),expected_npy);                              \
 46 |         return NULL;                                                        \
 47 |       }
 48 | 
 49 | %}
 50 | 
 51 | %init %{
 52 |     import_array();
 53 | %}
 54 | 
 55 | 
 56 | %{
 57 |     #include "image.h"
 58 | %}
 59 | 
 60 | %typemap(in) 
 61 |   (image_t* img) 
 62 |   (image_t image) {
 63 |   
 64 |   PyObject* a = $input;
 65 |   if(a==Py_None) {
 66 |     $1 = NULL;
 67 |   } else {
 68 |     CHECK_NUMPY_ARRAY(a, NPY_FLOAT)
 69 |     image.data = (float*) PyArray_DATA(a);
 70 |     a = PyObject_GetAttrString($input,"shape");
 71 |     assert(PyTuple_Size(a)==2);
 72 |     image.height = PyInt_AsLong(PyTuple_GetItem(a,0));
 73 |     image.width = PyInt_AsLong(PyTuple_GetItem(a,1));
 74 |     assert( image.width%4==0);
 75 |     image.stride = image.width;
 76 |     $1=&image;
 77 |   }
 78 | }
 79 | %apply (image_t* img) {(image_t* )};
 80 | 
 81 | %typemap(in) 
 82 |   (color_image_t* cimg) 
 83 |   (color_image_t cimage) {
 84 |   
 85 |   PyObject* a = $input;
 86 |   if(a==Py_None) {
 87 |     $1 = NULL;
 88 |   } else {
 89 |     CHECK_NUMPY_ARRAY(a, NPY_FLOAT)
 90 |     cimage.c1 = (float*) PyArray_DATA(a);
 91 |     a = PyObject_GetAttrString($input,"shape");
 92 |     assert(PyTuple_Size(a)==3);
 93 |     assert( PyInt_AsLong(PyTuple_GetItem(a,0)) == 3);
 94 |     cimage.height =  PyInt_AsLong(PyTuple_GetItem(a,1));
 95 |     cimage.width =  PyInt_AsLong(PyTuple_GetItem(a,2));
 96 |     assert( cimage.width%4==0);
 97 |     cimage.stride = cimage.width;
 98 |     cimage.c2 = cimage.c1 + cimage.stride*cimage.height; 
 99 |     cimage.c3 = cimage.c2 + cimage.stride*cimage.height; 
100 |     $1=&cimage;
101 |   }
102 | }
103 | %apply (color_image_t* cimg) {(color_image_t* )};
104 | 
105 | void deepflow2_numpy( int w, image_t* wx, image_t* wy, color_image_t* im1, color_image_t* im2, image_t* match, char *options);
106 | 
107 | void usage_python();
108 | 
109 | %{
110 |     #include "io.h"
111 |     #include "image.h"
112 |     #include "opticalflow.h"
113 |     #include <string.h>
114 |     
115 |     void deepflow2_numpy( int w, image_t* wx, image_t* wy, color_image_t* im1, color_image_t* im2, image_t* match, char *options){
116 |         // correct the width on the inputs
117 |         wx->width = w;
118 |         wy->width = w;
119 |         im1->width = w;
120 |         im2->width = w;
121 |         int h = im1->height;
122 |         
123 |         // read the matches
124 |         image_t *match_x = NULL, *match_y = NULL, *match_z = NULL;
125 |         if( match != NULL){
126 |             match_x = image_new(w, h);
127 |             match_y = image_new(w, h);
128 |             match_z = image_new(w, h);
129 |             image_erase(match_x); image_erase(match_y); image_erase(match_z);
130 |             int i;
131 |             for( i = 0 ; i<match->height ; i++){
132 |                 float x1 = match->data[i*match->stride+0], y1 = match->data[i*match->stride+1], x2 = match->data[i*match->stride+2], y2 = match->data[i*match->stride+3];
133 |                 if( x1<0 || y1<0 || x2<0 || y2<0 || x1>=w || y1>=h || x2>=w || y2>=h){
134 |                     fprintf(stderr, "Warning: match out of bound: %f %f -> %f %f\n", x1, y1, x2, y2);
135 |                     x1 = MINMAX(x1, w);
136 |                     x2 = MINMAX(x2, w);
137 |                     y1 = MINMAX(y1, h);
138 |                     y2 = MINMAX(y2, h);
139 |                 }
140 |                 int pos = (int) (y1*match_x->stride+x1);
141 |                 match_x->data[ pos ] = x2-x1;
142 |                 match_y->data[ pos ] = y2-y1;
143 |                 match_z->data[ pos ] = 1.0f;                         
144 |             }
145 |         }
146 |         
147 |         // set params to default
148 |         optical_flow_params_t* params = (optical_flow_params_t*) malloc(sizeof(optical_flow_params_t));
149 |         if(!params){
150 |             fprintf(stderr,"error deepflow2(): not enough memory\n");
151 |             exit(1);
152 |         }
153 |         optical_flow_params_default(params);
154 | 
155 |         // read options
156 |         if( options!=NULL ){
157 | 	        int argc=0;
158 | 	        char* argv[256];
159 |             argv[argc]=strtok(options," ");
160 | 	        while(argv[argc]!=NULL)
161 | 	        {
162 | 		        argv[++argc]=strtok(NULL," ");
163 | 	        }
164 | 	        parse_options(params, argc, argv, PYTHON_OPTIONS, w, h);
165 |         }
166 | 
167 |         // launch flow
168 |         image_t *flowx = image_new(w, h), *flowy = image_new(w,h); // optical_flow changes the pointer to the data
169 |         optical_flow(flowx, flowy, im1, im2, params, match_x, match_y, match_z);
170 |         memcpy( wx->data, flowx->data, sizeof(float)*flowx->stride*h);
171 |         memcpy( wy->data, flowy->data, sizeof(float)*flowx->stride*h);        
172 |        
173 |         free(params);
174 |         image_delete(flowx);
175 |         image_delete(flowy);
176 |         if(match!=NULL){
177 |             image_delete(match_x);
178 |             image_delete(match_y);
179 |             image_delete(match_z);        
180 |         }
181 |     }
182 |     
183 |     void usage_python(){
184 |         usage(PYTHON_OPTIONS);
185 |     }
186 | 
187 | %}
188 | 
189 | 
190 | %pythoncode %{  
191 |     from numpy import float32, concatenate, empty, rollaxis, ascontiguousarray, pad
192 |     def deepflow2( im1=None, im2=None, match=None, options=""):
193 |         """
194 |         flow = deepflow2.deepflow2(image1, image2, match=None, options='')
195 |         Compute the flow between two images, eventually using given matches.
196 |         Images must be HxWx3 numpy arrays (convert to float32).
197 |         Match is an optional numpy array argument (None by default, ie no input match), where each row starts by x1 y1 x2 y2.
198 |         Options is an optional string argument ('' by default), to set the options. Type deepflow2() to see the list of available options.
199 |         The function returns the optical flow as a HxWx2 numpy array."""
200 |         #convert images
201 |         if None in (im1,im2):
202 |             usage_python()
203 |             return
204 |         assert im1.shape == im2.shape, "images must have the same shape"
205 |         if im1.dtype != float32:
206 |             im1 = im1.astype(float32)
207 |         if im2.dtype != float32:
208 |             im2 = im2.astype(float32)
209 |         h, w, nchannels = im1.shape
210 |         assert nchannels==3, "images must have 3 channels"
211 |         stride = 4*((w+3)//4)
212 |         im1 = pad( rollaxis(im1,2), ((0,0),(0,0),(0, stride-w)), 'constant')
213 |         im2 = pad( rollaxis(im2,2), ((0,0),(0,0),(0, stride-w)), 'constant')
214 |         # allocate flow
215 |         flowx = empty((h,stride), dtype=float32)
216 |         flowy = empty((h,stride), dtype=float32)
217 |         # compute flow
218 |         if match is not None:
219 |             assert match.shape[1]>=4
220 |             match = ascontiguousarray(match[:,:4], dtype=float32)
221 |         deepflow2_numpy( w, flowx, flowy, im1, im2, match, options)
222 |         return concatenate ( (flowx[:,:w,None], flowy[:,:w,None]), axis=2)
223 | %} 
224 | 
225 | 
226 | 
227 | 
228 | 
229 | 
230 | 
231 | 


--------------------------------------------------------------------------------
/deep_flow2/deepflow2.m:
--------------------------------------------------------------------------------
 1 | % "flow = deepflow2(image1, image2, match, options)
 2 | %
 3 | % "Compute the flow between two images, eventually using given matches.
 4 | %
 5 | % "Images are HxWx3 single matrices.
 6 | % "Match is an optional argument ([] by default), where each row starts by x1 y1 x2 y2.
 7 | % "Options is an optional string argument ('' by default), to set the options. Type deepflow2() to see the list of available options.
 8 | %
 9 | % "The function returns the optical flow as a HxWx2 single matrix.
10 | 


--------------------------------------------------------------------------------
/deep_flow2/deepflow2.py:
--------------------------------------------------------------------------------
  1 | # This file was automatically generated by SWIG (http://www.swig.org).
  2 | # Version 2.0.11
  3 | #
  4 | # Do not make changes to this file unless you know what you are doing--modify
  5 | # the SWIG interface file instead.
  6 | 
  7 | 
  8 | 
  9 | 
 10 | """
 11 | Module to compute DeepFlow
 12 | """
 13 | 
 14 | 
 15 | from sys import version_info
 16 | if version_info >= (2,6,0):
 17 |     def swig_import_helper():
 18 |         from os.path import dirname
 19 |         import imp
 20 |         fp = None
 21 |         try:
 22 |             fp, pathname, description = imp.find_module('_deepflow2', [dirname(__file__)])
 23 |         except ImportError:
 24 |             import _deepflow2
 25 |             return _deepflow2
 26 |         if fp is not None:
 27 |             try:
 28 |                 _mod = imp.load_module('_deepflow2', fp, pathname, description)
 29 |             finally:
 30 |                 fp.close()
 31 |             return _mod
 32 |     _deepflow2 = swig_import_helper()
 33 |     del swig_import_helper
 34 | else:
 35 |     import _deepflow2
 36 | del version_info
 37 | try:
 38 |     _swig_property = property
 39 | except NameError:
 40 |     pass # Python < 2.2 doesn't have 'property'.
 41 | def _swig_setattr_nondynamic(self,class_type,name,value,static=1):
 42 |     if (name == "thisown"): return self.this.own(value)
 43 |     if (name == "this"):
 44 |         if type(value).__name__ == 'SwigPyObject':
 45 |             self.__dict__[name] = value
 46 |             return
 47 |     method = class_type.__swig_setmethods__.get(name,None)
 48 |     if method: return method(self,value)
 49 |     if (not static):
 50 |         self.__dict__[name] = value
 51 |     else:
 52 |         raise AttributeError("You cannot add attributes to %s" % self)
 53 | 
 54 | def _swig_setattr(self,class_type,name,value):
 55 |     return _swig_setattr_nondynamic(self,class_type,name,value,0)
 56 | 
 57 | def _swig_getattr(self,class_type,name):
 58 |     if (name == "thisown"): return self.this.own()
 59 |     method = class_type.__swig_getmethods__.get(name,None)
 60 |     if method: return method(self)
 61 |     raise AttributeError(name)
 62 | 
 63 | def _swig_repr(self):
 64 |     try: strthis = "proxy of " + self.this.__repr__()
 65 |     except: strthis = ""
 66 |     return "<%s.%s; %s >" % (self.__class__.__module__, self.__class__.__name__, strthis,)
 67 | 
 68 | try:
 69 |     _object = object
 70 |     _newclass = 1
 71 | except AttributeError:
 72 |     class _object : pass
 73 |     _newclass = 0
 74 | 
 75 | 
 76 | 
 77 | def deepflow2_numpy(*args):
 78 |   return _deepflow2.deepflow2_numpy(*args)
 79 | deepflow2_numpy = _deepflow2.deepflow2_numpy
 80 | 
 81 | def usage_python():
 82 |   return _deepflow2.usage_python()
 83 | usage_python = _deepflow2.usage_python
 84 | from numpy import float32, concatenate, empty, rollaxis, ascontiguousarray, pad
 85 | def deepflow2( im1=None, im2=None, match=None, options=""):
 86 |     """
 87 |     flow = deepflow2.deepflow2(image1, image2, match=None, options='')
 88 |     Compute the flow between two images, eventually using given matches.
 89 |     Images must be HxWx3 numpy arrays (convert to float32).
 90 |     Match is an optional numpy array argument (None by default, ie no input match), where each row starts by x1 y1 x2 y2.
 91 |     Options is an optional string argument ('' by default), to set the options. Type deepflow2() to see the list of available options.
 92 |     The function returns the optical flow as a HxWx2 numpy array."""
 93 |     #convert images
 94 |     if None in (im1,im2):
 95 |         usage_python()
 96 |         return
 97 |     assert im1.shape == im2.shape, "images must have the same shape"
 98 |     if im1.dtype != float32:
 99 |         im1 = im1.astype(float32)
100 |     if im2.dtype != float32:
101 |         im2 = im2.astype(float32)
102 |     h, w, nchannels = im1.shape
103 |     assert nchannels==3, "images must have 3 channels"
104 |     stride = 4*((w+3)//4)
105 |     im1 = pad( rollaxis(im1,2), ((0,0),(0,0),(0, stride-w)), 'constant')
106 |     im2 = pad( rollaxis(im2,2), ((0,0),(0,0),(0, stride-w)), 'constant')
107 |     # allocate flow
108 |     flowx = empty((h,stride), dtype=float32)
109 |     flowy = empty((h,stride), dtype=float32)
110 |     # compute flow
111 |     if match is not None:
112 |         assert match.shape[1]>=4
113 |         match = ascontiguousarray(match[:,:4], dtype=float32)
114 |     deepflow2_numpy( w, flowx, flowy, im1, im2, match, options)
115 |     return concatenate ( (flowx[:,:w,None], flowy[:,:w,None]), axis=2)
116 | 
117 | # This file is compatible with both classic and new-style classes.
118 | 
119 | 
120 | 


--------------------------------------------------------------------------------
/deep_flow2/deepflow2_matlab.cpp:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2013 Philippe Weinzaepfel
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
 16 | */
 17 | 
 18 | /*
 19 | MATLAB Wrapper
 20 | */
 21 | #include <mex.h>
 22 | #include <assert.h>
 23 | #include <math.h>
 24 | #include <string.h>
 25 | 
 26 | #include <stdint.h>
 27 | 
 28 | #define printf mexPrintf
 29 | 
 30 | extern "C" {
 31 |     #include "image.h"
 32 |     #include "opticalflow.h"
 33 |     #include "io.h"
 34 | }
 35 | 
 36 | color_image_t *input3darray_to_color_image(const mxArray *p){
 37 |     const int *dims = mxGetDimensions(p);
 38 |     const int h = dims[0], w = dims[1];
 39 |     assert( dims[2]==3 );
 40 |     float *in = (float*) mxGetData(p);
 41 |     color_image_t *out = color_image_new(w, h);
 42 |     const int s = out->stride;
 43 |     for(int c=0 ; c<3 ; c++){
 44 |         float *inptr = in + c*w*h;
 45 |         float *outptr = out->c1 + c*s*h;
 46 |         for( int j=0 ; j<h ; j++){
 47 |             for( int i=0 ; i<w ; i++){
 48 |                 outptr[j*s+i] = inptr[i*h+j];
 49 |             }
 50 |         }
 51 |     }
 52 |     return out;
 53 | }
 54 | 
 55 | void input2darray_to_matches( image_t *match_x, image_t *match_y, image_t *match_z, const mxArray *p){
 56 |     const int nmatch = mxGetM(p);
 57 |     const int w = match_x->width, h = match_x->height, s = match_x->stride;
 58 |     float *data = (float*) mxGetData(p);
 59 |     image_erase(match_x); image_erase(match_y); image_erase(match_z);
 60 |     for( int i=0 ; i<nmatch ; i++){
 61 |         float x1 = data[0*nmatch+i], y1 = data[1*nmatch+i], x2 = data[2*nmatch+i], y2 = data[3*nmatch+i];
 62 |         if( x1<0 || y1<0 || x2<0 || y2<0 || x1>=w || y1>=h || x2>=w || y2>=h){
 63 |             fprintf(stderr, "Warning: match out of bound: %f %f -> %f %f\n", x1, y1, x2, y2);
 64 |             x1 = MINMAX(x1,w);
 65 |             x2 = MINMAX(x2,w);
 66 |             y1 = MINMAX(y1,h);
 67 |             y2 = MINMAX(y2,h);
 68 |         }
 69 |         int pos = (int) (y1*s+x1);
 70 |         match_x->data[ pos ] = x2-x1;
 71 |         match_y->data[ pos ] = y2-y1;
 72 |         match_z->data[ pos ] = 1.0f;       
 73 |     }
 74 | }
 75 | 
 76 | 
 77 | 
 78 | void flow_to_output3darray(image_t *wx, image_t *wy, mxArray *p){
 79 |     const int h = wx->height, w = wx->width, s = wx->stride;
 80 |     float *data = (float*) mxGetData(p);
 81 |     for( int j=0 ; j<h ; j++) {
 82 |         for( int i=0 ; i<w ; i++) {
 83 |             data[i*h+j] = wx->data[j*s+i];
 84 |             data[(i+w)*h+j] = wy->data[j*s+i];
 85 |         }
 86 |     }    
 87 | }
 88 | 
 89 | void mexFunction( int nl, mxArray *pl[], int nr, const mxArray *pr[] ) {
 90 |     
 91 |     if( nr==0 ){
 92 |         usage(MATLAB_OPTIONS);
 93 |         return;
 94 |     }
 95 |     if ( nl != 1){
 96 |         usage(MATLAB_OPTIONS);
 97 |         mexErrMsgTxt("error: returns one output");
 98 |         return;
 99 |     }
100 |     if( nr < 2 || nr > 4){
101 |         usage(MATLAB_OPTIONS);
102 |         mexErrMsgTxt("error: takes two to four inputs");
103 |         return;
104 |     }
105 |     
106 |     // The code is originally written for C-order arrays.
107 |     // We thus transpose all arrays in this mex-function which is not efficient...
108 |     
109 |     const int *pDims;
110 |     if( mxGetNumberOfDimensions(pr[0]) != 3 ) mexErrMsgTxt("input images must have 3 dimensions");
111 |     if( !mxIsClass(pr[0], "single") ) mexErrMsgTxt("input images must be single");
112 |     pDims = mxGetDimensions(pr[0]);
113 |     if( pDims[2]!=3 ) mexErrMsgTxt("input images must have 3 channels");
114 |     const int h = pDims[0], w = pDims[1];
115 |     color_image_t *im1 = input3darray_to_color_image( pr[0] );
116 |    
117 |     if( mxGetNumberOfDimensions(pr[1]) != 3 ) mexErrMsgTxt("input images must have 3 dimensions");
118 |     if( !mxIsClass(pr[1], "single") ) mexErrMsgTxt("input images must be single");
119 |     pDims = mxGetDimensions(pr[1]);
120 |     if( pDims[0]!=h || pDims[1]!=w || pDims[2]!=3) mexErrMsgTxt( "input images must have the same size" );
121 |     color_image_t *im2 = input3darray_to_color_image( pr[1] );
122 | 
123 |     image_t *match_x = NULL, *match_y = NULL, *match_z = NULL;
124 |     if( nr>2 && !mxIsEmpty(pr[2]) ){
125 |         if( mxGetNumberOfDimensions(pr[2]) != 2 ) mexErrMsgTxt("input matches must be a 2d-matrix");
126 |         if( !mxIsClass(pr[2], "single")) mexErrMsgTxt("input matches must be single");  
127 |         pDims = mxGetDimensions(pr[1]); 
128 |         if( pDims[1]<4) mexErrMsgTxt( "input matches must have at least 4 columns: x1 y1 x2 y2" );
129 |         match_x = image_new(w, h); match_y = image_new(w, h); match_z = image_new(w, h); 
130 |         input2darray_to_matches( match_x, match_y, match_z, pr[2]);
131 |     }
132 |         
133 |     // set params to default
134 |     optical_flow_params_t* params = (optical_flow_params_t*) malloc(sizeof(optical_flow_params_t));
135 |     if(!params){
136 |         fprintf(stderr,"error deepflow2(): not enough memory\n");
137 |         exit(1);
138 |     }
139 |     optical_flow_params_default(params);
140 | 
141 |     // read options
142 |     if( nr > 3 ){
143 |         char *options = mxArrayToString(pr[3]);
144 |         if( !options )  mexErrMsgTxt("Fourth parameter must be a string");
145 | 	    int argc=0;
146 | 	    char* argv[256];
147 |         argv[argc]=strtok(options," ");
148 | 	    while(argv[argc]!=NULL)
149 | 	    {
150 | 		    argv[++argc]=strtok(NULL," ");
151 | 	    }
152 | 	    parse_options(params, argc, argv, MATLAB_OPTIONS, w, h);
153 |     }
154 |     
155 |     
156 |     image_t *wx = image_new(im1->width,im1->height), *wy = image_new(im1->width,im1->height);
157 |     optical_flow(wx, wy, im1, im2, params, match_x, match_y, match_z);
158 |     
159 |     int dims[3] = {h,w,2};
160 |     pl[0] = mxCreateNumericArray(3, dims, mxSINGLE_CLASS, mxREAL);
161 |     flow_to_output3darray(wx, wy, pl[0]);
162 |     
163 |     image_delete(wx);
164 |     image_delete(wy);
165 |     image_delete(match_x); image_delete(match_y); image_delete(match_z);
166 |     color_image_delete(im1); color_image_delete(im2);
167 |     free(params);
168 | 
169 | }
170 | 


--------------------------------------------------------------------------------
/deep_flow2/image.h:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2013 Philippe Weinzaepfel
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
 16 | */
 17 | #ifndef __IMAGE_H_
 18 | #define __IMAGE_H_
 19 | 
 20 | #include <stdio.h>
 21 | 
 22 | #define MIN(a, b) ((a) < (b) ? (a) : (b))
 23 | #define MAX(a, b) ((a) > (b) ? (a) : (b))
 24 | #define MINMAX(a,b) MIN( MAX(a,0) , b-1 )
 25 | 
 26 | /********** STRUCTURES *********/
 27 | 
 28 | /* structure for 1-channel image */
 29 | typedef struct image_s
 30 | {
 31 |   int width;		/* Width of the image */
 32 |   int height;		/* Height of the image */
 33 |   int stride;		/* Width of the memory (width + paddind such that it is a multiple of 4) */
 34 |   float *data;		/* Image data, aligned */
 35 | } image_t;
 36 | 
 37 | /* structure for 3-channels image stored with one layer per color, it assumes that c2 = c1+width*height and c3 = c2+width*height. */
 38 | typedef struct color_image_s
 39 | {
 40 |     int width;			/* Width of the image */
 41 |     int height;			/* Height of the image */
 42 |     int stride;         /* Width of the memory (width + paddind such that it is a multiple of 4) */
 43 |     float *c1;			/* Color 1, aligned */
 44 |     float *c2;			/* Color 2, consecutive to c1*/
 45 |     float *c3;			/* Color 3, consecutive to c2 */
 46 | } color_image_t;
 47 | 
 48 | /* structure for color image pyramid */
 49 | typedef struct color_image_pyramid_s 
 50 | {
 51 |   float scale_factor;          /* difference of scale between two levels */
 52 |   int min_size;                /* minimum size for width or height at the coarsest level */
 53 |   int size;                    /* number of levels in the pyramid */
 54 |   color_image_t **images;      /* list of images with images[0] the original one, images[size-1] the finest one */
 55 | } color_image_pyramid_t;
 56 | 
 57 | /* structure for convolutions */
 58 | typedef struct convolution_s
 59 | {
 60 |     int order;			/* Order of the convolution */
 61 |     float *coeffs;		/* Coefficients */
 62 |     float *coeffs_accu;	/* Accumulated coefficients */
 63 | } convolution_t;
 64 | 
 65 | /********** Create/Delete **********/
 66 | 
 67 | /* allocate a new image of size width x height */
 68 | image_t *image_new(const int width, const int height);
 69 | 
 70 | /* allocate a new image and copy the content from src */
 71 | image_t *image_cpy(const image_t *src);
 72 | 
 73 | /* set all pixels values to zeros */
 74 | void image_erase(image_t *image);
 75 | 
 76 | /* free memory of an image */
 77 | void image_delete(image_t *image);
 78 | 
 79 | /* multiply an image by a scalar */
 80 | void image_mul_scalar(image_t *image, const float scalar);
 81 | 
 82 | /* allocate a new color image of size width x height */
 83 | color_image_t *color_image_new(const int width, const int height);
 84 | 
 85 | /* allocate a new color image and copy the content from src */
 86 | color_image_t *color_image_cpy(const color_image_t *src);
 87 | 
 88 | /* set all pixels values to zeros */
 89 | void color_image_erase(color_image_t *image);
 90 | 
 91 | /* free memory of a color image */
 92 | void color_image_delete(color_image_t *image);
 93 | 
 94 | /* reallocate the memory of an image to fit the new width height */
 95 | void resize_if_needed_newsize(image_t *im, const int w, const int h);
 96 | 
 97 | /************ Resizing *********/
 98 | 
 99 | /* resize an image with bilinear interpolation */
100 | image_t *image_resize_bilinear(const image_t *src, const float scale);
101 | 
102 | /* resize an image with bilinear interpolation to fit the new weidht, height ; reallocation is done if necessary */
103 | void image_resize_bilinear_newsize(image_t *dst, const image_t *src, const int new_width, const int new_height);
104 | 
105 | /* resize a color image  with bilinear interpolation */
106 | color_image_t *color_image_resize_bilinear(const color_image_t *src, const float scale);
107 | 
108 | /************ Convolution ******/
109 | 
110 | /* return half coefficient of a gaussian filter */
111 | float *gaussian_filter(const float sigma, int *fSize);
112 | 
113 | /* create a convolution structure with a given order, half_coeffs, symmetric or anti-symmetric according to even parameter */
114 | convolution_t *convolution_new(int order, const float *half_coeffs, const int even);
115 | 
116 | /* perform an horizontal convolution of an image */
117 | void convolve_horiz(image_t *dest, const image_t *src, const convolution_t *conv);
118 | 
119 | /* perform a vertical convolution of an image */
120 | void convolve_vert(image_t *dest, const image_t *src, const convolution_t *conv);
121 | 
122 | /* free memory of a convolution structure */
123 | void convolution_delete(convolution_t *conv);
124 | 
125 | /* perform horizontal and/or vertical convolution to a color image */
126 | void color_image_convolve_hv(color_image_t *dst, const color_image_t *src, const convolution_t *horiz_conv, const convolution_t *vert_conv);
127 | 
128 | /************ Pyramid **********/
129 | 
130 | /* create a pyramid of color images using a given scale factor, stopping when one dimension reach min_size and with applying a gaussian smoothing of standard deviation spyr (no smoothing if 0) */
131 | color_image_pyramid_t *color_image_pyramid_create(const color_image_t *src, const float scale_factor, const int min_size, const float spyr);
132 | 
133 | /* delete the structure of a pyramid of color images */
134 | void color_image_pyramid_delete(color_image_pyramid_t *pyr);
135 | 
136 | #endif
137 | 


--------------------------------------------------------------------------------
/deep_flow2/io.h:
--------------------------------------------------------------------------------
 1 | /*
 2 | Copyright (C) 2013 Philippe Weinzaepfel
 3 | 
 4 | This program is free software: you can redistribute it and/or modify
 5 | it under the terms of the GNU General Public License as published by
 6 | the Free Software Foundation, either version 3 of the License, or
 7 | (at your option) any later version.
 8 | 
 9 | This program is distributed in the hope that it will be useful,
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 | GNU General Public License for more details.
13 | 
14 | You should have received a copy of the GNU General Public License
15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
16 | */
17 | #ifndef __IO_H__
18 | #define __IO_H__
19 | 
20 | #include <stdlib.h>
21 | 
22 | #include "image.h"
23 | #include "opticalflow.h"
24 | 
25 | /* read a flow file and returns a pointer with two images containing the flow along x and y axis */
26 | image_t** readFlowFile(const char* filename);
27 | 
28 | /* write a flow to a file */
29 | void writeFlowFile(const char* filename, const image_t *flowx, const image_t *flowy);
30 | 
31 | /* load a color image from a file in jpg, png or ppm*/
32 | color_image_t *color_image_load(const char *fname);
33 | 
34 | 
35 | #define EXE_OPTIONS 0
36 | #define MATLAB_OPTIONS 1
37 | #define PYTHON_OPTIONS 2
38 | /* print usage */
39 | void usage(const int language);
40 | 
41 | /* parse options and eventually return the matches given as argument */
42 | image_t** parse_options(optical_flow_params_t* params, int argc, char **argv, const int language, const int width, const int height);
43 | 
44 | #endif
45 | 


--------------------------------------------------------------------------------
/deep_flow2/opticalflow.c:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2013 Philippe Weinzaepfel
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
 16 | */
 17 | #include <stdlib.h>
 18 | #include <math.h>
 19 | #include <string.h>
 20 | #include <malloc.h>
 21 | 
 22 | #include "opticalflow.h"
 23 | #include "opticalflow_aux.h"
 24 | #include "solver.h"
 25 | #include "image.h"
 26 | 
 27 | #include <xmmintrin.h>
 28 | typedef __v4sf v4sf;
 29 | 
 30 | convolution_t *deriv, *deriv_flow;
 31 | float half_alpha, half_delta_over3, half_beta, half_gamma_over3;
 32 | 
 33 | /* perform flow computation at one level of the pyramid */
 34 | void compute_one_level(image_t *wx, image_t *wy, color_image_t *im1, color_image_t *im2, image_t *desc_flow_x, image_t *desc_flow_y, image_t *desc_weight, const optical_flow_params_t *params){ 
 35 |     const int width = wx->width, height = wx->height, stride=wx->stride;
 36 |     int i_inner_iteration;
 37 |   
 38 |     image_t *du = image_new(width,height), *dv = image_new(width,height), // the flow increment
 39 |         *mask = image_new(width,height), // mask containing 0 if a point goes outside image boundary, 1 otherwise
 40 |         *smooth_horiz = image_new(width,height), *smooth_vert = image_new(width,height), // horiz: (i,j) contains the diffusivity coeff from (i,j) to (i+1,j) 
 41 |         *uu = image_new(width,height), *vv = image_new(width,height), // flow plus flow increment
 42 |         *a11 = image_new(width,height), *a12 = image_new(width,height), *a22 = image_new(width,height), // system matrix A of Ax=b for each pixel
 43 |         *b1 = image_new(width,height), *b2 = image_new(width,height), // system matrix b of Ax=b for each pixel
 44 |         *smooth_weight = compute_smoothness_weight(im1, 5.0f, deriv); // local weights for smoothness
 45 |         
 46 |     color_image_t *w_im2 = color_image_new(width,height), // warped second image
 47 |         *Ix = color_image_new(width,height), *Iy = color_image_new(width,height), *Iz = color_image_new(width,height), // first order derivatives
 48 |         *Ixx = color_image_new(width,height), *Ixy = color_image_new(width,height), *Iyy = color_image_new(width,height), *Ixz = color_image_new(width,height), *Iyz = color_image_new(width,height); // second order derivatives
 49 |   
 50 |     // warp second image
 51 |     image_warp(w_im2, mask, im2, wx, wy);
 52 |     // compute derivatives
 53 |     get_derivatives(im1, w_im2, deriv, Ix, Iy, Iz, Ixx, Ixy, Iyy, Ixz, Iyz);
 54 |     // erase du and dv
 55 |     image_erase(du);
 56 |     image_erase(dv);
 57 |     // initialize uu and vv
 58 |     memcpy(uu->data,wx->data,wx->stride*wx->height*sizeof(float));
 59 |     memcpy(vv->data,wy->data,wy->stride*wy->height*sizeof(float));
 60 |     // inner fixed point iterations
 61 |     for(i_inner_iteration = 0 ; i_inner_iteration < params->n_inner_iteration ; i_inner_iteration++){
 62 |         //  compute robust function and system
 63 |         compute_smoothness(smooth_horiz, smooth_vert, uu, vv, smooth_weight, deriv_flow, half_alpha );
 64 |         compute_data_and_match(a11, a12, a22, b1, b2, mask, wx, wy, du, dv, uu, vv, Ix, Iy, Iz, Ixx, Ixy, Iyy, Ixz, Iyz, desc_weight, desc_flow_x, desc_flow_y, half_delta_over3, half_beta, half_gamma_over3);
 65 |         sub_laplacian(b1, wx, smooth_horiz, smooth_vert);
 66 |         sub_laplacian(b2, wy, smooth_horiz, smooth_vert);
 67 |         // solve system
 68 |         sor_coupled(du, dv, a11, a12, a22, b1, b2, smooth_horiz, smooth_vert, params->n_solver_iteration, params->sor_omega);
 69 |         // update flow plus flow increment
 70 |         int i;
 71 |         v4sf *uup = (v4sf*) uu->data, *vvp = (v4sf*) vv->data, *wxp = (v4sf*) wx->data, *wyp = (v4sf*) wy->data, *dup = (v4sf*) du->data, *dvp = (v4sf*) dv->data;
 72 |         for( i=0 ; i<height*stride/4 ; i++){
 73 |             (*uup) = (*wxp) + (*dup);
 74 |             (*vvp) = (*wyp) + (*dvp);
 75 |             uup+=1; vvp+=1; wxp+=1; wyp+=1;dup+=1;dvp+=1;
 76 | 	   }
 77 |     }
 78 |     // add flow increment to current flow
 79 |     memcpy(wx->data,uu->data,uu->stride*uu->height*sizeof(float));
 80 |     memcpy(wy->data,vv->data,vv->stride*vv->height*sizeof(float)); 
 81 |     // free memory
 82 |     image_delete(du); image_delete(dv);
 83 |     image_delete(mask);
 84 |     image_delete(smooth_horiz); image_delete(smooth_vert);
 85 |     image_delete(uu); image_delete(vv);
 86 |     image_delete(a11); image_delete(a12); image_delete(a22);
 87 |     image_delete(b1); image_delete(b2);
 88 |     image_delete(smooth_weight);
 89 |     color_image_delete(w_im2); 
 90 |     color_image_delete(Ix); color_image_delete(Iy); color_image_delete(Iz);
 91 |     color_image_delete(Ixx); color_image_delete(Ixy); color_image_delete(Iyy); color_image_delete(Ixz); color_image_delete(Iyz);
 92 | }
 93 | 
 94 | /* set flow parameters to default */
 95 | void optical_flow_params_default(optical_flow_params_t *params){
 96 |     if(!params){
 97 |         fprintf(stderr,"Error optical_flow_params_default: argument is null\n");
 98 |         exit(1);
 99 |     }
100 |     params->alpha = 1.0f;
101 |     params->beta = 20.0f;
102 |     params->gamma = 0.7f;
103 |     params->delta = 0.1f;
104 |     params->sigma = 0.6f;
105 |     params->bk = 0.5f;
106 |     params->eta = 0.95f;
107 |     params->min_size = 25;
108 |     params->n_inner_iteration = 5;  
109 |     params->n_solver_iteration = 25;
110 |     params->sor_omega = 1.60f;
111 | }
112 | 
113 | /* set flow parameters to sintel one */
114 | void optical_flow_params_sintel(optical_flow_params_t *params){
115 |     if(!params){
116 |         fprintf(stderr,"Error optical_flow_params_sintel: argument is null\n");
117 |         exit(1);
118 |     }
119 |     params->alpha = 1.0f;
120 |     params->beta = 32.0f;
121 |     params->gamma = 0.56f;
122 |     params->delta = 0.0f;
123 |     params->sigma = 0.45f;
124 |     params->bk = 0.45f;
125 |     params->eta = 0.95f;
126 |     params->min_size = 25;
127 |     params->n_inner_iteration = 5;  
128 |     params->n_solver_iteration = 25;
129 |     params->sor_omega = 1.60f;
130 | }
131 | 
132 | /* set flow parameters to middlebury one */
133 | void optical_flow_params_middlebury(optical_flow_params_t *params){
134 |     if(!params){
135 |         fprintf(stderr,"Error optical_flow_params_middlebury: argument is null\n");
136 |         exit(1);
137 |     }
138 |     params->alpha = 1.0f;
139 |     params->beta = 11.5f;
140 |     params->gamma = 1.09f;
141 |     params->delta = 0.04f;
142 |     params->sigma = 0.65f;
143 |     params->bk = 0.45f;
144 |     params->eta = 0.95f;
145 |     params->min_size = 25;
146 |     params->n_inner_iteration = 5;  
147 |     params->n_solver_iteration = 25;
148 |     params->sor_omega = 1.60f;
149 | }
150 | 
151 | /* set flow parameters to kitti one */
152 | void optical_flow_params_kitti(optical_flow_params_t *params){
153 |     if(!params){
154 |         fprintf(stderr,"Error optical_flow_params_kitti: argument is null\n");
155 |         exit(1);
156 |     }
157 |     params->alpha = 1.0f;
158 |     params->beta = 0.6f;
159 |     params->gamma = 1.09f;
160 |     params->delta = 0.40f;
161 |     params->sigma = 0.60f;
162 |     params->bk = 0.0f;
163 |     params->eta = 0.95f;
164 |     params->min_size = 25;
165 |     params->n_inner_iteration = 5;  
166 |     params->n_solver_iteration = 25;
167 |     params->sor_omega = 1.60f;
168 | }
169 | 
170 | /* Compute the optical flow between im1 and im2 and store it as two 1-channel images in wx for flow along x-axis and wy for flow along y-axis. match_x, match_y and match_z contains eventually the input matches (NULL for no match) at any scale. */
171 | void optical_flow(image_t *wx, image_t *wy, const color_image_t *im1, const color_image_t *im2, optical_flow_params_t *params, const image_t *match_x, const image_t *match_y, image_t *match_z){
172 |   
173 |     // Check parameters
174 |     if(!params){
175 |         params = (optical_flow_params_t*) malloc(sizeof(optical_flow_params_t));
176 |         if(!params){
177 |           fprintf(stderr,"error color_image_convolve_hv(): not enough memory\n");
178 |           exit(1);
179 |         }
180 |         optical_flow_params_default(params);
181 |     }
182 | 
183 |     // initialize global variables
184 |     half_alpha = 0.5f*params->alpha;
185 |     half_gamma_over3 = params->gamma*0.5f/3.0f;
186 |     half_delta_over3 = params->delta*0.5f/3.0f;
187 |     half_beta = params->beta*0.5f;
188 |     float deriv_filter[3] = {0.0f, -8.0f/12.0f, 1.0f/12.0f};
189 |     deriv = convolution_new(2, deriv_filter, 0);
190 |     float deriv_filter_flow[2] = {0.0f, -0.5f};
191 |     deriv_flow = convolution_new(1, deriv_filter_flow, 0);
192 |     
193 |     // presmooth images
194 |     int width = im1->width, height = im1->height, filter_size;
195 |     color_image_t *smooth_im1 = color_image_new(width, height), *smooth_im2 = color_image_new(width, height);
196 |     float *presmooth_filter = gaussian_filter(params->sigma, &filter_size);
197 |     convolution_t *presmoothing = convolution_new(filter_size, presmooth_filter, 1);
198 |     color_image_convolve_hv(smooth_im1, im1, presmoothing, presmoothing);
199 |     color_image_convolve_hv(smooth_im2, im2, presmoothing, presmoothing); 
200 |     convolution_delete(presmoothing);
201 |     free(presmooth_filter);
202 | 
203 |     // check descriptors
204 |     image_t *desc_flow_x, *desc_flow_y, *desc_weight, *desc_flow_x_original=NULL, *desc_flow_y_original=NULL, *desc_weight_original=NULL;
205 |     desc_flow_x = image_new(0,0);
206 |     desc_flow_y = image_new(0,0);
207 |     desc_weight = image_new(0,0);
208 |     if(params->beta){
209 |         if(match_x == NULL){
210 |             printf("No descriptor input, weight of descriptor term set to 0\n");    
211 |             params->beta = 0.0f;
212 |             half_beta = 0.0f;
213 |         }else{
214 |             compute_desc_weight(im1, im2, match_x, match_y, match_z, deriv_flow, deriv);
215 |             desc_flow_x_original = image_cpy(match_x);
216 |             desc_flow_y_original = image_cpy(match_y);
217 |             desc_weight_original = image_cpy(match_z);
218 |         }
219 |     }  
220 | 
221 |     // building pyramid
222 |     color_image_pyramid_t *pyr1 = color_image_pyramid_create(smooth_im1, 1.0f/params->eta, params->min_size, 0.0f),
223 |                         *pyr2 = color_image_pyramid_create(smooth_im2, 1.0f/params->eta, params->min_size, 0.0f);
224 | 
225 |     // loop over levels
226 |     int k;
227 |     for(k=pyr1->size-1; k>=0 ; k--){
228 |         if(params->bk>0.0f) half_beta = 0.5f*params->beta * pow(((float)k)/((float)pyr1->size-1),params->bk);
229 |         if(k == pyr1->size-1){ 
230 |             // first level	  
231 |             // allocate wx and wy
232 |             resize_if_needed_newsize(wx, pyr1->images[k]->width, pyr1->images[k]->height);
233 |             resize_if_needed_newsize(wy, pyr1->images[k]->width, pyr1->images[k]->height);
234 |             image_erase(wx); image_erase(wy);
235 | 	    }else{ 
236 |             // resize flow to the new pyramid level size and multiply it by 1/eta
237 |             image_t *tmp = image_new(pyr1->images[k]->width, pyr1->images[k]->height);
238 |             image_resize_bilinear_newsize(tmp, wx, pyr1->images[k]->width, pyr1->images[k]->height);
239 |             resize_if_needed_newsize(wx, pyr1->images[k]->width, pyr1->images[k]->height);
240 |             memcpy(wx->data, tmp->data, tmp->stride*tmp->height*sizeof(float)); 
241 |             image_mul_scalar(wx, 1.0f/params->eta);
242 |             image_resize_bilinear_newsize(tmp, wy, pyr1->images[k]->width, pyr1->images[k]->height);
243 |             resize_if_needed_newsize(wy, pyr1->images[k]->width, pyr1->images[k]->height);
244 |             memcpy(wy->data, tmp->data, tmp->stride*tmp->height*sizeof(float));
245 |             image_mul_scalar(wy, 1.0f/params->eta);     
246 |             image_delete(tmp);
247 |         }
248 | 
249 |         // resize descriptors
250 |         if(params->beta){
251 |             resize_if_needed_newsize(desc_flow_x, pyr1->images[k]->width, pyr1->images[k]->height);
252 |             resize_if_needed_newsize(desc_flow_y, pyr1->images[k]->width, pyr1->images[k]->height);
253 |             resize_if_needed_newsize(desc_weight, pyr1->images[k]->width, pyr1->images[k]->height);
254 |             descflow_resize(desc_flow_x,desc_flow_y,desc_weight,desc_flow_x_original,desc_flow_y_original,desc_weight_original);
255 | 	    }
256 |      
257 |         compute_one_level(wx, wy, pyr1->images[k], pyr2->images[k], desc_flow_x, desc_flow_y, desc_weight, params);
258 |       
259 |     }
260 |     
261 |     color_image_pyramid_delete(pyr1); color_image_pyramid_delete(pyr2);
262 |     
263 |     // do a last iteration without descriptor if bk==0
264 |     if(params->beta>0.0f && params->bk==0.0f){
265 |         half_beta = 0.0f;
266 |         compute_one_level(wx, wy, smooth_im1, smooth_im2, desc_flow_x, desc_flow_y, desc_weight, params);
267 |         half_beta = 0.5f*params->beta;
268 |     }
269 | 
270 |     // free memory
271 |     color_image_delete(smooth_im1);
272 |     color_image_delete(smooth_im2);
273 |     image_delete(desc_flow_x); image_delete(desc_flow_y); image_delete(desc_weight);
274 |     convolution_delete(deriv);
275 |     convolution_delete(deriv_flow);
276 |     if(params->beta){image_delete(desc_flow_x_original); image_delete(desc_flow_y_original); image_delete(desc_weight_original);}
277 | }
278 | 


--------------------------------------------------------------------------------
/deep_flow2/opticalflow.h:
--------------------------------------------------------------------------------
 1 | /*
 2 | Copyright (C) 2013 Philippe Weinzaepfel
 3 | 
 4 | This program is free software: you can redistribute it and/or modify
 5 | it under the terms of the GNU General Public License as published by
 6 | the Free Software Foundation, either version 3 of the License, or
 7 | (at your option) any later version.
 8 | 
 9 | This program is distributed in the hope that it will be useful,
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 | GNU General Public License for more details.
13 | 
14 | You should have received a copy of the GNU General Public License
15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
16 | */
17 | #ifndef __OPTICALFLOW_H__
18 | #define __OPTICALFLOW_H__
19 | 
20 | #include <stdio.h>
21 | #include <stdlib.h>
22 | 
23 | #include "image.h"
24 | 
25 | typedef struct optical_flow_params_s {
26 |   float alpha;             // smoothness weight
27 |   float beta;              // matching weight
28 |   float gamma;             // gradient constancy assumption weight
29 |   float delta;             // color constancy assumption weight
30 |   float sigma;             // presmoothing of the images
31 |   float bk;                // downweight parameter of the matching weight
32 |   float eta;               // downscale factor
33 |   int min_size;            // minimum size of the first level
34 |   int n_inner_iteration;   // number of inner fixed point iterations
35 |   int n_solver_iteration;  // number of solver iterations 
36 |   float sor_omega;         // omega parameter of sor method
37 | } optical_flow_params_t;
38 | 
39 | /* set flow parameters to default */
40 | void optical_flow_params_default(optical_flow_params_t *params);
41 | 
42 | /* set flow parameters to sintel one */
43 | void optical_flow_params_sintel(optical_flow_params_t *params);
44 | 
45 | /* set flow parameters to middlebury one */
46 | void optical_flow_params_middlebury(optical_flow_params_t *params);
47 | 
48 | /* set flow parameters to kitti one */
49 | void optical_flow_params_kitti(optical_flow_params_t *params);
50 | 
51 | /* Compute the optical flow between im1 and im2 and store it as two 1-channel images in wx for flow along x-axis and wy for flow along y-axis. match_x, match_y and match_z contains eventually the input matches (NULL for no match) at any scale. */
52 | void optical_flow(image_t *wx, image_t *wy, const color_image_t *im1, const color_image_t *im2, optical_flow_params_t *params, const image_t *match_x, const image_t *match_y, image_t *match_z);
53 | 
54 | #endif
55 | 


--------------------------------------------------------------------------------
/deep_flow2/opticalflow_aux.h:
--------------------------------------------------------------------------------
 1 | /*
 2 | Copyright (C) 2013 Philippe Weinzaepfel
 3 | 
 4 | This program is free software: you can redistribute it and/or modify
 5 | it under the terms of the GNU General Public License as published by
 6 | the Free Software Foundation, either version 3 of the License, or
 7 | (at your option) any later version.
 8 | 
 9 | This program is distributed in the hope that it will be useful,
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 | GNU General Public License for more details.
13 | 
14 | You should have received a copy of the GNU General Public License
15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
16 | */
17 | #ifndef __OPTICALFLOW_AUX_
18 | #define __OPTICALFLOW_AUX_
19 | 
20 | #include <stdlib.h>
21 | 
22 | #include "image.h"
23 | 
24 | /* warp a color image according to a flow. src is the input image, wx and wy, the input flow. dst is the warped image and mask contains 0 or 1 if the pixels goes outside/inside image boundaries */
25 | void image_warp(color_image_t *dst, image_t *mask, const color_image_t *src, const image_t *wx, const image_t *wy);
26 | 
27 | /* compute image first and second order spatio-temporal derivatives of a color image */
28 | void get_derivatives(const color_image_t *im1, const color_image_t *im2, const convolution_t *deriv, color_image_t *dx, color_image_t *dy, color_image_t *dt, color_image_t *dxx, color_image_t *dxy, color_image_t *dyy, color_image_t *dxt, color_image_t *dyt);
29 | 
30 | /* compute smoothness weight using image gradient's norm as exp(-coef*grad(luminance))*/
31 | image_t* compute_smoothness_weight(color_image_t *im, float coef, const convolution_t *deriv);
32 | 
33 | /* compute the smoothness term */
34 | void compute_smoothness(image_t *dst_horiz, image_t *dst_vert, const image_t *uu, const image_t *vv, const image_t *smooth_weight, const convolution_t *deriv_flow, const float quarter_alpha);
35 | 
36 | /* sub the laplacian (smoothness term) to the right-hand term */
37 | void sub_laplacian(image_t *dst, const image_t *src, const image_t *weight_horiz, const image_t *weight_vert);
38 | 
39 | /* compute the dataterm and the matching term
40 |    a11 a12 a22 represents the 2x2 diagonal matrix, b1 and b2 the right hand side
41 |    other (color) images are input */
42 | void compute_data_and_match(image_t *a11, image_t *a12, image_t *a22, image_t *b1, image_t *b2, image_t *mask, image_t *wx, image_t *wy, image_t *du, image_t *dv, image_t *uu, image_t *vv, color_image_t *Ix, color_image_t *Iy, color_image_t *Iz, color_image_t *Ixx, color_image_t *Ixy, color_image_t *Iyy, color_image_t *Ixz, color_image_t *Iyz, image_t *desc_weight, image_t *desc_flow_x, image_t *desc_flow_y, const float half_delta_over3, const float half_beta, const float half_gamma_over3);
43 | 
44 | /* compute score for matches based on autocorrelation matrix and similarity in color/gradient */
45 | void compute_desc_weight(const color_image_t* im1, const color_image_t* im2, const image_t* desc_x, const image_t *desc_y, image_t *desc_w, const convolution_t* deriv_autocor, const convolution_t *deriv_flow);
46 | 
47 | /* resize the descriptors to the new size using a weighted mean */
48 | void descflow_resize(image_t *dst_flow_x, image_t *dst_flow_y, image_t *dst_weight, const image_t *src_flow_x, const image_t *src_flow_y, const image_t *src_weight);
49 | 
50 | /* resize the descriptors to the new size using a nearest neighbor method while keeping the descriptor with the higher weight at the end */
51 | void descflow_resize_nn(image_t *dst_flow_x, image_t *dst_flow_y, image_t *dst_weight, const image_t *src_flow_x, const image_t *src_flow_y, const image_t *src_weight);
52 | 
53 | 
54 | 
55 | #endif
56 | 


--------------------------------------------------------------------------------
/deep_flow2/solver.h:
--------------------------------------------------------------------------------
 1 | /*
 2 | Copyright (C) 2013 Philippe Weinzaepfel
 3 | 
 4 | This program is free software: you can redistribute it and/or modify
 5 | it under the terms of the GNU General Public License as published by
 6 | the Free Software Foundation, either version 3 of the License, or
 7 | (at your option) any later version.
 8 | 
 9 | This program is distributed in the hope that it will be useful,
10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 | GNU General Public License for more details.
13 | 
14 | You should have received a copy of the GNU General Public License
15 | along with this program.  If not, see <http://www.gnu.org/licenses/>.
16 | */
17 | #include <stdio.h>
18 | #include <stdlib.h>
19 | 
20 | #include "image.h"
21 | 
22 | // Perform n iterations of the sor_coupled algorithm for a system of the form as described in opticalflow.c
23 | void sor_coupled(image_t *du, image_t *dv, image_t *a11, image_t *a12, image_t *a22, const image_t *b1, const image_t *b2, const image_t *dpsis_horiz, const image_t *dpsis_vert, const int iterations, const float omega);
24 | 


--------------------------------------------------------------------------------
/deep_matching/.gitignore:
--------------------------------------------------------------------------------
  1 | ## General
  2 | 
  3 | # Compiled Object files
  4 | *.slo
  5 | *.lo
  6 | *.o
  7 | *.cuo
  8 | 
  9 | # Compiled Dynamic libraries
 10 | *.so
 11 | *.dylib
 12 | 
 13 | # Compiled Static libraries
 14 | *.lai
 15 | *.la
 16 | *.a
 17 | 
 18 | # Compiled protocol buffers
 19 | *.pb.h
 20 | *.pb.cc
 21 | *_pb2.py
 22 | 
 23 | # Compiled python
 24 | *.pyc
 25 | 
 26 | # Compiled MATLAB
 27 | *.mex*
 28 | 
 29 | # IPython notebook checkpoints
 30 | .ipynb_checkpoints
 31 | 
 32 | # Editor temporaries
 33 | *.swp
 34 | *~
 35 | 
 36 | # Sublime Text settings
 37 | *.sublime-workspace
 38 | *.sublime-project
 39 | 
 40 | # Eclipse Project settings
 41 | *.*project
 42 | .settings
 43 | 
 44 | # QtCreator files
 45 | *.user
 46 | 
 47 | # PyCharm files
 48 | .idea
 49 | 
 50 | # OSX dir files
 51 | .DS_Store
 52 | 
 53 | ## Caffe
 54 | 
 55 | # User's build configuration
 56 | Makefile.config
 57 | 
 58 | # Data and models are either
 59 | # 1. reference, and not casually committed
 60 | # 2. custom, and live on their own unless they're deliberated contributed
 61 | data/*
 62 | models/*
 63 | *.caffemodel
 64 | *.caffemodel.h5
 65 | *.solverstate
 66 | *.solverstate.h5
 67 | *.binaryproto
 68 | *leveldb
 69 | *lmdb
 70 | 
 71 | # build, distribute, and bins (+ python proto bindings)
 72 | build
 73 | .build_debug/*
 74 | .build_release/*
 75 | distribute/*
 76 | *.testbin
 77 | *.bin
 78 | python/caffe/proto/
 79 | cmake_build
 80 | .cmake_build
 81 | 
 82 | # Generated documentation
 83 | docs/_site
 84 | docs/gathered
 85 | _site
 86 | doxygen
 87 | docs/dev
 88 | 
 89 | # LevelDB files
 90 | *.sst
 91 | *.ldb
 92 | LOCK
 93 | LOG*
 94 | CURRENT
 95 | MANIFEST-*
 96 | 
 97 | # images
 98 | *.jpg
 99 | *.png
100 | *.flo
101 | 


--------------------------------------------------------------------------------
/deep_matching/Makefile:
--------------------------------------------------------------------------------
 1 | # Path to gpudm and libcaffe.so
 2 | CAFFEDIR=caffe
 3 | CAFFELIB=$(CAFFEDIR)/build/lib
 4 | CAFFE_BUIL_SRC=$(CAFFEDIR)/.build_release/src
 5 | 
 6 | # Path to google tools (protobuf, glogs) # GOOGLETOOLS=/usr
 7 | GOOGLETOOLS=/home/ddk/softwares/caffe/zhouxia.env
 8 | 
 9 | CUDA=/usr/local/cuda
10 | 
11 | MKL=/home/ddk/softwares/caffe/mkl.install/intel/mkl
12 | 
13 | INCLUDES=-I/usr/include/python2.7 \
14 | -I$(CAFFEDIR)/include \
15 | -I$(CUDA)/include \
16 | -I$(GOOGLETOOLS)/include \
17 | -I$(MKL)/include \
18 | -I$(CAFFEDIR)/include \
19 | -I$(CAFFE_BUIL_SRC)
20 | 
21 | #include gpudm/Makefile.config
22 | CUDA_ARCH := \
23 |     -gencode arch=compute_35,code=sm_35 \
24 |     -gencode arch=compute_50,code=sm_50
25 | 
26 | HEADERS := $(shell find . -name '*.hpp')
27 | EXTRA_LAYERS := $(shell find . -name '*.hpp')
28 | 
29 | OPTFLAGS=-g -O2
30 | 
31 | all:  _gpudm.so
32 | 
33 | _gpudm.so: gpudm_wrap.o $(EXTRA_LAYERS:.hpp=.o) $(EXTRA_LAYERS:.hpp=.cuo)
34 | 	g++ $(OPTFLAGS) -fPIC $(INCLUDES) -L$(CAFFELIB) $^ -shared -o $@ -lcaffe -L$(CUDA)/lib64 -lcusparse
35 | 	CAFFEDIR=$(CAFFEDIR); GOOGLETOOLS=$(GOOGLETOOLS); CUDA=$(CUDA); MKL=$(MKL); LD_LIBRARY_PATH="$(CAFFELIB):$(CUDA)/lib64:$(MKL)/lib/intel64:/usr/lib64/openmpi/lib/:$(GOOGLETOOLS)/lib:$(LD_LIBRARY_PATH)" python -c "import gpudm"
36 | 
37 | %.cuo: %.cu %.hpp 
38 | 	$(CUDA)/bin/nvcc $(CUDA_ARCH) -Xcompiler -fPIC $(INCLUDES) $(OPTFLAGS) -c $< -o $@
39 | 
40 | gpudm_wrap.cxx: gpudm.swig $(HEADERS)
41 | 	swig -python -c++ $(INCLUDES) gpudm.swig
42 | 
43 | gpudm_wrap.o: gpudm_wrap.cxx 
44 | 	g++ $(OPTFLAGS) -c gpudm_wrap.cxx -fPIC $(INCLUDES) -o gpudm_wrap.o
45 | 
46 | %.o: %.cpp %.hpp 
47 | 	g++ $(OPTFLAGS) -c $< -fPIC $(INCLUDES) -L$(CAFFEDIR) -o $@
48 | 
49 | clean:
50 | 	rm -f *.pyc *~ _gpudm.so gpudm_wrap.o $(EXTRA_LAYERS:.hpp=.o) $(EXTRA_LAYERS:.hpp=.cuo)
51 | 
52 | cleanswig: clean
53 | 	rm -f gpudm.py gpudm_wrap.cxx gpudm_wrap.o
54 | 
55 | 
56 | 
57 | 
58 | 
59 | 
60 | 
61 | 
62 | 
63 | 
64 | 
65 | 
66 | 
67 | 
68 | 
69 | 
70 | 
71 | 
72 | 
73 | 
74 | 
75 | 
76 | 
77 | 
78 | 
79 | 


--------------------------------------------------------------------------------
/deep_matching/Makefile.bak:
--------------------------------------------------------------------------------
 1 | # Path to gpudm and libcaffe.so
 2 | CAFFEDIR=caffe
 3 | CAFFELIB=$(CAFFEDIR)/build/lib
 4 | CAFFE_BUIL_SRC=$(CAFFEDIR)/.build_release/src
 5 | 
 6 | # Path to google tools (protobuf, glogs)
 7 | GOOGLETOOLS=google_tools
 8 | 
 9 | # Path to CUDA
10 | CUDA=/scratch/hydrus/cuda-6.5
11 | 
12 | # Path to MKL (or BLAS)
13 | MKL=/home/clear/lear/intel/mkl
14 | 
15 | INCLUDES=-I/usr/include/python2.7 \
16 | -I$(CAFFEDIR)/include \
17 | -I$(CUDA)/include \
18 | -I$(GOOGLETOOLS)/include/ \
19 | -I$(MKL)/include \
20 | -I$(CAFFEDIR)/include \
21 | -I$(CAFFE_BUIL_SRC)
22 | 
23 | #include gpudm/Makefile.config
24 | CUDA_ARCH := \
25 |     -gencode arch=compute_35,code=sm_35 \
26 |     -gencode arch=compute_50,code=sm_50
27 | 
28 | HEADERS := $(shell find . -name '*.hpp')
29 | EXTRA_LAYERS := $(shell find . -name '*.hpp')
30 | 
31 | OPTFLAGS=-g -O2
32 | 
33 | all:  _gpudm.so
34 | 
35 | _gpudm.so: gpudm_wrap.o $(EXTRA_LAYERS:.hpp=.o) $(EXTRA_LAYERS:.hpp=.cuo)
36 | 	g++ $(OPTFLAGS) -fPIC $(INCLUDES) -L$(CAFFELIB) $^ -shared -o $@ -lcaffe -L$(CUDA)/lib64 -lcusparse
37 | 	CAFFEDIR=$(CAFFEDIR); GOOGLETOOLS=$(GOOGLETOOLS); CUDA=$(CUDA); MKL=$(MKL); LD_LIBRARY_PATH="$(CAFFELIB):$(CUDA)/lib64:$(MKL)/lib/intel64:/usr/lib64/openmpi/lib/:$(GOOGLETOOLS)/lib:$(LD_LIBRARY_PATH)" python -c "import gpudm"
38 | 
39 | %.cuo: %.cu %.hpp 
40 | 	$(CUDA)/bin/nvcc $(CUDA_ARCH) -Xcompiler -fPIC $(INCLUDES) $(OPTFLAGS) -c $< -o $@
41 | 
42 | gpudm_wrap.cxx: gpudm.swig $(HEADERS)
43 | 	swig -python -c++ $(INCLUDES) gpudm.swig
44 | 
45 | gpudm_wrap.o: gpudm_wrap.cxx 
46 | 	g++ $(OPTFLAGS) -c gpudm_wrap.cxx -fPIC $(INCLUDES) -o gpudm_wrap.o
47 | 
48 | %.o: %.cpp %.hpp 
49 | 	g++ $(OPTFLAGS) -c $< -fPIC $(INCLUDES) -L$(CAFFEDIR) -o $@
50 | 
51 | clean:
52 | 	rm -f *.pyc *~ _gpudm.so gpudm_wrap.o $(EXTRA_LAYERS:.hpp=.o) $(EXTRA_LAYERS:.hpp=.cuo)
53 | 
54 | cleanswig: clean
55 | 	rm -f gpudm.py gpudm_wrap.cxx gpudm_wrap.o
56 | 
57 | 
58 | 
59 | 
60 | 
61 | 
62 | 
63 | 
64 | 
65 | 
66 | 
67 | 
68 | 
69 | 
70 | 
71 | 
72 | 
73 | 
74 | 
75 | 
76 | 
77 | 
78 | 
79 | 
80 | 
81 | 


--------------------------------------------------------------------------------
/deep_matching/README.txt:
--------------------------------------------------------------------------------
  1 | Implementation of the Deep Matching algorithm on GPU. 
  2 | See paper "DeepMatching: Hierarchical Deformable Dense Matching", 
  3 | at http://lear.inrialpes.fr/src/deepmatching/ by Jerome Revaud, 
  4 | Philippe Weinzaepfel, Zaid Harchaoui and Cordelia Schmid.
  5 | Main code by Jerome Revaud, INRIA. The code is only for scientific 
  6 | or personnal use. Please contact me/INRIA for commercial use.
  7 | Email: jerome.revaud@inria.fr
  8 | 
  9 | Copyright (C) 2015 Jerome Revaud
 10 | 
 11 | Version 1.0
 12 | 
 13 | License:
 14 | 
 15 | This program is free software: you can redistribute it and/or modify
 16 | it under the terms of the GNU General Public License as published by
 17 | the Free Software Foundation, either version 3 of the License, or
 18 | (at your option) any later version.
 19 | 
 20 | This program is distributed in the hope that it will be useful,
 21 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 22 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 23 | GNU General Public License for more details.
 24 | 
 25 | You should have received a copy of the GNU General Public License
 26 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 27 | 
 28 | 
 29 | Installation:
 30 | 
 31 | 1) Install 'caffe'
 32 |   a) extract `caffe.zip` to get `caffe` directory
 33 |   b) mv `caffe` to some where, e.g. `mv caffe/ ../`
 34 |   c) cd `/path/to/caffe` and check the `Makefile` and `Makefile.config` to be sure than env settings are right.
 35 |   d) make -j8
 36 |     i use `Makefile` and `Makefile.config` of `faster-rcnn` instead of origin because of my env 
 37 |     (
 38 |       and now
 39 |       the `Makefile` and `Makefile.config` of caffe.zip are from `faster-rcnn` (i have replaced)
 40 |     )
 41 | 
 42 | 2) Add a softlink named 'caffe' in the current directory that points 
 43 |    toward the caffe directory (just to make things simpler):
 44 |    ln -s /path/to/caffe caffe, e.g. `ln -s ../caffe caffe`
 45 | 
 46 | 3) Edit Makefile
 47 |    Set the different paths for caffe and other dependencies
 48 |    set `GOOGLETOOLS`, `CUDA`, `MKL` path, 
 49 | 
 50 | 4) Compile
 51 |    make all
 52 |    
 53 |    (IMPORTANT NOTE: 
 54 |     if you compile the SWIG file, it is normal that you see lots of errors. 
 55 |     However, as long as it generates 'gpudm_warp.cxx', you can just relaunch 
 56 |     'make' and the rest of the compilation should go smoothly. )
 57 | 
 58 | 5) Test
 59 |   Set your environment variables:
 60 |     LD_LIBRARY_PATH should point to your libcaffe directory, to mkl, etc. 
 61 |     (basically to all the paths you edited in the Makefile)
 62 |     >>>
 63 |       vim ~/.bashrc
 64 |       add "export LD_LIBRARY_PATH=/home/ddk/dongdk/deep-matching/deep_matching/caffe/.build_release/lib:/usr/local/cuda-7.0/lib64/:$LD_LIBRARY_PATH" and save
 65 |       source ~/.bashrc
 66 | 
 67 |   
 68 |   Try executing the following command:
 69 |   >>> python deep_matching_gpu.py liberty1.png liberty2.png -v -viz corres
 70 |     or 
 71 |   >>> python deep_matching_gpu.py liberty1.png liberty2.png -GPU 0 -v -viz corres
 72 |   >>> python deep_matching_gpu.py liberty1.png liberty2.png -GPU 0 -v -viz flow
 73 |   >>> python deep_matching_gpu.py climb1.png climb2.png -GPU 0 -v -viz following
 74 | 
 75 |     if missing `libcaffe.so`, `libcusparse.so.7.0`, ..., all you do is to set the paths in environment variables
 76 |       e.g.
 77 |         `libcaffe.so` is located in `caffe/.build_release/lib`
 78 |         `libcusparse.so.7.0` is located in `/usr/local/cuda-7.0/lib64` (use `locate libcusparse.so.7.0` command to find where it is)
 79 |       and then set their paths in `~/.bashrc` file and `source ~/.bashrc`
 80 |         e.g.
 81 |           `export LD_LIBRARY_PATH=/home/ddk/dongdk/deep-matching/web_gpudm_1.0/caffe/.build_release/lib:/usr/local/cuda-7.0/lib64/:$LD_LIBRARY_PATH`
 82 |   
 83 |   You should see a rainbow visualization of correspondences. 
 84 |   When you continue (type 'c'+enter), you should get the following output: 
 85 |     36 36 36 26 3.77558 13
 86 |     36 44 36 34 3.65536 24
 87 |     [...]
 88 |     28 4 22 6 3.59854 94
 89 |     28 20 28 10 3.75238 90
 90 |     28 28 28 18 3.77126 83
 91 | 
 92 | 
 93 | Example usages and explanations:
 94 |   
 95 |   To get detailed information on parameters:
 96 |     python deep_matching_gpu.py -h
 97 |     python deep_matching_gpu.py --help
 98 |   >>>
 99 |     usage: deep_matching_gpu.py [-h] [-GPU [{-1,0,1,2,3,4}]] [-ds D] [-sp]
100 |                                 [-ngh RAD] [-pow G] [--crop W H] [-out OUTPUT]
101 |                                 [-v]
102 |                                 [-viz {net,mem,pxl_desc,patch_corr,rmap,corres,flow}]
103 |                                 img1 img2
104 | 
105 |     positional arguments:
106 |       img1                  Path to the first image
107 |       img2                  Path to the second image
108 | 
109 |     optional arguments:
110 |       -h, --help            show this help message and exit
111 |       -GPU [{-1,0,1,2,3,4}]
112 |                             GPU device number (default=0), or -1 for CPU (default)
113 |       -ds D, --downscale D  Prior downscale of input images by 2^D
114 |       -sp, --use_sparse     Use CUSPARSE for ligther convolutions (GPU only)
115 |       -ngh RAD, --ngh_rad RAD
116 |                             Restrict matching to local neighborhood of RAD pixels
117 |       -pow G, --powerlaw G  Non-linear power-law rectification (default = 1.4)
118 |       --crop W H            [Pre-processing] crop the images to a given shape
119 |       -out OUTPUT, --output OUTPUT
120 |                             Output the matching to a text file
121 |       -v, --verbose         Increase verbosity
122 |       -viz {net,mem,pxl_desc,patch_corr,rmap,corres,flow}
123 |                             Vizualisation options  
124 | 
125 |   
126 |   Typical command to match Sintel images:
127 |     # Requires 4.8 Go of memory on your GPU
128 |     >>> python deep_matching_gpu.py .../SINTEL/training/final/temple_3/frame_0041.png \
129 |                                 .../SINTEL/training/final/temple_3/frame_0042.png \
130 |                    -GPU -v --downscale 1 --ngh_rad 256 --use_sparse -viz mem -viz flow 
131 | 
132 |     >>> python deep_matching_gpu.py climb1.png climb2.png -GPU -v --downscale 1 --ngh_rad 256 --use_sparse -viz mem -viz flow
133 | 
134 |     >>> python deep_matching_gpu.py mude1.jpg mude2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse -viz mem -viz flow 
135 | 
136 |     >>> python deep_matching_gpu.py mude1.jpg mude2.jpg -GPU -v --downscale 1 --ngh_rad 256 --use_sparse -out mude1.txt 
137 | 
138 |         
139 |     # Note: if you don't use CUsparse, (no --use_sparse), it requires 5.3 Go.
140 |   
141 |   Nice vizualizations options: 
142 |     #   e.g. use "-viz rmap" to examine response_maps
143 |     #   (Then click on the top image to select a patch)
144 |     python deep_matching_gpu.py liberty1.png liberty2.png -v --downscale 0 -viz net -viz mem -viz rmap 
145 | 
146 | 
147 | For details about the options, please refer to the help, the papers or the code.
148 | 
149 | 
150 | Important tip:
151 |   If the program stops with an error in memset/memcpy, then it means that your GPU 
152 |   doesn't have enough memory. In this case, you should consider:
153 |     * decreasing the neighborhood radius with "--ngh_rad"  
154 |     * incrementing the "--downscale" parameter (i.e. to downscale images before matching). 
155 |     * You can also investigate the memory usage with '-viz mem', but keep in mind that
156 |       it under-estimates the actual memory usage.
157 |     * if your image pair is very large, please use `ds`, or you will see 
158 |         `F0316 10:10:52.342209 24363 blob.cpp:33] Check failed: shape[i] <= 2147483647 / count_ (513 vs. 242) blob size exceeds INT_MAX*** Check failure stack trace: ***`
159 |       and, for now it's not fixed.
160 | 
161 | 
162 | 
163 | Versions of the different modules:
164 |   * python 2.7
165 |   * fedora 21
166 |   * gcc/g++ 4.9.2
167 |   * swig 3.0.7 
168 |   * cuda 6.5
169 |   * caffe version is from November 12th (included in zip)
170 |   * protobuf 2.5.0
171 |   * glog 0.3.3
172 | 
173 | 
174 | 
175 | 
176 | 
177 | 
178 | 
179 | 
180 | 
181 | 
182 | 
183 | 
184 | 
185 | 
186 | 
187 | 
188 | 
189 | 
190 | 
191 | 
192 | 
193 | 
194 | 
195 | 
196 | 
197 | 
198 | 
199 | 
200 | 


--------------------------------------------------------------------------------
/deep_matching/caffe:
--------------------------------------------------------------------------------
1 | ../caffe


--------------------------------------------------------------------------------
/deep_matching/caffe.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zimenglan-sysu-512/deep-flow/fd127e9a2ccd2e5b73dcef39a3438ee77b2476a4/deep_matching/caffe.zip


--------------------------------------------------------------------------------
/deep_matching/extra_layers.hpp:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2015 Jerome Revaud
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 16 | */
 17 | #ifndef __EXTA_LAYERS_H__
 18 | #define __EXTA_LAYERS_H__
 19 | 
 20 | #include "caffe/layer.hpp"
 21 | #include "caffe/vision_layers.hpp"
 22 | #include "caffe/proto/caffe.pb.h"
 23 | #include <stdio.h>
 24 | 
 25 | #include "cusparse.h"
 26 | #define CUSPARSE_CHECK(condition) CHECK_EQ((condition), CUSPARSE_STATUS_SUCCESS)
 27 | 
 28 | #define recast reinterpret_cast
 29 | 
 30 | namespace caffe {
 31 | 
 32 |   ////////////////////////////////////////////////////////////
 33 |   //        CONVOLUTION WITH CSR-SPARSE WEIGHTS            //
 34 |   //////////////////////////////////////////////////////////
 35 | 
 36 |   class CusparseHandle {
 37 |    public:
 38 |     static cusparseHandle_t cusparse_handle() {
 39 |       if( instance_.cusparse_handle_ == NULL ) { // not yet initalized
 40 |         CUSPARSE_CHECK(cusparseCreate(&instance_.cusparse_handle_));
 41 |       }
 42 |       return instance_.cusparse_handle_; 
 43 |     }
 44 |     
 45 |    private:
 46 |     static CusparseHandle instance_;
 47 |     cusparseHandle_t cusparse_handle_;
 48 |     
 49 |     CusparseHandle() : 
 50 |       cusparse_handle_(NULL) {}
 51 |     ~CusparseHandle() {
 52 |       if (cusparse_handle_)
 53 |         CUSPARSE_CHECK(cusparseDestroy(cusparse_handle_));
 54 |     }
 55 |   };
 56 | 
 57 |   /* Convolution layer but with sparse filters.
 58 |      This layer computes:   Out = Filters x im2col( In )
 59 |      
 60 |      In and Out are dense matrices (NCHW fully-packed).
 61 |      Filters are given as a CSR matrix instead as dense matrix.
 62 |   */
 63 |   template <typename Dtype>
 64 |   class CSR_SparseConvolutionLayer : public Layer<Dtype> {
 65 |    public:
 66 |     explicit CSR_SparseConvolutionLayer(const LayerParameter& param )
 67 |         : Layer<Dtype>(param) {}
 68 |     
 69 |     virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
 70 |     virtual void Reshape(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
 71 |     
 72 |     // Blob<float> is cast to Blob<int> 
 73 |     void SetSparsityPattern( const int nnz, 
 74 |         const Blob<float>* row_ptr, const Blob<float>* col_ind, const Blob<float>* data = NULL );
 75 |     
 76 |    protected:
 77 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top)
 78 |       {NOT_IMPLEMENTED;}
 79 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
 80 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
 81 |       {NOT_IMPLEMENTED;}
 82 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
 83 |       {NOT_IMPLEMENTED;}
 84 |     
 85 |     int KSIZE_, STRIDE_, PAD_, NUM_OUTPUT_;
 86 |     int NUM_, CHANNELS_, HEIGHT_, WIDTH_;
 87 |     bool biasterm_;
 88 |     int M_, N_, K_; // matrix multiplication sizes
 89 |     Blob<Dtype> col_buffer_;
 90 |     
 91 |     int nnz_; // number of non-zero elements
 92 |     shared_ptr<SyncedMemory> weight_rowptr_, weight_colind_;
 93 |     
 94 |     void load_csr_gpu( const int** weight_rowptr, const int** weight_colind, 
 95 |                        const Dtype** weight_data, Dtype** weight_diff );
 96 |     
 97 |     bool do_im2col_;
 98 |     shared_ptr<SyncedMemory> bias_multiplier_, transpose_res_;
 99 |   };
100 | 
101 | 
102 |   ////////////////////////////////////////////////////////////
103 |   //               BORDER RECTIFICATION                    //
104 |   //////////////////////////////////////////////////////////
105 |   
106 |   template <typename Dtype>
107 |   class BorderRectifyLayer : public Layer<Dtype> {
108 |    public:
109 |     explicit BorderRectifyLayer(const LayerParameter& param, int ksize)
110 |         : Layer<Dtype>(param), KSIZE_(ksize) {}
111 |     
112 |     virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
113 |     virtual void Reshape(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
114 |     
115 |    protected:
116 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
117 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
118 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
119 |       {NOT_IMPLEMENTED;}
120 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
121 |       {NOT_IMPLEMENTED;}
122 |     
123 |     const int KSIZE_;
124 |   };
125 | 
126 | 
127 |   ////////////////////////////////////////////////////////////
128 |   //                   RECTIFIED SIGMOID                   //
129 |   //////////////////////////////////////////////////////////
130 | 
131 |   template <typename Dtype>
132 |   class RectifiedSigmoidLayer : public NeuronLayer<Dtype> {
133 |    public:
134 |     explicit RectifiedSigmoidLayer(const LayerParameter& param)
135 |         : NeuronLayer<Dtype>(param) {}
136 |     
137 |    protected:
138 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
139 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
140 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
141 |       {NOT_IMPLEMENTED;}
142 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
143 |       {NOT_IMPLEMENTED;}
144 |   };
145 | 
146 | 
147 |   ////////////////////////////////////////////////////////////
148 |   //                PIXEL NORMALIZATION                    //
149 |   //////////////////////////////////////////////////////////
150 | 
151 |   template <typename Dtype>
152 |   class PixelNormLayer : public NeuronLayer<Dtype> {
153 |    public:
154 |     explicit PixelNormLayer(const LayerParameter& param, Dtype norm)
155 |         : NeuronLayer<Dtype>(param), alpha_(norm) {}
156 |     
157 |    protected:
158 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
159 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
160 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
161 |       {NOT_IMPLEMENTED;}
162 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
163 |       {NOT_IMPLEMENTED;}
164 |     
165 |     const Dtype alpha_;
166 |   };
167 | 
168 | 
169 |   ////////////////////////////////////////////////////////////
170 |   //                  PATCH CONVOLUTION                    //
171 |   //////////////////////////////////////////////////////////
172 | 
173 |   template <typename Dtype>
174 |   class PatchConvolutionLayer : public Layer<Dtype> {
175 |    public:
176 |     explicit PatchConvolutionLayer(const LayerParameter& param, int ksize, int pad, int ngh_rad, char normalize_borders)
177 |         : Layer<Dtype>(param), KSIZE_(ksize), PAD_(pad), STRIDE_(1), ngh_rad_(ngh_rad), normalize_borders_(normalize_borders) {}
178 |     
179 |     virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
180 |     virtual void Reshape(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
181 |     
182 |    protected:
183 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
184 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
185 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
186 |       {NOT_IMPLEMENTED;}
187 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
188 |       {NOT_IMPLEMENTED;}
189 |     
190 |     const char normalize_borders_;  // if 'd': general case (dynamic) border normalization
191 |                                     // if 's': static border normalization => faster 
192 |                                     //         (DeepMatching-like with normalized pixel descriptors)
193 |     int num_, channels_, height_, width_;
194 |     int channels_out_;
195 |     const int KSIZE_, STRIDE_;  
196 |     int PAD_; // if PAD_ is negative, then it is applied to the first image (subsampling center patches only)
197 |     int K_;
198 |     const int ngh_rad_; // 0 if no offsets, else 2*nghrad+1
199 |     int virtual_pad_; // PAD_ + virtual_pad_ = theoretical_pad
200 |     int CROP_; // crop of the first image in case of negative padding
201 |     
202 |     Blob<Dtype> patches_;     // first image transformed into consecutive patches
203 |     Blob<Dtype> col_buffer_;  // temporary matrix for convolve-ready second image (4x4 bigger)
204 |     Blob<Dtype> ones_col_;
205 |     Blob<Dtype> masks_;
206 |     Blob<Dtype> dense_buf_;   // buffer to transfer results from dense GEMM to sparse nghrad
207 |   };
208 | 
209 | 
210 |   ////////////////////////////////////////////////////////////
211 |   //                DeepMatching ArgMax layer              //
212 |   //////////////////////////////////////////////////////////
213 | 
214 |   template <typename Dtype>
215 |   class DeepMatchingArgMaxLayer : public Layer<Dtype> {
216 |    public:
217 |     explicit DeepMatchingArgMaxLayer(const LayerParameter& param, 
218 |                    const int img_height, const int img_width, const int step, const int ngh_rad)
219 |         : Layer<Dtype>(param), img_height_(img_height), img_width_(img_width), step_(step),
220 |           ngh_rad_(ngh_rad) {}
221 |     
222 |     virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
223 |     virtual void Reshape(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
224 |     
225 |    protected:
226 |     virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
227 |     virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top);
228 |     virtual void Backward_cpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
229 |       {NOT_IMPLEMENTED;}
230 |     virtual void Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom)
231 |       {NOT_IMPLEMENTED;}
232 |     
233 |     const int img_height_, img_width_, step_, ngh_rad_;
234 |   };
235 | 
236 | 
237 | 
238 | };
239 | 
240 | 
241 | 
242 | #endif
243 | 
244 | 
245 | 
246 | 
247 | 
248 | 
249 | 
250 | 
251 | 
252 | 
253 | 
254 | 
255 | 
256 | 
257 | 
258 | 
259 | 
260 | 
261 | 
262 | 
263 | 
264 | 
265 | 
266 | 
267 | 
268 | 
269 | 


--------------------------------------------------------------------------------
/deep_matching/flow_utils.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Contains utilities function for flows: read/write, convert to color, displaying the color coding,
  3 | The functions are similar to the Middelbury function (which were written in matlab by Deqing Sun.
  4 | Author: Philippe Weinzaepfel
  5 | Version: 1.0
  6 | Date: 19 November 2012
  7 | """
  8 | 
  9 | import numpy as np
 10 | """import matplotlib.pylab as plt"""
 11 | import struct
 12 | from PIL import Image
 13 | 
 14 | # for read/write 
 15 | TAG_FLOAT = 202021.25 # tag to check the sanity of the file
 16 | TAG_STRING = 'PIEH'   # string containing the tag
 17 | MIN_WIDTH = 1
 18 | MAX_WIDTH = 99999
 19 | MIN_HEIGHT = 1
 20 | MAX_HEIGHT = 99999
 21 | 
 22 | # for colors
 23 | RY = 15
 24 | YG = 6
 25 | GC = 4
 26 | CB = 11
 27 | BM = 13
 28 | MR = 6
 29 | 
 30 | # for flow
 31 | UNKNOWN_THRESH = 1e9
 32 | 
 33 | def flowToColor(flow, maxflow=None, maxmaxflow=None, saturate=False):
 34 |     """
 35 |     flow_utils.flowToColor(flow): return a color code flow field, normalized based on the maximum l2-norm of the flow
 36 |     flow_utils.flowToColor(flow,maxflow): return a color code flow field, normalized by maxflow
 37 | 
 38 |     ---- PARAMETERS ----
 39 |         flow: flow to display of shape (height x width x 2)
 40 |         maxflow (default:None): if given, normalize the flow by its value, otherwise by the flow norm
 41 |         maxmaxflow (default:None): if given, normalize the flow by the max of its value and the flow norm
 42 | 
 43 |     ---- OUTPUT ----
 44 |         an np.array of shape (height x width x 3) of type uint8 containing a color code of the flow
 45 |     """
 46 |     h,w,n = flow.shape
 47 |     # check size of flow
 48 |     if not n == 2:
 49 |         raise Exception("flow_utils.flowToColor(flow): flow must have 2 bands")
 50 |     # compute max flow if needed
 51 |     if maxflow is None:
 52 |         maxflow = flowMaxNorm(flow)
 53 |     if maxmaxflow is not None:
 54 |         maxflow = min(maxmaxflow, maxflow)
 55 |     # fix unknown flow
 56 |     unknown_idx = np.max(np.abs(flow),2)>UNKNOWN_THRESH
 57 |     flow[unknown_idx] = 0.0
 58 |     # normalize flow
 59 |     eps = np.spacing(1) # minimum positive float value to avoid division by 0
 60 |     # compute the flow
 61 |     img = _computeColor(flow/(maxflow+eps), saturate=saturate)
 62 |     # put black pixels in unknown location
 63 |     img[ np.tile( unknown_idx[:,:,np.newaxis],[1,1,3]) ] = 0.0 
 64 |     return img
 65 | 
 66 | def flowMaxNorm(flow):
 67 |     """
 68 |     flow_utils.flowMaxNorm(flow): return the maximum of the l2-norm of the given flow
 69 | 
 70 |     ---- PARAMETERS ----
 71 |         flow: the flow
 72 |         
 73 |     ---- OUTPUT ----
 74 |         a float containing the maximum of the l2-norm of the flow
 75 |     """
 76 |     return np.max( np.sqrt( np.sum( np.square( flow ) , 2) ) )
 77 | 
 78 | 
 79 | def _computeColor(flow, saturate=True):
 80 |     """
 81 |     flow_utils._computeColor(flow): compute color codes for the flow field flow
 82 |     
 83 |     ---- PARAMETERS ----
 84 |         flow: np.array of dimension (height x width x 2) containing the flow to display
 85 | 
 86 |     ---- OUTPUTS ----
 87 |         an np.array of dimension (height x width x 3) containing the color conversion of the flow
 88 |     """
 89 |     # set nan to 0
 90 |     nanidx = np.isnan(flow[:,:,0])
 91 |     flow[nanidx] = 0.0
 92 |     
 93 |     # colorwheel
 94 |     ncols = RY + YG + GC + CB + BM + MR
 95 |     nchans = 3
 96 |     colorwheel = np.zeros((ncols,nchans),'uint8')
 97 |     col = 0;
 98 |     #RY
 99 |     colorwheel[:RY,0] = 255
100 |     colorwheel[:RY,1] = [(255*i) // RY for i in range(RY)]
101 |     col += RY
102 |     # YG    
103 |     colorwheel[col:col+YG,0] = [255 - (255*i) // YG for i in range(YG)]
104 |     colorwheel[col:col+YG,1] = 255
105 |     col += YG
106 |     # GC
107 |     colorwheel[col:col+GC,1] = 255
108 |     colorwheel[col:col+GC,2] = [(255*i) // GC for i in range(GC)]
109 |     col += GC
110 |     # CB
111 |     colorwheel[col:col+CB,1] = [255 - (255*i) // CB for i in range(CB)]
112 |     colorwheel[col:col+CB,2] = 255
113 |     col += CB
114 |     # BM
115 |     colorwheel[col:col+BM,0] = [(255*i) // BM for i in range(BM)]
116 |     colorwheel[col:col+BM,2] = 255
117 |     col += BM
118 |     # MR
119 |     colorwheel[col:col+MR,0] = 255
120 |     colorwheel[col:col+MR,2] = [255 - (255*i) // MR for i in range(MR)]
121 | 
122 |     # compute utility variables
123 |     rad = np.sqrt( np.sum( np.square(flow) , 2) ) # magnitude
124 |     a = np.arctan2( -flow[:,:,1] , -flow[:,:,0]) / np.pi # angle
125 |     fk = (a+1)/2 * (ncols-1) # map [-1,1] to [0,ncols-1]
126 |     k0 = np.floor(fk).astype('int')
127 |     k1 = k0+1
128 |     k1[k1==ncols] = 0
129 |     f = fk-k0
130 | 
131 |     if not saturate:
132 |         rad = np.minimum(rad,1)
133 | 
134 |     # compute the image
135 |     img = np.zeros( (flow.shape[0],flow.shape[1],nchans), 'uint8' )
136 |     for i in range(nchans):
137 |         tmp = colorwheel[:,i].astype('float')
138 |         col0 = tmp[k0]/255
139 |         col1 = tmp[k1]/255
140 |         col = (1-f)*col0 + f*col1
141 |         idx = (rad <= 1)
142 |         col[idx] = 1-rad[idx]*(1-col[idx]) # increase saturation with radius
143 |         col[~idx] *= 0.75 # out of range
144 |         img[:,:,i] = (255*col*(1-nanidx.astype('float'))).astype('uint8')
145 | 
146 |     return img
147 | 
148 | 
149 | 
150 | 
151 | 
152 | 


--------------------------------------------------------------------------------
/deep_matching/gpudm.swig:
--------------------------------------------------------------------------------
  1 | // -*- c++ -*-
  2 | /*
  3 | Copyright (C) 2015 Jerome Revaud
  4 | 
  5 | This program is free software: you can redistribute it and/or modify
  6 | it under the terms of the GNU General Public License as published by
  7 | the Free Software Foundation, either version 3 of the License, or
  8 | (at your option) any later version.
  9 | 
 10 | This program is distributed in the hope that it will be useful,
 11 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 13 | GNU General Public License for more details.
 14 | 
 15 | You should have received a copy of the GNU General Public License
 16 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 17 | */
 18 | 
 19 | %module gpudm;
 20 | 
 21 | %{
 22 | 
 23 | #include "caffe/caffe.hpp"
 24 | #include "extra_layers.hpp"
 25 | 
 26 | using namespace caffe; 
 27 | using namespace std; 
 28 | 
 29 | %}
 30 | 
 31 | %include "std_string.i"
 32 | %include "std_pair.i"
 33 | %include "std_set.i"
 34 | %include "std_map.i"
 35 | %include "std_vector.i"
 36 | %include "boost_shared_ptr.i"
 37 | 
 38 | 
 39 | %shared_ptr(caffe::Blob< float >); 
 40 | %shared_ptr(caffe::Layer< float >); 
 41 | %shared_ptr(caffe::NeuronLayer<float>);
 42 | %shared_ptr(caffe::ReLULayer< float >); 
 43 | %shared_ptr(caffe::PowerLayer< float >); 
 44 | %shared_ptr(caffe::RectifiedSigmoidLayer< float >); 
 45 | %shared_ptr(caffe::ReshapeLayer< float >); 
 46 | %shared_ptr(caffe::PixelNormLayer< float >);
 47 | %shared_ptr(caffe::BaseConvolutionLayer< float >); 
 48 | %shared_ptr(caffe::ConvolutionLayer< float >); 
 49 | %shared_ptr(caffe::PatchConvolutionLayer<float>);
 50 | %shared_ptr(caffe::CSR_SparseConvolutionLayer<float>);
 51 | %shared_ptr(caffe::BorderRectifyLayer< float >);
 52 | %shared_ptr(caffe::PoolingLayer<float>); 
 53 | %shared_ptr(caffe::InnerProductLayer<float>); 
 54 | %shared_ptr(caffe::DeepMatchingArgMaxLayer<float>); 
 55 | 
 56 | 
 57 | %include "caffe/caffe.hpp"
 58 | %include "caffe/common.hpp"
 59 | %include "caffe/blob.hpp"
 60 | %include "caffe/filler.hpp"
 61 | %include "caffe/layer.hpp"
 62 | 
 63 | using namespace std;
 64 | using namespace boost;
 65 | %template(BlobVector) vector< shared_ptr< caffe::Blob< float > > >; 
 66 | %template(BlobPtrVector) vector< caffe::Blob< float >* >; 
 67 | %template(LayerVector) vector< shared_ptr< caffe::Layer< float > > >; 
 68 | %template(FloatVector) vector< float >; 
 69 | 
 70 | %include "caffe/net.hpp"
 71 | %include "caffe/common_layers.hpp"
 72 | %include "caffe/neuron_layers.hpp"
 73 | %include "caffe/vision_layers.hpp"
 74 | %include "caffe/util/math_functions.hpp"
 75 | %include "extra_layers.hpp"
 76 | 
 77 | #define GOOGLE_PROTOBUF_VERSION 2005000
 78 | #define GOOGLE_PROTOBUF_MIN_PROTOC_VERSION 2005000
 79 | 
 80 | namespace google {
 81 |   namespace protobuf {
 82 |     class Message {
 83 |     private: 
 84 |       Message();
 85 |       int x;
 86 |     };
 87 |     typedef unsigned int uint32;
 88 |     typedef int int32;
 89 |     typedef long long int64;
 90 |   }
 91 | }
 92 | 
 93 | %include "caffe/proto/caffe.pb.h"
 94 | 
 95 | 
 96 | %template(NetFloat) caffe::Net<float>; 
 97 | %template(BlobFloat) caffe::Blob<float>; 
 98 | %template(LayerFloat) caffe::Layer<float>;
 99 | %template(NeuronLayerFloat) caffe::NeuronLayer<float>;
100 | %template(ReLULayerFloat) caffe::ReLULayer<float>;
101 | %template(PowerLayerFloat) caffe::PowerLayer<float>;
102 | %template(ReshapeLayerFloat) caffe::ReshapeLayer< float >; 
103 | %template(RectifiedSigmoidLayerFloat) caffe::RectifiedSigmoidLayer<float>;
104 | %template(PixelNormLayerFloat) caffe::PixelNormLayer< float >;
105 | %template(BaseConvolutionLayerFloat) caffe::BaseConvolutionLayer< float >; 
106 | %template(ConvolutionLayerFloat) caffe::ConvolutionLayer< float >; 
107 | %template(PatchConvolutionLayerFloat) caffe::PatchConvolutionLayer<float>;
108 | %template(CSR_SparseConvolutionLayerFloat) caffe::CSR_SparseConvolutionLayer<float>;
109 | %template(BorderRectifyLayerFloat) caffe::BorderRectifyLayer< float >;
110 | %template(PoolingLayerFloat) caffe::PoolingLayer<float>; 
111 | %template(DeepMatchingArgMaxLayerFloat) caffe::DeepMatchingArgMaxLayer<float>; 
112 | 
113 | // function releases GIL while doing slow action
114 | %exception {
115 |   Py_BEGIN_ALLOW_THREADS
116 |   $action
117 |   Py_END_ALLOW_THREADS
118 | }
119 | 
120 | %exception;
121 | 
122 | 
123 | %{
124 | #define SWIG_FILE_WITH_INIT
125 | #define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
126 | #include <numpy/arrayobject.h>
127 | 
128 | PyObject * floats_to_numpy_ref(float *src, long size) {
129 |   npy_intp shp = size; 
130 |   return PyArray_SimpleNewFromData(1, &shp, NPY_FLOAT32, src);
131 | }
132 | 
133 | %}
134 | 
135 | PyObject * floats_to_numpy_ref(float *src, long size);
136 | 
137 | %init %{
138 | /* needed, else crash at runtime */
139 |     import_array();
140 | %}
141 | 
142 | 
143 | %pythoncode %{
144 | 
145 | import numpy
146 | 
147 | def BlobFloat_get_shape(self): 
148 |   return (self.num(), self.channels(), self.height(), self.width())
149 | 
150 | def BlobFloat_to_numpy_ref(self): 
151 |   b = floats_to_numpy_ref(self.cpu_data(), self.count())
152 |   return b.reshape(self.get_shape())
153 | 
154 | def BlobFloat_diff_to_numpy_ref(self): 
155 |   b = floats_to_numpy_ref(self.cpu_diff(), self.count())
156 |   return b.reshape(self.get_shape())
157 | 
158 | def BlobFloat_mutable_to_numpy_ref(self): 
159 |   b = floats_to_numpy_ref(self.mutable_cpu_data(), self.count())
160 |   return b.reshape(self.get_shape())
161 | 
162 | def BlobFloat_mutable_diff_to_numpy_ref(self): 
163 |   b = floats_to_numpy_ref(self.mutable_cpu_diff(), self.count())
164 |   return b.reshape(self.get_shape())
165 | 
166 | BlobFloat.get_shape = BlobFloat_get_shape
167 | BlobFloat.to_numpy_ref = BlobFloat_to_numpy_ref
168 | BlobFloat.diff_to_numpy_ref = BlobFloat_diff_to_numpy_ref
169 | BlobFloat.mutable_to_numpy_ref = BlobFloat_mutable_to_numpy_ref
170 | BlobFloat.mutable_diff_to_numpy_ref = BlobFloat_mutable_diff_to_numpy_ref
171 | 
172 | %}
173 | 
174 | 
175 | /*-------- DeepMatching functions ------------*/
176 | %{
177 | 
178 | #include "numpy_image.h"
179 | #include <algorithm>
180 | using std::min;
181 | using std::max;
182 | static inline float pow2(float x) {return x*x;}
183 | #define nullptr 0
184 | 
185 | static inline int retrieve_children( const int x, const int y, const int_cube* child_grid ) {
186 |   const int size0_div2 = child_grid->pixels[0];
187 |   const int step0 = child_grid->tx==1 && child_grid->ty==1 ? 1 : 
188 |                                         max( child_grid->pixels[2]-child_grid->pixels[0], 
189 |                                              child_grid->pixels[1+2*child_grid->tx]-child_grid->pixels[1] );
190 |   int i = (x-size0_div2)/step0;
191 |   int j = (y-size0_div2)/step0;
192 |   assert( x==(i*step0+size0_div2) || !"error: child_grid does not match current grid" );
193 |   assert( y==(j*step0+size0_div2) || !"error: child_grid does not match current grid" );
194 |   if( i<0 || i>=child_grid->tx )  return -1;
195 |   if( j<0 || j>=child_grid->ty )  return -1;
196 |   return i+j*child_grid->tx;
197 | }
198 | 
199 | static inline void prepare_gaps( const int parent_psize, const int nc, int gaps[3] ) {
200 |   const int hs = parent_psize/2;
201 |   if(nc==2) { // 4 children per parent patch
202 |     gaps[0] = hs/2 - hs;
203 |     gaps[1] = hs/2;
204 |   } else if(nc==3) {  // 9 children per parent patch
205 |     gaps[0] = hs/2 - hs;
206 |     gaps[1] = 0;
207 |     gaps[2] = hs/2;
208 |   } else assert(0);
209 | }
210 | 
211 | /* Prepare a grid of cell positions in the first image for a given scale. Big cells inherit the cell at the previous scale.
212 |     size = size of cells at current scale
213 |     offset, step = grid generator: (offset + i*step, offset + j*step)
214 |     child_grid = grid of the previous layer (or None if first layer)
215 |     child_norms = image containing the norms of the patch at the previous level
216 |     grid = result center positions of cells in current scale
217 |     children = index of cells in previous scale used to construct big cells
218 |     norms = norms of the cells of this level
219 | */
220 | void _prepare_big_cells( int size, int offset, int step, 
221 |                          int_cube* child_grid, float_image* child_norms,
222 |                          int_cube* grid, int_cube* children, float_image* norms ) {
223 |   assert(grid->tz==2);
224 |   const int ntx = grid->tx; // should be == 1+(tx-size)/step so that patches do not pass the border
225 |   const int nty = grid->ty; // should be == 1+(ty-size)/step so that patches do not pass the border
226 |   
227 |   /* grid[i,j] = ( offset + i*step, offset + j*step )
228 |     
229 |     connection between two scales:
230 |     x cell position in lower scale == x position of children in upper scale
231 |     child_offset + child_i*child_step = offset + i*step + U*size/4
232 |                                                      with U = (2*u/(nc-1)-1) \in {-1,0,1}
233 |   */
234 |   
235 |   int i,j,u,v;
236 |   int* r = grid->pixels;
237 |   
238 |   if( !child_grid ) {
239 |     // this is the first scale: 
240 |     // we just return a grid of step size*(1-overlap/2) in [0, tx[ x [0, ty[
241 |     
242 |     for(j=0; j<nty; j++)
243 |       for(i=0; i<ntx; i++) {
244 |         *r++ = offset + i*step;
245 |         *r++ = offset + j*step;
246 |       }
247 |   } else {
248 |     assert(child_grid->tz==2);
249 |     assert( (child_norms!=NULL) == (norms!=NULL) || !"both must be null or non-null at the same time" );
250 |     if(norms) ASSERT_SAME_SIZE( child_grid, child_norms );
251 |     assert( children );
252 |     const int nc = sqrt(children->tz); // number of children per row or col
253 |     assert( children->tz==pow2(nc) );
254 |     ASSERT_SAME_SIZE( grid, children );
255 |     if(norms) ASSERT_SAME_SIZE( grid, norms );
256 |     // this is at least second scale
257 |     // we return a grid of step size*(1-overlap/2) in [0, tx[ x [0, ty[
258 |     
259 |     int gaps[3];
260 |     prepare_gaps( size, nc, gaps ); // usually, returns [-q,q] for nc==2 with q=size/4
261 |     
262 |     int* c = children->pixels; 
263 |     float *n = norms ? norms->pixels : nullptr;
264 |     if(n) memset(n,0,ntx*nty*sizeof(float));
265 |     for(j=0; j<nty; j++)
266 |       for(i=0; i<ntx; i++) {
267 |         int x = offset + i*step;
268 |         int y = offset + j*step;
269 |         *r++ = x;
270 |         *r++ = y;
271 |         
272 |         // accumulate norms from 2x2 or 3x3 neighbors        
273 |         for(v=0; v<nc; v++)
274 |           for(u=0; u<nc; u++,c++) {
275 |             // we want to index the children at position:
276 |             // ( center_x + gaps[u], center_y + gaps[v] )
277 |             *c = retrieve_children( x+gaps[u], y+gaps[v], child_grid );
278 |             if(n && *c>=0) *n += child_norms->pixels[*c];
279 |           }
280 |         if(n) n++;
281 |       }
282 |   }
283 | }
284 | 
285 | #define NEWA(type,n) (type*)malloc(sizeof(type)*(n))
286 | 
287 | static float** get_list_corres( const float_cube* map, int* nb ) {
288 |   const int tz = map->tz;
289 |   float* m = map->pixels;
290 |   const long npix = map->tx*map->ty;
291 |   float** res = NEWA(float*,npix);
292 |   
293 |   int i,n=0;
294 |   for(i=0; i<npix; i++,m+=tz)
295 |     if(m[4]) { // if score non-null
296 |       res[n++] = m; // remember pointer
297 |     }
298 |   
299 |   *nb = n;
300 |   return res;
301 | }
302 | 
303 | static inline int cmp_corres( const void* a, const void* b) {
304 |   return memcmp(*(float**)a,*(float**)b,4*sizeof(float));
305 | }
306 | 
307 | /* Intersect 2 mappings: erase all correspondences that are not reciprocal 
308 | */
309 | int _intersect_corres( const float_cube* map0, const float_cube* map1, float_image* corres ) {
310 |   const int tz = 6;
311 |   assert( map0->tz==tz && map1->tz==tz );
312 |   
313 |   // build the list of triplets
314 |   int n0,n1;
315 |   float** const corres0 = get_list_corres(map0,&n0);
316 |   float** const corres1 = get_list_corres(map1,&n1);
317 |   
318 |   // arg-sort the lists
319 |   qsort( corres0, n0, sizeof(float*), cmp_corres );
320 |   qsort( corres1, n1, sizeof(float*), cmp_corres );
321 |   
322 |   // remove all correspondences from map0/map1 that is not shared
323 |   float** c0 = corres0;
324 |   float** c1 = corres1;
325 |   float** const c0max = corres0 + n0;
326 |   float** const c1max = corres1 + n1;
327 |   float* res = corres->pixels;
328 |   float* r = res;
329 |   while(c0<c0max && c1<c1max) {
330 |     int d = memcmp(*c0,*c1,5*sizeof(float));
331 |     if(d<0) { // corres0 < corres1
332 |       c0++;
333 |     } else 
334 |     if(d>0) { // corres0 > corres1
335 |       c1++;
336 |     } else { // corres0 == corres1
337 |       if( r==res || memcmp( r-tz, *c0, tz*sizeof(float) ) ) { // if not already copied
338 |         memcpy( r, *c0, tz*sizeof(float) );
339 |         r += tz;
340 |       }
341 |       c0++;
342 |       c1++;
343 |     }
344 |   }
345 |   
346 |   free(corres0);
347 |   free(corres1);
348 |   return (r-res)/tz;
349 | }
350 | 
351 | %}
352 | 
353 | %include <numpy_image.swg>
354 | 
355 | void _prepare_big_cells( int size, int offset, int step, 
356 |                          int_cube* child_grid, float_image* child_norms,
357 |                          int_cube* grid, int_cube* children, float_image* norms );
358 | 
359 | int _intersect_corres( const float_cube* map0, const float_cube* map1, float_image* corres );
360 | 
361 | 
362 | %pythoncode %{
363 | 
364 | def prepare_big_cells( imshape, cell_size, overlap, child_overlap, child_grid, child_norms, dense_step=0, offset=None ):
365 |   if offset is None:  offset = cell_size/2 if not dense_step else 0
366 |   step = cell_size/(overlap+1) if not dense_step else dense_step
367 |   grid_size = lambda imsize: 1+max(0,imsize-2*offset)/step
368 |   gtx = grid_size(imshape[1])
369 |   gty = grid_size(imshape[0])
370 |   grid = numpy.empty((gty,gtx,2),numpy.int32)
371 |   norms = numpy.zeros((gty,gtx),numpy.float32) if child_norms is not None else None
372 |   
373 |   assert overlap in {0,1}
374 |   nc = (2+child_overlap)**2  # number of children per cell
375 |   children = numpy.empty((gty,gtx,nc),numpy.int32) if child_grid!=None else None
376 |   
377 |   _prepare_big_cells( cell_size, offset, step, child_grid, child_norms, grid, children, norms )
378 |   
379 |   if norms is None:
380 |     return step, grid, children
381 |   else:
382 |     return step, grid, children, norms
383 | 
384 | def intersect_corres( c0, c1 ):
385 |   n = min(c0.size, c1.size) / 6
386 |   res = numpy.empty((n,6), numpy.float32)
387 |   n = _intersect_corres( c0, c1, res )
388 |   return res[:n]
389 | 
390 | 
391 | %}
392 | 
393 | 
394 | 
395 | 
396 | 
397 | 
398 | 
399 | 
400 | 
401 | 
402 | 
403 | 
404 | 
405 | 
406 | 
407 | 
408 | 
409 | 
410 | 
411 | 
412 | 


--------------------------------------------------------------------------------
/deep_matching/helper.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Copyright (C) 2015 Jerome Revaud
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 16 | """
 17 | import os, sys, pdb, cPickle
 18 | from collections import namedtuple
 19 | from PIL import Image
 20 | from numpy import *
 21 | try:
 22 |   from matplotlib.pyplot import *
 23 |   ion()
 24 | except:
 25 |   pass
 26 | 
 27 | ########################################################
 28 | # visualization
 29 | 
 30 | def noticks():
 31 |   xticks([])
 32 |   yticks([])
 33 | 
 34 | def plot_rect(l,t,r,b,ls='-',rescale=True,**kwargs):
 35 |     (L,R), (B,T) = xlim(), ylim()
 36 |     plot([l,r,r,l,l],[t,t,b,b,t],ls,scalex=0,scaley=0,**kwargs)
 37 |     if rescale:
 38 |       xlim((min(L,l),max(R,r)))
 39 |       ylim((max(B,b),min(T,t)))
 40 | 
 41 | def plot_square(cx,cy,rad,ls='-',**kwargs):
 42 |     plot_rect(cx-rad,cy-rad,cx+rad,cy+rad,ls,**kwargs)
 43 | 
 44 | 
 45 | def get_assign(assign, n_maps):
 46 |   return arange(n_maps) if assign==None else assign 
 47 | 
 48 | 
 49 | def show_conv( levels, rot45=None, nshow=0, img0=None, img1=None, **kwargs ):
 50 |     level = levels[-1]
 51 |     grid = level.grid.reshape(-1,2)
 52 |     if rot45: grid = apply_rot45(rot45,grid)
 53 |     rad = level.psize/2
 54 |     assign = get_assign(level.assign,len(level.res_map))
 55 |     
 56 |     ax1 = subplot(311)
 57 |     ax1.numplot = 1
 58 |     imshow(img0, interpolation='nearest')
 59 |     ax2 = subplot(312)
 60 |     ax2.numplot = 2
 61 |     imshow(img1, interpolation='nearest')
 62 |     ax3 = subplot(313)
 63 |     ax3.numplot = 3
 64 |     fig = get_current_fig_manager().canvas.figure
 65 |     
 66 |     def redraw():
 67 |       # we redraw only the concerned axes
 68 |       renderer = fig.canvas.get_renderer()
 69 |       ax1.draw(renderer)  
 70 |       ax2.draw(renderer)
 71 |       ax3.draw(renderer)
 72 |       fig.canvas.blit(ax1.bbox)
 73 |       fig.canvas.blit(ax2.bbox)
 74 |       fig.canvas.blit(ax3.bbox)
 75 |     
 76 |     global cur  # ugly but wo cares
 77 |     cur = None
 78 |     def motion_notify_callback(event):
 79 |       global cur
 80 |       if not event.inaxes:  return
 81 |       x,y = event.xdata, event.ydata
 82 |       if x and y: # we are somewhere on a plot
 83 |         if cur is not None and event.inaxes.numplot in (2,3):
 84 |           ax2.lines = ax2.lines[:1]
 85 |           ax3.lines = []
 86 |           offx,offy = (0,0) if level.offsets is None else level.offsets.reshape(-1,2)[cur]
 87 |           if event.inaxes.numplot==2:
 88 |             f = level.f
 89 |             x,y = int(0.5 + x/f), int(0.5 + y/f)
 90 |           else:
 91 |             f = 1
 92 |             x,y = int(0.5 + (offx+x)/f), int(0.5 + (offy+y)/f)
 93 |           fig.add_subplot(312)
 94 |           xl,yl=xlim(),ylim()
 95 |           ax2.plot(x*level.f,y*level.f,'+',c=(0,1,0),ms=10,scalex=0,scaley=0)
 96 |           plot_square(x*level.f-0.5,y*level.f-0.5,rad,color='b')
 97 |           xlim(xl);ylim(yl)
 98 |           ax3.plot(x-offx,y-offy,'+k',ms=20,scalex=0,scaley=0)
 99 |           redraw()
100 |     
101 |     def mouse_click_callback(event):
102 |       global cur
103 |       if not event.inaxes:  return
104 |       x,y = event.xdata, event.ydata
105 |       if x and y: # we are somewhere on a plot
106 |         if event.inaxes.numplot==1:
107 |           cur = sum((grid - [x,y])**2,1).argmin()   # find nearest point
108 |           x,y = grid[cur]
109 |           ax1.lines = []
110 |           ax2.lines = []
111 |           ax3.lines = []
112 |           fig.add_subplot(311)
113 |           xl,yl=xlim(),ylim()
114 |           plot(x,y,'+',color=(0,1,0),ms=10,mew=1)
115 |           plot_square(x-0.5,y-0.5,rad,color='b')
116 |           xlim(xl);ylim(yl)
117 |           ax3.images = []
118 |           ax3.imshow(level.res_map[assign[cur]], vmin=0, vmax=1.1, interpolation='nearest')
119 |           if level.offsets is not None:
120 |             ox, oy = level.offsets.reshape(-1,2)[cur]
121 |             sx, sy = level.res_map.shape[1:]
122 |             subplot(312)
123 |             plot_rect(level.f*ox,level.f*oy,level.f*(ox+sx),level.f*(oy+sy),'-',c=(0,1,0),rescale=False)
124 |           redraw()
125 |         elif cur is not None and event.inaxes.numplot>1:
126 |           offx,offy = (0,0) if level.offsets is None else level.offsets.reshape(-1,2)[cur]
127 |           offx,offy = (0,0) if level.offsets is None else level.offsets.reshape(-1,2)[cur]
128 |           if event.inaxes.numplot==2:
129 |             f = level.f
130 |             x,y = int(0.5 + x/f), int(0.5 + y/f)
131 |             score = level.res_map[cur,y-offy,x-offx]
132 |           else:
133 |             x,y = int(0.5 + x), int(0.5 + y)
134 |             score = level.res_map[cur,y,x]
135 |           print 'res_map[%d, %d, %d] = %g' % (cur, y, x, score)
136 |     
137 |     class FakeEvent:
138 |       def __init__(self, x,y,ax):
139 |         self.xdata=x; self.ydata=y; self.inaxes=ax
140 |     mouse_click_callback(FakeEvent(1,1,ax1))
141 |     
142 |     subplots_adjust(left=0, bottom=0, right=1, top=1, wspace=0.02, hspace=0.02)
143 |     cid_move = fig.canvas.mpl_connect('motion_notify_event',motion_notify_callback)
144 |     cid_clic = fig.canvas.mpl_connect('button_press_event',mouse_click_callback)
145 |     print "Click on the top image to select a patch..."
146 |     pdb.set_trace()
147 |     fig.canvas.mpl_disconnect(cid_move)
148 |     fig.canvas.mpl_disconnect(cid_clic)
149 | 
150 | 
151 | def get_imatches(matches, shape, psize=8):
152 |     half = psize/2
153 |     imatches = -ones(shape, dtype=int32)
154 |     nums = arange(len(matches))
155 |     for j in range(-half,half+(psize%2)):
156 |       for i in range(-half,half+(psize%2)):
157 |         imatches[ clip(matches[:,1]+i,0,shape[0]-1), 
158 |                   clip(matches[:,0]+j,0,shape[1]-1)] = nums
159 |     return imatches
160 | 
161 | 
162 | def show_flow( lm, maxima, corr, img0=None, img1=None, mode='flow', full_corres=None, psize=None, **viz ):
163 |     assert img0!=None
164 |     assert img1!=None
165 |     if type(corr)==tuple: corr = corr[0]
166 |     assert corr.size, 'error: empty correspondences'
167 |     if corr.ndim==3:
168 |       corr = corr[corr[:,:,4]>0]
169 |     set_max = set(corr[:,5])
170 |     colors = {m:i for i,m in enumerate(set_max)}
171 |     colors = {m:cm.jet(i/float(len(colors))) for m,i in colors.items()}
172 |     for key in viz:
173 |       if key.startswith('mode_') and viz[key] is True:
174 |         mode = key[5:]
175 |     
176 |     def motion_notify_callback(event):
177 |       if not event.inaxes:  return
178 |       x,y = event.xdata, event.ydata
179 |       if x and y: # we are somewhere on a plot
180 |         ax1.lines = []
181 |         ax2.lines = []
182 |         if event.inaxes.numplot==0:
183 |           if mode=='score_path':
184 |             ax3.lines = []
185 |             col = fc0[int(y/step),int(x/step)]
186 |             x0, y0, x1, y1 = col[:4]
187 |             ax3.plot( col[6:], '+-', color='k' )
188 |           elif mode in ('comatches','argmax'):
189 |             n = sum((corr[:,0:2] - [x,y])**2,1).argmin()   # find nearest point
190 |             x0,y0,x1,y1,_,m = corr[n,0:6]
191 |             # print leading correspondences
192 |             ax1.plot(x0,y0,'o',ms=10,mew=2,color='blue',scalex=False,scaley=False)
193 |             ax2.plot(x1,y1,'o',ms=10,mew=2,color='red',scalex=False,scaley=False)
194 |             # find co-matches
195 |             corres0 = retrieve_one_maxima_corres( lm, maxima[m], **viz['params'] )
196 |             corres0 = set(map(tuple,corres0[:,0:4]))
197 |             if mode == 'comatches':
198 |               real0 = set(map(tuple,corr[:,0:4]))
199 |               intersect = corres0 & real0
200 |             else:
201 |               intersect = corres0 # no filtering
202 |             x0,y0,x1,y1 = zip(*list(intersect))
203 |             
204 |           else:
205 |             n = sum((corr[:,0:2] - [x,y])**2,1).argmin()   # find nearest point
206 |             x0,y0,x1,y1,score,m = corr[n,0:6]
207 |             print "\rmatch #%d (%d,%d) --> (%d,%d) (len=%.1f), score=%.3f from maxima %d" % (n,
208 |               x0,y0,x1,y1,sqrt((x0-x1)**2+(y0-y1)**2),score,m),;sys.stdout.flush()
209 |           
210 |           ax1.plot(x0,y0,'+',ms=10,mew=2,color='blue',scalex=False,scaley=False)
211 |           ax2.plot(x1,y1,'+',ms=10,mew=2,color='red',scalex=False,scaley=False)
212 |         
213 |         elif event.inaxes.numplot==1:
214 |           if mode=='score_path':
215 |             ax3.lines = []
216 |             col = fc1[int(y/step),int(x/step)]
217 |             x0, y0, x1, y1 = col[:4]
218 |             ax3.plot( col[6:], '+-', color='k' )
219 |           else:
220 |             n = sum((corr[:,2:4] - [x,y])**2,1).argmin()  # find nearest point
221 |             x0,y0,x1,y1,score,m = corr[n,0:6]
222 |             print "\rmatch #%d (%d,%d) --> (%d,%d) (len=%.1f), score=%.3f from maxima %d" % (n,
223 |               x0,y0,x1,y1,sqrt((x0-x1)**2+(y0-y1)**2),score,m),;sys.stdout.flush()
224 |           ax1.plot(x0,y0,'+',ms=10,mew=2,color='red',scalex=False,scaley=False)
225 |           ax2.plot(x1,y1,'+',ms=10,mew=2,color='blue',scalex=False,scaley=False)
226 |         # we redraw only the concerned axes
227 |         renderer = fig.canvas.get_renderer()
228 |         ax1.draw(renderer)  
229 |         ax2.draw(renderer)
230 |         fig.canvas.blit(ax1.bbox)
231 |         fig.canvas.blit(ax2.bbox)
232 |         if mode=='score_path':
233 |           ax3.set_ylim((0,1))
234 |           ax3.draw(renderer)
235 |           fig.canvas.blit(ax3.bbox)
236 |     
237 |     wider_than_high = (img0.shape[0]+img1.shape[0]<img0.shape[1]+img1.shape[1])
238 |     if mode in ('corres', 'rainbow'):
239 |       if wider_than_high:
240 |         layouts = (311, 312, 325, 326)
241 |       else:
242 |         layouts = (221, 222, 223, 224)
243 |     else:
244 |       if wider_than_high:
245 |         layouts = (311, 312, 313)
246 |       else:
247 |         layouts = (221, 222, 212)
248 |     
249 |     clf()
250 |     ax1 = subplot(layouts[0])
251 |     ax1.numplot = 0
252 |     imshow(img0,interpolation='nearest')
253 |     noticks()
254 |     ax2 = subplot(layouts[1])
255 |     ax2.numplot = 1
256 |     imshow(img1,interpolation='nearest')
257 |     noticks()
258 |     
259 |     if mode in 'flow score score_path comatches argmax':
260 |       ax3 = subplot(layouts[2])
261 |       if mode == 'score_path':
262 |         assert full_corres!=None
263 |         ax3.numplot = -1
264 |         # retrieve score's path
265 |         step = full_corres.step
266 |         fc0 = full_corres.corres0
267 |         fc1 = full_corres.corres1
268 |         m = fc0[:,:,6:].mean(axis=0).mean(axis=0)
269 |         # find periodicity
270 |         fc_period = min([p for p in (1,4,6) if all(m[p-1::p]<=1)])
271 |         fc0 = fc0[:,:,range(6)+range(6+fc_period-1,fc0.shape[-1],fc_period)]
272 |         fc1 = fc1[:,:,range(6)+range(6+fc_period-1,fc1.shape[-1],fc_period)]
273 |         plot( m[fc_period-1::fc_period], '+-', color='k' )
274 |         ylim((0,1))
275 |         
276 |       else:
277 |         ax3.numplot = 0
278 |         from flow_utils import flowToColor
279 |         matches = int32(corr)
280 |         imatch = get_imatches(matches,img0.shape[:2],lm and lm[0].psize or psize or 1)
281 |         if mode in 'flow comatches argmax':
282 |           corr_flow = (matches[:,2:4]-matches[:,0:2])[imatch]
283 |           corr_color = flowToColor(corr_flow, maxflow=50)
284 |         if mode == 'score':
285 |           corr_color = corr[:,4][imatch]
286 |         corr_color[imatch<0] = 0
287 |         imshow(corr_color,interpolation='nearest')
288 |     
289 |     elif mode == 'rainbow':
290 |       # make beautiful colors
291 |       center = corr[:,[1,0]].mean(axis=0) # array(img0.shape[:2])/2 #
292 |       corr[:,5] = arctan2(*(corr[:,[1,0]] - center).T)
293 |       corr[:,5] = int32(64*corr[:,5]/pi) % 128
294 |       
295 |       set_max = set(corr[:,5])
296 |       colors = {m:i for i,m in enumerate(set_max)}
297 |       colors = {m:cm.hsv(i/float(len(colors))) for m,i in colors.items()}
298 |       
299 |       ax3 = subplot(layouts[2])
300 |       ax3.numplot = 0
301 |       imshow(img0/2+64,interpolation='nearest')
302 |       for m in set_max:
303 |         plot(corr[corr[:,5]==m,0],corr[corr[:,5]==m,1],'+',ms=10,mew=2,color=colors[m],scalex=0,scaley=0)
304 |       noticks()
305 |       
306 |       ax4 = subplot(layouts[3])
307 |       ax4.numplot = 1
308 |       imshow(img1/2+64,interpolation='nearest')
309 |       for m in set_max:
310 |         plot(corr[corr[:,5]==m,2],corr[corr[:,5]==m,3],'+',ms=10,mew=2,color=colors[m],scalex=0,scaley=0)
311 |       noticks()
312 |     
313 |     else:
314 |       ax3 = subplot(layouts[2])
315 |       ax3.numplot = None
316 |       imshow(img0/4+192,interpolation='nearest')
317 |       #plot(corr[:,0],corr[:,1],'+',ms=10,mew=2)
318 |       for m in set_max:
319 |         plot(corr[corr[:,5]==m,0],corr[corr[:,5]==m,1],'+',ms=10,mew=2,color=colors[m],scalex=0,scaley=0)
320 |       noticks()
321 |       
322 |       ax4 = subplot(layouts[3])
323 |       ax4.numplot = None
324 |       imshow(img1/4+192,interpolation='nearest')
325 |       for m in set_max:
326 |         plot(corr[corr[:,5]==m,2],corr[corr[:,5]==m,3],'+',ms=10,mew=2,color=colors[m],scalex=0,scaley=0)
327 |       noticks()
328 |     
329 |     subplots_adjust(left=0.03, bottom=0.03, right=1, top=1, wspace=0.02, hspace=0.02)
330 |     
331 |     fig = get_current_fig_manager().canvas.figure
332 |     cid_move = fig.canvas.mpl_connect('motion_notify_event',motion_notify_callback)
333 |     print "Move your mouse on the top images..."
334 |     pdb.set_trace()
335 |     fig.canvas.draw()
336 |     fig.canvas.mpl_disconnect(cid_move)
337 | 
338 | 
339 | def viz_mem(net):
340 |     pos = arange(len(net.activation_blobs))
341 |     width = 0.9/2
342 |     from collections import OrderedDict
343 |     blob_sizes = OrderedDict()
344 |     hash_blob = lambda b: b.cpu_data().__long__()
345 |     blob_size = lambda b: int(b.count())*4 # sizeof(float) (diff is never used)
346 |     
347 |     ab_sizes, ab_fakes = [], []
348 |     for n,b in net.activation_blobs:
349 |       if b is None: 
350 |         ab_sizes.append(0)
351 |         ab_fakes.append(0)
352 |         continue
353 |       h = hash_blob(b)
354 |       size = blob_size(b)
355 |       if h not in blob_sizes:
356 |         blob_sizes[h] = size
357 |         ab_sizes.append(size)
358 |         ab_fakes.append(0)
359 |       else:
360 |         ab_sizes.append(0)
361 |         ab_fakes.append(size)
362 |     
363 |     w_sizes, w_fakes = [0],[0]
364 |     for n,l in net.layers:
365 |       total = fake = 0
366 |       for i in range(len(l.blobs())):
367 |         b = l.blobs()[i]
368 |         h = hash_blob(b)
369 |         size = blob_size(b)
370 |         total += size
371 |         if h in blob_sizes:
372 |           fake += size
373 |           blob_sizes[h] = size
374 |       w_sizes.append(total)
375 |       w_fakes.append(fake)
376 |     
377 |     try:
378 |       ab_rects = barh(pos, ab_sizes, width, color='r', label="Activation blobs")
379 |       barh(pos, ab_fakes, width, color='pink', label="Duplicated (inplace) activation blobs")
380 |       w_rects = barh(pos-0.5, w_sizes, width, color='b', label="Layer's blobs")
381 |       barh(pos-0.5, w_fakes, width, color=(0.5,0.5,1), label="Duplicated (inplace) layer's blobs")
382 |       
383 |       yticks(pos+0.5+width/2, ['[%d] %s'%(i,n) for i,(n,l) in enumerate(net.layers)])
384 |       legend(loc='upper right')
385 |     except:
386 |       print "error with matplotlib display"
387 |     
388 |     total = sum(ab_sizes) + sum(w_sizes)
389 |     print "/!\\ WARNING: this estimation is optimistic"
390 |     print "              (it doesn't count layer's hidden blobs)"
391 |     print 'total size = %dB (%.3f GB)' % (total, total/1.e9)
392 |     pdb.set_trace()
393 | 
394 | 
395 | ########################################################
396 | # Main 
397 | 
398 | def get_patch_size( base_psize=4, downsize2=False, truedownsize2=False, **kwargs):
399 |     upsize = 2**(downsize2 + truedownsize2)
400 |     return base_psize*upsize
401 | 
402 | # robust definition of a pyramid level
403 | PyrLevel = namedtuple('PyrLevel', 'f psize grid norms assign res_map trueshape offsets children')
404 | 
405 | 
406 | ########################################################
407 | # argument parsing / parameters 
408 | 
409 | 
410 | def preprocess_images(img0, img1, args):
411 |   if args.crop:
412 |     W,H = args.crop
413 |     img0 = img0[:H,:W]
414 |     img1 = img1[:H,:W]
415 |   
416 |   return img0, img1
417 | 
418 | 
419 | def output_file( corres, outfile, form_type=True):
420 |   from signal import signal, SIGPIPE, SIG_DFL
421 |   if form_type:
422 |     for x1, y1, x2, y2, score, index in corres:
423 |       outfile.write("%d %d %d %d %g %d\n" % (x1, y1, x2, y2, score, index))
424 |   else:
425 |     for x1, y1, x2, y2, score, index in corres:
426 |       outfile.write("%d %d %d %d\n" % (x1, y1, x2, y2))
427 |   # outfile.flush()
428 |   # outfile.close()
429 | 
430 | 
431 | 
432 | 
433 | 
434 | 
435 | 
436 | 
437 | 
438 | 
439 | 
440 | 
441 | 
442 | 
443 | 
444 | 
445 | 
446 | 


--------------------------------------------------------------------------------
/deep_matching/my_im2col.cpp:
--------------------------------------------------------------------------------
  1 | // Copyright 2013 Yangqing Jia
  2 | 
  3 | 
  4 | namespace caffe {
  5 | 
  6 | template <typename Dtype>
  7 | void my_im2col_cpu(const Dtype* data_im, const int channels,
  8 |     const int height, const int width, const int ksize, const int pad, 
  9 |     const int stride, Dtype* data_col) {
 10 |   int height_col = (height + 2 * pad - ksize) / stride + 1;
 11 |   int width_col = (width + 2 * pad - ksize) / stride + 1;
 12 |   int channels_col = channels * ksize * ksize;
 13 |   for (int c = 0; c < channels_col; ++c) {
 14 |     int w_offset = c % ksize;
 15 |     int h_offset = (c / ksize) % ksize;
 16 |     int c_im = c / ksize / ksize;
 17 |     for (int h = 0; h < height_col; ++h) {
 18 |       for (int w = 0; w < width_col; ++w) {
 19 |         int h_pad = h * stride - pad + h_offset;
 20 |         int w_pad = w * stride - pad + w_offset;
 21 |         if (h_pad >= 0 && h_pad < height && w_pad >= 0 && w_pad < width)
 22 |           data_col[(c * height_col + h) * width_col + w] =
 23 |             data_im[(c_im * height + h_pad) * width + w_pad];
 24 |         else
 25 |           data_col[(c * height_col + h) * width_col + w] = 0;
 26 |       }
 27 |     }
 28 |   }
 29 | }
 30 | 
 31 | template <typename Dtype>
 32 | void my_im2col_cpu_T(const Dtype* data_im, const int channels,
 33 |     const int height, const int width, const int ksize, const int pad, 
 34 |     const int stride, Dtype* data_col) {
 35 |   int height_col = (height + 2 * pad - ksize) / stride + 1;
 36 |   int width_col = (width + 2 * pad - ksize) / stride + 1;
 37 |   int channels_col = channels * ksize * ksize;
 38 |   for (int c = 0; c < channels_col; ++c) {
 39 |     int w_offset = c % ksize;
 40 |     int h_offset = (c / ksize) % ksize;
 41 |     int c_im = c / ksize / ksize;
 42 |     for (int h = 0; h < height_col; ++h) {
 43 |       for (int w = 0; w < width_col; ++w) {
 44 |         int h_pad = h * stride - pad + h_offset;
 45 |         int w_pad = w * stride - pad + w_offset;
 46 |         if (h_pad >= 0 && h_pad < height && w_pad >= 0 && w_pad < width)
 47 |           data_col[c + channels_col * (w + width_col * h)] =
 48 |             data_im[(c_im * height + h_pad) * width + w_pad];
 49 |         else
 50 |           data_col[c + channels_col * (w + width_col * h)] = 0;
 51 |       }
 52 |     }
 53 |   }
 54 | }
 55 | 
 56 | 
 57 | // Explicit instantiation
 58 | template void my_im2col_cpu<float>(const float* data_im, const int channels,
 59 |     const int height, const int width, const int ksize, const int pad,
 60 |     const int stride, float* data_col);
 61 | template void my_im2col_cpu<double>(const double* data_im, const int channels,
 62 |     const int height, const int width, const int ksize, const int pad,
 63 |     const int stride, double* data_col);
 64 | template void my_im2col_cpu_T<float>(const float* data_im, const int channels,
 65 |     const int height, const int width, const int ksize, const int pad,
 66 |     const int stride, float* data_col);
 67 | template void my_im2col_cpu_T<double>(const double* data_im, const int channels,
 68 |     const int height, const int width, const int ksize, const int pad,
 69 |     const int stride, double* data_col);
 70 | 
 71 | 
 72 | }  // namespace caffe
 73 | 
 74 | 
 75 | 
 76 | 
 77 | 
 78 | 
 79 | 
 80 | 
 81 | 
 82 | 
 83 | 
 84 | 
 85 | 
 86 | 
 87 | 
 88 | 
 89 | 
 90 | 
 91 | 
 92 | 
 93 | 
 94 | 
 95 | 
 96 | 
 97 | 
 98 | 
 99 | 
100 | 
101 | 
102 | 
103 | 
104 | 
105 | 
106 | 
107 | 


--------------------------------------------------------------------------------
/deep_matching/my_im2col.cu:
--------------------------------------------------------------------------------
  1 | // Copyright 2013 Yangqing Jia
  2 | 
  3 | //#include <algorithm>
  4 | //#include <cmath>
  5 | //#include <cstdlib>
  6 | //#include <cstring>
  7 | 
  8 | #include "caffe/common.hpp"
  9 | #include "my_im2col.hpp"
 10 | 
 11 | namespace caffe {
 12 | 
 13 | template <typename Dtype>
 14 | __global__ void my_im2col_gpu_kernel(const int n, const Dtype* data_im,
 15 |     const int height, const int width, const int ksize, const int pad,
 16 |     const int stride, const int height_col, const int width_col,
 17 |     Dtype* data_col) {
 18 |   CUDA_KERNEL_LOOP(_index, n) {
 19 |     int index = _index;
 20 |     int w_out = index % width_col;
 21 |     index /= width_col;
 22 |     int h_out = index % height_col;
 23 |     int channel_in = index / height_col;
 24 |     int channel_out = channel_in * ksize * ksize;
 25 |     int h_in = h_out * stride - pad;
 26 |     int w_in = w_out * stride - pad;
 27 |     data_col += (channel_out * height_col + h_out) * width_col + w_out;
 28 |     data_im += (channel_in * height + h_in) * width + w_in;
 29 |     for (int i = 0; i < ksize; ++i) {
 30 |       for (int j = 0; j < ksize; ++j) {
 31 |         int h = h_in + i;
 32 |         int w = w_in + j;
 33 |         *data_col = (h >= 0 && w >= 0 && w < width && h < height) ?
 34 |             data_im[i * width + j] : 0;
 35 |         data_col += height_col * width_col;
 36 |       }
 37 |     }
 38 |   }
 39 | }
 40 | 
 41 | template <typename Dtype>
 42 | void my_im2col_gpu(const Dtype* data_im, const int channels,
 43 |     const int height, const int width, const int ksize, const int pad,
 44 |     const int stride, Dtype* data_col) {
 45 |   // We are going to launch channels * height_col * width_col kernels, each
 46 |   // kernel responsible for copying a single-channel grid.
 47 |   int height_col = (height + 2 * pad - ksize) / stride + 1;
 48 |   int width_col = (width + 2 * pad - ksize) / stride + 1;
 49 |   int num_kernels = channels * height_col * width_col;
 50 |   // NOLINT_NEXT_LINE(whitespace/operators)
 51 |   my_im2col_gpu_kernel<Dtype><<<CAFFE_GET_BLOCKS(num_kernels),
 52 |                              CAFFE_CUDA_NUM_THREADS>>>(
 53 |       num_kernels, data_im, height, width, ksize, pad, stride, height_col,
 54 |       width_col, data_col);
 55 |   CUDA_POST_KERNEL_CHECK;
 56 | }
 57 | 
 58 | 
 59 | // Explicit instantiation
 60 | template void my_im2col_gpu<float>(const float* data_im, const int channels,
 61 |     const int height, const int width, const int ksize, const int pad,
 62 |     const int stride, float* data_col);
 63 | template void my_im2col_gpu<double>(const double* data_im, const int channels,
 64 |     const int height, const int width, const int ksize, const int pad,
 65 |     const int stride, double* data_col);
 66 | 
 67 | 
 68 | template <typename Dtype>
 69 | __global__ void my_im2col_gpu_kernel_T(const int n, const Dtype* data_im,
 70 |     const int channels, const int height, const int width, const int ksize, const int pad,
 71 |     const int stride, const int height_col, const int width_col,
 72 |     Dtype* data_col) {
 73 |   CUDA_KERNEL_LOOP(_index, n) {
 74 |     int index = _index;
 75 |     int w_out = index % width_col;
 76 |     index /= width_col;
 77 |     int h_out = index % height_col;
 78 |     int channel_in = index / height_col;
 79 |     int channel_out = channel_in * ksize * ksize;
 80 |     int channels_col = channels * ksize * ksize;
 81 |     int h_in = h_out * stride - pad;
 82 |     int w_in = w_out * stride - pad;
 83 |     data_col += channel_out + channels_col * (w_out + width_col * h_out);
 84 |     data_im += (channel_in * height + h_in) * width + w_in;
 85 |     for (int i = 0; i < ksize; ++i) {
 86 |       for (int j = 0; j < ksize; ++j) {
 87 |         int h = h_in + i;
 88 |         int w = w_in + j;
 89 |         *data_col = (h >= 0 && w >= 0 && w < width && h < height) ?
 90 |             data_im[i * width + j] : 0;
 91 |         data_col++;
 92 |       }
 93 |     }
 94 |   }
 95 | }
 96 | 
 97 | template <typename Dtype>
 98 | void my_im2col_gpu_T(const Dtype* data_im, const int channels,
 99 |     const int height, const int width, const int ksize, const int pad,
100 |     const int stride, Dtype* data_col) {
101 |   // We are going to launch channels * height_col * width_col kernels, each
102 |   // kernel responsible for copying a single-channel grid.
103 |   int height_col = (height + 2 * pad - ksize) / stride + 1;
104 |   int width_col = (width + 2 * pad - ksize) / stride + 1;
105 |   int num_kernels = channels * height_col * width_col;
106 |   // NOLINT_NEXT_LINE(whitespace/operators)
107 |   my_im2col_gpu_kernel_T<Dtype><<<CAFFE_GET_BLOCKS(num_kernels),
108 |                              CAFFE_CUDA_NUM_THREADS>>>(
109 |       num_kernels, data_im, channels, height, width, ksize, pad, stride, height_col,
110 |       width_col, data_col);
111 |   CUDA_POST_KERNEL_CHECK;
112 | }
113 | 
114 | 
115 | // Explicit instantiation
116 | template void my_im2col_gpu_T<float>(const float* data_im, const int channels,
117 |     const int height, const int width, const int ksize, const int pad,
118 |     const int stride, float* data_col);
119 | template void my_im2col_gpu_T<double>(const double* data_im, const int channels,
120 |     const int height, const int width, const int ksize, const int pad,
121 |     const int stride, double* data_col);
122 | 
123 | }  // namespace caffe
124 | 


--------------------------------------------------------------------------------
/deep_matching/my_im2col.hpp:
--------------------------------------------------------------------------------
 1 | #ifndef __MY_COL2IM_H__
 2 | #define __MY_COL2IM_H__
 3 | 
 4 | /* just some wrappers to map to the "old" versions of im2col functions in caffe
 5 | */
 6 | 
 7 | namespace caffe {
 8 | 
 9 | template <typename Dtype>
10 | void my_im2col_cpu(const Dtype* data_im, const int channels,
11 |     const int height, const int width, const int ksize, const int pad, 
12 |     const int stride, Dtype* data_col);
13 | 
14 | // Transposed version (output = channels, num, height, width)
15 | template <typename Dtype>
16 | void my_im2col_cpu_T(const Dtype* data_im, const int channels,
17 |     const int height, const int width, const int ksize, const int pad, 
18 |     const int stride, Dtype* data_col);
19 | 
20 | 
21 | template <typename Dtype>
22 | void my_im2col_gpu(const Dtype* data_im, const int channels,
23 |     const int height, const int width, const int ksize, const int pad, 
24 |     const int stride, Dtype* data_col);
25 | 
26 | // Transposed version (output = channels, num, height, width)
27 | template <typename Dtype>
28 | void my_im2col_gpu_T(const Dtype* data_im, const int channels,
29 |     const int height, const int width, const int ksize, const int pad, 
30 |     const int stride, Dtype* data_col);
31 | 
32 | }  // namespace caffe
33 | 
34 | #endif
35 | 
36 | 
37 | 
38 | 
39 | 
40 | 
41 | 
42 | 
43 | 
44 | 
45 | 
46 | 
47 | 
48 | 
49 | 
50 | 
51 | 
52 | 
53 | 
54 | 
55 | 
56 | 
57 | 
58 | 


--------------------------------------------------------------------------------
/deep_matching/net.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Copyright (C) 2015 Jerome Revaud
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 16 | """
 17 | import pdb
 18 | import numpy as np
 19 | import gpudm
 20 | 
 21 | ###########################################
 22 | # basic functions for blob <-> numpy transfer
 23 | 
 24 | def set_GPU(GPU=0):
 25 |   ''' if GPU == -1 => use CPU
 26 |       otherwise GPU device number
 27 |   '''
 28 |   if GPU>=0:
 29 |     gpudm.Caffe_set_mode(gpudm.Caffe.GPU)
 30 |     gpudm.Caffe.SetDevice(GPU)
 31 |   else:
 32 |     gpudm.Caffe_set_mode(gpudm.Caffe.CPU)
 33 | 
 34 | 
 35 | def blob_shape(blob):
 36 |   return (blob.num(), blob.channels(), blob.height(), blob.width())
 37 | 
 38 | def set_blob_to(blob, a):
 39 |   assert a.shape == blob_shape(blob), pdb.set_trace()
 40 |   assert a.flags.c_contiguous
 41 |   b = gpudm.floats_to_numpy_ref(blob.mutable_cpu_data(), a.size)
 42 |   b.ravel()[:] = a.ravel()[:]
 43 | 
 44 | 
 45 | 
 46 | ###########################################
 47 | # Deep Network
 48 | 
 49 | class Net (object):
 50 |   """ a neural net. Simplification of the Net in C++ version """
 51 |   
 52 |   def __init__(self, input_blob):
 53 |     if type(input_blob) == tuple:
 54 |       # just a size
 55 |       size = input_blob
 56 |       input_blob = gpudm.BlobFloat()
 57 |       input_blob.Reshape(size[0], size[1], size[2], size[3])
 58 |     self.input_blob = input_blob
 59 |     self.activation_blobs = [("data", input_blob)]
 60 |     self.layers = []
 61 | 
 62 |   @staticmethod
 63 |   def new_BlobPtrVector(*v):
 64 |     bv = gpudm.BlobPtrVector()
 65 |     for x in v:
 66 |       if x != None:
 67 |         bv.push_back(x)
 68 |     return bv
 69 | 
 70 |   @staticmethod
 71 |   def set_filler_params(dest, src):
 72 |     for k, v in src.items():
 73 |       getattr(dest, "set_" + k)(v)
 74 | 
 75 | 
 76 |   ####################################################3
 77 |   # Training and testing 
 78 | 
 79 |   def forward(self, start=0, end=0):
 80 |     end = end or len(self.layers)
 81 |     for i, (layer_name, layer) in enumerate(self.layers[start:end],start):
 82 |       bottom = self.activation_blobs[i][1]
 83 |       top = self.activation_blobs[i + 1][1]
 84 |       if top != None: 
 85 |         layer.Forward(self.new_BlobPtrVector(bottom),
 86 |                       self.new_BlobPtrVector(top))
 87 |       else:
 88 |         # last layer for train
 89 |         layer.Forward(self.new_BlobPtrVector(bottom, self.labels_blob),
 90 |                       self.new_BlobPtrVector())
 91 | 
 92 |   def test(self, input_data = None):
 93 |     if input_data != None:
 94 |       self.input_blob.mutable_to_numpy_ref()[:] = input_data
 95 |     self.forward()
 96 |     res = self.activation_blobs[-1][1]
 97 |     return res.to_numpy_ref()
 98 | 
 99 | 
100 |   ####################################################3
101 |   # I/O     
102 | 
103 |   def set_parameters(self, params, verbose=0, create_blobs=False):
104 |     for layer_name, layer in self.layers:
105 |       if layer_name in params:
106 |         layer_blobs = layer.blobs()
107 |         if create_blobs and len(layer_blobs)==0:  
108 |           for i, npdata in enumerate(params[layer_name]):
109 |             assert npdata.ndim == 4, 'error: paramter is not a blob'
110 |             blob = gpudm.BlobFloat(*npdata.shape)
111 |             blob.mutable_to_numpy_ref()[:] = npdata
112 |             layer_blobs.push_back(blob)
113 |         elif len(layer_blobs) > 0: 
114 |           assert len(params[layer_name]) == len(layer_blobs), "expected %d blobs for layer %s, received %d" % (len(layer_blobs), layer_name, len(params[layer_name]))
115 |           for i, npdata in enumerate(params[layer_name]):
116 |             #print 'Setting param #%d in layer %s' % (i, layer_name)
117 |             if type(npdata) == np.ndarray:
118 |               blob = layer_blobs[i].mutable_to_numpy_ref()
119 |               assert blob.shape == npdata.shape, "Error: parameters shapes differ: blob=%s vs weights=%s" %(
120 |                       str(blob.shape), str(npdata.shape))
121 |               blob[:] = npdata
122 |             else:
123 |               set_blob_to(layer_blobs[i], npdata)
124 |       elif verbose:
125 |         print "Layer %s not found in parameters"%(layer_name)
126 | 
127 |   def get_parameters(self, diff=False):
128 |     params = {}
129 |     for layer_name, layer in self.layers:
130 |       layer_params = params[layer_name] = []
131 |       if diff:  diff_params = params[layer_name+'_diff'] = []
132 |       for blob in layer.blobs(): 
133 |         layer_params.append(blob.to_numpy_ref().copy())
134 |         if diff:  diff_params.append(blob.diff_to_numpy_ref().copy())
135 |     return params
136 | 
137 |   def describe(self):
138 |     print "input:", self.input_blob.get_shape()
139 |     for i, (layer_name, layer) in enumerate(self.layers):
140 |       print "layer", layer_name, layer.__class__
141 |       print "  parameters:"
142 |       for j, blob in enumerate(layer.blobs()):
143 |         print "    ", blob.get_shape()
144 |       bottom_name, bottom = self.activation_blobs[i]
145 |       top_name, top = self.activation_blobs[i + 1]
146 |       print "  in:", bottom_name, bottom.get_shape()
147 |       print "  out:", top_name, top.get_shape()
148 | 
149 | 
150 |   ####################################################3
151 |   # Build layers
152 | 
153 |   def check_name(self, name):
154 |     used = set(zip(*([(None,None)]+self.layers))[0])
155 |     assert name not in used, 'error: layer name already used: '+name
156 | 
157 |   def get_layer(self, name, ret_index=False, list=False, layers=None, re=False):
158 |     rname = name if re else name.replace('*','.*')
159 |     import re
160 |     res = []
161 |     for i,(n,l) in enumerate(layers or self.layers):
162 |       if re.match(rname,n):
163 |         r = i if ret_index else l
164 |         if list:
165 |           res.append(r)
166 |         else:
167 |           return r
168 |     assert list or res, "error: no layer matching '%s' found"%name
169 |     return res
170 | 
171 |   def get_activation(self, name, **kwargs):
172 |     return self.get_layer(name, layers=self.activation_blobs, **kwargs)
173 | 
174 |   def add_layer(self, name, layer_class, args, inplace=False): 
175 |     self.check_name(name)
176 |     # single output
177 |     if inplace:
178 |       top_blob = self.activation_blobs[-1][1]
179 |       if hasattr(top_blob,'ShareData'):
180 |         blob = gpudm.BlobFloat(*blob_shape(top_blob))
181 |         blob.ShareData(top_blob)
182 |         blob.ShareDiff(top_blob)
183 |         top_blob = blob
184 |     else:
185 |       top_blob = gpudm.BlobFloat()
186 |     if type(args) is not tuple: args = (args,)
187 |     
188 |     layer = layer_class(*args)
189 |     self.layers.append((name, layer))
190 |     
191 |     layer.SetUp(self.new_BlobPtrVector(self.activation_blobs[-1][1]), self.new_BlobPtrVector(top_blob))
192 |     
193 |     self.activation_blobs.append((name, top_blob))    
194 | 
195 |   def add_convolution(self, name,                      
196 |                       kernelsize,
197 |                       num_output,
198 |                       stride = 1, 
199 |                       group = 1,
200 |                       pad = 0,
201 |                       biasterm = True,
202 |                       weight_filler = {},
203 |                       bias_filler = {}, 
204 |                       weights=None):
205 |     cp = gpudm.ConvolutionParameter()
206 |     cp.set_kernel_h(kernelsize)
207 |     cp.set_kernel_w(kernelsize)
208 |     cp.set_num_output(num_output)
209 |     assert stride>0, 'error: stride is 0 for '+name
210 |     cp.set_stride_h(stride )
211 |     cp.set_stride_w(stride )
212 |     cp.set_group(group)
213 |     cp.set_pad_h(pad)
214 |     cp.set_pad_w(pad)
215 |     cp.set_bias_term(biasterm)
216 |     self.set_filler_params(cp.mutable_weight_filler(), weight_filler)
217 |     self.set_filler_params(cp.mutable_bias_filler(), bias_filler)
218 |     lp = gpudm.LayerParameter()
219 |     lp.set_allocated_convolution_param(cp)
220 |     cp.this.disown()  # otherwise it will be freed 2 times
221 |     
222 |     self.add_layer(name, gpudm.ConvolutionLayerFloat, lp)
223 |     if weights: self.set_parameters({name:weights}, verbose=0)
224 | 
225 |   def add_border_rectification(self, name, 
226 |                           kernelsize, 
227 |                           weights,
228 |                           inplace = True ):
229 |     args = (gpudm.LayerParameter(), kernelsize)
230 |     self.add_layer(name, gpudm.BorderRectifyLayerFloat, args, inplace=inplace)
231 |     self.set_parameters({name:weights}, verbose=0) # computed based on a convolution mask
232 | 
233 |   def add_relu(self, name, inplace = True ):
234 |     lp = gpudm.LayerParameter()
235 |     self.add_layer(name, gpudm.ReLULayerFloat, lp, inplace=inplace)
236 | 
237 |   def add_rectified_sigmoid(self, name):
238 |     lp = gpudm.LayerParameter()
239 |     self.add_layer(name, gpudm.RectifiedSigmoidLayerFloat, lp)
240 | 
241 |   def add_pixel_norm(self, name, norm=1.0, inplace=True):
242 |     lp = gpudm.LayerParameter()
243 |     self.add_layer(name, gpudm.PixelNormLayerFloat, (lp, norm), inplace=inplace)
244 | 
245 |   def add_reshape_layer(self, name, dims, inplace=True):
246 |     shape = gpudm.BlobShape()
247 |     for d in dims:
248 |       shape.add_dim(d)
249 |     rp = gpudm.ReshapeParameter()
250 |     rp.set_allocated_shape(shape)
251 |     shape.this.disown()  # otherwise it will be freed 2 times
252 |     lp = gpudm.LayerParameter()
253 |     lp.set_allocated_reshape_param(rp)
254 |     rp.this.disown()  # otherwise it will be freed 2 times
255 |     self.add_layer(name, gpudm.ReshapeLayerFloat, lp, inplace=inplace)
256 | 
257 |   def add_patch_correlation(self, name, kernelsize = 1, 
258 |                                   pad = None,
259 |                                   nghrad = -1,
260 |                                   normalize_borders = 'dynamic' ):
261 |     if nghrad>=0 and pad is None: pad = nghrad  # smart default
262 |     lp = gpudm.LayerParameter()
263 |     norm_modes = {'dynamic':'d', 'd':'d', 'static':'s', 's':'s', 'none':0}
264 |     self.add_layer(name, gpudm.PatchConvolutionLayerFloat, 
265 |                     (lp, kernelsize, pad, nghrad, norm_modes[normalize_borders]) )
266 | 
267 |   def add_power_law(self, name, power, scale=1, shift=0, inplace=False):
268 |     pp = gpudm.PowerParameter()
269 |     pp.set_power(power)
270 |     pp.set_scale(scale)
271 |     pp.set_shift(shift)
272 |     lp = gpudm.LayerParameter()
273 |     lp.set_allocated_power_param(pp)
274 |     pp.this.disown()  # otherwise it will be freed 2 times
275 |     self.add_layer(name, gpudm.PowerLayerFloat, lp, inplace=inplace)
276 | 
277 |   # pool methods
278 |   MAX = gpudm.PoolingParameter_PoolMethod_MAX
279 |   AVE = gpudm.PoolingParameter_PoolMethod_AVE
280 |   STOCHASTIC = gpudm.PoolingParameter_PoolMethod_STOCHASTIC
281 |   
282 |   def add_pooling(self, name,
283 |                   kernelsize,
284 |                   stride = 1,
285 |                   pool = MAX,
286 |                   pad = 0):
287 |     if kernelsize=='full': 
288 |       last_blob = blob_shape(self.activation_blobs[-1][1])
289 |       assert last_blob[2] == last_blob[3]
290 |       kernelsize = last_blob[-1]
291 |     pp = gpudm.PoolingParameter()
292 |     pp.set_kernel_h(kernelsize)
293 |     pp.set_kernel_w(kernelsize)
294 |     pp.set_stride_h(stride)
295 |     pp.set_stride_w(stride)
296 |     pp.set_pad_h(pad)
297 |     pp.set_pad_w(pad)
298 |     pp.set_pool(pool)
299 |     lp = gpudm.LayerParameter()
300 |     lp.set_allocated_pooling_param(pp)
301 |     pp.this.disown()  # otherwise it will be freed 2 times
302 |     self.add_layer(name, gpudm.PoolingLayerFloat, lp)
303 | 
304 |   def add_sparse_convolution(self, name, sp_pattern, 
305 |                                   use_sp_data = True,
306 |                                   kernelsize = 1, 
307 |                                   stride = 1, 
308 |                                   pad = 0,
309 |                                   biasterm = False,
310 |                                   weight_filler = {},
311 |                                   bias_filler = {}, 
312 |                                   blobs_lr=[1.0,2.0],
313 |                                   weight_decays=[1.0,1.0],
314 |                                   weights = None ):
315 |     from scipy import sparse
316 |     assert sparse.isspmatrix(sp_pattern)
317 |     num_output = sp_pattern.shape[0]  # sparsity pattern is given in input
318 |     
319 |     cp = gpudm.ConvolutionParameter()
320 |     cp.set_kernel_h(kernelsize)
321 |     cp.set_kernel_w(kernelsize)
322 |     cp.set_num_output(num_output)
323 |     assert stride>0, 'error: stride is 0 for '+name
324 |     cp.set_stride_h(stride)
325 |     cp.set_stride_w(stride)
326 |     cp.set_pad_h(pad)
327 |     cp.set_pad_w(pad)
328 |     cp.set_bias_term(biasterm)
329 |     self.set_filler_params(cp.mutable_weight_filler(), weight_filler)
330 |     self.set_filler_params(cp.mutable_bias_filler(), bias_filler)
331 |     lp = gpudm.LayerParameter()
332 |     lp.set_allocated_convolution_param(cp)
333 |     cp.this.disown()  # otherwise it will be freed 2 times
334 |     
335 |     def arrToBlob(arr): # dirty function but simpler for now
336 |         bb = gpudm.BlobFloat(1,1,1,arr.size)
337 |         bb.mutable_to_numpy_ref().view(arr.dtype)[:] = arr.ravel()
338 |         return bb
339 |     
340 |     if sparse.isspmatrix_csr(sp_pattern):
341 |       sparsity_args = (sp_pattern.nnz, 
342 |                        arrToBlob(sp_pattern.indptr), arrToBlob(sp_pattern.indices), 
343 |                        arrToBlob(sp_pattern.data) if use_sp_data else None)
344 |       self.add_layer(name, gpudm.CSR_SparseConvolutionLayerFloat, lp)
345 |     elif sparse.isspmatrix_bsr(sp_pattern):
346 |       br,bc = sp_pattern.blocksize
347 |       assert br == bc, "error: not implemented for non-square blocks"
348 |       sparsity_args = (sp_pattern.nnz/(br*bc), br,
349 |                        arrToBlob(sp_pattern.indptr), arrToBlob(sp_pattern.indices), 
350 |                        arrToBlob(sp_pattern.data) if use_sp_data else None)
351 |       self.add_layer(name, gpudm.BSR_SparseConvolutionLayerFloat, lp)
352 |     else:
353 |       assert False, "This sparse matrix type is not implemented"
354 |     
355 |     # define sparsity pattern now
356 |     self.layers[-1][1].SetSparsityPattern( *sparsity_args )
357 |     
358 |     self.layers[-1][1].blobs_lr = blobs_lr
359 |     self.layers[-1][1].weight_decays = weight_decays
360 |     if weights: self.set_parameters({name:weights}, verbose=0)
361 | 
362 |   def add_dm_argmax(self, name, shape, nlevels, nghrad, tag='pow%d', step=4):
363 |     lp = gpudm.LayerParameter()
364 |     self.add_layer(name, gpudm.DeepMatchingArgMaxLayerFloat, 
365 |                     (lp, shape[0], shape[1], step, nghrad) )
366 |     
367 |     # append activation blobs of previous layers
368 |     blobs = self.layers[-1][1].blobs()
369 |     for layer_name,activation_blob in self.activation_blobs:
370 |       if layer_name ==  tag%len(blobs):
371 |         blobs.push_back(activation_blob)
372 |     assert blobs.size() == nlevels
373 | 
374 | 
375 | 
376 | 
377 | 
378 | 
379 | 
380 | 
381 | 
382 | 
383 | 
384 | 
385 | 
386 | 
387 | 
388 | 
389 | 


--------------------------------------------------------------------------------
/deep_matching/numpy_image.h:
--------------------------------------------------------------------------------
  1 | /*
  2 | Copyright (C) 2015 Jerome Revaud
  3 | 
  4 | This program is free software: you can redistribute it and/or modify
  5 | it under the terms of the GNU General Public License as published by
  6 | the Free Software Foundation, either version 3 of the License, or
  7 | (at your option) any later version.
  8 | 
  9 | This program is distributed in the hope that it will be useful,
 10 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 11 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 12 | GNU General Public License for more details.
 13 | 
 14 | You should have received a copy of the GNU General Public License
 15 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 16 | */
 17 | #ifndef ___numpy_image___
 18 | #define ___numpy_image___
 19 | 
 20 | /************************
 21 | * 1D Array
 22 | */
 23 | 
 24 | #define DEFINE_ARRAY(type)  \
 25 |     typedef struct {  \
 26 |       type* pixels; \
 27 |       int tx; \
 28 |     } type##_array;
 29 | 
 30 | DEFINE_ARRAY(int)
 31 | DEFINE_ARRAY(float)
 32 | 
 33 | #define ASSERT_ARRAY_ZEROS(arr) {int size=arr->tx; assert((arr->pixels[0]==0 && arr->pixels[size/2]==0 && arr->pixels[size-1]==0) || !"error: matrix " #arr "is supposed to be zeros");}
 34 | #define ARRAY_SIZE(array)   (array->tx)
 35 | #define ASSERT_SAME_ARRAY_SIZE(arr1,arr2) assert( (arr1)->tx == (arr2)->tx )
 36 | 
 37 | /************************
 38 | * 2D Image
 39 | */
 40 | 
 41 | #define DEFINE_IMG(type)    \
 42 |     typedef struct { \
 43 |       type* pixels;\
 44 |       int tx,ty;\
 45 |     } type##_image;
 46 | 
 47 | DEFINE_IMG(int)
 48 | DEFINE_IMG(float)
 49 | 
 50 | #define ASSERT_SAME_SIZE  ASSERT_SAME_IMG_SIZE
 51 | #define ASSERT_IMG_SIZE  ASSERT_SAME_IMG_SIZE
 52 | #define ASSERT_SAME_IMG_SIZE(im1,im2)  if(im1 && im2)  assert(im1->tx==im2->tx && im1->ty==im2->ty);
 53 | 
 54 | #define ASSERT_IMAGE_ZEROS
 55 | #define ASSERT_IMG_ZEROS(img) {int size=img->tx*img->ty; assert((img->pixels[0]==0 && img->pixels[size/2]==0 && img->pixels[size-1]==0) || !"error: matrix " #img "is supposed to be zeros");}
 56 | #define IMG_SIZE(cube) ((cube)->tx*(cube)->ty)
 57 | 
 58 | 
 59 | /************************
 60 | * 3D Image = Cube (Z coordinates are contiguous)
 61 | */
 62 | 
 63 | #define DEFINE_CUBE(type) \
 64 |     typedef struct {  \
 65 |       type* pixels;  \
 66 |       int tx,ty,tz;  \
 67 |     } type##_cube;
 68 | 
 69 | DEFINE_CUBE(int)
 70 | DEFINE_CUBE(float)
 71 | 
 72 | #define ASSERT_SAME_CUBE_SIZE(im1, im2)   \
 73 |   if((im1) && (im2))  assert((im1)->tx==(im2)->tx && (im1)->ty==(im2)->ty && (im1)->tz==(im2)->tz);
 74 | 
 75 | #define ASSERT_CUBE_ZEROS(img) {int size=img->tx*img->ty*img->tz; assert((img->pixels[0]==0 && img->pixels[size/2]==0 && img->pixels[size-1]==0) || !"error: matrix " #img "is supposed to be zeros");}
 76 | #define CUBE_SIZE(cube) ((cube)->tx*(cube)->ty*(cube)->tz)
 77 | 
 78 | #endif
 79 | 
 80 | 
 81 | 
 82 | 
 83 | 
 84 | 
 85 | 
 86 | 
 87 | 
 88 | 
 89 | 
 90 | 
 91 | 
 92 | 
 93 | 
 94 | 
 95 | 
 96 | 
 97 | 
 98 | 
 99 | 
100 | 
101 | 
102 | 
103 | 
104 | 
105 | 
106 | 
107 | 
108 | 
109 | 
110 | 
111 | 
112 | 
113 | 


--------------------------------------------------------------------------------
/deep_matching/numpy_image.swg:
--------------------------------------------------------------------------------
  1 | // -*- c++ -*- 
  2 | /*
  3 | Copyright (C) 2015 Jerome Revaud
  4 | 
  5 | This program is free software: you can redistribute it and/or modify
  6 | it under the terms of the GNU General Public License as published by
  7 | the Free Software Foundation, either version 3 of the License, or
  8 | (at your option) any later version.
  9 | 
 10 | This program is distributed in the hope that it will be useful,
 11 | but WITHOUT ANY WARRANTY; without even the implied warranty of
 12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 13 | GNU General Public License for more details.
 14 | 
 15 | You should have received a copy of the GNU General Public License
 16 | along with this program.  If not, see <http://www.gnu.org/licenses/>
 17 | */
 18 | 
 19 | %{
 20 | #include "numpy_image.h"
 21 | %}
 22 | 
 23 | 
 24 | %{
 25 | #define SWIG_FILE_WITH_INIT
 26 | 
 27 | #include <numpy/arrayobject.h>
 28 | 
 29 | #define CHECK_NUMPY_ARRAY(expected_npy)                                 \
 30 |   if(!a) {                                                              \
 31 |     fprintf(stderr,"error in %s(): NULL input\n",__PRETTY_FUNCTION__);             \
 32 |     return NULL;                                                        \
 33 |   }                                                                     \
 34 |   if(!PyArray_Check(a)) {                                               \
 35 |     fprintf(stderr,"error in %s(): input not numpy array\n",__PRETTY_FUNCTION__);  \
 36 |     return NULL;                                                        \
 37 |   }                                                                     \
 38 |   if(!PyArray_ISCONTIGUOUS((PyArrayObject*)a)) {                                        \
 39 |     fprintf(stderr,"error in %s(): array is not C-contiguous\n",__PRETTY_FUNCTION__);  \
 40 |     return NULL;                                                        \
 41 |   }                                                                     \
 42 |   if(PyArray_TYPE((PyArrayObject*)a)!=expected_npy) {                                   \
 43 |     fprintf(stderr,"error in %s(): input has bad type (type id %d != " #expected_npy " %d)\n",__PRETTY_FUNCTION__, \
 44 |             PyArray_TYPE((PyArrayObject*)a),expected_npy);                              \
 45 |     return NULL;                                                        \
 46 |   }
 47 | 
 48 | // append to current function result as a tuple
 49 | PyObject* APPEND_TUPLE(PyObject* o, PyObject* result) {
 50 |   PyObject *o2, *o3;
 51 |   
 52 |   if ((!result) || (result == Py_None)) {
 53 |       result = o;
 54 |   } else {
 55 |       if (!PyTuple_Check(result)) {
 56 |           o2 = result;
 57 |           result = PyTuple_New(1);
 58 |           PyTuple_SetItem(result,0,o2); // SetItem steals a ref
 59 |       }
 60 |       o3 = PyTuple_New(1);
 61 |       PyTuple_SetItem(o3,0,o); // SetItem steals a ref
 62 |       o2 = result;
 63 |       result = PySequence_Concat(o2,o3);
 64 |       Py_CLEAR(o2);
 65 |       Py_CLEAR(o3);
 66 |   }
 67 |   
 68 |   return result;
 69 | }
 70 | 
 71 | %}
 72 | 
 73 | %init %{
 74 | /* needed, else crash at runtime */
 75 |     import_array();
 76 | %}
 77 | 
 78 | 
 79 | /* ~~~~ 1D arrays ~~~~~~~~~~~~~~~ */
 80 | 
 81 | %define TYPEMAP_ARRAY_1D(type,NPY_TYPE)
 82 | %typemap(in) 
 83 |   (type ## _array* arr) 
 84 |   (type ## _array array) {
 85 |   
 86 |   PyObject* a = $input;
 87 |   if(a==Py_None)
 88 |     $1 = NULL;
 89 |   else {
 90 |     CHECK_NUMPY_ARRAY(NPY_TYPE)
 91 |     array.pixels = (type*) PyArray_DATA((PyArrayObject*)a);
 92 |     
 93 |     a = PyObject_GetAttrString($input,"shape");
 94 |     assert(PyTuple_Size(a)==1);
 95 |     array.tx = PyInt_AsLong(PyTuple_GetItem(a,0));
 96 |     Py_CLEAR(a);
 97 |     
 98 |     $1=&array;
 99 |   }
100 | }
101 | 
102 | %apply (type##_array* arr) {(type##_array* )};
103 | %enddef
104 | 
105 | TYPEMAP_ARRAY_1D(int,NPY_INT)
106 | TYPEMAP_ARRAY_1D(float,NPY_FLOAT)
107 | 
108 | 
109 | /* ~~~~ 2D images ~~~~~~~~~~~~~~~ */
110 | 
111 | %define TYPEMAP_IMAGE(type,NPY_TYPE)
112 | %typemap(in) 
113 |   (type ## _image* img) 
114 |   (type ## _image image) {
115 |   
116 |   PyObject* a = $input;
117 |   if(a==Py_None)
118 |     $1 = NULL;
119 |   else {
120 |     CHECK_NUMPY_ARRAY(NPY_TYPE)
121 |     image.pixels = (type*) PyArray_DATA((PyArrayObject*)a);
122 |     
123 |     a = PyObject_GetAttrString($input,"shape");
124 |     assert(PyTuple_Size(a)==2);
125 |     image.ty = PyInt_AsLong(PyTuple_GetItem(a,0));
126 |     image.tx = PyInt_AsLong(PyTuple_GetItem(a,1));
127 |     Py_CLEAR(a);
128 |     
129 |     $1=&image;
130 |   }
131 | }
132 | 
133 | // special case where we want to output an image
134 | 
135 | %apply (type##_image* img) {(type##_image* )};
136 | %enddef
137 | 
138 | TYPEMAP_IMAGE(int, NPY_INT)
139 | TYPEMAP_IMAGE(float, NPY_FLOAT)
140 | 
141 | 
142 | /* ~~~~ Cubes = 3D images ~~~~~~~~~~~~~~~ */
143 | 
144 | %define TYPEMAP_CUBE_3D(type,NPY_TYPE)
145 | %typemap(in) 
146 |   (type ## _cube* cube) 
147 |   (type ## _cube cube) {
148 |   
149 |   PyObject* a = $input;
150 |   if(a==Py_None)
151 |     $1 = NULL;
152 |   else {
153 |     CHECK_NUMPY_ARRAY(NPY_TYPE)
154 |     cube.pixels = (type*) PyArray_DATA((PyArrayObject*)a);
155 |     
156 |     a = PyObject_GetAttrString($input,"shape");
157 |     assert(PyTuple_Size(a)==3);
158 |     cube.ty = PyInt_AsLong(PyTuple_GetItem(a,0));
159 |     cube.tx = PyInt_AsLong(PyTuple_GetItem(a,1));
160 |     cube.tz = PyInt_AsLong(PyTuple_GetItem(a,2));
161 |     Py_CLEAR(a);
162 |     
163 |     $1=&cube;
164 |   }
165 | }
166 | 
167 | // special case where we want to output something
168 | 
169 | %apply (type##_cube* cube) {(type##_cube* )};
170 | %enddef
171 | 
172 | TYPEMAP_CUBE_3D(int, NPY_INT)
173 | TYPEMAP_CUBE_3D(float, NPY_FLOAT)
174 | 
175 | 
176 | 
177 | 
178 | 
179 | 
180 | 
181 | 
182 | 
183 | 
184 | 
185 | 
186 | 
187 | 
188 | 
189 | 
190 | 
191 | 
192 | 
193 | 
194 | 
195 | 


--------------------------------------------------------------------------------
/optical_flow/bbc_pose.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | root_dire="/home/ddk/dongdk/dataset/bbc_pose/"
 4 | 
 5 | # im_first_path="${root_dire}labels/flo.labels/train_ims1_21w.label"
 6 | # im_second_path="${root_dire}labels/flo.labels/train_ims2_21w.label"
 7 | # bbox_file="${root_dire}labels/flo.labels/pbbox_train_plus_21w.label"
 8 | 
 9 | # im_first_path="${root_dire}labels/flo.labels/val_ims1.label"
10 | # im_second_path="${root_dire}labels/flo.labels/val_ims2.label"
11 | # bbox_file="${root_dire}labels/flo.labels/pbbox_val_plus.label"
12 | 
13 | im_first_path="${root_dire}labels/flo.labels/test_ims1.label"
14 | im_second_path="${root_dire}labels/flo.labels/test_ims2.label"
15 | bbox_file="${root_dire}labels/flo.labels/pbbox_test.label"
16 | 
17 | out_dire="${root_dire}crop.data.flo/"
18 | mkdir -p $out_dire
19 | 
20 | origin_ims_dire="${root_dire}data/"
21 | 
22 | 
23 | cmd_choice=1 # 0: normal, 1: from bbox, other: NotImplemented
24 | 
25 | frame_n=-2
26 | 
27 | dm_file="/home/ddk/dongdk/deep-matching/deep_matching/deep_matching_gpu.py"
28 | 
29 | df_file="/home/ddk/dongdk/deep-matching/deep_flow2/deepflow2"
30 | 
31 | cf_file="/home/ddk/dongdk/deep-matching/color_flow/color_flow"
32 | 
33 | rm_flo=1  # 0: not remove (default), !=0: remove
34 | 
35 | rm_mth=1  # 0: not remove (default), !=0: remove
36 | 
37 | rm_ims=1  # 0: not remove (default), !=0: remove
38 | 
39 | run_dm=0  # 0: run deep-matching, !=0: not run
40 | 
41 | is_disp=1 # 0: print nothing, !=0: display info
42 | 
43 | im_disp=0 # 0: not show, !=0: show im
44 | 
45 | sleep_time=1
46 | 
47 | # dm: "--ngh_rad 256(192,) --use_sparse"
48 | python flow_pipeline.py \
49 | 		--run_dm $run_dm \
50 | 		--rm_flo $rm_flo \
51 | 		--rm_mth $rm_mth \
52 | 		--rm_ims $rm_ims \
53 | 		--is_disp $is_disp \
54 | 		--im_disp $im_disp \
55 | 		--dm_file $dm_file \
56 | 		--df_file $df_file \
57 | 		--cf_file $cf_file \
58 | 		--frame_n $frame_n \
59 | 		--out_dire $out_dire \
60 | 		--cmd_choice $cmd_choice \
61 | 		--im_first_path $im_first_path \
62 | 		--cf_options "" \
63 | 		--df_options "-sintel " \
64 | 		--dm_options "-form_type 1 -GPU -v --downscale 1 --ngh_rad 256 " \
65 | 		--sleep_time $sleep_time \
66 | 		--bbox_file $bbox_file \
67 | 		--origin_ims_dire $origin_ims_dire \
68 | 		--im_second_path $im_second_path \
69 | 


--------------------------------------------------------------------------------
/optical_flow/flic_movies.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | root_dire="/home/ddk/dongdk/dataset/Kinect2/"
 4 | 
 5 | sub_dire="up.crop.color"
 6 | 
 7 | im_first_path="${root_dire}${sub_dire}/"
 8 | # im_first_path=" ${root_dire}${sub_dire}/00019218.png"
 9 | # im_second_path="${root_dire}${sub_dire}/00019220.png"
10 | 
11 | out_dire="${root_dire}optical.flow/${sub_dire}/"
12 | mkdir -p $out_dire
13 | 
14 | origin_ims_dire="${root_dire}up.color/"
15 | 
16 | bbox_file="${root_dire}labels/up.color2.pbbox.log"
17 | 
18 | cmd_choice=1 # 0: normal, 1: from bbox, other: NotImplemented
19 | 
20 | frame_n=-2
21 | 
22 | dm_file="/home/ddk/dongdk/deep-matching/deep_matching/deep_matching_gpu.py"
23 | 
24 | df_file="/home/ddk/dongdk/deep-matching/deep_flow2/deepflow2"
25 | 
26 | cf_file="/home/ddk/dongdk/deep-matching/color_flow/color_flow"
27 | 
28 | rm_flo=1  # 0: not remove (default), !=0: remove
29 | 
30 | rm_mth=1  # 0: not remove (default), !=0: remove
31 | 
32 | rm_ims=1  # 0: not remove (default), !=0: remove
33 | 
34 | run_dm=0  # 0: run deep-matching, !=0: not run
35 | 
36 | is_disp=1 # 0: print nothing, !=0: display info
37 | 
38 | im_disp=0 # 0: not show, !=0: show im
39 | 
40 | sleep_time=3
41 | 
42 | # dm: "--ngh_rad 256(192,) --use_sparse"
43 | python flow_pipeline.py \
44 | 		--run_dm $run_dm \
45 | 		--rm_flo $rm_flo \
46 | 		--rm_mth $rm_mth \
47 | 		--rm_ims $rm_ims \
48 | 		--is_disp $is_disp \
49 | 		--im_disp $im_disp \
50 | 		--dm_file $dm_file \
51 | 		--df_file $df_file \
52 | 		--cf_file $cf_file \
53 | 		--frame_n $frame_n \
54 | 		--out_dire $out_dire \
55 | 		--cmd_choice $cmd_choice \
56 | 		--im_first_path $im_first_path \
57 | 		--cf_options "" \
58 | 		--df_options "-sintel " \
59 | 		--dm_options "-form_type 1 -GPU -v --downscale 1 --ngh_rad 256 " \
60 | 		--sleep_time $sleep_time \
61 | 		--bbox_file $bbox_file \
62 | 		--origin_ims_dire $origin_ims_dire \
63 | 		# --im_second_path $im_second_path \
64 | 


--------------------------------------------------------------------------------
/optical_flow/one_pic.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # im_first_path="/home/ddk/cv.life/Nutstore/graduate.project/demo.images/bp1.jpg"
 4 | # im_second_path="/home/ddk/cv.life/Nutstore/graduate.project/demo.images/bp2.jpg"
 5 | 
 6 | im_first_path="/home/ddk/dongdk/faster-rcnn/output/person.torso/demo/mude.images1/mude.16.02.20000039.jpg"
 7 | im_second_path="/home/ddk/dongdk/faster-rcnn/output/person.torso/demo/mude.images1/mude.16.02.20000425.jpg"
 8 | 
 9 | out_dire="/home/ddk/cv.life/Nutstore/graduate.project/demo.images/"
10 | mkdir -p $out_dire
11 | 
12 | cmd_choice=0 # 0: normal, 1: from bbox, other: NotImplemented
13 | 
14 | dm_file="/home/ddk/dongdk/deep-matching/deep_matching/deep_matching_gpu.py"
15 | 
16 | df_file="/home/ddk/dongdk/deep-matching/deep_flow2/deepflow2"
17 | 
18 | cf_file="/home/ddk/dongdk/deep-matching/color_flow/color_flow"
19 | 
20 | rm_flo=1  # 0: not remove (default), !=0: remove
21 | 
22 | rm_mth=1  # 0: not remove (default), !=0: remove
23 | 
24 | rm_ims=1  # 0: not remove (default), !=0: remove
25 | 
26 | run_dm=0  # 0: run deep-matching, !=0: not run
27 | 
28 | is_disp=1 # 0: print nothing, !=0: display info
29 | 
30 | im_disp=0 # 0: not show, !=0: show im
31 | 
32 | sleep_time=1
33 | 
34 | # dm: "--ngh_rad 256(192,) --use_sparse"
35 | python flow_pipeline.py \
36 | 		--run_dm $run_dm \
37 | 		--rm_flo $rm_flo \
38 | 		--rm_mth $rm_mth \
39 | 		--rm_ims $rm_ims \
40 | 		--is_disp $is_disp \
41 | 		--im_disp $im_disp \
42 | 		--dm_file $dm_file \
43 | 		--df_file $df_file \
44 | 		--cf_file $cf_file \
45 | 		--out_dire $out_dire \
46 | 		--cmd_choice $cmd_choice \
47 | 		--im_first_path $im_first_path \
48 | 		--im_second_path $im_second_path \
49 | 		--cf_options "" \
50 | 		--df_options "-sintel " \
51 | 		--dm_options "-form_type 1 -GPU -v --downscale 1 --ngh_rad 256 " \
52 | 		--sleep_time $sleep_time \
53 | 


--------------------------------------------------------------------------------
/optical_flow/origin_pipeline.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | # --------------------------------------------------------
  4 | # images search using k-nearest neighbors for dedupe project
  5 | # Written by Dengke Dong, 02.28.2016
  6 | # --------------------------------------------------------
  7 | 
  8 | """Compute the optical flow of a video for each image."""
  9 | 
 10 | import os
 11 | import cv2
 12 | import sys
 13 | import time
 14 | import pprint
 15 | import argparse
 16 | from math import *
 17 | 
 18 | def _parse_args():
 19 |   """
 20 |   Parse input arguments
 21 |   """
 22 |   parser = argparse.ArgumentParser(description='Compute the optical flow of a video for each image.')
 23 | 
 24 |   parser.add_argument('--im_first_path',    dest='im_first_path',  
 25 |   										help='images directory', required=True, type=str)
 26 |   parser.add_argument('--im_second_path',   dest='im_second_path', 
 27 |   										help='images directory', default=None, type=str)
 28 |   parser.add_argument('--out_dire',   dest='out_dire',	 
 29 |   										help='optical flow directory', type=str)
 30 |   parser.add_argument('--dm_file',    dest='dm_file',    
 31 |   										help="execued file of deep matching code", type=str)
 32 |   parser.add_argument('--df_file',    dest='df_file',    
 33 |   									  help="execued file of deep flow2 code",    type=str)
 34 |   parser.add_argument('--cf_file',    dest='cf_file',    
 35 |   										help="execued file of color flow code",    type=str)
 36 |   parser.add_argument('--run_dm',     dest='run_dm',     
 37 |   										help='whether to run deep matching or not', 
 38 |   										default=0, type=int)
 39 |   parser.add_argument('--dm_options', dest='dm_options', 
 40 |   										help='params options of deep matching', 
 41 |   										default=None, type=str)
 42 |   parser.add_argument('--df_options', dest='df_options', 
 43 |   										help='params options of deep flow2',    
 44 |   										default=None, type=str)
 45 |   parser.add_argument('--cf_options', dest='cf_options', 
 46 |   										help='params options of color flow',    
 47 |   										default=None, type=str)
 48 |   parser.add_argument('--frame_n',    dest='frame_n', 	 
 49 |   										help='second frame',  default=-2, type=int)
 50 |   parser.add_argument('--rm_flo',     dest='rm_flo',     
 51 |   										help='remove flo files, if need',   
 52 |   										default=0, type=int)
 53 |   parser.add_argument('--rm_mth',     dest='rm_mth',     
 54 |   										help='remove match files, if need', 
 55 |   										default=0, type=int)
 56 |   parser.add_argument('--is_disp',    dest='is_disp',    
 57 |   										help='show info',  default=0, type=int)
 58 |   parser.add_argument('--im_disp',    dest='im_disp',    
 59 |   										help='show ims',   default=0, type=int)
 60 |   parser.add_argument('--sleep_time', dest='sleep_time', 
 61 |   										help='sleep time', default=3, type=int)
 62 | 
 63 |   if len(sys.argv) == 1:
 64 |     parser.print_help()
 65 |     sys.exit(1)
 66 | 
 67 |   args = parser.parse_args()
 68 |   print('Called with args:')
 69 |   print(args)
 70 |   print "\n\n"
 71 | 
 72 |   return args
 73 | 
 74 | def _im_paths(im_path, is_disp=False):
 75 | 	im_path = im_path.strip()
 76 | 	if os.path.isfile(im_path):
 77 | 	  if im_path.endswith(".jpg") or im_path.endswith(".png") \
 78 | 	      or im_path.endswith(".jpeg"): # # just an image (with other image extension?)
 79 | 	    im_paths = [im_path]
 80 | 	  else: # read from label file: contain im_path [label ...]
 81 | 	    im_paths, _ = _get_test_data(im_path)
 82 | 	elif os.path.isdir(im_path):  # read from image directory
 83 | 	  im_names = os.listdir(im_path)
 84 | 	  assert len(im_names) >= 1
 85 | 	  im_names.sort() # sort it for some convinience
 86 | 	  im_paths = [im_path + im_name.strip() for im_name in im_names]
 87 | 	else:
 88 | 	  raise IOError(('{:s} not exist').format(im_path))
 89 | 
 90 | 	im_n = len(im_paths)
 91 | 	assert im_n >= 1, "invalid input of `im_path`: " % (im_path,)
 92 | 
 93 | 	if is_disp:
 94 | 		print "\n\n"
 95 | 		print "---- Images ----"
 96 | 		print "im_path:", im_path, "\n"
 97 | 		for  im_path in im_paths:
 98 | 			print im_path
 99 | 		print "\n\n"
100 | 
101 | 	return im_paths
102 | 
103 | def _im_pairs_v1(im_paths, frame_n, is_disp=False):
104 | 	im_pairs = []
105 | 	im_n 		 = len(im_paths)
106 | 
107 | 	assert frame_n != 0
108 | 	assert im_n    >= 1 + abs(frame_n)
109 | 
110 | 	if frame_n < 0:
111 | 		for idx in xrange(abs(frame_n)):
112 | 			if idx + abs(frame_n) >= im_n:
113 | 				continue
114 | 			im_pairs.append((im_paths[idx], im_paths[idx + abs(frame_n)]))
115 | 		for idx in xrange(abs(frame_n), im_n):
116 | 			im_pairs.append((im_paths[idx], im_paths[idx + frame_n]))
117 | 	else:
118 | 		for idx in xrange(0, im_n - frame_n):
119 | 			if idx + frame_n >= im_n:
120 | 				continue
121 | 			im_pairs.append((im_paths[idx], im_paths[idx + frame_n]))
122 | 
123 | 		for idx in xrange(im_n - frame_n, im_n):
124 | 			im_pairs.append((im_paths[idx], im_paths[idx - frame_n]))
125 | 	assert len(im_pairs) >= 1
126 | 
127 | 	if is_disp:
128 | 		print "\n\n---- Pairs ----\n"
129 | 		for im_pair in im_pairs:
130 | 			print im_pair
131 | 		print "\n\n"
132 | 
133 | 	return im_pairs
134 | 
135 | def _im_pairs_v2(im_first_paths, im_second_paths, is_disp=False):
136 | 	assert len(im_first_paths) >= 1
137 | 	assert len(im_first_paths) == len(im_second_paths)
138 | 
139 | 	im_pairs = []
140 | 	im_n     = len(im_first_paths)
141 | 
142 | 	for idx in xrange(im_n):
143 | 		im_first_path  = im_first_paths[idx]
144 | 		im_second_path = im_second_paths[idx]
145 | 		im_pairs.append((im_first_path, im_second_path))
146 | 
147 | 	if is_disp:
148 | 		print "\n\n---- Pairs ----\n"
149 | 		for im_pair in im_pairs:
150 | 			print im_pair
151 | 		print "\n\n"
152 | 
153 | 	return im_pairs
154 | 
155 | def _executed_files(args):
156 | 	dm_file = args.dm_file.strip()
157 | 	if not os.path.exists(dm_file) or not os.path.isfile(dm_file):
158 | 		raise IOError(('{:s} not exist').format(dm_file))
159 | 
160 | 	df_file = args.df_file.strip()
161 | 	if not os.path.exists(df_file) or not os.path.isfile(df_file):
162 | 		raise IOError(('{:s} not exist').format(df_file))
163 | 
164 | 	cf_file = args.cf_file.strip()
165 | 	if not os.path.exists(cf_file) or not os.path.isfile(cf_file):
166 | 		raise IOError(('{:s} not exist').format(cf_file))
167 | 
168 | 	return dm_file, df_file, cf_file
169 | 
170 | def _executed_options(args):
171 | 	dm_options = ""
172 | 	if args.dm_options is not None:
173 | 		dm_options = args.dm_options.strip()
174 | 
175 | 	df_options = ""
176 | 	if args.df_options is not None:
177 | 		df_options = args.df_options.strip()
178 | 
179 | 	cf_options = ""
180 | 	if args.cf_options is not None:
181 | 		cf_options = args.cf_options.strip()
182 | 
183 | 	return dm_options, df_options, cf_options
184 | 
185 | def _executed_cmds(args, im_pairs, out_dire, dm_file, dm_options, df_file, df_options, cf_file, cf_options):
186 | 	''''''
187 | 	t_time     = time.time()
188 | 	im_n       = len(im_pairs)
189 | 	mth_paths  = []
190 | 	flo_paths  = []
191 | 	
192 | 	im_disp		 = True if args.im_disp != 0 else False
193 | 	run_dm		 = True if args.run_dm  == 0 else False
194 | 	rm_flo		 = True if args.rm_flo  != 0 else False
195 | 	rm_mth		 = True if args.rm_mth  != 0 else False
196 | 	print "run_dm:", run_dm, "im_disp:", im_disp, \
197 | 				"rm_flo:", rm_flo, "rm_mth:",  rm_mth
198 | 
199 | 	for im_i in xrange(im_n):
200 | 		s_time   = time.time()
201 | 
202 | 		im_pair  = im_pairs[im_i]
203 | 		
204 | 		im_path1 = im_pair[0]
205 | 		im_name  = os.path.basename(im_path1)
206 | 		
207 | 		im_name2 = os.path.splitext(im_name)[0]
208 | 		im_path2 = im_pair[1]
209 | 
210 | 		print "main im_path:", im_path1
211 | 		print "auxi im_path:", im_path2
212 | 		
213 | 		mth_path = out_dire + im_name2 + "_match.txt"
214 | 		mth_paths.append(mth_path)
215 | 
216 | 		of_path  = out_dire + im_name2 + ".png"
217 | 		
218 | 		flo_path = out_dire + im_name2 + ".flo"
219 | 		flo_paths.append(flo_path)
220 | 
221 | 		# ##############################################################
222 | 
223 | 		dm_cmd   = "python %s %s %s %s -out %s" % (dm_file, im_path1, \
224 | 										im_path2, dm_options, mth_path)
225 | 
226 | 		if run_dm:
227 | 			df_cmd   = "%s %s %s %s %s -match %s" % (df_file, im_path1, \
228 | 										im_path2, flo_path, df_options, mth_path)
229 | 		else:
230 | 			df_cmd   = "%s %s %s %s %s" % (df_file, im_path1, im_path2, \
231 | 										flo_path, df_options)
232 | 
233 | 		cf_cmd   = "%s %s %s" % (cf_file, flo_path, of_path)
234 | 
235 | 		# ##############################################################
236 | 
237 | 		# optical flow images
238 | 		if not os.path.exists(of_path) or not os.path.isfile(of_path):
239 | 			# flo files and match file
240 | 			if run_dm:
241 | 				if not os.path.exists(flo_path) or not os.path.isfile(flo_path) or \
242 | 				   not os.path.exists(mth_path) or not os.path.isfile(mth_path):
243 | 					print "\nrun deep-matching\n"
244 | 					cmd = dm_cmd
245 | 					os.system(cmd)
246 | 				
247 | 			cmd = df_cmd
248 | 			os.system(cmd)
249 | 
250 | 			if os.path.exists(flo_path) and os.path.isfile(flo_path):
251 | 				cmd = cf_cmd
252 | 				os.system(cmd)
253 | 			else:	
254 | 				raise IOError(('{:s} not exist').format(flo_path))
255 | 		else:
256 | 			pass
257 | 
258 | 		# remove flo file
259 | 		if rm_flo and os.path.exists(flo_path) and os.path.isfile(flo_path):
260 | 			os.remove(flo_path)
261 | 
262 | 		# remove match file
263 | 		if rm_mth and os.path.exists(mth_path) and os.path.isfile(mth_path):
264 | 			os.remove(mth_path) 
265 | 
266 | 		if im_disp:
267 | 			im1 = cv2.imread(im_path1)
268 | 			im2 = cv2.imread(im_path2)
269 | 			im3 = cv2.imread(of_path)
270 | 			cv2.imshow(im_name2, im1)
271 | 			cv2.waitKey(0)
272 | 			cv2.destroyAllWindows()
273 | 			cv2.imshow(im_name2, im2)
274 | 			cv2.waitKey(0)
275 | 			cv2.destroyAllWindows()
276 | 			cv2.imshow(im_name2, im3)
277 | 			cv2.waitKey(0)
278 | 			cv2.destroyAllWindows()
279 | 		
280 | 		print "\n---- Takes %s seconds for %s-th image: %s----\n" % (time.time() - s_time, im_i, im_path1)
281 | 
282 | 	# if rm_flo:
283 | 	# 	for flo_path in flo_paths:
284 | 	# 		if os.path.exists(flo_path) and os.path.isfile(flo_path):
285 | 	# 		  os.remove(flo_path)
286 | 
287 | 	# if rm_mth:
288 | 	# 	for mth_path in mth_paths:
289 | 	# 		if os.path.exists(mth_path) and os.path.isfile(mth_path):
290 | 	# 		  os.remove(mth_path) 
291 | 
292 | 	t_time = time.time() - t_time
293 | 	print "\n---- Takes %s seconds for %s images -- (average time: %s)----\n" % (t_time, im_n, t_time / im_n)
294 | 	print "\nDone\n"
295 | 
296 | def flow_pipeline():
297 | 	''''''
298 | 	args 							= _parse_args()
299 | 
300 | 	frame_n 					= args.frame_n
301 | 
302 | 	im_first_path 	  = args.im_first_path.strip()
303 | 
304 | 	out_dire 					= args.out_dire.strip()
305 | 
306 | 	is_disp						= True if args.is_disp != 0 else False
307 | 
308 | 	im_first_paths 		= _im_paths(im_first_path, is_disp)
309 | 
310 | 	if args.im_second_path is None:
311 | 		print "\nPair from sequence\n"
312 | 		time.sleep(args.sleep_time)
313 | 		im_pairs 			  = _im_pairs_v1(im_first_paths, frame_n, is_disp)
314 | 	else:
315 | 		print "\nPair from directory or files or image\n"
316 | 		time.sleep(args.sleep_time)
317 | 		im_second_path  = args.im_second_path.strip()
318 | 		im_second_paths = _im_paths(im_second_path, is_disp)
319 | 		im_pairs        = _im_pairs_v2(im_first_paths, im_second_paths, is_disp)
320 | 
321 | 	dm_file, df_file, cf_file = _executed_files(args)
322 | 
323 | 	dm_options, df_options, cf_options = _executed_options(args)
324 | 
325 | 	time.sleep(args.sleep_time)
326 | 
327 | 	_executed_cmds(args, im_pairs, out_dire, dm_file, dm_options, df_file, df_options, cf_file, cf_options)
328 | 
329 | 
330 | if __name__ == '__main__':
331 | 	''''''
332 | 	flow_pipeline()
333 | 


--------------------------------------------------------------------------------
/optical_flow/origin_pipeline.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # im dire
 4 | # root_dire="/home/ddk/dongdk/dataset/video.pose/FLIC.Motion-Ims-Src/"
 5 | # im_first_path="${root_dire}itself/"
 6 | # im_second_path="${root_dire}positive.2/"
 7 | # out_dire="${root_dire}optical.flow/flic.pos.2/"
 8 | 
 9 | 
10 | root_dire="/home/ddk/download/pt.pose/tianshui/"
11 | # root_dire="/home/ddk/download/pt.pose/huanglili/"
12 | im_first_path="${root_dire}images/"
13 | out_dire="${root_dire}flo.viz/"
14 | 
15 | mkdir -p $out_dire
16 | 
17 | frame_n=-3
18 | 
19 | dm_file="/home/ddk/dongdk/deep-matching/deep_matching/deep_matching_gpu.py"
20 | 
21 | df_file="/home/ddk/dongdk/deep-matching/deep_flow2/deepflow2"
22 | 
23 | cf_file="/home/ddk/dongdk/deep-matching/color_flow/color_flow"
24 | 
25 | rm_flo=1  # 0: not remove (default), !=0: remove
26 | 
27 | rm_mth=1  # 0: not remove (default), !=0: remove
28 | 
29 | run_dm=0  # 0: run deep-matching, !=0: not run
30 | 
31 | is_disp=1 # 0: print nothing, !=0: display info
32 | 
33 | im_disp=0 # 0: not show, !=0: show im
34 | 
35 | sleep_time=4
36 | 
37 | # dm: "--ngh_rad 256(192,) --use_sparse"
38 | python flow_pipeline.py \
39 | 		--run_dm $run_dm \
40 | 		--rm_flo $rm_flo \
41 | 		--rm_mth $rm_mth \
42 | 		--is_disp $is_disp \
43 | 		--im_disp $im_disp \
44 | 		--dm_file $dm_file \
45 | 		--df_file $df_file \
46 | 		--cf_file $cf_file \
47 | 		--frame_n $frame_n \
48 | 		--out_dire $out_dire \
49 | 		--im_first_path $im_first_path \
50 | 		--cf_options "" \
51 | 		--df_options "-sintel " \
52 | 		--dm_options "-form_type 1 -GPU -v --downscale 1 --ngh_rad 256 " \
53 | 		--sleep_time $sleep_time \
54 | 		# --im_second_path $im_second_path \
55 | 


--------------------------------------------------------------------------------