forked from tikroeger/OF_DIS
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpatch.cpp
407 lines (337 loc) · 13 KB
/
patch.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
#include <iostream>
#include <string>
#include <vector>
#include <thread>
#include <Eigen/Core>
#include <Eigen/LU>
#include <Eigen/Dense>
#include <stdio.h>
#include "patch.h"
using std::cout;
using std::endl;
using std::vector;
namespace OFC
{
typedef __v4sf v4sf;
PatClass::PatClass(
const camparam* cpt_in,
const camparam* cpo_in,
const optparam* op_in,
const int patchid_in)
:
cpt(cpt_in),
cpo(cpo_in),
op(op_in),
patchid(patchid_in)
{
pc = new patchstate;
CreateStatusStruct(pc);
tmp.resize(op->novals,1);
dxx_tmp.resize(op->novals,1);
dyy_tmp.resize(op->novals,1);
}
void PatClass::CreateStatusStruct(patchstate * psin)
{
// get reference / template patch
psin->pdiff.resize(op->novals,1);
psin->pweight.resize(op->novals,1);
}
PatClass::~PatClass()
{
delete pc;
}
void PatClass::InitializePatch(Eigen::Map<const Eigen::MatrixXf> * im_ao_in, Eigen::Map<const Eigen::MatrixXf> * im_ao_dx_in, Eigen::Map<const Eigen::MatrixXf> * im_ao_dy_in, const Eigen::Vector2f pt_ref_in)
{
im_ao = im_ao_in;
im_ao_dx = im_ao_dx_in;
im_ao_dy = im_ao_dy_in;
pt_ref = pt_ref_in;
ResetPatch();
getPatchStaticNNGrad(im_ao->data(), im_ao_dx->data(), im_ao_dy->data(), &pt_ref, &tmp, &dxx_tmp, &dyy_tmp);
ComputeHessian();
}
void PatClass::ComputeHessian()
{
#if (SELECTMODE==1)
pc->Hes(0,0) = (dxx_tmp.array() * dxx_tmp.array()).sum();
pc->Hes(0,1) = (dxx_tmp.array() * dyy_tmp.array()).sum();
pc->Hes(1,1) = (dyy_tmp.array() * dyy_tmp.array()).sum();
pc->Hes(1,0) = pc->Hes(0,1);
if (pc->Hes.determinant()==0)
{
pc->Hes(0,0)+=1e-10;
pc->Hes(1,1)+=1e-10;
}
#else
pc->Hes(0,0) = (dxx_tmp.array() * dxx_tmp.array()).sum();
if (pc->Hes.sum()==0)
pc->Hes(0,0)+=1e-10;
#endif
}
void PatClass::SetTargetImage(Eigen::Map<const Eigen::MatrixXf> * im_bo_in, Eigen::Map<const Eigen::MatrixXf> * im_bo_dx_in, Eigen::Map<const Eigen::MatrixXf> * im_bo_dy_in)
{
im_bo = im_bo_in;
im_bo_dx = im_bo_dx_in;
im_bo_dy = im_bo_dy_in;
ResetPatch();
}
void PatClass::ResetPatch()
{
pc->hasconverged=0;
pc->hasoptstarted=0;
pc->pt_st = pt_ref;
pc->pt_iter = pt_ref;
pc->p_in.setZero();
pc->p_iter.setZero();
pc->delta_p.setZero();
pc->delta_p_sqnorm = 1e-10;
pc->delta_p_sqnorm_init = 1e-10;
pc->mares = 1e20;
pc->mares_old = 1e20;
pc->cnt=0;
pc->invalid = false;
}
#if (SELECTMODE==1)
void PatClass::OptimizeStart(const Eigen::Vector2f p_in_arg)
#else
void PatClass::OptimizeStart(const Eigen::Matrix<float, 1, 1> p_in_arg)
#endif
{
pc->p_in = p_in_arg;
pc->p_iter = p_in_arg;
// convert from input parameters to 2D query location(s) for patches
paramtopt();
// save starting location, only needed for outlier check
pc->pt_st = pc->pt_iter;
//Check if initial position is already invalid
if (pc->pt_iter[0] < cpt->tmp_lb || pc->pt_iter[1] < cpt->tmp_lb || // check if patch left valid image region
pc->pt_iter[0] > cpt->tmp_ubw || pc->pt_iter[1] > cpt->tmp_ubh)
{
pc->hasconverged=1;
pc->pdiff = tmp;
pc->hasoptstarted=1;
}
else
{
pc->cnt=0; // reset iteration counter
pc->delta_p_sqnorm = 1e-10;
pc->delta_p_sqnorm_init = 1e-10; // set to arbitrary low value, s.t. that loop condition is definitely true on first iteration
pc->mares = 1e5; // mean absolute residual
pc->mares_old = 1e20; // for rate of change, keep mares from last iteration in here. Set high so that loop condition is definitely true on first iteration
pc->hasconverged=0;
OptimizeComputeErrImg();
pc->hasoptstarted=1;
pc->invalid = false;
}
}
#if (SELECTMODE==1)
void PatClass::OptimizeIter(const Eigen::Vector2f p_in_arg, const bool untilconv)
#else
void PatClass::OptimizeIter(const Eigen::Matrix<float, 1, 1> p_in_arg, const bool untilconv)
#endif
{
if (!pc->hasoptstarted)
{
ResetPatch();
OptimizeStart(p_in_arg);
}
int oldcnt=pc->cnt;
// optimize patch until convergence, or do only one iteration if DIS visualization is used
while ( ! (pc->hasconverged || (untilconv == false && (pc->cnt > oldcnt))) )
{
pc->cnt++;
// Projection onto sd_images
#if (SELECTMODE==1)
pc->delta_p[0] = (dxx_tmp.array() * pc->pdiff.array()).sum();
pc->delta_p[1] = (dyy_tmp.array() * pc->pdiff.array()).sum();
#else
pc->delta_p[0] = (dxx_tmp.array() * pc->pdiff.array()).sum();
#endif
pc->delta_p = pc->Hes.llt().solve(pc->delta_p); // solve linear system
pc->p_iter -= pc->delta_p; // update flow vector
#if (SELECTMODE==2) // if stereo depth
if (cpt->camlr==0)
pc->p_iter[0] = std::min(pc->p_iter[0],0.0f); // disparity in t can only be negative (in right image)
else
pc->p_iter[0] = std::max(pc->p_iter[0],0.0f); // ... positive (in left image)
#endif
// compute patch locations based on new parameter vector
paramtopt();
// check if patch(es) moved too far from starting location, if yes, stop iteration and reset to starting location
if ((pc->pt_st - pc->pt_iter).norm() > op->outlierthresh // check if query patch moved more than >padval from starting location -> most likely outlier
||
pc->pt_iter[0] < cpt->tmp_lb || pc->pt_iter[1] < cpt->tmp_lb || // check patch left valid image region
pc->pt_iter[0] > cpt->tmp_ubw || pc->pt_iter[1] > cpt->tmp_ubh)
{
pc->p_iter = pc->p_in; // reset
paramtopt();
pc->hasconverged=1;
pc->hasoptstarted=1;
}
OptimizeComputeErrImg();
}
}
inline void PatClass::paramtopt()
{
#if (SELECTMODE==1)
pc->pt_iter = pt_ref + pc->p_iter; // for optical flow the point displacement and the parameter vector are equivalent
#else
pc->pt_iter[0] = pt_ref[0] + pc->p_iter[0];
#endif
}
void PatClass::LossComputeErrorImage(Eigen::Matrix<float, Eigen::Dynamic, 1>* patdest, Eigen::Matrix<float, Eigen::Dynamic, 1>* wdest, const Eigen::Matrix<float, Eigen::Dynamic, 1>* patin, const Eigen::Matrix<float, Eigen::Dynamic, 1>* tmpin)
{
v4sf * pd = (v4sf*) patdest->data(),
* pa = (v4sf*) patin->data(),
* te = (v4sf*) tmpin->data(),
* pw = (v4sf*) wdest->data();
if (op->costfct==0) // L2 cost function
{
for (int i=op->novals/4; i--; ++pd, ++pa, ++te, ++pw)
{
(*pd) = (*pa)-(*te); // difference image
(*pw) = __builtin_ia32_andnps(op->negzero, (*pd) );
}
}
else if (op->costfct==1) // L1 cost function
{
for (int i=op->novals/4; i--; ++pd, ++pa, ++te, ++pw)
{
(*pd) = (*pa)-(*te); // difference image
(*pd) = __builtin_ia32_orps( __builtin_ia32_andps(op->negzero, (*pd) ) , __builtin_ia32_sqrtps (__builtin_ia32_andnps(op->negzero, (*pd) )) ); // sign(pdiff) * sqrt(abs(pdiff))
(*pw) = __builtin_ia32_andnps(op->negzero, (*pd) );
}
}
else if (op->costfct==2) // Pseudo Huber cost function
{
for (int i=op->novals/4; i--; ++pd, ++pa, ++te, ++pw)
{
(*pd) = (*pa)-(*te); // difference image
(*pd) = __builtin_ia32_orps(__builtin_ia32_andps(op->negzero, (*pd) ),
__builtin_ia32_sqrtps (
__builtin_ia32_mulps( // PSEUDO HUBER NORM
__builtin_ia32_sqrtps (op->ones + __builtin_ia32_divps(__builtin_ia32_mulps((*pd),(*pd)) , op->normoutlier_tmpbsq)) - op->ones, // PSEUDO HUBER NORM
op->normoutlier_tmp2bsq) // PSEUDO HUBER NORM
)
); // sign(pdiff) * sqrt( 2*b^2*( sqrt(1+abs(pdiff)^2/b^2)+1) )) // <- looks like this without SSE instruction
(*pw) = __builtin_ia32_andnps(op->negzero, (*pd) );
}
}
}
void PatClass::OptimizeComputeErrImg()
{
getPatchStaticBil(im_bo->data(), &(pc->pt_iter), &(pc->pdiff));
// Get photometric patch error
LossComputeErrorImage(&pc->pdiff, &pc->pweight, &pc->pdiff, &tmp);
// Compute step norm
pc->delta_p_sqnorm = pc->delta_p.squaredNorm();
if (pc->cnt==1)
pc->delta_p_sqnorm_init = pc->delta_p_sqnorm;
// Check early termination criterions
pc->mares_old = pc->mares;
pc->mares = pc->pweight.lpNorm<1>() / (op->novals);
if ( ! ((pc->cnt < op->max_iter) & (pc->mares > op->res_thresh) &
((pc->cnt < op->min_iter) | (pc->delta_p_sqnorm / pc->delta_p_sqnorm_init >= op->dp_thresh)) &
((pc->cnt < op->min_iter) | (pc->mares / pc->mares_old <= op->dr_thresh))) )
pc->hasconverged=1;
}
// Extract patch on integer position, and gradients, No Bilinear interpolation
void PatClass::getPatchStaticNNGrad(const float* img, const float* img_dx, const float* img_dy,
const Eigen::Vector2f* mid_in,
Eigen::Matrix<float, Eigen::Dynamic, 1>* tmp_in_e,
Eigen::Matrix<float, Eigen::Dynamic, 1>* tmp_dx_in_e,
Eigen::Matrix<float, Eigen::Dynamic, 1>* tmp_dy_in_e)
{
float *tmp_in = tmp_in_e->data();
float *tmp_dx_in = tmp_dx_in_e->data();
float *tmp_dy_in = tmp_dy_in_e->data();
Eigen::Vector2i pos;
Eigen::Vector2i pos_it;
pos[0] = round((*mid_in)[0]) + cpt->imgpadding;
pos[1] = round((*mid_in)[1]) + cpt->imgpadding;
int posxx = 0;
int lb = -op->p_samp_s/2;
int ub = op->p_samp_s/2-1;
for (int j=lb; j <= ub; ++j)
{
for (int i=lb; i <= ub; ++i, ++posxx)
{
pos_it[0] = pos[0]+i;
pos_it[1] = pos[1]+j;
int idx = pos_it[0] + pos_it[1] * cpt->tmp_w;
#if (SELECTCHANNEL==1 | SELECTCHANNEL==2) // Single channel
tmp_in[posxx] = img[idx];
tmp_dx_in[posxx] = img_dx[idx];
tmp_dy_in[posxx] = img_dy[idx];
#else // 3 RGB channels
idx *= 3;
tmp_in[posxx] = img[idx]; tmp_dx_in[posxx] = img_dx[idx]; tmp_dy_in[posxx] = img_dy[idx]; ++posxx; ++idx;
tmp_in[posxx] = img[idx]; tmp_dx_in[posxx] = img_dx[idx]; tmp_dy_in[posxx] = img_dy[idx]; ++posxx; ++idx;
tmp_in[posxx] = img[idx]; tmp_dx_in[posxx] = img_dx[idx]; tmp_dy_in[posxx] = img_dy[idx];
#endif
}
}
// PATCH NORMALIZATION
if (op->patnorm>0) // Subtract Mean
tmp_in_e->array() -= (tmp_in_e->sum() / op->novals);
}
// Extract patch on float position with bilinear interpolation, no gradients.
void PatClass::getPatchStaticBil(const float* img, const Eigen::Vector2f* mid_in, Eigen::Matrix<float, Eigen::Dynamic, 1>* tmp_in_e)
{
float *tmp_in = tmp_in_e->data();
Eigen::Vector2f resid;
Eigen::Vector4f we; // bilinear weight vector
Eigen::Vector4i pos;
Eigen::Vector2i pos_it;
// Compute the bilinear weight vector, for patch without orientation/scale change -> weight vector is constant for all pixels
pos[0] = ceil((*mid_in)[0]+.00001f); // ensure rounding up to natural numbers
pos[1] = ceil((*mid_in)[1]+.00001f);
pos[2] = floor((*mid_in)[0]);
pos[3] = floor((*mid_in)[1]);
resid[0] = (*mid_in)[0] - (float)pos[2];
resid[1] = (*mid_in)[1] - (float)pos[3];
we[0] = resid[0]*resid[1];
we[1] = (1-resid[0])*resid[1];
we[2] = resid[0]*(1-resid[1]);
we[3] = (1-resid[0])*(1-resid[1]);
pos[0] += cpt->imgpadding;
pos[1] += cpt->imgpadding;
float * tmp_it = tmp_in;
const float * img_a, * img_b, * img_c, * img_d, *img_e;
#if (SELECTCHANNEL==1 | SELECTCHANNEL==2) // 1 channel image
img_e = img + pos[0]-op->p_samp_s/2;
#else // 3-channel RGB image
img_e = img + (pos[0]-op->p_samp_s/2)*3;
#endif
int lb = -op->p_samp_s/2;
int ub = op->p_samp_s/2-1;
for (pos_it[1]=pos[1]+lb; pos_it[1] <= pos[1]+ub; ++pos_it[1])
{
#if (SELECTCHANNEL==1 | SELECTCHANNEL==2) // 1 channel image
img_a = img_e + pos_it[1] * cpt->tmp_w;
img_c = img_e + (pos_it[1]-1) * cpt->tmp_w;
img_b = img_a-1;
img_d = img_c-1;
#else // 3-channel RGB image
img_a = img_e + pos_it[1] * cpt->tmp_w * 3;
img_c = img_e + (pos_it[1]-1) * cpt->tmp_w * 3;
img_b = img_a-3;
img_d = img_c-3;
#endif
for (pos_it[0]=pos[0]+lb; pos_it[0] <= pos[0]+ub; ++pos_it[0],
++tmp_it,++img_a,++img_b,++img_c,++img_d)
{
#if (SELECTCHANNEL==1 | SELECTCHANNEL==2) // Single channel
(*tmp_it) = we[0] * (*img_a) + we[1] * (*img_b) + we[2] * (*img_c) + we[3] * (*img_d);
#else // 3-channel RGB image
(*tmp_it) = we[0] * (*img_a) + we[1] * (*img_b) + we[2] * (*img_c) + we[3] * (*img_d); ++tmp_it; ++img_a; ++img_b; ++img_c; ++img_d;
(*tmp_it) = we[0] * (*img_a) + we[1] * (*img_b) + we[2] * (*img_c) + we[3] * (*img_d); ++tmp_it; ++img_a; ++img_b; ++img_c; ++img_d;
(*tmp_it) = we[0] * (*img_a) + we[1] * (*img_b) + we[2] * (*img_c) + we[3] * (*img_d);
#endif
}
}
// PATCH NORMALIZATION
if (op->patnorm>0) // Subtract Mean
tmp_in_e->array() -= (tmp_in_e->sum() / op->novals);
}
}