dlut_libvo: matcher.h Source File

Go to the documentation of this file.
00001 /*
00002 Copyright 2012. All rights reserved.
00003 Institute of Measurement and Control Systems
00004 Karlsruhe Institute of Technology, Germany
00005 
00006 This file is part of libviso2.
00007 Authors: Andreas Geiger
00008 
00009 libviso2 is free software; you can redistribute it and/or modify it under the
00010 terms of the GNU General Public License as published by the Free Software
00011 Foundation; either version 2 of the License, or any later version.
00012 
00013 libviso2 is distributed in the hope that it will be useful, but WITHOUT ANY
00014 WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
00015 PARTICULAR PURPOSE. See the GNU General Public License for more details.
00016 
00017 You should have received a copy of the GNU General Public License along with
00018 libviso2; if not, write to the Free Software Foundation, Inc., 51 Franklin
00019 Street, Fifth Floor, Boston, MA 02110-1301, USA
00020 */
00021 
00022 #ifndef __MATCHER_H__
00023 #define __MATCHER_H__
00024 
00025 #include <stdio.h>
00026 #include <stdlib.h>
00027 #include <string.h>
00028 #include <iostream>
00029 #include <math.h>
00030 #include <emmintrin.h>
00031 #include <algorithm>
00032 #include <vector>
00033 
00034 #include "matrix.h"
00035 using namespace std;
00036 class Matcher {
00037 
00038 public:
00039 
00040   // parameter settings
00041   struct parameters {
00042 
00043     int32_t nms_n;                  // non-max-suppression: min. distance between maxima (in pixels)
00044     int32_t nms_tau;                // non-max-suppression: interest point peakiness threshold
00045     int32_t match_binsize;          // matching bin width/height (affects efficiency only)
00046     int32_t match_radius;           // matching radius (du/dv in pixels)
00047     int32_t match_disp_tolerance;   // dv tolerance for stereo matches (in pixels)
00048     int32_t outlier_disp_tolerance; // outlier removal: disparity tolerance (in pixels)
00049     int32_t outlier_flow_tolerance; // outlier removal: flow tolerance (in pixels)
00050     int32_t multi_stage;            // 0=disabled,1=multistage matching (denser and faster)
00051     int32_t half_resolution;        // 0=disabled,1=match at half resolution, refine at full resolution
00052     int32_t refinement;             // refinement (0=none,1=pixel,2=subpixel)
00053     double  f,cu,cv,base;           // calibration (only for match prediction)
00054 
00055     // default settings
00056     parameters () {
00057       nms_n                  = 4;
00058       nms_tau                = 50;
00059       match_binsize          = 50;
00060       match_radius           = 200;
00061       match_disp_tolerance   = 2;
00062       outlier_disp_tolerance = 5;
00063       outlier_flow_tolerance = 5;
00064       multi_stage            = 1;
00065       half_resolution        = 1;
00066       refinement             = 2;
00067     }
00068   };
00069 
00070   // constructor (with default parameters)
00071   Matcher(parameters param);
00072 
00073   // deconstructor
00074   ~Matcher();
00075 
00076   // intrinsics
00077   void setIntrinsics(double f,double cu,double cv,double base) {
00078     param.f = f;
00079     param.cu = cu;
00080     param.cv = cv;
00081     param.base = base;
00082   }
00083 
00084   // structure for storing matches
00085   struct p_match {
00086     float   u1p,v1p; // u,v-coordinates in previous left  image
00087     int32_t i1p;     // feature index (for tracking)
00088     float   u2p,v2p; // u,v-coordinates in previous right image
00089     int32_t i2p;     // feature index (for tracking)
00090     float   u1c,v1c; // u,v-coordinates in current  left  image
00091     int32_t i1c;     // feature index (for tracking)
00092     float   u2c,v2c; // u,v-coordinates in current  right image
00093     int32_t i2c;     // feature index (for tracking)
00094     p_match(){}
00095     p_match(float u1p,float v1p,int32_t i1p,float u2p,float v2p,int32_t i2p,
00096             float u1c,float v1c,int32_t i1c,float u2c,float v2c,int32_t i2c):
00097             u1p(u1p),v1p(v1p),i1p(i1p),u2p(u2p),v2p(v2p),i2p(i2p),
00098             u1c(u1c),v1c(v1c),i1c(i1c),u2c(u2c),v2c(v2c),i2c(i2c) {}
00099     bool operator < (const p_match &m) const
00100     {
00101         double d = max(u1p-u2p,0.00001f);
00102         double z = 582.508667*0.070103/d;
00103         double d_m = max(m.u1p-m.u2p,0.00001f);
00104         double z_m = 582.508667*0.070103/d_m;
00105         return z<z_m;
00106     }
00107   };
00108 
00109   // computes features from left/right images and pushes them back to a ringbuffer,
00110   // which interally stores the features of the current and previous image pair
00111   // use this function for stereo or quad matching
00112   // input: I1,I2 .......... pointers to left and right image (row-aligned), range [0..255]
00113   //        dims[0,1] ...... image width and height (both images must be rectified and of same size)
00114   //        dims[2] ........ bytes per line (often equals width)
00115   //        replace ........ if this flag is set, the current image is overwritten with
00116   //                         the input images, otherwise the current image is first copied
00117   //                         to the previous image (ring buffer functionality, descriptors need
00118   //                         to be computed only once)
00119   void pushBack (uint8_t *I1,uint8_t* I2,int32_t* dims,const bool replace);
00120 
00121   // computes features from a single image and pushes it back to a ringbuffer,
00122   // which interally stores the features of the current and previous image pair
00123   // use this function for flow computation
00124   // parameter description see above
00125   void pushBack (uint8_t *I1,int32_t* dims,const bool replace) { pushBack(I1,0,dims,replace); }
00126 
00127   // match features currently stored in ring buffer (current and previous frame)
00128   // input: method ... 0 = flow, 1 = stereo, 2 = quad matching
00129   //        Tr_delta: uses motion from previous frame to better search for
00130   //                  matches, if specified
00131   void matchFeatures(int32_t method, Matrix *Tr_delta = 0);
00132 
00133   // feature bucketing: keeps only max_features per bucket, where the domain
00134   // is split into buckets of size (bucket_width,bucket_height)
00135   void bucketFeatures(int32_t max_features,float bucket_width,float bucket_height);
00136 
00137   // return vector with matched feature points and indices
00138   std::vector<Matcher::p_match> getMatches() { return p_matched_2; }
00139         void setMatches(std::vector<Matcher::p_match> p_matched) { p_matched_2 = p_matched; }
00140   // given a vector of inliers computes gain factor between the current and
00141   // the previous frame. this function is useful if you want to reconstruct 3d
00142   // and you want to cancel the change of (unknown) camera gain.
00143   float getGain (std::vector<int32_t> inliers);
00144 
00145 private:
00146 
00147   // structure for storing interest points
00148   struct maximum {
00149     int32_t u;   // u-coordinate
00150     int32_t v;   // v-coordinate
00151     int32_t val; // value
00152     int32_t c;   // class
00153     int32_t d1,d2,d3,d4,d5,d6,d7,d8; // descriptor
00154     maximum() {}
00155     maximum(int32_t u,int32_t v,int32_t val,int32_t c):u(u),v(v),val(val),c(c) {}
00156   };
00157 
00158   // u/v ranges for matching stage 0-3
00159   struct range {
00160     float u_min[4];
00161     float u_max[4];
00162     float v_min[4];
00163     float v_max[4];
00164   };
00165 
00166   struct delta {
00167     float val[8];
00168     delta () {}
00169     delta (float v) {
00170       for (int32_t i=0; i<8; i++)
00171         val[i] = v;
00172     }
00173   };
00174 
00175   // computes the address offset for coordinates u,v of an image of given width
00176   inline int32_t getAddressOffsetImage (const int32_t& u,const int32_t& v,const int32_t& width) {
00177     return v*width+u;
00178   }
00179 
00180   // Alexander Neubeck and Luc Van Gool: Efficient Non-Maximum Suppression, ICPR'06, algorithm 4
00181   void nonMaximumSuppression (int16_t* I_f1,int16_t* I_f2,const int32_t* dims,std::vector<Matcher::maximum> &maxima,int32_t nms_n);
00182 
00183   // descriptor functions
00184   inline uint8_t saturate(int16_t in);
00185   void filterImageAll (uint8_t* I,uint8_t* I_du,uint8_t* I_dv,int16_t* I_f1,int16_t* I_f2,const int* dims);
00186   void filterImageSobel (uint8_t* I,uint8_t* I_du,uint8_t* I_dv,const int* dims);
00187   inline void computeDescriptor (const uint8_t* I_du,const uint8_t* I_dv,const int32_t &bpl,const int32_t &u,const int32_t &v,uint8_t *desc_addr);
00188   inline void computeSmallDescriptor (const uint8_t* I_du,const uint8_t* I_dv,const int32_t &bpl,const int32_t &u,const int32_t &v,uint8_t *desc_addr);
00189   void computeDescriptors (uint8_t* I_du,uint8_t* I_dv,const int32_t bpl,std::vector<Matcher::maximum> &maxima);
00190 
00191   void getHalfResolutionDimensions(const int32_t *dims,int32_t *dims_half);
00192   uint8_t* createHalfResolutionImage(uint8_t *I,const int32_t* dims);
00193 
00194   // compute sparse set of features from image
00195   // inputs:  I ........ image
00196   //          dims ..... image dimensions [width,height]
00197   //          n ........ non-max neighborhood
00198   //          tau ...... non-max threshold
00199   // outputs: max ...... vector with maxima [u,v,value,class,descriptor (128 bits)]
00200   //          I_du ..... gradient in horizontal direction
00201   //          I_dv ..... gradient in vertical direction
00202   // WARNING: max,I_du,I_dv has to be freed by yourself!
00203   void computeFeatures (uint8_t *I,const int32_t* dims,int32_t* &max1,int32_t &num1,int32_t* &max2,int32_t &num2,uint8_t* &I_du,uint8_t* &I_dv,uint8_t* &I_du_full,uint8_t* &I_dv_full);
00204 
00205   // matching functions
00206   void computePriorStatistics (std::vector<Matcher::p_match> &p_matched,int32_t method);
00207   void createIndexVector (int32_t* m,int32_t n,std::vector<int32_t> *k,const int32_t &u_bin_num,const int32_t &v_bin_num);
00208   inline void findMatch (int32_t* m1,const int32_t &i1,int32_t* m2,const int32_t &step_size,
00209                          std::vector<int32_t> *k2,const int32_t &u_bin_num,const int32_t &v_bin_num,const int32_t &stat_bin,
00210                          int32_t& min_ind,int32_t stage,bool flow,bool use_prior,double u_=-1,double v_=-1);
00211   void matching (int32_t *m1p,int32_t *m2p,int32_t *m1c,int32_t *m2c,
00212                  int32_t n1p,int32_t n2p,int32_t n1c,int32_t n2c,
00213                  std::vector<Matcher::p_match> &p_matched,int32_t method,bool use_prior,Matrix *Tr_delta = 0);
00214 
00215   // outlier removal
00216   void removeOutliers (std::vector<Matcher::p_match> &p_matched,int32_t method);
00217 
00218   // parabolic fitting
00219   bool parabolicFitting(const uint8_t* I1_du,const uint8_t* I1_dv,const int32_t* dims1,
00220                         const uint8_t* I2_du,const uint8_t* I2_dv,const int32_t* dims2,
00221                         const float &u1,const float &v1,
00222                         float       &u2,float       &v2,
00223                         Matrix At,Matrix AtA,
00224                         uint8_t* desc_buffer);
00225   void relocateMinimum(const uint8_t* I1_du,const uint8_t* I1_dv,const int32_t* dims1,
00226                        const uint8_t* I2_du,const uint8_t* I2_dv,const int32_t* dims2,
00227                        const float &u1,const float &v1,
00228                        float       &u2,float       &v2,
00229                        uint8_t* desc_buffer);
00230   void refinement (std::vector<Matcher::p_match> &p_matched,int32_t method);
00231 
00232   // mean for gain computation
00233   inline float mean(const uint8_t* I,const int32_t &bpl,const int32_t &u_min,const int32_t &u_max,const int32_t &v_min,const int32_t &v_max);
00234 
00235   // parameters
00236   parameters param;
00237   int32_t    margin;
00238 
00239   int32_t *m1p1,*m2p1,*m1c1,*m2c1;
00240   int32_t *m1p2,*m2p2,*m1c2,*m2c2;
00241   int32_t n1p1,n2p1,n1c1,n2c1;
00242   int32_t n1p2,n2p2,n1c2,n2c2;
00243   uint8_t *I1p,*I2p,*I1c,*I2c;
00244   uint8_t *I1p_du,*I2p_du,*I1c_du,*I2c_du;
00245   uint8_t *I1p_dv,*I2p_dv,*I1c_dv,*I2c_dv;
00246   uint8_t *I1p_du_full,*I2p_du_full,*I1c_du_full,*I2c_du_full; // only needed for
00247   uint8_t *I1p_dv_full,*I2p_dv_full,*I1c_dv_full,*I2c_dv_full; // half-res matching
00248   int32_t dims_p[3],dims_c[3];
00249 
00250   std::vector<Matcher::p_match> p_matched_1;
00251   std::vector<Matcher::p_match> p_matched_2;
00252   std::vector<Matcher::range>   ranges;
00253 };
00254 
00255 #endif
00256