jsk_perception: point_pose_extractor.h Source File

Go to the documentation of this file.
 // -*- mode: c++ -*-
 /*********************************************************************
  * Software License Agreement (BSD License)
  *
  *  Copyright (c) 2015, JSK Lab
  *  All rights reserved.
  *
  *  Redistribution and use in source and binary forms, with or without
  *  modification, are permitted provided that the following conditions
  *  are met:
  *
  *   * Redistributions of source code must retain the above copyright
  *     notice, this list of conditions and the following disclaimer.
  *   * Redistributions in binary form must reproduce the above
  *     copyright notice, this list of conditions and the following
  *     disclaimer in the documentation and/or other materials provided
  *     with the distribution.
  *   * Neither the name of the JSK Lab nor the names of its
  *     contributors may be used to endorse or promote products derived
  *     from this software without specific prior written permission.
  *
  *  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  *  "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  *  LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  *  FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  *  COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  *  INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  *  BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  *  LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  *  CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  *  LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  *  ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  *  POSSIBILITY OF SUCH DAMAGE.
  *********************************************************************/
 #ifndef JSK_PERCEPTION_POINT_POSE_EXTRACTOR_H_
 #define JSK_PERCEPTION_POINT_POSE_EXTRACTOR_H_
  
 #include <jsk_topic_tools/diagnostic_nodelet.h>
 #include <ros/ros.h>
 #include <rospack/rospack.h>
 #include <cv_bridge/cv_bridge.h>
 #if ( CV_MAJOR_VERSION >= 4)
 #include <opencv2/opencv.hpp>
 #include <opencv2/highgui/highgui_c.h>
 #include <opencv2/calib3d/calib3d_c.h>
 #else
 #include <opencv/highgui.h>
 #include <opencv/cv.hpp>
 #endif
 #include <posedetection_msgs/Feature0DDetect.h>
 #include <posedetection_msgs/ImageFeature0D.h>
 #include <posedetection_msgs/ObjectDetection.h>
 #include <posedetection_msgs/Object6DPose.h>
 #include <geometry_msgs/PoseStamped.h>
 #include <geometry_msgs/Pose.h>
 #include <geometry_msgs/Quaternion.h>
 #include <sensor_msgs/image_encodings.h>
 #include <image_transport/image_transport.h>
 #include <image_geometry/pinhole_camera_model.h>
 #include <tf/tf.h>
 #include <tf/transform_broadcaster.h>
 #include <boost/shared_ptr.hpp>
 #include <boost/foreach.hpp>
 #include <boost/filesystem.hpp>
 #include <vector>
 #include <sstream>
 #include <iostream>
 #include <dynamic_reconfigure/server.h>
 #include <jsk_perception/point_pose_extractorConfig.h>
 #include <jsk_perception/SetTemplate.h>
  
 namespace enc = sensor_msgs::image_encodings;
  
 void features2keypoint (posedetection_msgs::Feature0D features,
                         std::vector<cv::KeyPoint>& keypoints,
                         cv::Mat& descriptors){
   keypoints.resize(features.scales.size());
   descriptors.create(features.scales.size(),features.descriptor_dim,CV_32FC1);
   std::vector<cv::KeyPoint>::iterator keypoint_it = keypoints.begin();
   for ( int i=0; keypoint_it != keypoints.end(); ++keypoint_it, ++i ) {
     *keypoint_it = cv::KeyPoint(cv::Point2f(features.positions[i*2+0],
                                             features.positions[i*2+1]),
                                 features.descriptor_dim, // size
                                 features.orientations[i], //angle
                                 0, // resonse
                                 features.scales[i] // octave
                                 );
     for (int j = 0; j < features.descriptor_dim; j++){
       descriptors.at<float>(i,j) =
         features.descriptors[i*features.descriptor_dim+j];
     }
   }
 }
  
  
 class Matching_Template
 {
 public:
   std::string _matching_frame;
   cv::Mat _template_img;
   std::vector<cv::KeyPoint> _template_keypoints;
   cv::Mat _template_descriptors;
   int _original_width_size;
   int _original_height_size;
   double _template_width;       // width of template [m]
   double _template_height;      // height of template [m]
   tf::Transform _relativepose;
   cv::Mat _affine_matrix;
   std::string _window_name;
   // The maximum allowed reprojection error to treat a point pair as an inlier
   double _reprojection_threshold;
   // threshold on squared ratio of distances between NN and 2nd NN
   double _distanceratio_threshold;
   std::vector<cv::Point2d> _correspondances;
   cv::Mat _previous_stack_img;
  
   Matching_Template(){
   }
   Matching_Template(cv::Mat img,
                     std::string matching_frame,
                     int original_width_size,
                     int original_height_size,
                     double template_width,
                     double template_height,
                     tf::Transform relativepose,
                     cv::Mat affine_matrix,
                     double reprojection_threshold,
                     double distanceratio_threshold,
                     std::string window_name,
                     bool autosize){
  
     _template_img = img.clone();
     _matching_frame = matching_frame;
     _original_width_size = original_width_size;
     _original_height_size = original_height_size;
     _template_width = template_width;
     _template_height = template_height;
     _relativepose = relativepose;
     _affine_matrix = affine_matrix;
     _window_name = window_name;
     _reprojection_threshold = reprojection_threshold;
     _distanceratio_threshold = distanceratio_threshold;
     _template_keypoints.clear();
     _correspondances.clear();
     //    cv::namedWindow(_window_name, autosize ? CV_WINDOW_AUTOSIZE : 0);
   }
  
  
   virtual ~Matching_Template(){
     std::cerr << "delete " << _window_name << std::endl;
   }
  
  
   std::string get_window_name(){
     return _window_name;
   }
  
   std::vector<cv::Point2d>* correspondances(){
     return &_correspondances;
   }
  
   bool check_template (){
     if (_template_img.empty() && _template_keypoints.size() == 0 &&
         _template_descriptors.empty()){
       return false;
     }
     else {
       return true;
     }
   }
  
  
   int set_template(ros::ServiceClient client){
     posedetection_msgs::Feature0DDetect srv;
  
     if ( _template_img.empty()) {
       ROS_ERROR ("template picture is empty.");
       return -1;
     }
     ROS_INFO_STREAM("read template image and call " << client.getService() << " service");
     cv_bridge::CvImage cv_img;
     cv_img.image = cv::Mat(_template_img);
     cv_img.encoding = std::string("bgr8");
     srv.request.image = *(cv_img.toImageMsg());
     if (client.call(srv)) {
       ROS_INFO_STREAM("get features with " << srv.response.features.scales.size() << " descriptoins");
       features2keypoint (srv.response.features, _template_keypoints, _template_descriptors);
  
       // inverse affine translation
       cv::Mat M_inv;
       cv::Mat dst;
       cv::invert(_affine_matrix, M_inv);
       //      cv::drawKeypoints (tmp, _template_keypoints, dst, cv::Scalar::all(1), cv::DrawMatchesFlags::DRAW_RICH_KEYPOINTS);
       //      cv::drawKeypoints (tmp, _template_keypoints, dst);
       // cv::warpPerspective(_template_img, dst, M_inv,
       //                          cv::Size(_original_width_size, _original_height_size),
       //                          CV_INTER_LINEAR, IPL_BORDER_CONSTANT, 0);
       for (int i = 0; i < (int)_template_keypoints.size(); i++){
         cv::Point2f pt;
         cv::Mat pt_mat(cv::Size(1,1), CV_32FC2, &pt);
         cv::Mat pt_src_mat(cv::Size(1,1), CV_32FC2, &_template_keypoints.at(i).pt);
         cv::perspectiveTransform (pt_src_mat, pt_mat, M_inv);
         _template_keypoints.at(i).pt = pt_mat.at<cv::Point2f>(0,0);
       }
       //      cvSetMouseCallback (_window_name.c_str(), &PointPoseExtractor::cvmousecb, this);
       //      _template_img = dst;
       return 0;
     } else {
       ROS_ERROR("Failed to call service Feature0DDetect");
       return 1;
     }
   }
  
  
   double log_fac( int n )
   {
     static std::vector<double> slog_table;
     int osize = slog_table.size();
     if(osize <= n){
       slog_table.resize(n+1);
       if(osize == 0){
         slog_table[0] = -1;
         slog_table[1] = log(1.0);
         osize = 2;
       }
       for(int i = osize; i <= n; i++ ){
         slog_table[i] = slog_table[i-1] + log(i);
       }
     }
     return slog_table[n];
   }
  
   int min_inlier( int n, int m, double p_badsupp, double p_badxform )
   {
     double pi, sum;
     int i, j;
     double lp_badsupp = log( p_badsupp );
     double lp_badsupp1 = log( 1.0 - p_badsupp );
     for( j = m+1; j <= n; j++ ){
       sum = 0;
       for( i = j; i <= n; i++ ){
         pi = (i-m) * lp_badsupp + (n-i+m) * lp_badsupp1 +
           log_fac( n - m ) - log_fac( i - m ) - log_fac( n - i );
         sum += exp( pi );
       }
       if( sum < p_badxform )
         break;
     }
     return j;
   }
  
  
   bool estimate_od (ros::ServiceClient client, cv::Mat src_img,
                     std::vector<cv::KeyPoint> sourceimg_keypoints,
                     image_geometry::PinholeCameraModel pcam,
                     double err_thr, cv::Mat &stack_img,
                     cv::flann::Index* ft, posedetection_msgs::Object6DPose* o6p){
  
     if ( _template_keypoints.size()== 0 &&
          _template_descriptors.empty() ){
       set_template(client);
     }
     if ( _template_keypoints.size()== 0 &&
          _template_descriptors.empty() ) {
       ROS_ERROR ("Template image was not set.");
       return false;
     }
     // stacked image
     cv::Size stack_size  = cv::Size(MAX(src_img.cols,_template_img.cols),
                                     src_img.rows+_template_img.rows);
     stack_img = cv::Mat(stack_size,CV_8UC3);
     stack_img = cv::Scalar(0);
     cv::Mat stack_img_tmp(stack_img,cv::Rect(0,0,_template_img.cols,_template_img.rows));
     cv::add(stack_img_tmp, _template_img, stack_img_tmp);
     cv::Mat stack_img_src(stack_img,cv::Rect(0,_template_img.rows,src_img.cols,src_img.rows));
     cv::add(stack_img_src, src_img, stack_img_src);
     _previous_stack_img = stack_img.clone();
  
     // matching
     cv::Mat m_indices(_template_descriptors.rows, 2, CV_32S);
     cv::Mat m_dists(_template_descriptors.rows, 2, CV_32F);
     ft->knnSearch(_template_descriptors, m_indices, m_dists, 2, cv::flann::SearchParams(-1) );
  
     // matched points
     std::vector<cv::Point2f> pt1, pt2;
     std::vector<int> queryIdxs,trainIdxs;
     for ( unsigned int j = 0; j < _template_keypoints.size(); j++ ) {
       if ( m_dists.at<float>(j,0) < m_dists.at<float>(j,1) * _distanceratio_threshold) {
         queryIdxs.push_back(j);
         trainIdxs.push_back(m_indices.at<int>(j,0));
       }
     }
     if ( queryIdxs.size() == 0 ) {
       ROS_WARN_STREAM("could not find matched points with distanceratio(" <<_distanceratio_threshold << ")");
     } else {
       cv::KeyPoint::convert(_template_keypoints,pt1,queryIdxs);
       cv::KeyPoint::convert(sourceimg_keypoints,pt2,trainIdxs);
     }
  
     ROS_INFO ("Found %d total matches among %d template keypoints", (int)pt2.size(), (int)_template_keypoints.size());
  
     cv::Mat H;
     std::vector<uchar> mask((int)pt2.size());
  
     if ( pt1.size() > 4 ) {
           // ToDO for curve face
       H = cv::findHomography(cv::Mat(pt1), cv::Mat(pt2), mask, CV_RANSAC, _reprojection_threshold);
     }
  
     // draw line
     for (int j = 0; j < (int)pt1.size(); j++){
       cv::Point2f pt, pt_orig;
       cv::Mat pt_mat(cv::Size(1,1), CV_32FC2, &pt);
       cv::Mat pt_src_mat(cv::Size(1,1), CV_32FC2, &pt1.at(j));
       cv::perspectiveTransform (pt_src_mat, pt_mat, _affine_matrix);
       pt_orig = pt_mat.at<cv::Point2f>(0,0);
       if ( mask.at(j)){
         cv::line(stack_img, pt_orig, pt2.at(j)+cv::Point2f(0,_template_img.rows),
                  CV_RGB(0,255,0), 1,8,0);
       }
       else {
         cv::line(stack_img, pt_orig, pt2.at(j)+cv::Point2f(0,_template_img.rows),
                  CV_RGB(255,0,255), 1,8,0);
       }
     }
     int inlier_sum = 0;
     for (int k=0; k < (int)mask.size(); k++){
       inlier_sum += (int)mask.at(k);
     }
  
     double text_scale = 1.5;
     {
       int fontFace = 0, thickness = 0, baseLine;
       int x, y;
       cv::Size text_size;
       std::string text;
  
       text = "inlier: " + boost::lexical_cast<std::string>((int)inlier_sum) + " / " + boost::lexical_cast<std::string>((int)pt2.size());
       text_size = cv::getTextSize(text, fontFace, text_scale, thickness, &baseLine);
       x = stack_img.size().width - text_size.width;
       y = text_size.height + thickness + 10; // 10pt pading
       cv::putText (stack_img, text, cv::Point(x, y),
                    fontFace, text_scale, CV_RGB(0, 255, 0),
                    thickness, 8, false);
  
       text = "template: " + boost::lexical_cast<std::string>((int)_template_keypoints.size());
       text_size = cv::getTextSize(text, fontFace, text_scale, thickness, &baseLine);
       x = stack_img.size().width - text_size.width;
       y += text_size.height + thickness + 10; // 10pt pading
       cv::putText (stack_img, text, cv::Point(x, y),
                    fontFace, text_scale, CV_RGB(0, 255, 0),
                    thickness, 8, false);
     }
  
     // draw correspondances
     ROS_INFO("  _correspondances.size: %d", (int)_correspondances.size());
     for (int j = 0; j < (int)_correspondances.size(); j++){
       cv::circle(stack_img, cv::Point2f(_correspondances.at(j).x, _correspondances.at(j).y + _template_img.size().height),
                  8, CV_RGB(255,0,0), -1);
     }
  
     ROS_INFO("    inlier_sum:%d   min_lier:%d", inlier_sum, min_inlier((int)pt2.size(), 4, 0.10, 0.01));
     if ((cv::countNonZero( H ) == 0) || (inlier_sum < min_inlier((int)pt2.size(), 4, 0.10, 0.01))){
       ROS_INFO("    inlier_sum < min_lier return-from estimate-od");
       if( _window_name != "" )
         cv::imshow(_window_name, stack_img);
       return false;
     }
  
     std::string _type;
     char chr[20];
  
     // number of match points
     sprintf(chr, "%d", (int)pt2.size());
     _type = _matching_frame + "_" + std::string(chr);
  
     sprintf(chr, "%d", inlier_sum);
     _type = _type + "_" + std::string(chr);
  
     cv::Point2f corners2d[4] = {cv::Point2f(0,0),
                                 cv::Point2f(_original_width_size,0),
                                 cv::Point2f(_original_width_size,_original_height_size),
                                 cv::Point2f(0,_original_height_size)};
     cv::Mat corners2d_mat (cv::Size(4, 1), CV_32FC2, corners2d);
     cv::Point3f corners3d[4] = {cv::Point3f(0,0,0),
                                 cv::Point3f(0,_template_width,0),
                                 cv::Point3f(_template_height,_template_width,0),
                                 cv::Point3f(_template_height,0,0)};
     cv::Mat corners3d_mat (cv::Size(4, 1), CV_32FC3, corners3d);
  
     cv::Mat corners2d_mat_trans;
  
     cv::perspectiveTransform (corners2d_mat, corners2d_mat_trans, H);
  
     double fR3[3], fT3[3];
     cv::Mat rvec(3, 1, CV_64FC1, fR3);
     cv::Mat tvec(3, 1, CV_64FC1, fT3);
     cv::Mat zero_distortion_mat = cv::Mat::zeros(4, 1, CV_64FC1);
  
     cv::solvePnP (corners3d_mat, corners2d_mat_trans, 
                   pcam.intrinsicMatrix(),
                   zero_distortion_mat,//if unrectified: pcam.distortionCoeffs()
                   rvec, tvec);
  
     tf::Transform checktf, resulttf;
  
     checktf.setOrigin( tf::Vector3(fT3[0], fT3[1], fT3[2] ) );
  
     double rx = fR3[0], ry = fR3[1], rz = fR3[2];
     tf::Quaternion quat;
     double angle = cv::norm(rvec);
     quat.setRotation(tf::Vector3(rx/angle, ry/angle, rz/angle), angle);
     checktf.setRotation( quat );
  
     resulttf = checktf * _relativepose;
  
     ROS_INFO( "      tx: (%0.2lf,%0.2lf,%0.2lf) rx: (%0.2lf,%0.2lf,%0.2lf)",
               resulttf.getOrigin().getX(),
               resulttf.getOrigin().getY(),
               resulttf.getOrigin().getZ(),
               resulttf.getRotation().getAxis().x() * resulttf.getRotation().getAngle(),
               resulttf.getRotation().getAxis().y() * resulttf.getRotation().getAngle(),
               resulttf.getRotation().getAxis().z() * resulttf.getRotation().getAngle());
  
     o6p->pose.position.x = resulttf.getOrigin().getX();
     o6p->pose.position.y = resulttf.getOrigin().getY();
     o6p->pose.position.z = resulttf.getOrigin().getZ();
     o6p->pose.orientation.w = resulttf.getRotation().w();
     o6p->pose.orientation.x = resulttf.getRotation().x();
     o6p->pose.orientation.y = resulttf.getRotation().y();
     o6p->pose.orientation.z = resulttf.getRotation().z();
     o6p->type = _matching_frame; // _type
  
     // draw 3d cube model
     std::vector<cv::Point2f> projected_top;
     {
       tf::Vector3 coords[8] = {tf::Vector3(0,0,0),
                                tf::Vector3(0, _template_width, 0),
                                tf::Vector3(_template_height, _template_width,0),
                                tf::Vector3(_template_height, 0, 0),
                                tf::Vector3(0, 0, -0.03),
                                tf::Vector3(0, _template_width, -0.03),
                                tf::Vector3(_template_height, _template_width, -0.03),
                                tf::Vector3(_template_height, 0, -0.03)};
  
       projected_top = std::vector<cv::Point2f>(8);
  
       for(int i=0; i<8; i++) {
         coords[i] = checktf * coords[i];
         cv::Point3f pt(coords[i].getX(), coords[i].getY(), coords[i].getZ());
         projected_top[i] = pcam.project3dToPixel(pt);
       }
     }
  
     { // check if the matched region does not too big or too small
       float max_x, max_y, min_x, min_y;
       max_x = max_y = -1e9;
       min_x = min_y = 1e9;
       for (int j = 0; j < 4; j++){
         cv::Point2f pt = corners2d_mat_trans.at<cv::Point2f>(0,j);
         max_x = std::max(max_x, pt.x), max_y = std::max(max_y, pt.y);
         min_x = std::min(min_x, pt.x), min_y = std::min(min_y, pt.y);
       }
       if((max_x - min_x) < 30 || (max_y - min_y) < 30 ||
          src_img.rows < (max_x - min_x)/2 || src_img.cols < (max_y - min_y)/2){
         ROS_INFO("        matched region is too big or small (2< && <30) width:%f height:%f return-from estimate-od", max_x - min_x, max_y - min_y);
         return false;
       }
     }
  
     double err_sum = 0;
     bool err_success = true;
     for (int j = 0; j < 4; j++){
       double err = sqrt(pow((corners2d_mat_trans.at<cv::Point2f>(0,j).x - projected_top.at(j).x), 2) +
                       pow((corners2d_mat_trans.at<cv::Point2f>(0,j).y - projected_top.at(j).y), 2));
       err_sum += err;
     }
     if (err_sum > err_thr){
       ROS_INFO("          err_sum:%f > err_thr:%f return-from estimate-od", err_sum, err_thr);
       err_success = false;
     } else {
       o6p->reliability = 1.0 - (err_sum / err_thr);
     }
     // draw lines around the detected object
     for (int j = 0; j < corners2d_mat_trans.cols; j++){
       cv::Point2f p1(corners2d_mat_trans.at<cv::Point2f>(0,j).x,
                      corners2d_mat_trans.at<cv::Point2f>(0,j).y+_template_img.rows);
       cv::Point2f p2(corners2d_mat_trans.at<cv::Point2f>(0,(j+1)%corners2d_mat_trans.cols).x,
                      corners2d_mat_trans.at<cv::Point2f>(0,(j+1)%corners2d_mat_trans.cols).y+_template_img.rows);
       cv::line (stack_img, p1, p2, CV_RGB(255, 0, 0),
                 (err_success?4:1), // width
                 CV_AA, 0);
     }
  
     // draw 3d cube model
     if(projected_top.size() == 8) { // verify, the size is 8
       int cnt = 8;
       std::vector<cv::Point2f> ps(cnt);
       for(int i=0; i<cnt; i++)
         ps[i] = cv::Point2f(projected_top[i].x,
                             projected_top[i].y+_template_img.rows);
  
       int draw_width = ( err_success ? 3 : 1);
       for(int i=0; i<4; i++) {
         cv::line (stack_img, ps[i], ps[(i+1)%4], CV_RGB(0, 0, 255), draw_width, CV_AA, 0);
         cv::line (stack_img, ps[i+4], ps[(i+1)%4+4], CV_RGB(0, 0, 255), draw_width, CV_AA, 0);
         cv::line (stack_img, ps[i], ps[i+4], CV_RGB(0, 0, 255), draw_width, CV_AA, 0);
       }
     }
  
     // draw coords
     if ( err_success )
     {
       tf::Vector3 coords[4] = { tf::Vector3(0,0,0),
                                 tf::Vector3(0.05,0,0),
                                 tf::Vector3(0,0.05,0),
                                 tf::Vector3(0,0,0.05)};
       std::vector<cv::Point2f> ps(4);
  
       for(int i=0; i<4; i++) {
         coords[i] = resulttf * coords[i];
         cv::Point3f pt(coords[i].getX(), coords[i].getY(), coords[i].getZ());   
         ps[i] = pcam.project3dToPixel(pt);
         ps[i].y += _template_img.rows; // draw on camera image
       }
  
       cv::line (stack_img, ps[0], ps[1], CV_RGB(255, 0, 0), 3, CV_AA, 0);
       cv::line (stack_img, ps[0], ps[2], CV_RGB(0, 255, 0), 3, CV_AA, 0);
       cv::line (stack_img, ps[0], ps[3], CV_RGB(0, 0, 255), 3, CV_AA, 0);
     }
  
     // write text on image
     {
       std::string text;
       int x, y;
       text = "error: " + boost::lexical_cast<std::string>(err_sum);
       x = stack_img.size().width - 16*17*text_scale; // 16pt * 17
       y = _template_img.size().height - (16 + 2)*text_scale*6;
       cv::putText (stack_img, text, cv::Point(x, y),
                    0, text_scale, CV_RGB(0, 255, 0),
                    2, 8, false);
       ROS_INFO("      %s < %f (threshold)", text.c_str(), err_thr );
     }
     // for debug window
     if( _window_name != "" )
       cv::imshow(_window_name, stack_img);
  
     return err_success;
   }
 };  // the end of difinition of class Matching_Template
  
  
 namespace jsk_perception
 {
  
   class PointPoseExtractor: public jsk_topic_tools::DiagnosticNodelet
   {
   public:
     std::vector<Matching_Template *> _templates;
     typedef jsk_perception::point_pose_extractorConfig Config;
     PointPoseExtractor() : DiagnosticNodelet("PointPoseExtractor") {}
     virtual ~PointPoseExtractor();
   protected:
     ros::NodeHandle _n;
     image_transport::ImageTransport *it;
     ros::Subscriber _sub;
     ros::ServiceServer _server;
     ros::ServiceClient _client;
     ros::Publisher _pub, _pub_agg, _pub_pose;
     tf::TransformBroadcaster _br;
     image_transport::Publisher _debug_pub;
     bool _first_sample_change;
     double _reprojection_threshold;
     double _distanceratio_threshold;
     double _th_step;
     double _phi_step;
     bool _autosize;
     double _err_thr;
     image_geometry::PinholeCameraModel pcam;
     bool pnod;
     bool _initialized;
     bool _viewer;
     bool _publish_tf;
     std::string _child_frame_id;
  
     virtual void initialize ();
     virtual cv::Mat make_homography(cv::Mat src, cv::Mat rvec, cv::Mat tvec,
                                     double template_width, double template_height, cv::Size &size);
     virtual int make_warped_images (cv::Mat src, std::vector<cv::Mat> &imgs,
                                     std::vector<cv:: Mat> &Mvec,
                                     double template_width, double template_height,
                                     double th_step, double phi_step);
     virtual bool add_new_template(cv::Mat img, std::string typestr, tf::Transform relative_pose,
                                   double template_width, double template_height,
                                   double theta_step, double phi_step);
     virtual bool settemplate_cb (jsk_perception::SetTemplate::Request &req,
                                  jsk_perception::SetTemplate::Response &res);
     virtual void imagefeature_cb (const posedetection_msgs::ImageFeature0DConstPtr& msg);
     virtual void onInit();
     virtual void subscribe();
     virtual void unsubscribe();
     virtual void dyn_conf_callback(Config &config, uint32_t level);
  
     static void cvmousecb (int event, int x, int y, int flags, void* param){
       PointPoseExtractor* ppe = static_cast<PointPoseExtractor*>(param);
       Matching_Template *mt = ppe->_templates.back();
       // std::cerr << "mousecb_ -> " << mt << std::endl;
       switch (event){
       case CV_EVENT_LBUTTONUP: {
         cv::Point2d pt(x,y - (int)mt->_template_img.size().height);
         ROS_INFO("add correspondence (%d, %d)", (int)pt.x, (int)pt.y);
         mt->_correspondances.push_back(pt);
         if ((int)mt->_correspondances.size() >= 4){
           make_template_from_mousecb(ppe);
           mt->_correspondances.clear();
           ROS_INFO("reset");
         }
         break;
       }
       case CV_EVENT_RBUTTONUP: {
         mt->_correspondances.clear();
         ROS_INFO("reset");
         break;
       }
       }
     }
   static void make_template_from_mousecb(PointPoseExtractor* ppe){
     Matching_Template *mt = ppe->_templates.back();
     cv::Mat H;
     cv::Mat tmp_template, tmp_warp_template;
     std::vector<cv::Point2f>pt1, pt2;
     double width, height;
     std::string filename;
     std::cout << "input template's [width]" << std::endl;
     std::cin >> width;
     std::cout << "input template's [height]" << std::endl;
     std::cin >> height;
     std::cout << "input template's [filename]" << std::endl;
     std::cin >> filename;
  
     for (int i = 0; i < 4; i++){
       pt1.push_back(cv::Point2d((int)mt->_correspondances.at(i).x,
                                 (int)mt->_correspondances.at(i).y + mt->_template_img.size().height));
     }
     cv::Rect rect = cv::boundingRect(cv::Mat(pt1));
     double scale = std::max(width, height) / 500.0;
     int iwidth = width / scale, iheight = height / scale;
     pt2.push_back(cv::Point2d(0,0));
     pt2.push_back(cv::Point2d(iwidth,0));
     pt2.push_back(cv::Point2d(iwidth,iheight));
     pt2.push_back(cv::Point2d(0,     iheight));
     H = cv::findHomography(cv::Mat(pt1), cv::Mat(pt2));
  
     cv::getRectSubPix(mt->_previous_stack_img, rect.size(),
                       cv::Point2f((rect.tl().x + rect.br().x)/2.0,(rect.tl().y + rect.br().y)/2.0),
                       tmp_template);
     cv::warpPerspective(mt->_previous_stack_img, tmp_warp_template, H, cv::Size(iwidth, iheight));
  
     try {
       cv::imwrite(filename,tmp_template);
       boost::filesystem::path fname(filename);
       std::stringstream ss;
       ss << (fname.parent_path() / fname.stem()).c_str() << "_wrap" << fname.extension().c_str();
       cv::imwrite(ss.str(),tmp_warp_template);
     }catch (cv::Exception e) {
       std::cerr << e.what()  << std::endl;
     }
  
     for (int i = 0; i < (int)pt1.size(); i++){
       pt2.push_back(cv::Point2d((int)pt1.at(i).x - rect.x,
                                 (int)pt1.at(i).y - rect.y - mt->_template_img.size().height));
     }
     // cv::Mat mask_img = cv::Mat::zeros(tmp_template.size(), CV_8UC3);
     // cv::fillConvexPoly(mask_img, pt2.begin(), (int)pt2.size(), CV_RGB(255, 255, 255));
  
     // cv::namedWindow("hoge", 1);
     // cv::imshow("hoge", mask_img);
  
     cv::Mat M = (cv::Mat_<double>(3,3) << 1,0,0, 0,1,0, 0,0,1);
     std::string window_name = "sample" + boost::lexical_cast<std::string>((int)ppe->_templates.size());
  
     Matching_Template* tmplt =
       new Matching_Template (tmp_warp_template, "sample",
                              tmp_warp_template.size().width, tmp_warp_template.size().height,
                              width, height,
                              tf::Transform(tf::Quaternion(0, 0, 0, 1), tf::Vector3(0, 0, 0)),
                              M,
                              mt->_reprojection_threshold,
                              mt->_distanceratio_threshold,
                              ppe->_first_sample_change ? window_name : mt->_window_name,
                              cv::getWindowProperty(mt->_window_name, CV_WND_PROP_AUTOSIZE));
  
     mt->_correspondances.clear();
     ppe->_templates.push_back(tmplt);
     cv::namedWindow(ppe->_first_sample_change ? window_name : mt->_window_name,
                     cv::getWindowProperty(mt->_window_name, CV_WND_PROP_AUTOSIZE));
     cvSetMouseCallback (ppe->_first_sample_change ? window_name.c_str() : mt->_window_name.c_str(),
                         &cvmousecb, ppe);
     ppe->_first_sample_change = true;
   }
   private:
   };
 }
  
  
 #endif