doxygen/visp-3.2.0/testGenericTrackerDepth_8cpp_source.html

 /****************************************************************************
  *
  * ViSP, open source Visual Servoing Platform software.
  * Copyright (C) 2005 - 2019 by Inria. All rights reserved.
  *
  * This software is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License as published by
  * the Free Software Foundation; either version 2 of the License, or
  * (at your option) any later version.
  * See the file LICENSE.txt at the root directory of this source
  * distribution for additional information about the GNU GPL.
  *
  * For using ViSP with software that can not be combined with the GNU
  * GPL, please contact Inria about acquiring a ViSP Professional
  * Edition License.
  *
  * See http://visp.inria.fr for more information.
  *
  * This software was developed at:
  * Inria Rennes - Bretagne Atlantique
  * Campus Universitaire de Beaulieu
  * 35042 Rennes Cedex
  * France
  *
  * If you have questions regarding the use of this file, please contact
  * Inria at visp@inria.fr
  *
  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
  *
  * Description:
  * Regression test for depth MBT.
  *
  *****************************************************************************/

 #include <cstdlib>
 #include <iostream>
 #include <visp3/core/vpConfig.h>

 #if defined(VISP_HAVE_MODULE_MBT)

 #include <visp3/core/vpIoTools.h>
 #include <visp3/io/vpParseArgv.h>
 #include <visp3/io/vpImageIo.h>
 #include <visp3/gui/vpDisplayX.h>
 #include <visp3/gui/vpDisplayGDI.h>
 #include <visp3/gui/vpDisplayOpenCV.h>
 #include <visp3/gui/vpDisplayD3D.h>
 #include <visp3/gui/vpDisplayGTK.h>
 #include <visp3/mbt/vpMbGenericTracker.h>

 #define GETOPTARGS "i:dcle:mh"

 namespace
 {
   void usage(const char *name, const char *badparam)
   {
     fprintf(stdout, "\n\
     Regression test for vpGenericTracker and depth.\n\
     \n\
     SYNOPSIS\n\
       %s [-i <test image path>] [-c] [-d] [-h] [-l] \n\
      [-e <last frame index>] [-m]\n", name);

     fprintf(stdout, "\n\
     OPTIONS:                                               \n\
       -i <input image path>                                \n\
          Set image input path.\n\
          These images come from ViSP-images-x.y.z.tar.gz available \n\
          on the ViSP website.\n\
          Setting the VISP_INPUT_IMAGE_PATH environment\n\
          variable produces the same behavior than using\n\
          this option.\n\
     \n\
       -d \n\
          Turn off the display.\n\
     \n\
       -c\n\
          Disable the mouse click. Useful to automate the \n\
          execution of this program without human intervention.\n\
     \n\
       -l\n\
          Use the scanline for visibility tests.\n\
     \n\
       -e <last frame index>\n\
          Specify the index of the last frame. Once reached, the tracking is stopped.\n\
     \n\
       -m \n\
          Set a tracking mask.\n\
     \n\
       -h \n\
          Print the help.\n\n");

     if (badparam)
       fprintf(stdout, "\nERROR: Bad parameter [%s]\n", badparam);
   }

   bool getOptions(int argc, const char **argv, std::string &ipath, bool &click_allowed, bool &display,
                   bool &useScanline, int &lastFrame, bool &use_mask)
   {
     const char *optarg_;
     int c;
     while ((c = vpParseArgv::parse(argc, argv, GETOPTARGS, &optarg_)) > 1) {

       switch (c) {
       case 'i':
         ipath = optarg_;
         break;
       case 'c':
         click_allowed = false;
         break;
       case 'd':
         display = false;
         break;
       case 'l':
         useScanline = true;
         break;
       case 'e':
         lastFrame = atoi(optarg_);
         break;
       case 'm':
         use_mask = true;
         break;
       case 'h':
         usage(argv[0], NULL);
         return false;
         break;

       default:
         usage(argv[0], optarg_);
         return false;
         break;
       }
     }

     if ((c == 1) || (c == -1)) {
       // standalone param or error
       usage(argv[0], NULL);
       std::cerr << "ERROR: " << std::endl;
       std::cerr << "  Bad argument " << optarg_ << std::endl << std::endl;
       return false;
     }

     return true;
   }

   bool read_data(const std::string &input_directory, const int cpt, const vpCameraParameters &cam_depth,
                  vpImage<unsigned char> &I, vpImage<uint16_t> &I_depth,
                  std::vector<vpColVector> &pointcloud, vpHomogeneousMatrix &cMo)
   {
     char buffer[256];
     sprintf(buffer, std::string(input_directory + "/Images/Image_%04d.pgm").c_str(), cpt);
     std::string image_filename = buffer;

     sprintf(buffer, std::string(input_directory + "/Depth/Depth_%04d.bin").c_str(), cpt);
     std::string depth_filename = buffer;

     sprintf(buffer, std::string(input_directory + "/CameraPose/Camera_%03d.txt").c_str(), cpt);
     std::string pose_filename = buffer;

     if (!vpIoTools::checkFilename(image_filename) || !vpIoTools::checkFilename(depth_filename)
         || !vpIoTools::checkFilename(pose_filename))
       return false;

     vpImageIo::read(I, image_filename);

     unsigned int depth_width = 0, depth_height = 0;
     std::ifstream file_depth(depth_filename.c_str(), std::ios::in | std::ios::binary);
     if (!file_depth.is_open())
       return false;

     vpIoTools::readBinaryValueLE(file_depth, depth_height);
     vpIoTools::readBinaryValueLE(file_depth, depth_width);
     I_depth.resize(depth_height, depth_width);
     pointcloud.resize(depth_height*depth_width);

     const float depth_scale = 0.000030518f;
     for (unsigned int i = 0; i < I_depth.getHeight(); i++) {
       for (unsigned int j = 0; j < I_depth.getWidth(); j++) {
         vpIoTools::readBinaryValueLE(file_depth, I_depth[i][j]);
         double x = 0.0, y = 0.0, Z = I_depth[i][j] * depth_scale;
         vpPixelMeterConversion::convertPoint(cam_depth, j, i, x, y);
         vpColVector pt3d(4, 1.0);
         pt3d[0] = x*Z;
         pt3d[1] = y*Z;
         pt3d[2] = Z;
         pointcloud[i*I_depth.getWidth()+j] = pt3d;
       }
     }

     std::ifstream file_pose(pose_filename.c_str());
     if (!file_pose.is_open()) {
       return false;
     }

     for (unsigned int i = 0; i < 4; i++) {
       for (unsigned int j = 0; j < 4; j++) {
         file_pose >> cMo[i][j];
       }
     }

     return true;
   }
 }

 int main(int argc, const char *argv[])
 {
   try {
     std::string env_ipath;
     std::string opt_ipath = "";
     bool opt_click_allowed = true;
     bool opt_display = true;
     bool useScanline = false;
 #if defined(__mips__) || defined(__mips) || defined(mips) || defined(__MIPS__)
     // To avoid Debian test timeout
     int opt_lastFrame = 5;
 #else
     int opt_lastFrame = -1;
 #endif
     bool use_mask = false;

     // Get the visp-images-data package path or VISP_INPUT_IMAGE_PATH
     // environment variable value
     env_ipath = vpIoTools::getViSPImagesDataPath();

     // Read the command line options
     if (!getOptions(argc, argv, opt_ipath, opt_click_allowed, opt_display,
                     useScanline, opt_lastFrame, use_mask)) {
       return EXIT_FAILURE;
     }

     std::cout << "useScanline: " << useScanline << std::endl;
     std::cout << "use_mask: " << use_mask << std::endl;

     // Test if an input path is set
     if (opt_ipath.empty() && env_ipath.empty()) {
       usage(argv[0], NULL);
       std::cerr << std::endl << "ERROR:" << std::endl;
       std::cerr << "  Use -i <visp image path> option or set VISP_INPUT_IMAGE_PATH " << std::endl
                 << "  environment variable to specify the location of the " << std::endl
                 << "  image path where test images are located." << std::endl
                 << std::endl;

       return EXIT_FAILURE;
     }

     std::string input_directory = vpIoTools::createFilePath(!opt_ipath.empty() ? opt_ipath : env_ipath, "mbt-depth/Castle-simu");
     if (!vpIoTools::checkDirectory(input_directory)) {
       std::cerr << "ViSP-images does not contain the folder: " << input_directory << "!" << std::endl;
       return EXIT_SUCCESS;
     }

     // Initialise a  display
 #if defined VISP_HAVE_X11
     vpDisplayX display1, display2;
 #elif defined VISP_HAVE_GDI
     vpDisplayGDI display1, display2;
 #elif defined VISP_HAVE_OPENCV
     vpDisplayOpenCV display1, display2;
 #elif defined VISP_HAVE_D3D9
     vpDisplayD3D display1, display2;
 #elif defined VISP_HAVE_GTK
     vpDisplayGTK display1, display2;
 #else
     opt_display = false;
 #endif

     std::vector<int> tracker_type;
     tracker_type.push_back(vpMbGenericTracker::DEPTH_DENSE_TRACKER);
     vpMbGenericTracker tracker(tracker_type);
 #if defined(VISP_HAVE_XML2)
     tracker.loadConfigFile(input_directory + "/Config/chateau_depth.xml");
 #else
     {
       vpCameraParameters cam_depth;
       cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);
       tracker.setCameraParameters(cam_depth);
     }
     // Depth
     tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);
     tracker.setDepthNormalPclPlaneEstimationMethod(2);
     tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);
     tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);
     tracker.setDepthNormalSamplingStep(2, 2);

     tracker.setDepthDenseSamplingStep(4, 4);

 #if defined(VISP_HAVE_MODULE_KLT) && (defined(VISP_HAVE_OPENCV) && (VISP_HAVE_OPENCV_VERSION >= 0x020100))
     tracker.setKltMaskBorder(5);
 #endif

     tracker.setAngleAppear(vpMath::rad(85.0));
     tracker.setAngleDisappear(vpMath::rad(89.0));
     tracker.setNearClippingDistance(0.01);
     tracker.setFarClippingDistance(2.0);
     tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);
 #endif
     tracker.loadModel(input_directory + "/Models/chateau.cao");
     vpHomogeneousMatrix T;
     T[0][0] = -1;
     T[0][3] = -0.2;
     T[1][1] = 0;
     T[1][2] = 1;
     T[1][3] = 0.12;
     T[2][1] = 1;
     T[2][2] = 0;
     T[2][3] = -0.15;
     tracker.loadModel(input_directory + "/Models/cube.cao", false, T);
     vpCameraParameters cam_depth;
     tracker.getCameraParameters(cam_depth);
     tracker.setDisplayFeatures(true);
     tracker.setScanLineVisibilityTest(useScanline);

     vpImage<unsigned char> I;
     vpImage<uint16_t> I_depth_raw;
     vpImage<vpRGBa> I_depth;
     vpHomogeneousMatrix cMo_truth;
     std::vector<vpColVector> pointcloud;
     int cpt_frame = 1;
     if (!read_data(input_directory, cpt_frame, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {
       std::cerr << "Cannot read first frame!" << std::endl;
       return EXIT_FAILURE;
     }

     vpImage<bool> mask(I.getHeight(), I.getWidth());
     const double roi_step = 7.0;
     const double roi_step2 = 6.0;
     if (use_mask) {
       mask = false;
       for (unsigned int i = (unsigned int) (I.getRows()/roi_step); i < (unsigned int) (I.getRows()*roi_step2/roi_step); i++) {
         for (unsigned int j = (unsigned int) (I.getCols()/roi_step); j < (unsigned int) (I.getCols()*roi_step2/roi_step); j++) {
           mask[i][j] = true;
         }
       }
       tracker.setMask(mask);
     }

     vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);
     if (opt_display) {
 #ifdef VISP_HAVE_DISPLAY
       display1.init(I, 0, 0, "Image");
       display2.init(I_depth, I.getWidth(), 0, "Depth");
 #endif
     }

     vpHomogeneousMatrix depth_M_color;
     depth_M_color[0][3] = -0.05;
     tracker.initFromPose(I, depth_M_color*cMo_truth);

     bool click = false, quit = false;
     std::vector<double> vec_err_t, vec_err_tu;
     std::vector<double> time_vec;
     while (read_data(input_directory, cpt_frame, cam_depth, I, I_depth_raw, pointcloud, cMo_truth) && !quit
            && (opt_lastFrame > 0 ? (int)cpt_frame <= opt_lastFrame : true)) {
       vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);

       if (opt_display) {
         vpDisplay::display(I);
         vpDisplay::display(I_depth);
       }

       double t = vpTime::measureTimeMs();
       std::map<std::string, const vpImage<unsigned char> *> mapOfImages;
       std::map<std::string, const std::vector<vpColVector> *> mapOfPointclouds;
       mapOfPointclouds["Camera"] = &pointcloud;
       std::map<std::string, unsigned int> mapOfWidths, mapOfHeights;
       mapOfWidths["Camera"] = I_depth.getWidth();
       mapOfHeights["Camera"] = I_depth.getHeight();

       tracker.track(mapOfImages, mapOfPointclouds, mapOfWidths, mapOfHeights);
       vpHomogeneousMatrix cMo = tracker.getPose();
       t = vpTime::measureTimeMs() - t;
       time_vec.push_back(t);

       if (opt_display) {
         tracker.display(I_depth, cMo, cam_depth, vpColor::red, 3);
         vpDisplay::displayFrame(I_depth, cMo, cam_depth, 0.05, vpColor::none, 3);

         std::stringstream ss;
         ss << "Frame: " << cpt_frame;
         vpDisplay::displayText(I_depth, 20, 20, ss.str(), vpColor::red);
         ss.str("");
         ss << "Nb features: " << tracker.getError().getRows();
         vpDisplay::displayText(I_depth, 40, 20, ss.str(), vpColor::red);
       }

       vpPoseVector pose_est(cMo);
       vpPoseVector pose_truth(depth_M_color*cMo_truth);
       vpColVector t_est(3), t_truth(3);
       vpColVector tu_est(3), tu_truth(3);
       for (int i = 0; i < 3; i++) {
         t_est[i] = pose_est[i];
         t_truth[i] = pose_truth[i];
         tu_est[i] = pose_est[i+3];
         tu_truth[i] = pose_truth[i+3];
       }

       vpColVector t_err = t_truth-t_est, tu_err = tu_truth-tu_est;
       double t_err2 = sqrt(t_err.sumSquare()), tu_err2 = vpMath::deg(sqrt(tu_err.sumSquare()));
       vec_err_t.push_back( t_err2 );
       vec_err_tu.push_back( tu_err2 );
       const double t_thresh = useScanline ? 0.003 : 0.002;
       const double tu_thresh = useScanline ? 0.5 : 0.4;
       if ( !use_mask && (t_err2 > t_thresh || tu_err2 > tu_thresh) ) { //no accuracy test with mask
         std::cerr << "Pose estimated exceeds the threshold (t_thresh = 0.003, tu_thresh = 0.5)!" << std::endl;
         std::cout << "t_err: " << sqrt(t_err.sumSquare()) << " ; tu_err: " << vpMath::deg(sqrt(tu_err.sumSquare())) << std::endl;
         return EXIT_FAILURE;
       }

       if (opt_display) {
         if (use_mask) {
           vpRect roi(vpImagePoint(I.getRows()/roi_step, I.getCols()/roi_step),
                      vpImagePoint(I.getRows()*roi_step2/roi_step, I.getCols()*roi_step2/roi_step));
           vpDisplay::displayRectangle(I_depth, roi, vpColor::yellow);
         }

         vpDisplay::flush(I);
         vpDisplay::flush(I_depth);
       }

       if (opt_display && opt_click_allowed) {
         vpMouseButton::vpMouseButtonType button;
         if (vpDisplay::getClick(I, button, click)) {
           switch (button) {
             case vpMouseButton::button1:
               quit = !click;
               break;

             case vpMouseButton::button3:
               click = !click;
               break;

             default:
               break;
           }
         }
       }

       cpt_frame++;
     }

     if (!time_vec.empty())
       std::cout << "Computation time, Mean: " << vpMath::getMean(time_vec) << " ms ; Median: " << vpMath::getMedian(time_vec)
                 << " ms ; Std: " << vpMath::getStdev(time_vec) << " ms" << std::endl;

     if (!vec_err_t.empty())
       std::cout << "Max translation error: " << *std::max_element(vec_err_t.begin(), vec_err_t.end()) << std::endl;

     if (!vec_err_tu.empty())
       std::cout << "Max thetau error: " << *std::max_element(vec_err_tu.begin(), vec_err_tu.end()) << std::endl;

 #if defined(VISP_HAVE_XML2)
     // Cleanup memory allocated by xml library used to parse the xml config
     // file in vpMbGenericTracker::loadConfigFile()
     vpXmlParser::cleanup();
 #endif

     return EXIT_SUCCESS;
   } catch (const vpException &e) {
     std::cout << "Catch an exception: " << e << std::endl;
     return EXIT_FAILURE;
   }
 }
 #else
 int main() {
   std::cout << "Enable MBT module (VISP_HAVE_MODULE_MBT) to launch this test." << std::endl;
   return 0;
 }
 #endif
vpImage::getCols
unsigned int getCols() const
Definition: vpImage.h:169

vpDisplay::getClick
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
Definition: vpDisplay_uchar.cpp:702

vpMath::getStdev
static double getStdev(const std::vector< double > &v, const bool useBesselCorrection=false)
Definition: vpMath.cpp:252

vpIoTools::checkDirectory
static bool checkDirectory(const char *dirname)
Definition: vpIoTools.cpp:467

vpIoTools::getViSPImagesDataPath
static std::string getViSPImagesDataPath()
Definition: vpIoTools.cpp:1316

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:239

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:92

vpIoTools::readBinaryValueLE
static void readBinaryValueLE(std::ifstream &file, int16_t &short_value)
Definition: vpIoTools.cpp:1864

vpMath::getMedian
static double getMedian(const std::vector< double > &v)
Definition: vpMath.cpp:222

vpDisplayGDI
Display for windows using GDI (available on any windows 32 platform).
Definition: vpDisplayGDI.h:129

vpMouseButton::button3
Definition: vpMouseButton.h:55

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:601

vpDisplayX
Use the X11 console to display images on unix-like OS. Thus to enable this class X11 should be instal...
Definition: vpDisplayX.h:151

vpColor::none
static const vpColor none
Definition: vpColor.h:192

vpException
error that can be emited by ViSP classes.
Definition: vpException.h:71

vpPixelMeterConversion::convertPoint
static void convertPoint(const vpCameraParameters &cam, const double &u, const double &v, double &x, double &y)
Definition: vpPixelMeterConversion.h:103

vpMbGenericTracker
Real-time 6D object pose tracking using its CAD model.
Definition: vpMbGenericTracker.h:80

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:653

vpTime::measureTimeMs
VISP_EXPORT double measureTimeMs()
Definition: vpTime.cpp:88

vpParseArgv::parse
static bool parse(int *argcPtr, const char **argv, vpArgvInfo *argTable, int flags)
Definition: vpParseArgv.cpp:69

vpColor::red
static const vpColor red
Definition: vpColor.h:180

vpMouseButton::vpMouseButtonType
vpMouseButtonType
Definition: vpMouseButton.h:52

vpCameraParameters::initPersProjWithoutDistortion
void initPersProjWithoutDistortion(const double px, const double py, const double u0, const double v0)
Definition: vpCameraParameters.cpp:183

vpIoTools::checkFilename
static bool checkFilename(const char *filename)
Definition: vpIoTools.cpp:675

vpMath::getMean
static double getMean(const std::vector< double > &v)
Definition: vpMath.cpp:202

vpDisplayD3D
Display for windows using Direct3D 3rd party. Thus to enable this class Direct3D should be installed...
Definition: vpDisplayD3D.h:107

vpImage::getRows
unsigned int getRows() const
Definition: vpImage.h:211

vpIoTools::createFilePath
static std::string createFilePath(const std::string &parent, const std::string &child)
Definition: vpIoTools.cpp:1541

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:677

vpDisplayOpenCV
The vpDisplayOpenCV allows to display image using the OpenCV library. Thus to enable this class OpenC...
Definition: vpDisplayOpenCV.h:142

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:233

vpDisplayGTK
The vpDisplayGTK allows to display image using the GTK 3rd party library. Thus to enable this class G...
Definition: vpDisplayGTK.h:138

vpImage::resize
void resize(const unsigned int h, const unsigned int w)
resize the image : Image initialization
Definition: vpImage.h:866

vpDisplay::displayRectangle
static void displayRectangle(const vpImage< unsigned char > &I, const vpImagePoint &topLeft, unsigned int width, unsigned int height, const vpColor &color, bool fill=false, unsigned int thickness=1)
Definition: vpDisplay_uchar.cpp:485

vpMath::rad
static double rad(double deg)
Definition: vpMath.h:102

vpDisplayGTK::init
void init(vpImage< unsigned char > &I, int winx=-1, int winy=-1, const std::string &title="")
Definition: vpDisplayGTK.cpp:258

vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION
Definition: vpMbtFaceDepthNormal.h:62

vpColVector::sumSquare
double sumSquare() const
Definition: vpColVector.cpp:1437

vpMouseButton::button1
Definition: vpMouseButton.h:53

vpXmlParser::cleanup
static void cleanup()
Definition: vpXmlParser.h:310

vpMath::deg
static double deg(double rad)
Definition: vpMath.h:95

vpImageIo::read
static void read(vpImage< unsigned char > &I, const std::string &filename)
Definition: vpImageIo.cpp:207

vpMbGenericTracker::DEPTH_DENSE_TRACKER
Definition: vpMbGenericTracker.h:89

vpColVector
Implementation of column vector and the associated operations.
Definition: vpColVector.h:72

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0))
Definition: vpDisplay_uchar.cpp:378

vpPoseVector
Implementation of a pose vector and operations on poses.
Definition: vpPoseVector.h:92

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:178

vpRect
Defines a rectangle in the plane.
Definition: vpRect.h:78

vpImagePoint
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition: vpImagePoint.h:88

vpColor::yellow
static const vpColor yellow
Definition: vpColor.h:188

vpImage< unsigned char >

vpImageConvert::createDepthHistogram
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
Definition: vpImageConvert.cpp:201

vpPolygon3D::FOV_CLIPPING
Definition: vpPolygon3D.h:70