doxygen/visp-daily/perfGenericTracker_8cpp_source.html

 /*

  * ViSP, open source Visual Servoing Platform software.

  * Copyright (C) 2005 - 2024 by Inria. All rights reserved.

  *

  * This software is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2 of the License, or

  * (at your option) any later version.

  * See the file LICENSE.txt at the root directory of this source

  * distribution for additional information about the GNU GPL.

  *

  * For using ViSP with software that can not be combined with the GNU

  * GPL, please contact Inria about acquiring a ViSP Professional

  * Edition License.

  *

  * See https://visp.inria.fr for more information.

  *

  * This software was developed at:

  * Inria Rennes - Bretagne Atlantique

  * Campus Universitaire de Beaulieu

  * 35042 Rennes Cedex

  * France

  *

  * If you have questions regarding the use of this file, please contact

  * Inria at visp@inria.fr

  *

  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE

  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.

  *

  * Description:

  * Benchmark generic tracker.

  */


 #include <visp3/core/vpConfig.h>


 #if defined(VISP_HAVE_CATCH2)


 #include <catch_amalgamated.hpp>


 #include <visp3/core/vpIoTools.h>

 #include <visp3/io/vpImageIo.h>

 #include <visp3/mbt/vpMbGenericTracker.h>


 // #define DEBUG_DISPLAY // uncomment to check that the tracking is correct

 #ifdef DEBUG_DISPLAY

 #include <visp3/gui/vpDisplayX.h>

 #endif


 #ifdef ENABLE_VISP_NAMESPACE

 using namespace VISP_NAMESPACE_NAME;

 #endif


 namespace

 {

 bool runBenchmark = false;


 template <typename Type>

 bool read_data(const std::string &input_directory, int cpt, const vpCameraParameters &cam_depth, vpImage<Type> &I,

                vpImage<uint16_t> &I_depth, std::vector<vpColVector> &pointcloud, vpHomogeneousMatrix &cMo)

 {

   static_assert(std::is_same<Type, unsigned char>::value || std::is_same<Type, vpRGBa>::value,

                 "Template function supports only unsigned char and vpRGBa images!");

 #if VISP_HAVE_DATASET_VERSION >= 0x030600

   std::string ext("png");

 #else

   std::string ext("pgm");

 #endif

   char buffer[FILENAME_MAX];

   snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/Images/Image_%04d." + ext).c_str(), cpt);

   std::string image_filename = buffer;


   snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/Depth/Depth_%04d.bin").c_str(), cpt);

   std::string depth_filename = buffer;


   snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/CameraPose/Camera_%03d.txt").c_str(), cpt);

   std::string pose_filename = buffer;


   if (!vpIoTools::checkFilename(image_filename) || !vpIoTools::checkFilename(depth_filename) ||

       !vpIoTools::checkFilename(pose_filename))

     return false;


   vpImageIo::read(I, image_filename);


   unsigned int depth_width = 0, depth_height = 0;

   std::ifstream file_depth(depth_filename.c_str(), std::ios::in | std::ios::binary);

   if (!file_depth.is_open())

     return false;


   vpIoTools::readBinaryValueLE(file_depth, depth_height);

   vpIoTools::readBinaryValueLE(file_depth, depth_width);

   I_depth.resize(depth_height, depth_width);

   pointcloud.resize(depth_height * depth_width);


   const float depth_scale = 0.000030518f;

   for (unsigned int i = 0; i < I_depth.getHeight(); i++) {

     for (unsigned int j = 0; j < I_depth.getWidth(); j++) {

       vpIoTools::readBinaryValueLE(file_depth, I_depth[i][j]);

       double x = 0.0, y = 0.0, Z = I_depth[i][j] * depth_scale;

       vpPixelMeterConversion::convertPoint(cam_depth, j, i, x, y);

       vpColVector pt3d(4, 1.0);

       pt3d[0] = x * Z;

       pt3d[1] = y * Z;

       pt3d[2] = Z;

       pointcloud[i * I_depth.getWidth() + j] = pt3d;

     }

   }


   std::ifstream file_pose(pose_filename.c_str());

   if (!file_pose.is_open()) {

     return false;

   }


   for (unsigned int i = 0; i < 4; i++) {

     for (unsigned int j = 0; j < 4; j++) {

       file_pose >> cMo[i][j];

     }

   }


   return true;

 }

 } // anonymous namespace


 TEST_CASE("Benchmark generic tracker", "[benchmark]")

 {

   if (runBenchmark) {

     std::vector<int> tracker_type(2);

     tracker_type[0] = vpMbGenericTracker::EDGE_TRACKER;

     tracker_type[1] = vpMbGenericTracker::DEPTH_DENSE_TRACKER;

     vpMbGenericTracker tracker(tracker_type);


     const std::string input_directory =

       vpIoTools::createFilePath(vpIoTools::getViSPImagesDataPath(), "mbt-depth/Castle-simu");


     const bool verbose = false;

 #if defined(VISP_HAVE_PUGIXML)

     const std::string configFileCam1 = input_directory + std::string("/Config/chateau.xml");

     const std::string configFileCam2 = input_directory + std::string("/Config/chateau_depth.xml");

     REQUIRE(vpIoTools::checkFilename(configFileCam1));

     REQUIRE(vpIoTools::checkFilename(configFileCam2));

     tracker.loadConfigFile(configFileCam1, configFileCam2, verbose);

 #else

     {

       vpCameraParameters cam_color, cam_depth;

       cam_color.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

       cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

       tracker.setCameraParameters(cam_color, cam_depth);

     }


     // Edge

     vpMe me;

     me.setMaskSize(5);

     me.setMaskNumber(180);

     me.setRange(8);

     me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

     me.setThreshold(5);

     me.setMu1(0.5);

     me.setMu2(0.5);

     me.setSampleStep(5);

     tracker.setMovingEdge(me);


     // Klt

 #if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

     vpKltOpencv klt;

     tracker.setKltMaskBorder(5);

     klt.setMaxFeatures(10000);

     klt.setWindowSize(5);

     klt.setQuality(0.01);

     klt.setMinDistance(5);

     klt.setHarrisFreeParameter(0.02);

     klt.setBlockSize(3);

     klt.setPyramidLevels(3);


     tracker.setKltOpencv(klt);

 #endif


     // Depth

     tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);

     tracker.setDepthNormalPclPlaneEstimationMethod(2);

     tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);

     tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);

     tracker.setDepthNormalSamplingStep(2, 2);


     tracker.setDepthDenseSamplingStep(4, 4);


     tracker.setAngleAppear(vpMath::rad(85.0));

     tracker.setAngleDisappear(vpMath::rad(89.0));

     tracker.setNearClippingDistance(0.01);

     tracker.setFarClippingDistance(2.0);

     tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

 #endif


     REQUIRE(vpIoTools::checkFilename(input_directory + "/Models/chateau.cao"));

     tracker.loadModel(input_directory + "/Models/chateau.cao", input_directory + "/Models/chateau.cao", verbose);


     vpHomogeneousMatrix T;

     T[0][0] = -1;

     T[0][3] = -0.2;

     T[1][1] = 0;

     T[1][2] = 1;

     T[1][3] = 0.12;

     T[2][1] = 1;

     T[2][2] = 0;

     T[2][3] = -0.15;

     tracker.loadModel(input_directory + "/Models/cube.cao", verbose, T);


     vpImage<unsigned char> I;

     vpImage<uint16_t> I_depth_raw;

     vpHomogeneousMatrix cMo_truth;

     std::vector<vpColVector> pointcloud;


     vpCameraParameters cam_color, cam_depth;

     tracker.getCameraParameters(cam_color, cam_depth);


     vpHomogeneousMatrix depth_M_color;

     depth_M_color[0][3] = -0.05;

     tracker.setCameraTransformationMatrix("Camera2", depth_M_color);


     // load all the data in memory to not take into account I/O from disk

     std::vector<vpImage<unsigned char> > images;

     std::vector<vpImage<uint16_t> > depth_raws;

     std::vector<std::vector<vpColVector> > pointclouds;

     std::vector<vpHomogeneousMatrix> cMo_truth_all;

     // forward

     for (int i = 1; i <= 40; i++) {

       if (read_data(input_directory, i, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {

         images.push_back(I);

         depth_raws.push_back(I_depth_raw);

         pointclouds.push_back(pointcloud);

         cMo_truth_all.push_back(cMo_truth);

       }

     }

     // backward

     for (int i = 40; i >= 1; i--) {

       if (read_data(input_directory, i, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {

         images.push_back(I);

         depth_raws.push_back(I_depth_raw);

         pointclouds.push_back(pointcloud);

         cMo_truth_all.push_back(cMo_truth);

       }

     }


     // Stereo MBT

     {

       std::vector<std::map<std::string, int> > mapOfTrackerTypes;

       mapOfTrackerTypes.push_back(

           { {"Camera1", vpMbGenericTracker::EDGE_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

       mapOfTrackerTypes.push_back(

           { {"Camera1", vpMbGenericTracker::EDGE_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

 #if defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

       mapOfTrackerTypes.push_back(

           { {"Camera1", vpMbGenericTracker::KLT_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

       mapOfTrackerTypes.push_back({ {"Camera1", vpMbGenericTracker::EDGE_TRACKER | vpMbGenericTracker::KLT_TRACKER},

                                    {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

       mapOfTrackerTypes.push_back({ {"Camera1", vpMbGenericTracker::EDGE_TRACKER | vpMbGenericTracker::KLT_TRACKER},

                                    {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

 #endif


       std::vector<std::string> benchmarkNames = {

         "Edge MBT",

         "Edge + Depth dense MBT",

 #if defined(VISP_HAVE_OPENCV)

         "KLT MBT",

         "KLT + depth dense MBT",

         "Edge + KLT + depth dense MBT"

 #endif

       };


       std::vector<bool> monoculars = {

         true,

         false,

 #if defined(VISP_HAVE_OPENCV)

         true,

         false,

         false

 #endif

       };


       for (size_t idx = 0; idx < mapOfTrackerTypes.size(); idx++) {

         tracker.resetTracker();

         tracker.setTrackerType(mapOfTrackerTypes[idx]);


         const bool verbose = false;

 #if defined(VISP_HAVE_PUGIXML)

         tracker.loadConfigFile(configFileCam1, configFileCam2, verbose);

 #else

         {

           vpCameraParameters cam_color, cam_depth;

           cam_color.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

           cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

           tracker.setCameraParameters(cam_color, cam_depth);

         }


         // Edge

         vpMe me;

         me.setMaskSize(5);

         me.setMaskNumber(180);

         me.setRange(8);

         me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

         me.setThreshold(5);

         me.setMu1(0.5);

         me.setMu2(0.5);

         me.setSampleStep(5);

         tracker.setMovingEdge(me);


         // Klt

 #if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

         vpKltOpencv klt;

         tracker.setKltMaskBorder(5);

         klt.setMaxFeatures(10000);

         klt.setWindowSize(5);

         klt.setQuality(0.01);

         klt.setMinDistance(5);

         klt.setHarrisFreeParameter(0.02);

         klt.setBlockSize(3);

         klt.setPyramidLevels(3);


         tracker.setKltOpencv(klt);

 #endif


         // Depth

         tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);

         tracker.setDepthNormalPclPlaneEstimationMethod(2);

         tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);

         tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);

         tracker.setDepthNormalSamplingStep(2, 2);


         tracker.setDepthDenseSamplingStep(4, 4);


         tracker.setAngleAppear(vpMath::rad(85.0));

         tracker.setAngleDisappear(vpMath::rad(89.0));

         tracker.setNearClippingDistance(0.01);

         tracker.setFarClippingDistance(2.0);

         tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

 #endif

         tracker.loadModel(input_directory + "/Models/chateau.cao", input_directory + "/Models/chateau.cao", verbose);

         tracker.loadModel(input_directory + "/Models/cube.cao", verbose, T);

         tracker.initFromPose(images.front(), cMo_truth_all.front());


         std::map<std::string, unsigned int> mapOfWidths, mapOfHeights;

         mapOfWidths["Camera2"] = monoculars[idx] ? 0 : I_depth_raw.getWidth();

         mapOfHeights["Camera2"] = monoculars[idx] ? 0 : I_depth_raw.getHeight();


         vpHomogeneousMatrix cMo;

 #ifndef DEBUG_DISPLAY

         BENCHMARK(benchmarkNames[idx].c_str())

 #else

         vpImage<unsigned char> I_depth;

         vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


         vpDisplayX d_color(I, 0, 0, "Color image");

         vpDisplayX d_depth(I_depth, I.getWidth(), 0, "Depth image");

         tracker.setDisplayFeatures(true);

 #endif

         {

           tracker.initFromPose(images.front(), cMo_truth_all.front());


           for (size_t i = 0; i < images.size(); i++) {

             const vpImage<unsigned char> &I_current = images[i];

             const std::vector<vpColVector> &pointcloud_current = pointclouds[i];


 #ifdef DEBUG_DISPLAY

             vpImageConvert::createDepthHistogram(depth_raws[i], I_depth);

             I = I_current;

             vpDisplay::display(I);

             vpDisplay::display(I_depth);

 #endif


             std::map<std::string, const vpImage<unsigned char> *> mapOfImages;

             mapOfImages["Camera1"] = &I_current;


             std::map<std::string, const std::vector<vpColVector> *> mapOfPointclouds;

             mapOfPointclouds["Camera2"] = &pointcloud_current;


             tracker.track(mapOfImages, mapOfPointclouds, mapOfWidths, mapOfHeights);

             cMo = tracker.getPose();


 #ifdef DEBUG_DISPLAY

             tracker.display(I, I_depth, cMo, depth_M_color * cMo, cam_color, cam_depth, vpColor::red, 3);

             vpDisplay::displayFrame(I, cMo, cam_color, 0.05, vpColor::none, 3);

             vpDisplay::displayFrame(I_depth, depth_M_color * cMo, cam_depth, 0.05, vpColor::none, 3);

             vpDisplay::displayText(I, 20, 20, benchmarkNames[idx], vpColor::red);

             vpDisplay::displayText(

                 I, 40, 20, std::string("Nb features: " + std::to_string(tracker.getError().getRows())), vpColor::red);


             vpDisplay::flush(I);

             vpDisplay::flush(I_depth);

             vpTime::wait(33);

 #endif

           }


 #ifndef DEBUG_DISPLAY

           return cMo;

         };

 #else

       }

 #endif


         vpPoseVector pose_est(cMo);

         vpPoseVector pose_truth(cMo_truth);

         vpColVector t_err(3), tu_err(3);

         for (unsigned int i = 0; i < 3; i++) {

           t_err[i] = pose_est[i] - pose_truth[i];

           tu_err[i] = pose_est[i + 3] - pose_truth[i + 3];

         }


         const double max_translation_error = 0.006;

         const double max_rotation_error = 0.03;

         CHECK(sqrt(t_err.sumSquare()) < max_translation_error);

         CHECK(sqrt(tu_err.sumSquare()) < max_rotation_error);

     }

   }

 } // if (runBenchmark)

 }


 int main(int argc, char *argv[])

 {

   Catch::Session session;


   auto cli = session.cli()         // Get Catch's composite command line parser

     | Catch::Clara::Opt(runBenchmark)   // bind variable to a new option, with a hint string

     ["--benchmark"] // the option names it will respond to

     ("run benchmark comparing naive code with ViSP implementation"); // description string for the help output


   // Now pass the new composite back to Catch so it uses that

   session.cli(cli);

   session.applyCommandLine(argc, argv);

   int numFailed = session.run();

   return numFailed;

 }


 #else

 #include <iostream>


 int main() { return EXIT_SUCCESS; }

 #endif

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:310

vpCameraParameters::initPersProjWithoutDistortion
void initPersProjWithoutDistortion(double px, double py, double u0, double v0)
Definition: vpCameraParameters.cpp:202

vpColVector
Implementation of column vector and the associated operations.
Definition: vpColVector.h:191

vpColor::red
static const vpColor red
Definition: vpColor.h:217

vpColor::none
static const vpColor none
Definition: vpColor.h:229

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:830

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
Definition: vpDisplay_uchar.cpp:413

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:806

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:221

vpImageConvert::createDepthHistogram
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
Definition: vpImageConvert.cpp:253

vpImageIo::read
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Definition: vpImageIo.cpp:147

vpImage
Definition of the vpImage class member functions.
Definition: vpImage.h:131

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:242

vpImage::resize
void resize(unsigned int h, unsigned int w)
resize the image : Image initialization
Definition: vpImage.h:542

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:181

vpIoTools::getViSPImagesDataPath
static std::string getViSPImagesDataPath()
Definition: vpIoTools.cpp:1053

vpIoTools::checkFilename
static bool checkFilename(const std::string &filename)
Definition: vpIoTools.cpp:786

vpIoTools::readBinaryValueLE
static void readBinaryValueLE(std::ifstream &file, int16_t &short_value)
Definition: vpIoTools_config_file.cpp:469

vpIoTools::createFilePath
static std::string createFilePath(const std::string &parent, const std::string &child)
Definition: vpIoTools.cpp:1427

vpKltOpencv
Wrapper for the KLT (Kanade-Lucas-Tomasi) feature tracker implemented in OpenCV. Thus to enable this ...
Definition: vpKltOpencv.h:74

vpKltOpencv::setBlockSize
void setBlockSize(int blockSize)
Definition: vpKltOpencv.h:267

vpKltOpencv::setQuality
void setQuality(double qualityLevel)
Definition: vpKltOpencv.h:356

vpKltOpencv::setHarrisFreeParameter
void setHarrisFreeParameter(double harris_k)
Definition: vpKltOpencv.h:275

vpKltOpencv::setMaxFeatures
void setMaxFeatures(int maxCount)
Definition: vpKltOpencv.h:315

vpKltOpencv::setMinDistance
void setMinDistance(double minDistance)
Definition: vpKltOpencv.h:324

vpKltOpencv::setWindowSize
void setWindowSize(int winSize)
Definition: vpKltOpencv.h:377

vpKltOpencv::setPyramidLevels
void setPyramidLevels(int pyrMaxLevel)
Definition: vpKltOpencv.h:343

vpMath::rad
static double rad(double deg)
Definition: vpMath.h:129

vpMbGenericTracker
Real-time 6D object pose tracking using its CAD model.
Definition: vpMbGenericTracker.h:201

vpMbGenericTracker::EDGE_TRACKER
@ EDGE_TRACKER
Definition: vpMbGenericTracker.h:205

vpMbGenericTracker::DEPTH_DENSE_TRACKER
@ DEPTH_DENSE_TRACKER
Definition: vpMbGenericTracker.h:210

vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION
@ ROBUST_FEATURE_ESTIMATION
Robust scheme to estimate the normal of the plane.
Definition: vpMbtFaceDepthNormal.h:71

vpMe
Definition: vpMe.h:134

vpMe::setMu1
void setMu1(const double &mu_1)
Definition: vpMe.h:385

vpMe::setRange
void setRange(const unsigned int &range)
Definition: vpMe.h:415

vpMe::setLikelihoodThresholdType
void setLikelihoodThresholdType(const vpLikelihoodThresholdType likelihood_threshold_type)
Definition: vpMe.h:505

vpMe::setMaskNumber
void setMaskNumber(const unsigned int &mask_number)
Definition: vpMe.cpp:552

vpMe::setThreshold
void setThreshold(const double &threshold)
Definition: vpMe.h:466

vpMe::setSampleStep
void setSampleStep(const double &sample_step)
Definition: vpMe.h:422

vpMe::setMaskSize
void setMaskSize(const unsigned int &mask_size)
Definition: vpMe.cpp:560

vpMe::setMu2
void setMu2(const double &mu_2)
Definition: vpMe.h:392

vpMe::NORMALIZED_THRESHOLD
@ NORMALIZED_THRESHOLD
Definition: vpMe.h:145

vpPixelMeterConversion::convertPoint
static void convertPoint(const vpCameraParameters &cam, const double &u, const double &v, double &x, double &y)
Definition: vpPixelMeterConversion.h:102

vpPolygon3D::FOV_CLIPPING
@ FOV_CLIPPING
Definition: vpPolygon3D.h:68

vpPoseVector
Implementation of a pose vector and operations on poses.
Definition: vpPoseVector.h:203

VISP_NAMESPACE_NAME
Definition: vpEigenConversion.h:44

vpTime::wait
VISP_EXPORT int wait(double t0, double t)