doxygen/visp-daily/perfGenericTracker_8cpp-example.html

/*

 * ViSP, open source Visual Servoing Platform software.

 * Copyright (C) 2005 - 2024 by Inria. All rights reserved.

 *

 * This software is free software; you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation; either version 2 of the License, or

 * (at your option) any later version.

 * See the file LICENSE.txt at the root directory of this source

 * distribution for additional information about the GNU GPL.

 *

 * For using ViSP with software that can not be combined with the GNU

 * GPL, please contact Inria about acquiring a ViSP Professional

 * Edition License.

 *

 * See https://visp.inria.fr for more information.

 *

 * This software was developed at:

 * Inria Rennes - Bretagne Atlantique

 * Campus Universitaire de Beaulieu

 * 35042 Rennes Cedex

 * France

 *

 * If you have questions regarding the use of this file, please contact

 * Inria at visp@inria.fr

 *

 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE

 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.

 *

 * Description:

 * Benchmark generic tracker.

 */


#include <visp3/core/vpConfig.h>


#if defined(VISP_HAVE_CATCH2)


#include <catch_amalgamated.hpp>


#include <visp3/core/vpIoTools.h>

#include <visp3/io/vpImageIo.h>

#include <visp3/mbt/vpMbGenericTracker.h>


// #define DEBUG_DISPLAY // uncomment to check that the tracking is correct

#ifdef DEBUG_DISPLAY

#include <visp3/gui/vpDisplayX.h>

#endif


#ifdef ENABLE_VISP_NAMESPACE

using namespace VISP_NAMESPACE_NAME;

#endif


namespace

{

bool runBenchmark = false;


template <typename Type>

bool read_data(const std::string &input_directory, int cpt, const vpCameraParameters &cam_depth, vpImage<Type> &I,

               vpImage<uint16_t> &I_depth, std::vector<vpColVector> &pointcloud, vpHomogeneousMatrix &cMo)

{

  static_assert(std::is_same<Type, unsigned char>::value || std::is_same<Type, vpRGBa>::value,

                "Template function supports only unsigned char and vpRGBa images!");

#if VISP_HAVE_DATASET_VERSION >= 0x030600

  std::string ext("png");

#else

  std::string ext("pgm");

#endif

  char buffer[FILENAME_MAX];

  snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/Images/Image_%04d." + ext).c_str(), cpt);

  std::string image_filename = buffer;


  snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/Depth/Depth_%04d.bin").c_str(), cpt);

  std::string depth_filename = buffer;


  snprintf(buffer, FILENAME_MAX, std::string(input_directory + "/CameraPose/Camera_%03d.txt").c_str(), cpt);

  std::string pose_filename = buffer;


  if (!vpIoTools::checkFilename(image_filename) || !vpIoTools::checkFilename(depth_filename) ||

      !vpIoTools::checkFilename(pose_filename))

    return false;


  vpImageIo::read(I, image_filename);


  unsigned int depth_width = 0, depth_height = 0;

  std::ifstream file_depth(depth_filename.c_str(), std::ios::in | std::ios::binary);

  if (!file_depth.is_open())

    return false;


  vpIoTools::readBinaryValueLE(file_depth, depth_height);

  vpIoTools::readBinaryValueLE(file_depth, depth_width);

  I_depth.resize(depth_height, depth_width);

  pointcloud.resize(depth_height * depth_width);


  const float depth_scale = 0.000030518f;

  for (unsigned int i = 0; i < I_depth.getHeight(); i++) {

    for (unsigned int j = 0; j < I_depth.getWidth(); j++) {

      vpIoTools::readBinaryValueLE(file_depth, I_depth[i][j]);

      double x = 0.0, y = 0.0, Z = I_depth[i][j] * depth_scale;

      vpPixelMeterConversion::convertPoint(cam_depth, j, i, x, y);

      vpColVector pt3d(4, 1.0);

      pt3d[0] = x * Z;

      pt3d[1] = y * Z;

      pt3d[2] = Z;

      pointcloud[i * I_depth.getWidth() + j] = pt3d;

    }

  }


  std::ifstream file_pose(pose_filename.c_str());

  if (!file_pose.is_open()) {

    return false;

  }


  for (unsigned int i = 0; i < 4; i++) {

    for (unsigned int j = 0; j < 4; j++) {

      file_pose >> cMo[i][j];

    }

  }


  return true;

}

} // anonymous namespace


TEST_CASE("Benchmark generic tracker", "[benchmark]")

{

  if (runBenchmark) {

    std::vector<int> tracker_type(2);

    tracker_type[0] = vpMbGenericTracker::EDGE_TRACKER;

    tracker_type[1] = vpMbGenericTracker::DEPTH_DENSE_TRACKER;

    vpMbGenericTracker tracker(tracker_type);


    const std::string input_directory =

      vpIoTools::createFilePath(vpIoTools::getViSPImagesDataPath(), "mbt-depth/Castle-simu");


    const bool verbose = false;

#if defined(VISP_HAVE_PUGIXML)

    const std::string configFileCam1 = input_directory + std::string("/Config/chateau.xml");

    const std::string configFileCam2 = input_directory + std::string("/Config/chateau_depth.xml");

    REQUIRE(vpIoTools::checkFilename(configFileCam1));

    REQUIRE(vpIoTools::checkFilename(configFileCam2));

    tracker.loadConfigFile(configFileCam1, configFileCam2, verbose);

#else

    {

      vpCameraParameters cam_color, cam_depth;

      cam_color.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

      cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

      tracker.setCameraParameters(cam_color, cam_depth);

    }


    // Edge

    vpMe me;

    me.setMaskSize(5);

    me.setMaskNumber(180);

    me.setRange(8);

    me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

    me.setThreshold(5);

    me.setMu1(0.5);

    me.setMu2(0.5);

    me.setSampleStep(5);

    tracker.setMovingEdge(me);


    // Klt

#if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

    vpKltOpencv klt;

    tracker.setKltMaskBorder(5);

    klt.setMaxFeatures(10000);

    klt.setWindowSize(5);

    klt.setQuality(0.01);

    klt.setMinDistance(5);

    klt.setHarrisFreeParameter(0.02);

    klt.setBlockSize(3);

    klt.setPyramidLevels(3);


    tracker.setKltOpencv(klt);

#endif


    // Depth

    tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);

    tracker.setDepthNormalPclPlaneEstimationMethod(2);

    tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);

    tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);

    tracker.setDepthNormalSamplingStep(2, 2);


    tracker.setDepthDenseSamplingStep(4, 4);


    tracker.setAngleAppear(vpMath::rad(85.0));

    tracker.setAngleDisappear(vpMath::rad(89.0));

    tracker.setNearClippingDistance(0.01);

    tracker.setFarClippingDistance(2.0);

    tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

#endif


    REQUIRE(vpIoTools::checkFilename(input_directory + "/Models/chateau.cao"));

    tracker.loadModel(input_directory + "/Models/chateau.cao", input_directory + "/Models/chateau.cao", verbose);


    vpHomogeneousMatrix T;

    T[0][0] = -1;

    T[0][3] = -0.2;

    T[1][1] = 0;

    T[1][2] = 1;

    T[1][3] = 0.12;

    T[2][1] = 1;

    T[2][2] = 0;

    T[2][3] = -0.15;

    tracker.loadModel(input_directory + "/Models/cube.cao", verbose, T);


    vpImage<unsigned char> I;

    vpImage<uint16_t> I_depth_raw;

    vpHomogeneousMatrix cMo_truth;

    std::vector<vpColVector> pointcloud;


    vpCameraParameters cam_color, cam_depth;

    tracker.getCameraParameters(cam_color, cam_depth);


    vpHomogeneousMatrix depth_M_color;

    depth_M_color[0][3] = -0.05;

    tracker.setCameraTransformationMatrix("Camera2", depth_M_color);


    // load all the data in memory to not take into account I/O from disk

    std::vector<vpImage<unsigned char> > images;

    std::vector<vpImage<uint16_t> > depth_raws;

    std::vector<std::vector<vpColVector> > pointclouds;

    std::vector<vpHomogeneousMatrix> cMo_truth_all;

    // forward

    for (int i = 1; i <= 40; i++) {

      if (read_data(input_directory, i, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {

        images.push_back(I);

        depth_raws.push_back(I_depth_raw);

        pointclouds.push_back(pointcloud);

        cMo_truth_all.push_back(cMo_truth);

      }

    }

    // backward

    for (int i = 40; i >= 1; i--) {

      if (read_data(input_directory, i, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {

        images.push_back(I);

        depth_raws.push_back(I_depth_raw);

        pointclouds.push_back(pointcloud);

        cMo_truth_all.push_back(cMo_truth);

      }

    }


    // Stereo MBT

    {

      std::vector<std::map<std::string, int> > mapOfTrackerTypes;

      mapOfTrackerTypes.push_back(

          { {"Camera1", vpMbGenericTracker::EDGE_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

      mapOfTrackerTypes.push_back(

          { {"Camera1", vpMbGenericTracker::EDGE_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

#if defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

      mapOfTrackerTypes.push_back(

          { {"Camera1", vpMbGenericTracker::KLT_TRACKER}, {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

      mapOfTrackerTypes.push_back({ {"Camera1", vpMbGenericTracker::EDGE_TRACKER | vpMbGenericTracker::KLT_TRACKER},

                                   {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

      mapOfTrackerTypes.push_back({ {"Camera1", vpMbGenericTracker::EDGE_TRACKER | vpMbGenericTracker::KLT_TRACKER},

                                   {"Camera2", vpMbGenericTracker::DEPTH_DENSE_TRACKER} });

#endif


      std::vector<std::string> benchmarkNames = {

        "Edge MBT",

        "Edge + Depth dense MBT",

#if defined(VISP_HAVE_OPENCV)

        "KLT MBT",

        "KLT + depth dense MBT",

        "Edge + KLT + depth dense MBT"

#endif

      };


      std::vector<bool> monoculars = {

        true,

        false,

#if defined(VISP_HAVE_OPENCV)

        true,

        false,

        false

#endif

      };


      for (size_t idx = 0; idx < mapOfTrackerTypes.size(); idx++) {

        tracker.resetTracker();

        tracker.setTrackerType(mapOfTrackerTypes[idx]);


        const bool verbose = false;

#if defined(VISP_HAVE_PUGIXML)

        tracker.loadConfigFile(configFileCam1, configFileCam2, verbose);

#else

        {

          vpCameraParameters cam_color, cam_depth;

          cam_color.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

          cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);

          tracker.setCameraParameters(cam_color, cam_depth);

        }


        // Edge

        vpMe me;

        me.setMaskSize(5);

        me.setMaskNumber(180);

        me.setRange(8);

        me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

        me.setThreshold(5);

        me.setMu1(0.5);

        me.setMu2(0.5);

        me.setSampleStep(5);

        tracker.setMovingEdge(me);


        // Klt

#if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

        vpKltOpencv klt;

        tracker.setKltMaskBorder(5);

        klt.setMaxFeatures(10000);

        klt.setWindowSize(5);

        klt.setQuality(0.01);

        klt.setMinDistance(5);

        klt.setHarrisFreeParameter(0.02);

        klt.setBlockSize(3);

        klt.setPyramidLevels(3);


        tracker.setKltOpencv(klt);

#endif


        // Depth

        tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);

        tracker.setDepthNormalPclPlaneEstimationMethod(2);

        tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);

        tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);

        tracker.setDepthNormalSamplingStep(2, 2);


        tracker.setDepthDenseSamplingStep(4, 4);


        tracker.setAngleAppear(vpMath::rad(85.0));

        tracker.setAngleDisappear(vpMath::rad(89.0));

        tracker.setNearClippingDistance(0.01);

        tracker.setFarClippingDistance(2.0);

        tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

#endif

        tracker.loadModel(input_directory + "/Models/chateau.cao", input_directory + "/Models/chateau.cao", verbose);

        tracker.loadModel(input_directory + "/Models/cube.cao", verbose, T);

        tracker.initFromPose(images.front(), cMo_truth_all.front());


        std::map<std::string, unsigned int> mapOfWidths, mapOfHeights;

        mapOfWidths["Camera2"] = monoculars[idx] ? 0 : I_depth_raw.getWidth();

        mapOfHeights["Camera2"] = monoculars[idx] ? 0 : I_depth_raw.getHeight();


        vpHomogeneousMatrix cMo;

#ifndef DEBUG_DISPLAY

        BENCHMARK(benchmarkNames[idx].c_str())

#else

        vpImage<unsigned char> I_depth;

        vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


        vpDisplayX d_color(I, 0, 0, "Color image");

        vpDisplayX d_depth(I_depth, I.getWidth(), 0, "Depth image");

        tracker.setDisplayFeatures(true);

#endif

        {

          tracker.initFromPose(images.front(), cMo_truth_all.front());


          for (size_t i = 0; i < images.size(); i++) {

            const vpImage<unsigned char> &I_current = images[i];

            const std::vector<vpColVector> &pointcloud_current = pointclouds[i];


#ifdef DEBUG_DISPLAY

            vpImageConvert::createDepthHistogram(depth_raws[i], I_depth);

            I = I_current;

            vpDisplay::display(I);

            vpDisplay::display(I_depth);

#endif


            std::map<std::string, const vpImage<unsigned char> *> mapOfImages;

            mapOfImages["Camera1"] = &I_current;


            std::map<std::string, const std::vector<vpColVector> *> mapOfPointclouds;

            mapOfPointclouds["Camera2"] = &pointcloud_current;


            tracker.track(mapOfImages, mapOfPointclouds, mapOfWidths, mapOfHeights);

            cMo = tracker.getPose();


#ifdef DEBUG_DISPLAY

            tracker.display(I, I_depth, cMo, depth_M_color * cMo, cam_color, cam_depth, vpColor::red, 3);

            vpDisplay::displayFrame(I, cMo, cam_color, 0.05, vpColor::none, 3);

            vpDisplay::displayFrame(I_depth, depth_M_color * cMo, cam_depth, 0.05, vpColor::none, 3);

            vpDisplay::displayText(I, 20, 20, benchmarkNames[idx], vpColor::red);

            vpDisplay::displayText(

                I, 40, 20, std::string("Nb features: " + std::to_string(tracker.getError().getRows())), vpColor::red);


            vpDisplay::flush(I);

            vpDisplay::flush(I_depth);

            vpTime::wait(33);

#endif

          }


#ifndef DEBUG_DISPLAY

          return cMo;

        };

#else

      }

#endif


        vpPoseVector pose_est(cMo);

        vpPoseVector pose_truth(cMo_truth);

        vpColVector t_err(3), tu_err(3);

        for (unsigned int i = 0; i < 3; i++) {

          t_err[i] = pose_est[i] - pose_truth[i];

          tu_err[i] = pose_est[i + 3] - pose_truth[i + 3];

        }


        const double max_translation_error = 0.006;

        const double max_rotation_error = 0.03;

        CHECK(sqrt(t_err.sumSquare()) < max_translation_error);

        CHECK(sqrt(tu_err.sumSquare()) < max_rotation_error);

    }

  }

} // if (runBenchmark)

}


int main(int argc, char *argv[])

{

  Catch::Session session;


  auto cli = session.cli()         // Get Catch's composite command line parser

    | Catch::Clara::Opt(runBenchmark)   // bind variable to a new option, with a hint string

    ["--benchmark"] // the option names it will respond to

    ("run benchmark comparing naive code with ViSP implementation"); // description string for the help output


  // Now pass the new composite back to Catch so it uses that

  session.cli(cli);

  session.applyCommandLine(argc, argv);

  int numFailed = session.run();

  return numFailed;

}


#else

#include <iostream>


int main() { return EXIT_SUCCESS; }

#endif

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:310

vpCameraParameters::initPersProjWithoutDistortion
void initPersProjWithoutDistortion(double px, double py, double u0, double v0)
Definition: vpCameraParameters.cpp:202

vpColVector
Implementation of column vector and the associated operations.
Definition: vpColVector.h:191

vpColor::red
static const vpColor red
Definition: vpColor.h:217

vpColor::none
static const vpColor none
Definition: vpColor.h:229

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:830

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
Definition: vpDisplay_uchar.cpp:413

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:806

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:221

vpImageConvert::createDepthHistogram
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
Definition: vpImageConvert.cpp:253

vpImageIo::read
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Definition: vpImageIo.cpp:147

vpImage
Definition of the vpImage class member functions.
Definition: vpImage.h:131

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:242

vpImage::resize
void resize(unsigned int h, unsigned int w)
resize the image : Image initialization
Definition: vpImage.h:542

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:181

vpIoTools::getViSPImagesDataPath
static std::string getViSPImagesDataPath()
Definition: vpIoTools.cpp:1053

vpIoTools::checkFilename
static bool checkFilename(const std::string &filename)
Definition: vpIoTools.cpp:786

vpIoTools::readBinaryValueLE
static void readBinaryValueLE(std::ifstream &file, int16_t &short_value)
Definition: vpIoTools_config_file.cpp:469

vpIoTools::createFilePath
static std::string createFilePath(const std::string &parent, const std::string &child)
Definition: vpIoTools.cpp:1427

vpKltOpencv
Wrapper for the KLT (Kanade-Lucas-Tomasi) feature tracker implemented in OpenCV. Thus to enable this ...
Definition: vpKltOpencv.h:74

vpKltOpencv::setBlockSize
void setBlockSize(int blockSize)
Definition: vpKltOpencv.h:267

vpKltOpencv::setQuality
void setQuality(double qualityLevel)
Definition: vpKltOpencv.h:356

vpKltOpencv::setHarrisFreeParameter
void setHarrisFreeParameter(double harris_k)
Definition: vpKltOpencv.h:275

vpKltOpencv::setMaxFeatures
void setMaxFeatures(int maxCount)
Definition: vpKltOpencv.h:315

vpKltOpencv::setMinDistance
void setMinDistance(double minDistance)
Definition: vpKltOpencv.h:324

vpKltOpencv::setWindowSize
void setWindowSize(int winSize)
Definition: vpKltOpencv.h:377

vpKltOpencv::setPyramidLevels
void setPyramidLevels(int pyrMaxLevel)
Definition: vpKltOpencv.h:343

vpMath::rad
static double rad(double deg)
Definition: vpMath.h:129

vpMbGenericTracker
Real-time 6D object pose tracking using its CAD model.
Definition: vpMbGenericTracker.h:201

vpMbGenericTracker::EDGE_TRACKER
@ EDGE_TRACKER
Definition: vpMbGenericTracker.h:205

vpMbGenericTracker::DEPTH_DENSE_TRACKER
@ DEPTH_DENSE_TRACKER
Definition: vpMbGenericTracker.h:210

vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION
@ ROBUST_FEATURE_ESTIMATION
Robust scheme to estimate the normal of the plane.
Definition: vpMbtFaceDepthNormal.h:71

vpMe
Definition: vpMe.h:134

vpMe::setMu1
void setMu1(const double &mu_1)
Definition: vpMe.h:385

vpMe::setRange
void setRange(const unsigned int &range)
Definition: vpMe.h:415

vpMe::setLikelihoodThresholdType
void setLikelihoodThresholdType(const vpLikelihoodThresholdType likelihood_threshold_type)
Definition: vpMe.h:505

vpMe::setMaskNumber
void setMaskNumber(const unsigned int &mask_number)
Definition: vpMe.cpp:552

vpMe::setThreshold
void setThreshold(const double &threshold)
Definition: vpMe.h:466

vpMe::setSampleStep
void setSampleStep(const double &sample_step)
Definition: vpMe.h:422

vpMe::setMaskSize
void setMaskSize(const unsigned int &mask_size)
Definition: vpMe.cpp:560

vpMe::setMu2
void setMu2(const double &mu_2)
Definition: vpMe.h:392

vpMe::NORMALIZED_THRESHOLD
@ NORMALIZED_THRESHOLD
Definition: vpMe.h:145

vpPixelMeterConversion::convertPoint
static void convertPoint(const vpCameraParameters &cam, const double &u, const double &v, double &x, double &y)
Definition: vpPixelMeterConversion.h:102

vpPolygon3D::FOV_CLIPPING
@ FOV_CLIPPING
Definition: vpPolygon3D.h:68

vpPoseVector
Implementation of a pose vector and operations on poses.
Definition: vpPoseVector.h:203

VISP_NAMESPACE_NAME
Definition: vpEigenConversion.h:44

vpTime::wait
VISP_EXPORT int wait(double t0, double t)