doxygen/visp-daily/tutorial-mb-generic-tracker-rgbd_8cpp_source.html

 #include <iostream>


 #include <visp3/core/vpConfig.h>

 #include <visp3/core/vpDisplay.h>

 #include <visp3/core/vpIoTools.h>

 #include <visp3/gui/vpDisplayFactory.h>

 #include <visp3/io/vpImageIo.h>

 #include <visp3/mbt/vpMbGenericTracker.h>


 #if defined(VISP_HAVE_PCL)  && defined(VISP_HAVE_PCL_COMMON)

 #include <pcl/common/common.h>

 #include <pcl/point_cloud.h>

 #include <pcl/point_types.h>


 #ifdef ENABLE_VISP_NAMESPACE

 using namespace VISP_NAMESPACE_NAME;

 #endif


 namespace

 {

 struct vpRealsenseIntrinsics_t

 {

   float ppx;

   float ppy;

   float fx;

   float fy;

   float coeffs[5];

 };


 void rs_deproject_pixel_to_point(float point[3], const vpRealsenseIntrinsics_t &intrin, const float pixel[2], float depth)

 {

   float x = (pixel[0] - intrin.ppx) / intrin.fx;

   float y = (pixel[1] - intrin.ppy) / intrin.fy;


   float r2 = x * x + y * y;

   float f = 1 + intrin.coeffs[0] * r2 + intrin.coeffs[1] * r2 * r2 + intrin.coeffs[4] * r2 * r2 * r2;

   float ux = x * f + 2 * intrin.coeffs[2] * x * y + intrin.coeffs[3] * (r2 + 2 * x * x);

   float uy = y * f + 2 * intrin.coeffs[3] * x * y + intrin.coeffs[2] * (r2 + 2 * y * y);


   x = ux;

   y = uy;


   point[0] = depth * x;

   point[1] = depth * y;

   point[2] = depth;

 }


 bool read_data(unsigned int cpt, const std::string &input_directory, vpImage<vpRGBa> &I_color,

                vpImage<uint16_t> &I_depth_raw, pcl::PointCloud<pcl::PointXYZ>::Ptr &pointcloud)

 {

   char buffer[FILENAME_MAX];

   // Read color

   std::stringstream ss;

   ss << input_directory << "/color_image_%04d.jpg";

   snprintf(buffer, FILENAME_MAX, ss.str().c_str(), cpt);

   std::string filename_color = buffer;


   if (!vpIoTools::checkFilename(filename_color)) {

     std::cerr << "Cannot read: " << filename_color << std::endl;

     return false;

   }

   vpImageIo::read(I_color, filename_color);


   // Read raw depth

   ss.str("");

   ss << input_directory << "/depth_image_%04d.bin";

   snprintf(buffer, FILENAME_MAX, ss.str().c_str(), cpt);

   std::string filename_depth = buffer;


   std::ifstream file_depth(filename_depth.c_str(), std::ios::in | std::ios::binary);

   if (!file_depth.is_open()) {

     return false;

   }


   unsigned int height = 0, width = 0;

   vpIoTools::readBinaryValueLE(file_depth, height);

   vpIoTools::readBinaryValueLE(file_depth, width);

   I_depth_raw.resize(height, width);


   uint16_t depth_value = 0;

   for (unsigned int i = 0; i < height; i++) {

     for (unsigned int j = 0; j < width; j++) {

       vpIoTools::readBinaryValueLE(file_depth, depth_value);

       I_depth_raw[i][j] = depth_value;

     }

   }


   // Transform pointcloud

   pointcloud->width = width;

   pointcloud->height = height;

   pointcloud->resize((size_t)width * height);


   // Only for Creative SR300

   const float depth_scale = 0.00100000005f;

   vpRealsenseIntrinsics_t depth_intrinsic;

   depth_intrinsic.ppx = 320.503509521484f;

   depth_intrinsic.ppy = 235.602951049805f;

   depth_intrinsic.fx = 383.970001220703f;

   depth_intrinsic.fy = 383.970001220703f;

   depth_intrinsic.coeffs[0] = 0.0f;

   depth_intrinsic.coeffs[1] = 0.0f;

   depth_intrinsic.coeffs[2] = 0.0f;

   depth_intrinsic.coeffs[3] = 0.0f;

   depth_intrinsic.coeffs[4] = 0.0f;


   for (unsigned int i = 0; i < height; i++) {

     for (unsigned int j = 0; j < width; j++) {

       float scaled_depth = I_depth_raw[i][j] * depth_scale;

       float point[3];

       float pixel[2] = { (float)j, (float)i };

       rs_deproject_pixel_to_point(point, depth_intrinsic, pixel, scaled_depth);

       pointcloud->points[(size_t)(i * width + j)].x = point[0];

       pointcloud->points[(size_t)(i * width + j)].y = point[1];

       pointcloud->points[(size_t)(i * width + j)].z = point[2];

     }

   }


   return true;

 }

 } // namespace


 int main(int argc, char *argv[])

 {

   std::string input_directory = "data"; // location of the data (images, depth_map, point_cloud)

   std::string config_color = "model/cube/cube.xml", config_depth = "model/cube/cube_depth.xml";

   std::string model_color = "model/cube/cube.cao", model_depth = "model/cube/cube.cao";

   std::string init_file = "model/cube/cube.init";

   unsigned int frame_cpt = 0;

   bool disable_depth = false;


   for (int i = 1; i < argc; i++) {

     if (std::string(argv[i]) == "--input_directory" && i + 1 < argc) {

       input_directory = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--config_color" && i + 1 < argc) {

       config_color = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--config_depth" && i + 1 < argc) {

       config_depth = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--model_color" && i + 1 < argc) {

       model_color = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--model_depth" && i + 1 < argc) {

       model_depth = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--init_file" && i + 1 < argc) {

       init_file = std::string(argv[i + 1]);

     }

     else if (std::string(argv[i]) == "--disable_depth") {

       disable_depth = true;

     }

     else if (std::string(argv[i]) == "--help" || std::string(argv[i]) == "-h") {

       std::cout << "Usage: \n"

         << argv[0]

         << " --input_directory <data directory> --config_color <object.xml> --config_depth <object.xml>"

         " --model_color <object.cao> --model_depth <object.cao> --init_file <object.init> --disable_depth"

         << std::endl;

       std::cout

         << "\nExample:\n"

         << argv[0]

         << " --config_color model/cube/cube.xml --config_depth model/cube/cube.xml"

         " --model_color model/cube/cube.cao --model_depth model/cube/cube.cao --init_file model/cube/cube.init\n"

         << std::endl;

       return EXIT_SUCCESS;

     }

   }


   std::cout << "Tracked features: " << std::endl;

 #if defined(VISP_HAVE_OPENCV)

   std::cout << "  Use edges   : 1" << std::endl;

 #if defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

   std::cout << "  Use klt     : 1" << std::endl;

 #else

   std::cout << "  Use klt     : 0" << std::endl;

 #endif

   std::cout << "  Use depth   : " << !disable_depth << std::endl;

 #else

   std::cout << "  Use edges   : 1" << std::endl;

   std::cout << "  Use klt     : 0" << std::endl;

   std::cout << "  Use depth   : 0" << std::endl;

 #endif

   std::cout << "Config files: " << std::endl;

   std::cout << "  Input directory: "

     << "\"" << input_directory << "\"" << std::endl;

   std::cout << "  Config color: "

     << "\"" << config_color << "\"" << std::endl;

   std::cout << "  Config depth: "

     << "\"" << config_depth << "\"" << std::endl;

   std::cout << "  Model color : "

     << "\"" << model_color << "\"" << std::endl;

   std::cout << "  Model depth : "

     << "\"" << model_depth << "\"" << std::endl;

   std::cout << "  Init file   : "

     << "\"" << init_file << "\"" << std::endl;


   vpImage<vpRGBa> I_color;

   vpImage<unsigned char> I_gray, I_depth;

   vpImage<uint16_t> I_depth_raw;

   pcl::PointCloud<pcl::PointXYZ>::Ptr pointcloud(new pcl::PointCloud<pcl::PointXYZ>());

   vpCameraParameters cam_color, cam_depth;


   read_data(frame_cpt, input_directory, I_color, I_depth_raw, pointcloud);

   vpImageConvert::convert(I_color, I_gray);

   vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


 #if defined(VISP_HAVE_DISPLAY)

 #if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)

   std::shared_ptr<vpDisplay> display1 = vpDisplayFactory::createDisplay();

   std::shared_ptr<vpDisplay> display2 = vpDisplayFactory::createDisplay();

 #else

   vpDisplay *display1 = vpDisplayFactory::allocateDisplay();

   vpDisplay *display2 = vpDisplayFactory::allocateDisplay();

 #endif

   unsigned int _posx = 100, _posy = 50, _posdx = 10;

   display1->init(I_gray, _posx, _posy, "Color stream");

   display2->init(I_depth, _posx + I_gray.getWidth() + _posdx, _posy, "Depth stream");

 #endif


   vpDisplay::display(I_gray);

   vpDisplay::display(I_depth);

   vpDisplay::flush(I_gray);

   vpDisplay::flush(I_depth);


   std::vector<int> trackerTypes;

 #if defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

   trackerTypes.push_back(vpMbGenericTracker::EDGE_TRACKER | vpMbGenericTracker::KLT_TRACKER);

 #else

   trackerTypes.push_back(vpMbGenericTracker::EDGE_TRACKER);

 #endif

   trackerTypes.push_back(vpMbGenericTracker::DEPTH_DENSE_TRACKER);

   vpMbGenericTracker tracker(trackerTypes);

 #if defined(VISP_HAVE_PUGIXML)

   tracker.loadConfigFile(config_color, config_depth);

 #else

   {

     vpCameraParameters cam_color, cam_depth;

     cam_color.initPersProjWithoutDistortion(614.9, 614.9, 320.2, 241.5);

     cam_depth.initPersProjWithoutDistortion(384.0, 384.0, 320.5, 235.6);

     tracker.setCameraParameters(cam_color, cam_depth);

   }


   // Edge

   vpMe me;

   me.setMaskSize(5);

   me.setMaskNumber(180);

   me.setRange(7);

   me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

   me.setThreshold(10);

   me.setMu1(0.5);

   me.setMu2(0.5);

   me.setSampleStep(4);

   tracker.setMovingEdge(me);


   // Klt

 #if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)

   vpKltOpencv klt;

   tracker.setKltMaskBorder(5);

   klt.setMaxFeatures(300);

   klt.setWindowSize(5);

   klt.setQuality(0.01);

   klt.setMinDistance(5);

   klt.setHarrisFreeParameter(0.01);

   klt.setBlockSize(3);

   klt.setPyramidLevels(3);


   tracker.setKltOpencv(klt);

 #endif


   // Depth

   tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);

   tracker.setDepthNormalPclPlaneEstimationMethod(2);

   tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);

   tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);

   tracker.setDepthNormalSamplingStep(2, 2);


   tracker.setDepthDenseSamplingStep(4, 4);


   tracker.setAngleAppear(vpMath::rad(80.0));

   tracker.setAngleDisappear(vpMath::rad(85.0));

   tracker.setNearClippingDistance(0.001);

   tracker.setFarClippingDistance(5.0);

   tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

 #endif

   tracker.loadModel(model_color, model_depth);


   tracker.getCameraParameters(cam_color, cam_depth);


   std::cout << "Camera parameters for color camera (from XML file): " << cam_color << std::endl;

   std::cout << "Camera parameters for depth camera (from XML file): " << cam_depth << std::endl;


   tracker.setDisplayFeatures(true);


   vpHomogeneousMatrix depth_M_color;

   {

     std::ifstream file((std::string(input_directory + "/depth_M_color.txt")).c_str());

     depth_M_color.load(file);

     file.close();

   }

   std::map<std::string, vpHomogeneousMatrix> mapOfCameraTransformations;

   mapOfCameraTransformations["Camera1"] = vpHomogeneousMatrix();

   mapOfCameraTransformations["Camera2"] = depth_M_color;

   tracker.setCameraTransformationMatrix(mapOfCameraTransformations);

   std::cout << "depth_M_color: \n" << depth_M_color << std::endl;


   std::map<std::string, const vpImage<unsigned char> *> mapOfImages;

   mapOfImages["Camera1"] = &I_gray;

   mapOfImages["Camera2"] = &I_depth;


   std::map<std::string, std::string> mapOfInitFiles;

   mapOfInitFiles["Camera1"] = init_file;

   tracker.initClick(mapOfImages, mapOfInitFiles, true);


   mapOfImages.clear();

   pcl::PointCloud<pcl::PointXYZ>::Ptr empty_pointcloud(new pcl::PointCloud<pcl::PointXYZ>);

   std::vector<double> times_vec;


   try {

     bool quit = false;

     while (!quit) {

       double t = vpTime::measureTimeMs();

       quit = !read_data(frame_cpt, input_directory, I_color, I_depth_raw, pointcloud);

       vpImageConvert::convert(I_color, I_gray);

       vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


       vpDisplay::display(I_gray);

       vpDisplay::display(I_depth);


       mapOfImages["Camera1"] = &I_gray;

       std::map<std::string, pcl::PointCloud<pcl::PointXYZ>::ConstPtr> mapOfPointclouds;

       if (disable_depth)

         mapOfPointclouds["Camera2"] = empty_pointcloud;

       else

         mapOfPointclouds["Camera2"] = pointcloud;


       tracker.track(mapOfImages, mapOfPointclouds);


       vpHomogeneousMatrix cMo = tracker.getPose();


       std::cout << "iter: " << frame_cpt << " cMo:\n" << cMo << std::endl;


       tracker.display(I_gray, I_depth, cMo, depth_M_color * cMo, cam_color, cam_depth, vpColor::red, 3);

       vpDisplay::displayFrame(I_gray, cMo, cam_color, 0.05, vpColor::none, 3);

       vpDisplay::displayFrame(I_depth, depth_M_color * cMo, cam_depth, 0.05, vpColor::none, 3);


       t = vpTime::measureTimeMs() - t;

       times_vec.push_back(t);


       std::stringstream ss;

       ss << "Computation time: " << t << " ms";

       vpDisplay::displayText(I_gray, 20, 20, ss.str(), vpColor::red);

       {

         std::stringstream ss;

         ss << "Nb features: " << tracker.getError().size();

         vpDisplay::displayText(I_gray, I_gray.getHeight() - 50, 20, ss.str(), vpColor::red);

       }

       {

         std::stringstream ss;

         ss << "Features: edges " << tracker.getNbFeaturesEdge() << ", klt " << tracker.getNbFeaturesKlt() << ", depth "

           << tracker.getNbFeaturesDepthDense();

         vpDisplay::displayText(I_gray, I_gray.getHeight() - 30, 20, ss.str(), vpColor::red);

       }


       vpDisplay::flush(I_gray);

       vpDisplay::flush(I_depth);


       vpMouseButton::vpMouseButtonType button;

       if (vpDisplay::getClick(I_gray, button, false)) {

         quit = true;

       }


       frame_cpt++;

     }

   }

   catch (const vpException &e) {

     std::cout << "Catch exception: " << e.getStringMessage() << std::endl;

   }


 #if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11) && defined(VISP_HAVE_DISPLAY)

   if (display1 != nullptr) {

     delete display1;

   }

   if (display2 != nullptr) {

     delete display2;

   }

 #endif


   std::cout << "\nProcessing time, Mean: " << vpMath::getMean(times_vec)

     << " ms ; Median: " << vpMath::getMedian(times_vec) << " ; Std: " << vpMath::getStdev(times_vec) << " ms"

     << std::endl;


   vpDisplay::displayText(I_gray, 60, 20, "Click to quit", vpColor::red);

   vpDisplay::flush(I_gray);

   vpDisplay::getClick(I_gray);


   return EXIT_SUCCESS;

 }

 #else

 int main()

 {

   std::cout << "To run this tutorial, ViSP should be build with PCL library."

     " Install libpcl, configure and build again ViSP..."

     << std::endl;

   return EXIT_SUCCESS;

 }

 #endif

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:310

vpCameraParameters::initPersProjWithoutDistortion
void initPersProjWithoutDistortion(double px, double py, double u0, double v0)
Definition: vpCameraParameters.cpp:202

vpColor::red
static const vpColor red
Definition: vpColor.h:198

vpColor::none
static const vpColor none
Definition: vpColor.h:210

vpDisplay
Class that defines generic functionalities for display.
Definition: vpDisplay.h:178

vpDisplay::getClick
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
Definition: vpDisplay_uchar.cpp:855

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:830

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
Definition: vpDisplay_uchar.cpp:413

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:806

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpException
error that can be emitted by ViSP classes.
Definition: vpException.h:60

vpException::getStringMessage
const std::string & getStringMessage() const
Definition: vpException.cpp:67

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:221

vpHomogeneousMatrix::load
void load(std::ifstream &f)
Definition: vpHomogeneousMatrix.cpp:1065

vpImageConvert::createDepthHistogram
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
Definition: vpImageConvert.cpp:257

vpImageConvert::convert
static void convert(const vpImage< unsigned char > &src, vpImage< vpRGBa > &dest)
Definition: vpImageConvert.cpp:73

vpImageIo::read
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Definition: vpImageIo.cpp:147

vpImage< vpRGBa >

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:242

vpImage::resize
void resize(unsigned int h, unsigned int w)
resize the image : Image initialization
Definition: vpImage.h:544

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:181

vpIoTools::checkFilename
static bool checkFilename(const std::string &filename)
Definition: vpIoTools.cpp:786

vpIoTools::readBinaryValueLE
static void readBinaryValueLE(std::ifstream &file, int16_t &short_value)
Definition: vpIoTools_config_file.cpp:469

vpKltOpencv
Wrapper for the KLT (Kanade-Lucas-Tomasi) feature tracker implemented in OpenCV. Thus to enable this ...
Definition: vpKltOpencv.h:79

vpKltOpencv::setBlockSize
void setBlockSize(int blockSize)
Definition: vpKltOpencv.h:272

vpKltOpencv::setQuality
void setQuality(double qualityLevel)
Definition: vpKltOpencv.h:361

vpKltOpencv::setHarrisFreeParameter
void setHarrisFreeParameter(double harris_k)
Definition: vpKltOpencv.h:280

vpKltOpencv::setMaxFeatures
void setMaxFeatures(int maxCount)
Definition: vpKltOpencv.h:320

vpKltOpencv::setMinDistance
void setMinDistance(double minDistance)
Definition: vpKltOpencv.h:329

vpKltOpencv::setWindowSize
void setWindowSize(int winSize)
Definition: vpKltOpencv.h:382

vpKltOpencv::setPyramidLevels
void setPyramidLevels(int pyrMaxLevel)
Definition: vpKltOpencv.h:348

vpMath::rad
static double rad(double deg)
Definition: vpMath.h:129

vpMath::getMedian
static double getMedian(const std::vector< double > &v)
Definition: vpMath.cpp:322

vpMath::getStdev
static double getStdev(const std::vector< double > &v, bool useBesselCorrection=false)
Definition: vpMath.cpp:353

vpMath::getMean
static double getMean(const std::vector< double > &v)
Definition: vpMath.cpp:302

vpMbGenericTracker
Real-time 6D object pose tracking using its CAD model.
Definition: vpMbGenericTracker.h:201

vpMbGenericTracker::EDGE_TRACKER
@ EDGE_TRACKER
Definition: vpMbGenericTracker.h:205

vpMbGenericTracker::DEPTH_DENSE_TRACKER
@ DEPTH_DENSE_TRACKER
Definition: vpMbGenericTracker.h:210

vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION
@ ROBUST_FEATURE_ESTIMATION
Robust scheme to estimate the normal of the plane.
Definition: vpMbtFaceDepthNormal.h:71

vpMe
Definition: vpMe.h:134

vpMe::setMu1
void setMu1(const double &mu_1)
Definition: vpMe.h:385

vpMe::setRange
void setRange(const unsigned int &range)
Definition: vpMe.h:415

vpMe::setLikelihoodThresholdType
void setLikelihoodThresholdType(const vpLikelihoodThresholdType likelihood_threshold_type)
Definition: vpMe.h:505

vpMe::setMaskNumber
void setMaskNumber(const unsigned int &mask_number)
Definition: vpMe.cpp:552

vpMe::setThreshold
void setThreshold(const double &threshold)
Definition: vpMe.h:466

vpMe::setSampleStep
void setSampleStep(const double &sample_step)
Definition: vpMe.h:422

vpMe::setMaskSize
void setMaskSize(const unsigned int &mask_size)
Definition: vpMe.cpp:560

vpMe::setMu2
void setMu2(const double &mu_2)
Definition: vpMe.h:392

vpMe::NORMALIZED_THRESHOLD
@ NORMALIZED_THRESHOLD
Definition: vpMe.h:145

vpMouseButton::vpMouseButtonType
vpMouseButtonType
Definition: vpMouseButton.h:49

vpPolygon3D::FOV_CLIPPING
@ FOV_CLIPPING
Definition: vpPolygon3D.h:68

VISP_NAMESPACE_NAME
Definition: vpEigenConversion.h:44

vpDisplayFactory::createDisplay
std::shared_ptr< vpDisplay > createDisplay()
Return a smart pointer vpDisplay specialization if a GUI library is available or nullptr otherwise.
Definition: vpDisplayFactory.h:137

vpDisplayFactory::allocateDisplay
vpDisplay * allocateDisplay()
Return a newly allocated vpDisplay specialization if a GUI library is available or nullptr otherwise.
Definition: vpDisplayFactory.h:63

vpTime::measureTimeMs
VISP_EXPORT double measureTimeMs()