doxygen/visp-daily/tutorial-apriltag-detector-live-rgbd-realsense_8cpp-example.html

#include <visp3/core/vpConfig.h>

#ifdef VISP_HAVE_MODULE_SENSOR

#include <visp3/sensor/vpRealSense2.h>

#endif

#include <visp3/detection/vpDetectorAprilTag.h>

#include <visp3/core/vpImageConvert.h>

#include <visp3/gui/vpDisplayGDI.h>

#include <visp3/gui/vpDisplayOpenCV.h>

#include <visp3/gui/vpDisplayX.h>

#include <visp3/vision/vpPose.h>


int main(int argc, const char **argv)

{

#if defined(VISP_HAVE_APRILTAG) && defined(VISP_HAVE_REALSENSE2)

#ifdef ENABLE_VISP_NAMESPACE

  using namespace VISP_NAMESPACE_NAME;

#endif


  vpDetectorAprilTag::vpAprilTagFamily tagFamily = vpDetectorAprilTag::TAG_36h11;

  vpDetectorAprilTag::vpPoseEstimationMethod poseEstimationMethod = vpDetectorAprilTag::HOMOGRAPHY_VIRTUAL_VS;

  double tagSize = 0.053;

  float quad_decimate = 1.0;

  int nThreads = 1;

  bool display_tag = false;

  int color_id = -1;

  unsigned int thickness = 2;

  bool align_frame = false;

  bool opt_verbose = false;


#if !(defined(VISP_HAVE_X11) || defined(VISP_HAVE_GDI) || defined(VISP_HAVE_OPENCV))

  bool display_off = true;

  std::cout << "Warning: There is no 3rd party (X11, GDI or openCV) to dislay images..." << std::endl;

#else

  bool display_off = false;

#endif


  for (int i = 1; i < argc; i++) {

    if (std::string(argv[i]) == "--pose_method" && i + 1 < argc) {

      poseEstimationMethod = (vpDetectorAprilTag::vpPoseEstimationMethod)atoi(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--tag_size" && i + 1 < argc) {

      tagSize = atof(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--quad_decimate" && i + 1 < argc) {

      quad_decimate = (float)atof(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--nthreads" && i + 1 < argc) {

      nThreads = atoi(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--display_tag") {

      display_tag = true;

    }

    else if (std::string(argv[i]) == "--display_off") {

      display_off = true;

    }

    else if (std::string(argv[i]) == "--color" && i + 1 < argc) {

      color_id = atoi(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--thickness" && i + 1 < argc) {

      thickness = (unsigned int)atoi(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--tag_family" && i + 1 < argc) {

      tagFamily = (vpDetectorAprilTag::vpAprilTagFamily)atoi(argv[i + 1]);

    }

    else if (std::string(argv[i]) == "--z_aligned") {

      align_frame = true;

    }

    else if (std::string(argv[i]) == "--verbose" || std::string(argv[i]) == "-v") {

      opt_verbose = true;

    }

    else if (std::string(argv[i]) == "--help" || std::string(argv[i]) == "-h") {

      std::cout << "Usage: " << argv[0]

        << " [--tag_size <tag_size in m> (default: 0.053)]"

        " [--quad_decimate <quad_decimate> (default: 1)]"

        " [--nthreads <nb> (default: 1)]"

        " [--pose_method <method> (0: HOMOGRAPHY, 1: HOMOGRAPHY_VIRTUAL_VS, "

        " 2: DEMENTHON_VIRTUAL_VS, 3: LAGRANGE_VIRTUAL_VS, "

        " 4: BEST_RESIDUAL_VIRTUAL_VS, 5: HOMOGRAPHY_ORTHOGONAL_ITERATION) (default: 0)]"

        " [--tag_family <family> (0: TAG_36h11, 1: TAG_36h10 (DEPRECATED), 2: TAG_36ARTOOLKIT (DEPRECATED),"

        " 3: TAG_25h9, 4: TAG_25h7 (DEPRECATED), 5: TAG_16h5, 6: TAG_CIRCLE21h7, 7: TAG_CIRCLE49h12,"

        " 8: TAG_CUSTOM48h12, 9: TAG_STANDARD41h12, 10: TAG_STANDARD52h13) (default: 0)]"

        " [--display_tag] [--z_aligned]";

#if (defined(VISP_HAVE_X11) || defined(VISP_HAVE_GDI) || defined(VISP_HAVE_OPENCV))

      std::cout << " [--display_off] [--color <color id>] [--thickness <line thickness>]";

#endif

      std::cout << " [--verbose,-v] [--help,-h]" << std::endl;

      return EXIT_SUCCESS;

    }

  }


  try {

    std::cout << "Use Realsense 2 grabber" << std::endl;

    vpRealSense2 g;

    rs2::config config;

    unsigned int width = 640, height = 480;

    config.enable_stream(RS2_STREAM_COLOR, static_cast<int>(width), static_cast<int>(height), RS2_FORMAT_RGBA8, 30);

    config.enable_stream(RS2_STREAM_DEPTH, static_cast<int>(width), static_cast<int>(height), RS2_FORMAT_Z16, 30);

    config.enable_stream(RS2_STREAM_INFRARED, static_cast<int>(width), static_cast<int>(height), RS2_FORMAT_Y8, 30);


    vpImage<unsigned char> I;

    vpImage<vpRGBa> I_color(height, width);

    vpImage<uint16_t> I_depth_raw(height, width);

    vpImage<vpRGBa> I_depth;


    g.open(config);

    const float depth_scale = g.getDepthScale();

    std::cout << "I_color: " << I_color.getWidth() << " " << I_color.getHeight() << std::endl;

    std::cout << "I_depth_raw: " << I_depth_raw.getWidth() << " " << I_depth_raw.getHeight() << std::endl;


    rs2::align align_to_color = RS2_STREAM_COLOR;

    g.acquire(reinterpret_cast<unsigned char *>(I_color.bitmap), reinterpret_cast<unsigned char *>(I_depth_raw.bitmap),

              nullptr, nullptr, &align_to_color);


    std::cout << "Read camera parameters from Realsense device" << std::endl;

    vpCameraParameters cam;

    cam = g.getCameraParameters(RS2_STREAM_COLOR, vpCameraParameters::perspectiveProjWithoutDistortion);


    std::cout << cam << std::endl;

    std::cout << "poseEstimationMethod: " << poseEstimationMethod << std::endl;

    std::cout << "tagFamily: " << tagFamily << std::endl;

    std::cout << "nThreads : " << nThreads << std::endl;

    std::cout << "Z aligned: " << align_frame << std::endl;


    vpImage<vpRGBa> I_color2 = I_color;

    vpImage<float> depthMap;

    vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


    vpDisplay *d1 = nullptr;

    vpDisplay *d2 = nullptr;

    vpDisplay *d3 = nullptr;

    if (!display_off) {

#ifdef VISP_HAVE_X11

      d1 = new vpDisplayX(I_color, 100, 30, "Pose from Homography");

      d2 = new vpDisplayX(I_color2, I_color.getWidth() + 120, 30, "Pose from RGBD fusion");

      d3 = new vpDisplayX(I_depth, 100, I_color.getHeight() + 70, "Depth");

#elif defined(VISP_HAVE_GDI)

      d1 = new vpDisplayGDI(I_color, 100, 30, "Pose from Homography");

      d2 = new vpDisplayGDI(I_color2, I_color.getWidth() + 120, 30, "Pose from RGBD fusion");

      d3 = new vpDisplayGDI(I_depth, 100, I_color.getHeight() + 70, "Depth");

#elif defined(HAVE_OPENCV_HIGHGUI)

      d1 = new vpDisplayOpenCV(I_color, 100, 30, "Pose from Homography");

      d2 = new vpDisplayOpenCV(I_color2, I_color.getWidth() + 120, 30, "Pose from RGBD fusion");

      d3 = new vpDisplayOpenCV(I_depth, 100, I_color.getHeight() + 70, "Depth");

#endif

    }


    vpDetectorAprilTag detector(tagFamily);


    detector.setAprilTagQuadDecimate(quad_decimate);

    detector.setAprilTagPoseEstimationMethod(poseEstimationMethod);

    detector.setAprilTagNbThreads(nThreads);

    detector.setDisplayTag(display_tag, color_id < 0 ? vpColor::none : vpColor::getColor(color_id), thickness);

    detector.setZAlignedWithCameraAxis(align_frame);

    std::vector<double> time_vec;

    for (;;) {

      double t = vpTime::measureTimeMs();


      g.acquire(reinterpret_cast<unsigned char *>(I_color.bitmap),

                reinterpret_cast<unsigned char *>(I_depth_raw.bitmap), nullptr, nullptr, &align_to_color);


      I_color2 = I_color;

      vpImageConvert::convert(I_color, I);

      vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);


      depthMap.resize(I_depth_raw.getHeight(), I_depth_raw.getWidth());

#ifdef VISP_HAVE_OPENMP

#pragma omp parallel for

#endif

      for (int i = 0; i < static_cast<int>(I_depth_raw.getHeight()); i++) {

        for (int j = 0; j < static_cast<int>(I_depth_raw.getWidth()); j++) {

          if (I_depth_raw[i][j]) {

            float Z = I_depth_raw[i][j] * depth_scale;

            depthMap[i][j] = Z;

          }

          else {

            depthMap[i][j] = 0;

          }

        }

      }


      vpDisplay::display(I_color);

      vpDisplay::display(I_color2);

      vpDisplay::display(I_depth);


      std::vector<vpHomogeneousMatrix> cMo_vec;

      detector.detect(I, tagSize, cam, cMo_vec);


      // Display camera pose for each tag

      for (size_t i = 0; i < cMo_vec.size(); i++) {

        vpDisplay::displayFrame(I_color, cMo_vec[i], cam, tagSize / 2, vpColor::none, 3);

      }


      std::vector<std::vector<vpImagePoint> > tags_corners = detector.getPolygon();

      std::vector<int> tags_id = detector.getTagsId();

      std::map<int, double> tags_size;

      tags_size[-1] = tagSize; // Default tag size

      std::vector<std::vector<vpPoint> > tags_points3d = detector.getTagsPoints3D(tags_id, tags_size);

      for (size_t i = 0; i < tags_corners.size(); i++) {

        vpHomogeneousMatrix cMo;

        double confidence_index;

        if (vpPose::computePlanarObjectPoseFromRGBD(depthMap, tags_corners[i], cam, tags_points3d[i], cMo,

                                                    &confidence_index)) {

          if (confidence_index > 0.5) {

            vpDisplay::displayFrame(I_color2, cMo, cam, tagSize / 2, vpColor::none, 3);

          }

          else if (confidence_index > 0.25) {

            vpDisplay::displayFrame(I_color2, cMo, cam, tagSize / 2, vpColor::orange, 3);

          }

          else {

            vpDisplay::displayFrame(I_color2, cMo, cam, tagSize / 2, vpColor::red, 3);

          }

          std::stringstream ss;

          ss << "Tag id " << tags_id[i] << " confidence: " << confidence_index;

          vpDisplay::displayText(I_color2, 35 + i * 15, 20, ss.str(), vpColor::red);


          if (opt_verbose) {

            std::cout << "cMo[" << i << "]: \n" << cMo_vec[i] << std::endl;

            std::cout << "cMo[" << i << "] using depth: \n" << cMo << std::endl;

          }

        }

      }


      vpDisplay::displayText(I_color, 20, 20, "Pose from homography + VVS", vpColor::red);

      vpDisplay::displayText(I_color2, 20, 20, "Pose from RGBD fusion", vpColor::red);

      vpDisplay::displayText(I_color, 35, 20, "Click to quit.", vpColor::red);

      t = vpTime::measureTimeMs() - t;

      time_vec.push_back(t);


      std::stringstream ss;

      ss << "Detection time: " << t << " ms for " << detector.getNbObjects() << " tags";

      vpDisplay::displayText(I_color, 50, 20, ss.str(), vpColor::red);


      if (vpDisplay::getClick(I_color, false))

        break;


      vpDisplay::flush(I_color);

      vpDisplay::flush(I_color2);

      vpDisplay::flush(I_depth);

    }


    std::cout << "Benchmark loop processing time" << std::endl;

    std::cout << "Mean / Median / Std: " << vpMath::getMean(time_vec) << " ms"

      << " ; " << vpMath::getMedian(time_vec) << " ms"

      << " ; " << vpMath::getStdev(time_vec) << " ms" << std::endl;


    if (!display_off) {

      delete d1;

      delete d2;

      delete d3;

    }


  }

  catch (const vpException &e) {

    std::cerr << "Catch an exception: " << e.getMessage() << std::endl;

}


  return EXIT_SUCCESS;

#else

  (void)argc;

  (void)argv;

#ifndef VISP_HAVE_APRILTAG

  std::cout << "Enable Apriltag support, configure and build ViSP to run this tutorial" << std::endl;

#else

  std::cout << "Install librealsense 3rd party, configure and build ViSP again to use this example" << std::endl;

#endif

#endif

  return EXIT_SUCCESS;

}

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:310

vpCameraParameters::perspectiveProjWithoutDistortion
@ perspectiveProjWithoutDistortion
Perspective projection without distortion model.
Definition: vpCameraParameters.h:317

vpColor::getColor
static vpColor getColor(const unsigned int &i)
Definition: vpColor.h:311

vpColor::red
static const vpColor red
Definition: vpColor.h:217

vpColor::none
static const vpColor none
Definition: vpColor.h:229

vpColor::orange
static const vpColor orange
Definition: vpColor.h:227

vpDetectorAprilTag
Definition: vpDetectorAprilTag.h:235

vpDetectorAprilTag::vpPoseEstimationMethod
vpPoseEstimationMethod
Definition: vpDetectorAprilTag.h:253

vpDetectorAprilTag::HOMOGRAPHY_VIRTUAL_VS
@ HOMOGRAPHY_VIRTUAL_VS
Definition: vpDetectorAprilTag.h:255

vpDetectorAprilTag::setZAlignedWithCameraAxis
void setZAlignedWithCameraAxis(bool zAlignedWithCameraFrame)
Definition: vpDetectorAprilTag.cpp:1234

vpDetectorAprilTag::setDisplayTag
void setDisplayTag(bool display, const vpColor &color=vpColor::none, unsigned int thickness=2)
Definition: vpDetectorAprilTag.h:316

vpDetectorAprilTag::setAprilTagQuadDecimate
void setAprilTagQuadDecimate(float quadDecimate)
Definition: vpDetectorAprilTag.cpp:1176

vpDetectorAprilTag::getTagsPoints3D
std::vector< std::vector< vpPoint > > getTagsPoints3D(const std::vector< int > &tagsId, const std::map< int, double > &tagsSize) const
Definition: vpDetectorAprilTag.cpp:1051

vpDetectorAprilTag::detect
bool detect(const vpImage< unsigned char > &I) VP_OVERRIDE
Definition: vpDetectorAprilTag.cpp:885

vpDetectorAprilTag::vpAprilTagFamily
vpAprilTagFamily
Definition: vpDetectorAprilTag.h:238

vpDetectorAprilTag::TAG_36h11
@ TAG_36h11
AprilTag 36h11 pattern (recommended)
Definition: vpDetectorAprilTag.h:239

vpDetectorAprilTag::setAprilTagNbThreads
void setAprilTagNbThreads(int nThreads)
Definition: vpDetectorAprilTag.cpp:1146

vpDetectorAprilTag::setAprilTagPoseEstimationMethod
void setAprilTagPoseEstimationMethod(const vpPoseEstimationMethod &poseEstimationMethod)
Definition: vpDetectorAprilTag.cpp:1158

vpDetectorAprilTag::getTagsId
std::vector< int > getTagsId() const
Definition: vpDetectorAprilTag.cpp:1109

vpDetectorBase::getPolygon
std::vector< std::vector< vpImagePoint > > & getPolygon()
Definition: vpDetectorBase.h:113

vpDetectorBase::getNbObjects
size_t getNbObjects() const
Definition: vpDetectorBase.h:108

vpDisplayGDI
Display for windows using GDI (available on any windows 32 platform).
Definition: vpDisplayGDI.h:130

vpDisplayOpenCV
The vpDisplayOpenCV allows to display image using the OpenCV library. Thus to enable this class OpenC...
Definition: vpDisplayOpenCV.h:139

vpDisplay
Class that defines generic functionalities for display.
Definition: vpDisplay.h:178

vpDisplay::getClick
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
Definition: vpDisplay_uchar.cpp:855

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:830

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
Definition: vpDisplay_uchar.cpp:413

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:806

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpException
error that can be emitted by ViSP classes.
Definition: vpException.h:60

vpException::getMessage
const char * getMessage() const
Definition: vpException.cpp:65

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:221

vpImageConvert::createDepthHistogram
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
Definition: vpImageConvert.cpp:257

vpImageConvert::convert
static void convert(const vpImage< unsigned char > &src, vpImage< vpRGBa > &dest)
Definition: vpImageConvert.cpp:73

vpImage< unsigned char >

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:242

vpImage::resize
void resize(unsigned int h, unsigned int w)
resize the image : Image initialization
Definition: vpImage.h:544

vpImage::bitmap
Type * bitmap
points toward the bitmap
Definition: vpImage.h:135

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:181

vpMath::getMedian
static double getMedian(const std::vector< double > &v)
Definition: vpMath.cpp:322

vpMath::getStdev
static double getStdev(const std::vector< double > &v, bool useBesselCorrection=false)
Definition: vpMath.cpp:353

vpMath::getMean
static double getMean(const std::vector< double > &v)
Definition: vpMath.cpp:302

vpPose::computePlanarObjectPoseFromRGBD
static bool computePlanarObjectPoseFromRGBD(const vpImage< float > &depthMap, const std::vector< vpImagePoint > &corners, const vpCameraParameters &colorIntrinsics, const std::vector< vpPoint > &point3d, vpHomogeneousMatrix &cMo, double *confidence_index=nullptr)
Definition: vpPoseRGBD.cpp:158

vpRealSense2
Definition: vpRealSense2.h:312

vpRealSense2::getCameraParameters
vpCameraParameters getCameraParameters(const rs2_stream &stream, vpCameraParameters::vpCameraParametersProjType type=vpCameraParameters::perspectiveProjWithDistortion, int index=-1) const
Definition: vpRealSense2.cpp:681

vpRealSense2::acquire
void acquire(vpImage< unsigned char > &grey, double *ts=nullptr)
Definition: vpRealSense2.cpp:90

vpRealSense2::open
bool open(const rs2::config &cfg=rs2::config())
Definition: vpRealSense2.cpp:1363

vpRealSense2::getDepthScale
float getDepthScale()
Definition: vpRealSense2.cpp:763

VISP_NAMESPACE_NAME
Definition: vpEigenConversion.h:44

vpTime::measureTimeMs
VISP_EXPORT double measureTimeMs()