doxygen/visp-daily/tutorial-detection-object-mbt2_8cpp-example.html

#include <visp3/core/vpConfig.h>

#include <visp3/core/vpIoTools.h>

#include <visp3/gui/vpDisplayFactory.h>

#include <visp3/io/vpVideoReader.h>

#include <visp3/mbt/vpMbGenericTracker.h>

#include <visp3/vision/vpKeyPoint.h>


#ifdef ENABLE_VISP_NAMESPACE

using namespace VISP_NAMESPACE_NAME;

#endif


#if defined(HAVE_OPENCV_IMGPROC) && defined(VISP_HAVE_DISPLAY) && \

  ((VISP_HAVE_OPENCV_VERSION < 0x050000) && defined(HAVE_OPENCV_CALIB3D) && defined(HAVE_OPENCV_FEATURES2D)) || \

  ((VISP_HAVE_OPENCV_VERSION >= 0x050000) && defined(HAVE_OPENCV_3D) && defined(HAVE_OPENCV_FEATURES))


void learnCube(const vpImage<unsigned char> &I, vpMbGenericTracker &tracker, vpKeyPoint &keypoint_learning, int id)

{

  std::vector<cv::KeyPoint> trainKeyPoints;

  double elapsedTime;

  keypoint_learning.detect(I, trainKeyPoints, elapsedTime);


  std::vector<vpPolygon> polygons;

  std::vector<std::vector<vpPoint> > roisPt;

  std::pair<std::vector<vpPolygon>, std::vector<std::vector<vpPoint> > > pair = tracker.getPolygonFaces();

  polygons = pair.first;

  roisPt = pair.second;


  std::vector<cv::Point3f> points3f;

  vpHomogeneousMatrix cMo;

  tracker.getPose(cMo);

  vpCameraParameters cam;

  tracker.getCameraParameters(cam);

  vpKeyPoint::compute3DForPointsInPolygons(cMo, cam, trainKeyPoints, polygons, roisPt, points3f);


  keypoint_learning.buildReference(I, trainKeyPoints, points3f, true, id);


  for (std::vector<cv::KeyPoint>::const_iterator it = trainKeyPoints.begin(); it != trainKeyPoints.end(); ++it) {

    vpDisplay::displayCross(I, (int)it->pt.y, (int)it->pt.x, 4, vpColor::red);

  }

}

#endif


int main(int argc, char **argv)

{

#if defined(HAVE_OPENCV_IMGPROC) && \

  ((VISP_HAVE_OPENCV_VERSION < 0x050000) && defined(HAVE_OPENCV_FEATURES2D)) || ((VISP_HAVE_OPENCV_VERSION >= 0x050000) && defined(HAVE_OPENCV_FEATURES))


#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)

  std::shared_ptr<vpDisplay> display, display2;

#else

  vpDisplay *display = nullptr;

  vpDisplay *display2 = nullptr;

#endif

  try {

    std::string videoname = "cube.mp4";


    for (int i = 1; i < argc; i++) {

      if (std::string(argv[i]) == "--name" && i + 1 < argc)

        videoname = std::string(argv[++i]);

      else if (std::string(argv[i]) == "--help" || std::string(argv[i]) == "-h") {

        std::cout << "\nUsage: " << argv[0]

          << " [--name <video name>]"

          << " [--help] [-h]\n" << std::endl;

        return EXIT_SUCCESS;

      }

    }

    std::string parentname = vpIoTools::getParent(videoname);

    std::string objectname = vpIoTools::getNameWE(videoname);


    if (!parentname.empty())

      objectname = parentname + "/" + objectname;


    std::cout << "Video name: " << videoname << std::endl;

    std::cout << "Tracker requested config files: " << objectname << ".[init,"

      << "xml,"

      << "cao or wrl]" << std::endl;

    std::cout << "Tracker optional config files: " << objectname << ".[ppm]" << std::endl;


    vpImage<unsigned char> I;

    vpHomogeneousMatrix cMo;

    vpCameraParameters cam;


    vpMbGenericTracker tracker(vpMbGenericTracker::EDGE_TRACKER);

    bool usexml = false;

#if defined(VISP_HAVE_PUGIXML)

    if (vpIoTools::checkFilename(objectname + ".xml")) {

      tracker.loadConfigFile(objectname + ".xml");

      tracker.getCameraParameters(cam);

      usexml = true;

    }

#endif

    if (!usexml) {

      vpMe me;

      me.setMaskSize(5);

      me.setMaskNumber(180);

      me.setRange(7);

      me.setLikelihoodThresholdType(vpMe::NORMALIZED_THRESHOLD);

      me.setThreshold(20);

      me.setMu1(0.5);

      me.setMu2(0.5);

      me.setSampleStep(4);

      me.setNbTotalSample(250);

      tracker.setMovingEdge(me);

      cam.initPersProjWithoutDistortion(547, 542, 339, 235);

      tracker.setCameraParameters(cam);

      tracker.setAngleAppear(vpMath::rad(89));

      tracker.setAngleDisappear(vpMath::rad(89));

      tracker.setNearClippingDistance(0.01);

      tracker.setFarClippingDistance(10.0);

      tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);

    }


    tracker.setOgreVisibilityTest(false);

    if (vpIoTools::checkFilename(objectname + ".cao")) {

      tracker.loadModel(objectname + ".cao");

    }

    else if (vpIoTools::checkFilename(objectname + ".wrl")) {

      tracker.loadModel(objectname + ".wrl");

    }

    tracker.setDisplayFeatures(true);


    vpKeyPoint keypoint_learning("ORB", "ORB", "BruteForce-Hamming");

#if ((VISP_HAVE_OPENCV_VERSION < 0x050000) && defined(HAVE_OPENCV_FEATURES2D)) || ((VISP_HAVE_OPENCV_VERSION >= 0x050000) && defined(HAVE_OPENCV_FEATURES))

#if (VISP_HAVE_OPENCV_VERSION < 0x030000)

    keypoint_learning.setDetectorParameter("ORB", "nLevels", 1);

#else

    cv::Ptr<cv::ORB> orb_learning = keypoint_learning.getDetector("ORB").dynamicCast<cv::ORB>();

    if (orb_learning) {

      orb_learning->setNLevels(1);

    }

#endif

#endif


    /*

     * Start the part of the code dedicated to object learning from 3 images

     */

    std::string imageName[] = { "cube0001.png", "cube0150.png", "cube0200.png" };

    vpHomogeneousMatrix initPoseTab[] = {

        vpHomogeneousMatrix(0.02143385294, 0.1098083886, 0.5127439561, 2.087159614, 1.141775176, -0.4701291124),

        vpHomogeneousMatrix(0.02651282185, -0.03713587374, 0.6873765919, 2.314744454, 0.3492296488, -0.1226054828),

        vpHomogeneousMatrix(0.02965448956, -0.07283091786, 0.7253526051, 2.300529617, -0.4286674806, 0.1788761025) };

    for (int i = 0; i < 3; i++) {

      vpImageIo::read(I, imageName[i]);

      if (i == 0) {

#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)

        display = vpDisplayFactory::createDisplay(I, 10, 10);

#else

        display = vpDisplayFactory::allocateDisplay(I, 10, 10);

#endif

      }

      std::stringstream title;

      title << "Learning cube on image: " << imageName[i];

      vpDisplay::setTitle(I, title.str().c_str());


      vpDisplay::display(I);


      tracker.setPose(I, initPoseTab[i]);


      tracker.track(I);


      tracker.getPose(cMo);

      tracker.display(I, cMo, cam, vpColor::red);


      learnCube(I, tracker, keypoint_learning, i);


      vpDisplay::displayText(I, 10, 10, "Learning step: keypoints are detected on visible cube faces", vpColor::red);

      if (i < 2) {

        vpDisplay::displayText(I, 30, 10, "Click to continue the learning...", vpColor::red);

      }

      else {

        vpDisplay::displayText(I, 30, 10, "Click to continue with the detection...", vpColor::red);

      }


      vpDisplay::flush(I);

      vpDisplay::getClick(I, true);

    }


    keypoint_learning.saveLearningData("cube_learning_data.bin", true);


    /*

     * Start the part of the code dedicated to detection and localization

     */

    vpKeyPoint keypoint_detection("ORB", "ORB", "BruteForce-Hamming");

#if ((VISP_HAVE_OPENCV_VERSION < 0x050000) && defined(HAVE_OPENCV_FEATURES2D)) || ((VISP_HAVE_OPENCV_VERSION >= 0x050000) && defined(HAVE_OPENCV_FEATURES))

#if (VISP_HAVE_OPENCV_VERSION < 0x030000)

    keypoint_detection.setDetectorParameter("ORB", "nLevels", 1);

#else

    cv::Ptr<cv::ORB> orb_detector = keypoint_detection.getDetector("ORB").dynamicCast<cv::ORB>();

    orb_detector = keypoint_detection.getDetector("ORB").dynamicCast<cv::ORB>();

    if (orb_detector) {

      orb_detector->setNLevels(1);

    }

#endif

#endif


    keypoint_detection.loadLearningData("cube_learning_data.bin", true);


    vpImage<unsigned char> IMatching;

    keypoint_detection.createImageMatching(I, IMatching);


    vpVideoReader g;

    g.setFileName(videoname);

    g.open(I);


#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)

    display2 = vpDisplayFactory::createDisplay(IMatching, 50, 50, "Display matching between learned and current images");

#else

    display2 = vpDisplayFactory::allocateDisplay(IMatching, 50, 50, "Display matching between learned and current images");

#endif

    vpDisplay::setTitle(I, "Cube detection and localization");


    double error;

    bool click_done = false;


    while (!g.end()) {

      g.acquire(I);

      vpDisplay::display(I);


      keypoint_detection.insertImageMatching(I, IMatching);


      vpDisplay::display(IMatching);

      vpDisplay::displayText(I, 10, 10, "Detection and localization in process...", vpColor::red);


      double elapsedTime;

      if (keypoint_detection.matchPoint(I, cam, cMo, error, elapsedTime)) {


        tracker.setPose(I, cMo);


        tracker.display(I, cMo, cam, vpColor::red, 2);

        vpDisplay::displayFrame(I, cMo, cam, 0.05, vpColor::none, 3);


        keypoint_detection.displayMatching(I, IMatching);


        std::vector<vpImagePoint> ransacInliers = keypoint_detection.getRansacInliers();

        std::vector<vpImagePoint> ransacOutliers = keypoint_detection.getRansacOutliers();


        for (std::vector<vpImagePoint>::const_iterator it = ransacInliers.begin(); it != ransacInliers.end(); ++it) {

          vpDisplay::displayCircle(I, *it, 4, vpColor::green);

          vpImagePoint imPt(*it);

          imPt.set_u(imPt.get_u() + I.getWidth());

          imPt.set_v(imPt.get_v() + I.getHeight());

          vpDisplay::displayCircle(IMatching, imPt, 4, vpColor::green);

        }


        for (std::vector<vpImagePoint>::const_iterator it = ransacOutliers.begin(); it != ransacOutliers.end(); ++it) {

          vpDisplay::displayCircle(I, *it, 4, vpColor::red);

          vpImagePoint imPt(*it);

          imPt.set_u(imPt.get_u() + I.getWidth());

          imPt.set_v(imPt.get_v() + I.getHeight());

          vpDisplay::displayCircle(IMatching, imPt, 4, vpColor::red);

        }


        keypoint_detection.displayMatching(I, IMatching);


        vpCameraParameters cam2;

        cam2.initPersProjWithoutDistortion(cam.get_px(), cam.get_py(), cam.get_u0() + I.getWidth(),

          cam.get_v0() + I.getHeight());

        tracker.setCameraParameters(cam2);

        tracker.setPose(IMatching, cMo);

        tracker.display(IMatching, cMo, cam2, vpColor::red, 2);

        vpDisplay::displayFrame(IMatching, cMo, cam2, 0.05, vpColor::none, 3);

      }


      vpDisplay::flush(I);

      vpDisplay::displayText(IMatching, 30, 10, "A click to exit.", vpColor::red);

      vpDisplay::flush(IMatching);

      if (vpDisplay::getClick(I, false)) {

        click_done = true;

        break;

      }

      if (vpDisplay::getClick(IMatching, false)) {

        click_done = true;

        break;

      }

    }


    if (!click_done)

      vpDisplay::getClick(IMatching);

  }

  catch (const vpException &e) {

    std::cout << "Catch an exception: " << e << std::endl;

  }

#if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)

  if (display != nullptr) {

    delete display;

  }


  if (display2 != nullptr) {

    delete display2;

  }

#endif

#else

  (void)argc;

  (void)argv;

  std::cout << "Install OpenCV and rebuild ViSP to use this example." << std::endl;

#endif


  return EXIT_SUCCESS;

  }

vpCameraParameters
Generic class defining intrinsic camera parameters.
Definition: vpCameraParameters.h:310

vpCameraParameters::initPersProjWithoutDistortion
void initPersProjWithoutDistortion(double px, double py, double u0, double v0)
Definition: vpCameraParameters.cpp:202

vpCameraParameters::get_v0
double get_v0() const
Definition: vpCameraParameters.h:409

vpCameraParameters::get_u0
double get_u0() const
Definition: vpCameraParameters.h:408

vpCameraParameters::get_py
double get_py() const
Definition: vpCameraParameters.h:407

vpCameraParameters::get_px
double get_px() const
Definition: vpCameraParameters.h:404

vpColor::red
static const vpColor red
Definition: vpColor.h:198

vpColor::none
static const vpColor none
Definition: vpColor.h:210

vpColor::green
static const vpColor green
Definition: vpColor.h:201

vpDisplay
Class that defines generic functionalities for display.
Definition: vpDisplay.h:178

vpDisplay::getClick
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
Definition: vpDisplay_uchar.cpp:855

vpDisplay::displayCircle
static void displayCircle(const vpImage< unsigned char > &I, const vpImageCircle &circle, const vpColor &color, bool fill=false, unsigned int thickness=1)
Definition: vpDisplay_uchar.cpp:149

vpDisplay::display
static void display(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:830

vpDisplay::displayFrame
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
Definition: vpDisplay_uchar.cpp:413

vpDisplay::displayCross
static void displayCross(const vpImage< unsigned char > &I, const vpImagePoint &ip, unsigned int size, const vpColor &color, unsigned int thickness=1)
Definition: vpDisplay_uchar.cpp:199

vpDisplay::setTitle
static void setTitle(const vpImage< unsigned char > &I, const std::string &windowtitle)
Definition: vpDisplay_uchar.cpp:1325

vpDisplay::flush
static void flush(const vpImage< unsigned char > &I)
Definition: vpDisplay_uchar.cpp:806

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpException
error that can be emitted by ViSP classes.
Definition: vpException.h:60

vpHomogeneousMatrix
Implementation of an homogeneous matrix and operations on such kind of matrices.
Definition: vpHomogeneousMatrix.h:221

vpImageIo::read
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Definition: vpImageIo.cpp:147

vpImagePoint
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition: vpImagePoint.h:82

vpImage< unsigned char >

vpImage::getWidth
unsigned int getWidth() const
Definition: vpImage.h:242

vpImage::getHeight
unsigned int getHeight() const
Definition: vpImage.h:181

vpIoTools::checkFilename
static bool checkFilename(const std::string &filename)
Definition: vpIoTools.cpp:786

vpIoTools::getNameWE
static std::string getNameWE(const std::string &pathname)
Definition: vpIoTools.cpp:1227

vpIoTools::getParent
static std::string getParent(const std::string &pathname)
Definition: vpIoTools.cpp:1314

vpKeyPoint
Class that allows keypoints 2D features detection (and descriptors extraction) and matching thanks to...
Definition: vpKeyPoint.h:267

vpKeyPoint::detect
void detect(const vpImage< unsigned char > &I, std::vector< cv::KeyPoint > &keyPoints, const vpRect &rectangle=vpRect())
Definition: vpKeyPoint.cpp:989

vpKeyPoint::compute3DForPointsInPolygons
static void compute3DForPointsInPolygons(const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, std::vector< cv::KeyPoint > &candidates, const std::vector< vpPolygon > &polygons, const std::vector< std::vector< vpPoint > > &roisPt, std::vector< cv::Point3f > &points, cv::Mat *descriptors=nullptr)
Definition: vpKeyPoint.cpp:481

vpKeyPoint::buildReference
unsigned int buildReference(const vpImage< unsigned char > &I)
Definition: vpKeyPoint.cpp:211

vpMath::rad
static double rad(double deg)
Definition: vpMath.h:129

vpMbGenericTracker
Real-time 6D object pose tracking using its CAD model.
Definition: vpMbGenericTracker.h:201

vpMbGenericTracker::EDGE_TRACKER
@ EDGE_TRACKER
Definition: vpMbGenericTracker.h:205

vpMbGenericTracker::getPolygonFaces
virtual std::pair< std::vector< vpPolygon >, std::vector< std::vector< vpPoint > > > getPolygonFaces(bool orderPolygons=true, bool useVisibility=true, bool clipPolygon=false) VP_OVERRIDE
Definition: vpMbGenericTracker.cpp:1711

vpMbGenericTracker::getCameraParameters
virtual void getCameraParameters(vpCameraParameters &camera) const VP_OVERRIDE
Definition: vpMbGenericTracker.cpp:818

vpMbGenericTracker::getPose
virtual void getPose(vpHomogeneousMatrix &cMo) const VP_OVERRIDE
Definition: vpMbGenericTracker.cpp:1762

vpMe
Definition: vpMe.h:134

vpMe::setMu1
void setMu1(const double &mu_1)
Definition: vpMe.h:385

vpMe::setRange
void setRange(const unsigned int &range)
Definition: vpMe.h:415

vpMe::setLikelihoodThresholdType
void setLikelihoodThresholdType(const vpLikelihoodThresholdType likelihood_threshold_type)
Definition: vpMe.h:505

vpMe::setNbTotalSample
void setNbTotalSample(const int &ntotal_sample)
Definition: vpMe.h:399

vpMe::setMaskNumber
void setMaskNumber(const unsigned int &mask_number)
Definition: vpMe.cpp:552

vpMe::setThreshold
void setThreshold(const double &threshold)
Definition: vpMe.h:466

vpMe::setSampleStep
void setSampleStep(const double &sample_step)
Definition: vpMe.h:422

vpMe::setMaskSize
void setMaskSize(const unsigned int &mask_size)
Definition: vpMe.cpp:560

vpMe::setMu2
void setMu2(const double &mu_2)
Definition: vpMe.h:392

vpMe::NORMALIZED_THRESHOLD
@ NORMALIZED_THRESHOLD
Definition: vpMe.h:145

vpPolygon3D::FOV_CLIPPING
@ FOV_CLIPPING
Definition: vpPolygon3D.h:68

vpVideoReader
Class that enables to manipulate easily a video file or a sequence of images. As it inherits from the...
Definition: vpVideoReader.h:181

vpVideoReader::acquire
void acquire(vpImage< vpRGBa > &I)
Definition: vpVideoReader.cpp:243

vpVideoReader::open
void open(vpImage< vpRGBa > &I)
Definition: vpVideoReader.cpp:174

vpVideoReader::setFileName
void setFileName(const std::string &filename)
Definition: vpVideoReader.cpp:86

vpVideoReader::end
bool end()
Definition: vpVideoReader.h:251

VISP_NAMESPACE_NAME
Definition: vpEigenConversion.h:44

vpDisplayFactory::createDisplay
std::shared_ptr< vpDisplay > createDisplay()
Return a smart pointer vpDisplay specialization if a GUI library is available or nullptr otherwise.
Definition: vpDisplayFactory.h:137

vpDisplayFactory::allocateDisplay
vpDisplay * allocateDisplay()
Return a newly allocated vpDisplay specialization if a GUI library is available or nullptr otherwise.
Definition: vpDisplayFactory.h:63