Visual Servoing Platform  version 3.1.0
tutorial-apriltag-detector.cpp
1 #include <visp3/detection/vpDetectorAprilTag.h>
5 #include <visp3/gui/vpDisplayGDI.h>
6 #include <visp3/gui/vpDisplayOpenCV.h>
7 #include <visp3/gui/vpDisplayX.h>
8 #include <visp3/io/vpImageIo.h>
9 #ifdef VISP_HAVE_XML2
10 #include <visp3/core/vpXmlParserCamera.h>
11 #endif
12 
13 int main(int argc, const char **argv)
14 {
16 #if defined(VISP_HAVE_APRILTAG) && (defined(VISP_HAVE_X11) || defined(VISP_HAVE_GDI) || defined(VISP_HAVE_OPENCV))
17 
19  std::string input_filename = "AprilTag.pgm";
22  double tagSize = 0.053;
23  float quad_decimate = 1.0;
24  int nThreads = 1;
25  std::string intrinsic_file = "";
26  std::string camera_name = "";
27  bool display_tag = false;
28 
29  for (int i = 1; i < argc; i++) {
30  if (std::string(argv[i]) == "--pose_method" && i + 1 < argc) {
31  poseEstimationMethod = (vpDetectorAprilTag::vpPoseEstimationMethod)atoi(argv[i + 1]);
32  } else if (std::string(argv[i]) == "--tag_size" && i + 1 < argc) {
33  tagSize = atof(argv[i + 1]);
34  } else if (std::string(argv[i]) == "--input" && i + 1 < argc) {
35  input_filename = std::string(argv[i + 1]);
36  } else if (std::string(argv[i]) == "--quad_decimate" && i + 1 < argc) {
37  quad_decimate = (float)atof(argv[i + 1]);
38  } else if (std::string(argv[i]) == "--nthreads" && i + 1 < argc) {
39  nThreads = atoi(argv[i + 1]);
40  } else if (std::string(argv[i]) == "--intrinsic" && i + 1 < argc) {
41  intrinsic_file = std::string(argv[i + 1]);
42  } else if (std::string(argv[i]) == "--camera_name" && i + 1 < argc) {
43  camera_name = std::string(argv[i + 1]);
44  } else if (std::string(argv[i]) == "--display_tag") {
45  display_tag = true;
46  } else if (std::string(argv[i]) == "--tag_family" && i + 1 < argc) {
47  tagFamily = (vpDetectorAprilTag::vpAprilTagFamily)atoi(argv[i + 1]);
48  } else if (std::string(argv[i]) == "--help" || std::string(argv[i]) == "-h") {
49  std::cout << "Usage: " << argv[0]
50  << " [--input <input file>] [--tag_size <tag_size in m>]"
51  " [--quad_decimate <quad_decimate>] [--nthreads <nb>]"
52  " [--intrinsic <intrinsic file>] [--camera_name <camera name>]"
53  " [--pose_method <method> (0: HOMOGRAPHY_VIRTUAL_VS, 1: "
54  "DEMENTHON_VIRTUAL_VS,"
55  " 2: LAGRANGE_VIRTUAL_VS, 3: BEST_RESIDUAL_VIRTUAL_VS)]"
56  " [--tag_family <family> (0: TAG_36h11, 1: TAG_36h10, 2: "
57  "TAG_36ARTOOLKIT,"
58  " 3: TAG_25h9, 4: TAG_25h7)]"
59  " [--display_tag] [--help]"
60  << std::endl;
61  return EXIT_SUCCESS;
62  }
63  }
64 
66  cam.initPersProjWithoutDistortion(615.1674805, 615.1675415, 312.1889954, 243.4373779);
67 #ifdef VISP_HAVE_XML2
68  vpXmlParserCamera parser;
69  if (!intrinsic_file.empty() && !camera_name.empty())
70  parser.parse(cam, intrinsic_file, camera_name, vpCameraParameters::perspectiveProjWithoutDistortion);
71 #endif
72  std::cout << "cam:\n" << cam << std::endl;
73  std::cout << "poseEstimationMethod: " << poseEstimationMethod << std::endl;
74  std::cout << "tagFamily: " << tagFamily << std::endl;
75 
76  try {
78  vpImageIo::read(I, input_filename);
79 
80 #ifdef VISP_HAVE_X11
81  vpDisplayX d(I);
82 #elif defined(VISP_HAVE_GDI)
83  vpDisplayGDI d(I);
84 #elif defined(VISP_HAVE_OPENCV)
85  vpDisplayOpenCV d(I);
86 #endif
87 
89  vpDetectorBase *detector = new vpDetectorAprilTag(tagFamily);
91 
93  dynamic_cast<vpDetectorAprilTag *>(detector)->setAprilTagQuadDecimate(quad_decimate);
94  dynamic_cast<vpDetectorAprilTag *>(detector)->setAprilTagPoseEstimationMethod(poseEstimationMethod);
95  dynamic_cast<vpDetectorAprilTag *>(detector)->setAprilTagNbThreads(nThreads);
96  dynamic_cast<vpDetectorAprilTag *>(detector)->setDisplayTag(display_tag);
98 
100 
101  double t = vpTime::measureTimeMs();
103  std::vector<vpHomogeneousMatrix> cMo_vec;
104  dynamic_cast<vpDetectorAprilTag *>(detector)->detect(I, tagSize, cam, cMo_vec);
106  t = vpTime::measureTimeMs() - t;
107 
108  std::stringstream ss;
109  ss << "Detection time: " << t << " ms for " << detector->getNbObjects() << " tags";
110  vpDisplay::displayText(I, 40, 20, ss.str(), vpColor::red);
111 
113  for (size_t i = 0; i < detector->getNbObjects(); i++) {
116  std::vector<vpImagePoint> p = detector->getPolygon(i);
117  vpRect bbox = detector->getBBox(i);
121  vpDisplay::displayText(I, (int)(bbox.getTop() - 10), (int)bbox.getLeft(),
122  "Message: \"" + detector->getMessage(i) + "\"", vpColor::red);
124  for (size_t j = 0; j < p.size(); j++) {
125  vpDisplay::displayCross(I, p[j], 14, vpColor::red, 3);
126  std::ostringstream number;
127  number << j;
128  vpDisplay::displayText(I, p[j] + vpImagePoint(15, 5), number.str(), vpColor::blue);
129  }
130  }
131 
132  vpDisplay::displayText(I, 20, 20, "Click to display tag poses", vpColor::red);
133  vpDisplay::flush(I);
135 
137 
139  for (size_t i = 0; i < cMo_vec.size(); i++) {
140  vpDisplay::displayFrame(I, cMo_vec[i], cam, tagSize / 2, vpColor::none, 3);
141  }
143 
144  vpDisplay::displayText(I, 20, 20, "Click to quit.", vpColor::red);
145  vpDisplay::flush(I);
147 
148  delete detector;
149  } catch (const vpException &e) {
150  std::cerr << "Catch an exception: " << e.getMessage() << std::endl;
151  }
152 
153  return EXIT_SUCCESS;
154 #else
155  (void)argc;
156  (void)argv;
157  return 0;
158 #endif
159 }
vpRect getBBox(size_t i) const
double getTop() const
Definition: vpRect.h:175
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
Display for windows using GDI (available on any windows 32 platform).
Definition: vpDisplayGDI.h:129
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Use the X11 console to display images on unix-like OS. Thus to enable this class X11 should be instal...
Definition: vpDisplayX.h:151
static const vpColor none
Definition: vpColor.h:192
error that can be emited by ViSP classes.
Definition: vpException.h:71
size_t getNbObjects() const
XML parser to load and save intrinsic camera parameters.
static const vpColor green
Definition: vpColor.h:183
static void flush(const vpImage< unsigned char > &I)
VISP_EXPORT double measureTimeMs()
Definition: vpTime.cpp:88
static const vpColor red
Definition: vpColor.h:180
void initPersProjWithoutDistortion(const double px, const double py, const double u0, const double v0)
static void display(const vpImage< unsigned char > &I)
The vpDisplayOpenCV allows to display image using the OpenCV library. Thus to enable this class OpenC...
Generic class defining intrinsic camera parameters.
static void displayRectangle(const vpImage< unsigned char > &I, const vpImagePoint &topLeft, unsigned int width, unsigned int height, const vpColor &color, bool fill=false, unsigned int thickness=1)
double getLeft() const
Definition: vpRect.h:156
const char * getMessage(void) const
Definition: vpException.cpp:90
static void displayCross(const vpImage< unsigned char > &I, const vpImagePoint &ip, unsigned int size, const vpColor &color, unsigned int thickness=1)
static void read(vpImage< unsigned char > &I, const std::string &filename)
Definition: vpImageIo.cpp:207
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0))
Defines a rectangle in the plane.
Definition: vpRect.h:78
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition: vpImagePoint.h:88
std::vector< std::string > & getMessage()
int parse(vpCameraParameters &cam, const std::string &filename, const std::string &camera_name, const vpCameraParameters::vpCameraParametersProjType &projModel, const unsigned int image_width=0, const unsigned int image_height=0)
static const vpColor blue
Definition: vpColor.h:186
std::vector< std::vector< vpImagePoint > > & getPolygon()