Visual Servoing Platform  version 3.6.1 under development (2025-03-13)
tutorial-apriltag-detector.cpp
1 #include <visp3/core/vpConfig.h>
4 #include <visp3/detection/vpDetectorAprilTag.h>
6 #include <visp3/core/vpXmlParserCamera.h>
7 #include <visp3/gui/vpDisplayFactory.h>
8 #include <visp3/io/vpImageIo.h>
9 
10 int main(int argc, const char **argv)
11 {
12 #ifdef ENABLE_VISP_NAMESPACE
13  using namespace VISP_NAMESPACE_NAME;
14 #endif
16 #if defined(VISP_HAVE_APRILTAG) && defined(VISP_HAVE_DISPLAY)
18 #ifdef ENABLE_VISP_NAMESPACE
19  using namespace VISP_NAMESPACE_NAME;
20 #endif
21  std::string input_filename = "AprilTag.pgm";
24  double tagSize = 0.053;
25  float quad_decimate = 1.0;
26  int nThreads = 1;
27  std::string intrinsic_file = "";
28  std::string opt_camera_name = "";
29  bool display_tag = false;
30  int color_id = -1;
31  unsigned int thickness = 2;
32  bool z_aligned = false;
33 
34  for (int i = 1; i < argc; ++i) {
35  if (std::string(argv[i]) == "--pose-method" && i + 1 < argc) {
36  poseEstimationMethod = static_cast<vpDetectorAprilTag::vpPoseEstimationMethod>(atoi(argv[++i]));
37  }
38  else if (std::string(argv[i]) == "--tag-size" && i + 1 < argc) {
39  tagSize = atof(argv[++i]);
40  }
41  else if (std::string(argv[i]) == "--input" && i + 1 < argc) {
42  input_filename = std::string(argv[++i]);
43  }
44  else if (std::string(argv[i]) == "--quad-decimate" && i + 1 < argc) {
45  quad_decimate = static_cast<float>(atof(argv[++i]));
46  }
47  else if (std::string(argv[i]) == "--nthreads" && i + 1 < argc) {
48  nThreads = atoi(argv[++i]);
49  }
50 #if defined(VISP_HAVE_PUGIXML)
51  else if (std::string(argv[i]) == "--intrinsic" && i + 1 < argc) {
52  intrinsic_file = std::string(argv[++i]);
53  }
54  else if (std::string(argv[i]) == "--camera-name" && i + 1 < argc) {
55  opt_camera_name = std::string(argv[++i]);
56  }
57 #endif
58  else if (std::string(argv[i]) == "--display-tag") {
59  display_tag = true;
60  }
61  else if (std::string(argv[i]) == "--color" && i + 1 < argc) {
62  color_id = atoi(argv[++i]);
63  }
64  else if (std::string(argv[i]) == "--thickness" && i + 1 < argc) {
65  thickness = static_cast<unsigned int>(atoi(argv[++i]));
66  }
67  else if (std::string(argv[i]) == "--tag-family" && i + 1 < argc) {
68  tagFamily = static_cast<vpDetectorAprilTag::vpAprilTagFamily>(atoi(argv[++i]));
69  }
70  else if (std::string(argv[i]) == "--z-aligned") {
71  z_aligned = true;
72  }
73  else if (std::string(argv[i]) == "--help" || std::string(argv[i]) == "-h") {
74  std::cout << "Usage: " << argv[0]
75  << " [--input <input file>] [--tag-size <tag_size in m>]"
76  << " [--quad-decimate <quad_decimate>] [--nthreads <nb>]"
77  << " [--intrinsic <intrinsic file>] [--camera-name <camera name>]"
78  << " [--pose-method <method> (0: HOMOGRAPHY, 1: HOMOGRAPHY_VIRTUAL_VS, "
79  << " 2: DEMENTHON_VIRTUAL_VS, 3: LAGRANGE_VIRTUAL_VS, "
80  << " 4: BEST_RESIDUAL_VIRTUAL_VS, 5: HOMOGRAPHY_ORTHOGONAL_ITERATION) (default: 0)]"
81  << " [--tag-family <family> (0: TAG_36h11, 1: TAG_36h10 (DEPRECATED), 2: TAG_36ARTOOLKIT (DEPRECATED),"
82  << " 3: TAG_25h9, 4: TAG_25h7 (DEPRECATED), 5: TAG_16h5, 6: TAG_CIRCLE21h7, 7: TAG_CIRCLE49h12,"
83  << " 8: TAG_CUSTOM48h12, 9: TAG_STANDARD41h12, 10: TAG_STANDARD52h13) (default: 0)]"
84  << " [--display-tag] [--color <color_id (0, 1, ...)>]"
85  << " [--thickness <thickness>] [--z-aligned]"
86  << " [--help,-h]"
87  << std::endl;
88  return EXIT_SUCCESS;
89  }
90  }
91 
93  cam.initPersProjWithoutDistortion(615.1674805, 615.1675415, 312.1889954, 243.4373779);
94 #if defined(VISP_HAVE_PUGIXML)
95  vpXmlParserCamera parser;
96  if (!intrinsic_file.empty() && !opt_camera_name.empty()) {
97  parser.parse(cam, intrinsic_file, opt_camera_name, vpCameraParameters::perspectiveProjWithoutDistortion);
98  }
99 #endif
100 
101  std::cout << cam << std::endl;
102  std::cout << "poseEstimationMethod: " << poseEstimationMethod << std::endl;
103  std::cout << "tagFamily: " << tagFamily << std::endl;
104  std::cout << "nThreads : " << nThreads << std::endl;
105  std::cout << "Z aligned: " << z_aligned << std::endl;
106 
107 #if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
108  std::shared_ptr<vpDisplay> display, display2;
109 #else
110  vpDisplay *display = nullptr;
111  vpDisplay *display2 = nullptr;
112 #endif
113  try {
114  vpImage<vpRGBa> I_color;
115  vpImageIo::read(I_color, input_filename);
117  vpImageConvert::convert(I_color, I);
118 
119 #if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
120  display = vpDisplayFactory::createDisplay(I);
121 #else
123 #endif
124 
126  vpDetectorAprilTag detector(tagFamily);
128 
130  detector.setAprilTagQuadDecimate(quad_decimate);
131  detector.setAprilTagPoseEstimationMethod(poseEstimationMethod);
132  detector.setAprilTagNbThreads(nThreads);
133  detector.setDisplayTag(display_tag, color_id < 0 ? vpColor::none : vpColor::getColor(color_id), thickness);
134  detector.setZAlignedWithCameraAxis(z_aligned);
136 
138 
139  double t = vpTime::measureTimeMs();
141  std::vector<vpHomogeneousMatrix> cMo_vec;
142  detector.detect(I, tagSize, cam, cMo_vec);
144  t = vpTime::measureTimeMs() - t;
145 
146  std::stringstream ss;
147  ss << "Detection time: " << t << " ms for " << detector.getNbObjects() << " tags";
148  vpDisplay::displayText(I, 40, 20, ss.str(), vpColor::red);
149 
151  for (size_t i = 0; i < detector.getNbObjects(); i++) {
154  std::vector<vpImagePoint> p = detector.getPolygon(i);
155  vpRect bbox = detector.getBBox(i);
159  std::string message = detector.getMessage(i);
162  std::size_t tag_id_pos = message.find("id: ");
163  if (tag_id_pos != std::string::npos) {
164  int tag_id = atoi(message.substr(tag_id_pos + 4).c_str());
165  ss.str("");
166  ss << "Tag id: " << tag_id;
167  vpDisplay::displayText(I, static_cast<int>(bbox.getTop() - 10), static_cast<int>(bbox.getLeft()), ss.str(), vpColor::red);
168  }
170  for (size_t j = 0; j < p.size(); j++) {
171  vpDisplay::displayCross(I, p[j], 14, vpColor::red, 3);
172  std::ostringstream number;
173  number << j;
174  vpDisplay::displayText(I, p[j] + vpImagePoint(15, 5), number.str(), vpColor::blue);
175  }
176  }
177 
178  vpDisplay::displayText(I, 20, 20, "Click to display tag poses", vpColor::red);
179  vpDisplay::flush(I);
181 
183 
185  for (size_t i = 0; i < cMo_vec.size(); i++) {
186  vpDisplay::displayFrame(I, cMo_vec[i], cam, tagSize / 2, vpColor::none, 3);
187  }
189 
190  vpDisplay::displayText(I, 20, 20, "Click to quit.", vpColor::red);
191  vpDisplay::flush(I);
193 
194 
195 #if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
196  display2 = vpDisplayFactory::createDisplay(I_color, 50, 50);
197 #else
198  display2 = vpDisplayFactory::allocateDisplay(I_color, 50, 50);
199 #endif
200  // To test the displays on a vpRGBa image
201  vpDisplay::display(I_color);
202 
203  // Display frames and tags but remove the display of the last element
204  std::vector<std::vector<vpImagePoint> > tagsCorners = detector.getTagsCorners();
205  tagsCorners.pop_back();
206  detector.displayTags(I_color, tagsCorners, vpColor::none, 3);
207 
208  cMo_vec.pop_back();
209  detector.displayFrames(I_color, cMo_vec, cam, tagSize / 2, vpColor::none, 3);
210 
211  vpDisplay::displayText(I_color, 20, 20, "Click to quit.", vpColor::red);
212  vpDisplay::flush(I_color);
213  vpDisplay::getClick(I_color);
214  }
215  catch (const vpException &e) {
216  std::cerr << "Catch an exception: " << e.getMessage() << std::endl;
217  }
218 
219 #if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)
220  if (display != nullptr) {
221  delete display;
222  }
223  if (display2 != nullptr) {
224  delete display2;
225  }
226 #endif
227 #else
228  (void)argc;
229  (void)argv;
230 #endif
231  return EXIT_SUCCESS;
232 }
Generic class defining intrinsic camera parameters.
void initPersProjWithoutDistortion(double px, double py, double u0, double v0)
@ perspectiveProjWithoutDistortion
Perspective projection without distortion model.
static vpColor getColor(const unsigned int &i)
Definition: vpColor.h:292
static const vpColor red
Definition: vpColor.h:198
static const vpColor none
Definition: vpColor.h:210
static const vpColor blue
Definition: vpColor.h:204
static const vpColor green
Definition: vpColor.h:201
@ TAG_36h11
AprilTag 36h11 pattern (recommended)
Class that defines generic functionalities for display.
Definition: vpDisplay.h:178
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
static void display(const vpImage< unsigned char > &I)
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
static void displayCross(const vpImage< unsigned char > &I, const vpImagePoint &ip, unsigned int size, const vpColor &color, unsigned int thickness=1)
static void flush(const vpImage< unsigned char > &I)
static void displayRectangle(const vpImage< unsigned char > &I, const vpImagePoint &topLeft, unsigned int width, unsigned int height, const vpColor &color, bool fill=false, unsigned int thickness=1)
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
error that can be emitted by ViSP classes.
Definition: vpException.h:60
const char * getMessage() const
Definition: vpException.cpp:65
static void convert(const vpImage< unsigned char > &src, vpImage< vpRGBa > &dest)
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Definition: vpImageIo.cpp:147
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition: vpImagePoint.h:82
Defines a rectangle in the plane.
Definition: vpRect.h:79
double getLeft() const
Definition: vpRect.h:173
double getTop() const
Definition: vpRect.h:192
XML parser to load and save intrinsic camera parameters.
int parse(vpCameraParameters &cam, const std::string &filename, const std::string &camera_name, const vpCameraParameters::vpCameraParametersProjType &projModel, unsigned int image_width=0, unsigned int image_height=0, bool verbose=true)
std::shared_ptr< vpDisplay > createDisplay()
Return a smart pointer vpDisplay specialization if a GUI library is available or nullptr otherwise.
vpDisplay * allocateDisplay()
Return a newly allocated vpDisplay specialization if a GUI library is available or nullptr otherwise.
VISP_EXPORT double measureTimeMs()