doxygen/visp-daily/vpDetectorDNNOpenCV_8h_source.html

 /*

  * ViSP, open source Visual Servoing Platform software.

  * Copyright (C) 2005 - 2024 by Inria. All rights reserved.

  *

  * This software is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2 of the License, or

  * (at your option) any later version.

  * See the file LICENSE.txt at the root directory of this source

  * distribution for additional information about the GNU GPL.

  *

  * For using ViSP with software that can not be combined with the GNU

  * GPL, please contact Inria about acquiring a ViSP Professional

  * Edition License.

  *

  * See https://visp.inria.fr for more information.

  *

  * This software was developed at:

  * Inria Rennes - Bretagne Atlantique

  * Campus Universitaire de Beaulieu

  * 35042 Rennes Cedex

  * France

  *

  * If you have questions regarding the use of this file, please contact

  * Inria at visp@inria.fr

  *

  * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE

  * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.

  *

  * Description:

  * DNN object detection using OpenCV DNN module.

  */


 #ifndef VP_DETECTOR_DNN_OPENCV_H

 #define VP_DETECTOR_DNN_OPENCV_H


 #include <visp3/core/vpConfig.h>


 // Check if std:c++17 or higher.

 // Here we cannot use (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_17) in the declaration of the class

 #if (VISP_HAVE_OPENCV_VERSION >= 0x030403) && defined(HAVE_OPENCV_DNN) && \

     ((__cplusplus >= 201703L) || (defined(_MSVC_LANG) && (_MSVC_LANG >= 201703L)))


 #include <map>

 #include <string>

 #include <vector>


 #include <opencv2/dnn.hpp>


 #include <visp3/core/vpColor.h>

 #include <visp3/core/vpDisplay.h>

 #include <visp3/core/vpImage.h>

 #include <visp3/core/vpRect.h>


 #include <optional>


 #ifdef VISP_HAVE_NLOHMANN_JSON

 #include VISP_NLOHMANN_JSON(json.hpp)

 #endif


 BEGIN_VISP_NAMESPACE

 class VISP_EXPORT vpDetectorDNNOpenCV

 {

 public:

   typedef enum DNNResultsParsingType

   {

     USER_SPECIFIED = 0,

     FASTER_RCNN = 1,

     SSD_MOBILENET = 2,

     RESNET_10 = 3,

     YOLO_V3 = 4,

     YOLO_V4 = 5,

     YOLO_V5 = 6,

     YOLO_V7 = 7,

     YOLO_V8 = 8,

     YOLO_V11 = 9,

     COUNT = 10

   } DNNResultsParsingType;


   typedef struct DetectionCandidates

   {

     std::vector< float > m_confidences;

     std::vector< cv::Rect > m_boxes;

     std::vector< int > m_classIds;

   } DetectionCandidates;


   typedef class DetectedFeatures2D

   {

   protected:

     vpRect m_bbox;

     double m_score;

     unsigned int m_cls;

     std::optional<std::string> m_classname;

   public:

     inline explicit DetectedFeatures2D(double u_min, double u_max

       , double v_min, double v_max

       , unsigned int cls, double score

       , const std::optional<std::string> &classname

     )

       : m_bbox(vpImagePoint(v_min, u_min), vpImagePoint(v_max, u_max))

       , m_score(score)

       , m_cls(cls)

     {

       if (classname) {

         m_classname = classname;

       }

       else {

         m_classname = std::nullopt;

       }

     };


     inline vpRect getBoundingBox() const { return m_bbox; }

     inline double getConfidenceScore() const { return m_score; }

     inline unsigned int getClassId() const { return m_cls; }

     inline std::optional<std::string> getClassName() const { return m_classname; }


     template < typename Type >

     void display(const vpImage< Type > &img, const vpColor &color = vpColor::blue, unsigned int thickness = 1) const;


     friend vpDetectorDNNOpenCV;

   } DetectedFeatures2D;


   typedef class NetConfig

   {

   private:

     float m_confThreshold;

     float m_nmsThreshold;

     std::vector<std::string> m_classNames;

     cv::Size m_inputSize;

     double m_filterSizeRatio;

     cv::Scalar m_mean;

     double m_scaleFactor;

     bool m_swapRB; /*<! If true, swap R and B for mean subtraction, e.g. when a model has been trained on BGR image format.*/

     DNNResultsParsingType m_parsingMethodType;

     std::string m_modelFilename;

     std::string m_modelConfigFilename; /*<! Path towards the model additional configuration file, e.g. pbtxt file.*/

     std::string m_framework;

 #ifdef VISP_HAVE_NLOHMANN_JSON

     friend inline void from_json(const nlohmann::json &j, NetConfig &config)

     {

       config.m_confThreshold = j.value("confidenceThreshold", config.m_confThreshold);

       if (config.m_confThreshold <= 0) {

         throw vpException(vpException::badValue, "Confidence threshold should be > 0");

       }


       config.m_nmsThreshold = j.value("nmsThreshold", config.m_nmsThreshold);

       if (config.m_nmsThreshold <= 0) {

         throw vpException(vpException::badValue, "Confidence threshold should be > 0");

       }


       config.m_filterSizeRatio = j.value("filterSizeRatio", config.m_filterSizeRatio);


       config.m_classNames = j.value("classNames", config.m_classNames);


       std::pair<unsigned int, unsigned int> resolution = j.value("resolution", std::pair<unsigned int, unsigned int>(config.m_inputSize.width, config.m_inputSize.height));

       config.m_inputSize.width = resolution.first;

       config.m_inputSize.height = resolution.second;


       std::vector<double> v_mean = j.value("mean", std::vector<double>({ config.m_mean[0], config.m_mean[1], config.m_mean[2] }));

       if (v_mean.size() != 3) {

         throw(vpException(vpException::dimensionError, "Mean should have size = 3"));

       }

       config.m_mean = cv::Scalar(v_mean[0], v_mean[1], v_mean[2]);


       config.m_scaleFactor = j.value("scale", config.m_scaleFactor);

       config.m_swapRB = j.value("swapRB", config.m_swapRB);

       config.m_parsingMethodType = dnnResultsParsingTypeFromString(j.value("parsingType", dnnResultsParsingTypeToString(config.m_parsingMethodType)));

       config.m_modelFilename = j.value("modelFile", config.m_modelFilename);

       config.m_modelConfigFilename = j.value("configurationFile", config.m_modelConfigFilename);

       config.m_framework = j.value("framework", config.m_framework);

     }


     friend inline void to_json(nlohmann::json &j, const NetConfig &config)

     {

       std::pair<unsigned int, unsigned int> resolution = { config.m_inputSize.width, config.m_inputSize.height };

       std::vector<double> v_mean = { config.m_mean[0], config.m_mean[1], config.m_mean[2] };

       j = nlohmann::json {

         {"confidenceThreshold", config.m_confThreshold  } ,

         {"nmsThreshold"       , config.m_nmsThreshold   } ,

         {"filterSizeRatio"    , config.m_filterSizeRatio} ,

         {"classNames"         , config.m_classNames     } ,

         {"resolution"         , resolution              } ,

         {"mean"           , v_mean                      } ,

         {"scale"          , config.m_scaleFactor        } ,

         {"swapRB"         , config.m_swapRB             } ,

         {"parsingType"    , dnnResultsParsingTypeToString(config.m_parsingMethodType) },

         {"modelFile"          , config.m_modelFilename           } ,

         {"configurationFile"  , config.m_modelConfigFilename     } ,

         {"framework"          , config.m_framework               }

       };

     }

 #endif


   public:

     inline static std::vector<std::string> parseClassNamesFile(const std::string &filename)

     {

       std::vector<std::string> classNames;

       std::ifstream ifs(filename);

       std::string line;

       while (getline(ifs, line)) {

         if (line.find("[") == std::string::npos) {

           classNames.push_back(line);

         }

         else {

           std::string lineWithoutBracket;

           if (line.find("[") != std::string::npos) {

             lineWithoutBracket = line.substr(line.find("[") + 1, line.size() - 2); // Remove opening and closing brackets

           }


           while (!lineWithoutBracket.empty()) {

             std::string className;

             auto start_pos = lineWithoutBracket.find("\"");

             auto end_pos = lineWithoutBracket.find("\"", start_pos + 1);

             className = lineWithoutBracket.substr(start_pos + 1, end_pos - (start_pos + 1));

             if (!className.empty()) {

               classNames.push_back(className);

               lineWithoutBracket = lineWithoutBracket.substr(end_pos + 1);

             }

           }

         }

       }

       return classNames;

     }


     inline NetConfig()

       : m_confThreshold(0.5f)

       , m_nmsThreshold(0.4f)

       , m_classNames()

       , m_inputSize(300, 300)

       , m_filterSizeRatio(0.)

       , m_mean(127.5, 127.5, 127.5)

       , m_scaleFactor(2.0 / 255.0)

       , m_swapRB(true)

       , m_parsingMethodType(vpDetectorDNNOpenCV::USER_SPECIFIED)

       , m_modelFilename()

       , m_modelConfigFilename()

       , m_framework()

     {


     }


     inline NetConfig(const NetConfig &config)

       : m_confThreshold(config.m_confThreshold)

       , m_nmsThreshold(config.m_nmsThreshold)

       , m_classNames(config.m_classNames)

       , m_inputSize(config.m_inputSize.width, config.m_inputSize.height)

       , m_filterSizeRatio(config.m_filterSizeRatio)

       , m_mean(cv::Scalar(config.m_mean[0], config.m_mean[1], config.m_mean[2]))

       , m_scaleFactor(config.m_scaleFactor)

       , m_swapRB(config.m_swapRB)

       , m_parsingMethodType(config.m_parsingMethodType)

       , m_modelFilename(config.m_modelFilename)

       , m_modelConfigFilename(config.m_modelConfigFilename)

       , m_framework(config.m_framework)

     {


     }


     inline NetConfig(float confThresh, const float &nmsThresh, const std::vector<std::string> &classNames, const cv::Size &dnnInputSize, const double &filterSizeRatio = 0.

       , const cv::Scalar &mean = cv::Scalar(127.5, 127.5, 127.5), const double &scaleFactor = 2. / 255., const bool &swapRB = true

       , const DNNResultsParsingType &parsingType = vpDetectorDNNOpenCV::USER_SPECIFIED, const std::string &modelFilename = "", const std::string &configFilename = "", const std::string &framework = "")

       : m_confThreshold(confThresh)

       , m_nmsThreshold(nmsThresh)

       , m_classNames(classNames)

       , m_inputSize(dnnInputSize)

       , m_filterSizeRatio(filterSizeRatio)

       , m_mean(mean)

       , m_scaleFactor(scaleFactor)

       , m_swapRB(swapRB)

       , m_parsingMethodType(parsingType)

       , m_modelFilename(modelFilename)

       , m_modelConfigFilename(configFilename)

       , m_framework(framework)

     { }


     inline NetConfig(const float &confThresh, const float &nmsThresh, const std::string &classNamesFile, const cv::Size &dnnInputSize, const double &filterSizeRatio = 0.

       , const cv::Scalar &mean = cv::Scalar(127.5, 127.5, 127.5), const double &scaleFactor = 2. / 255., const bool &swapRB = true

       , const DNNResultsParsingType &parsingType = vpDetectorDNNOpenCV::USER_SPECIFIED, const std::string &modelFilename = "", const std::string &configFilename = "", const std::string &framework = "")

       : m_confThreshold(confThresh)

       , m_nmsThreshold(nmsThresh)

       , m_inputSize(dnnInputSize)

       , m_filterSizeRatio(filterSizeRatio)

       , m_mean(mean)

       , m_scaleFactor(scaleFactor)

       , m_swapRB(swapRB)

       , m_parsingMethodType(parsingType)

       , m_modelFilename(modelFilename)

       , m_modelConfigFilename(configFilename)

       , m_framework(framework)

     {

       m_classNames = parseClassNamesFile(classNamesFile);

     }


     inline std::string toString() const

     {

       std::string text;

       text += "Model                : " + m_modelFilename + "\n";

       text += "Type                 : " + vpDetectorDNNOpenCV::dnnResultsParsingTypeToString(m_parsingMethodType) + "\n";

       text += "Config     (optional): " + (m_modelConfigFilename.empty() ? "\"None\"" : m_modelConfigFilename) + "\n";

       text += "Framework  (optional): " + (m_framework.empty() ? "\"None\"" : m_framework) + "\n";

       text += "Width x Height       : " + std::to_string(m_inputSize.width) + " x " + std::to_string(m_inputSize.height) + "\n";

       text += "Mean RGB             : " + std::to_string(m_mean[0]) + " " + std::to_string(m_mean[1]) + " " + std::to_string(m_mean[2]) + "\n";

       text += "Scale                : " + std::to_string(m_scaleFactor) + "\n";

       text += "Swap RB?             : " + (m_swapRB ? std::string("true") : std::string("false")) + "\n";

       text += "Confidence threshold : " + std::to_string(m_confThreshold) + "\n";

       text += "NMS threshold        : " + std::to_string(m_nmsThreshold) + "\n";

       text += "Filter threshold     : " +

         (m_filterSizeRatio > std::numeric_limits<double>::epsilon() ? std::to_string(m_filterSizeRatio)

           : "disabled") + "\n";

       return text;

     }


     friend inline std::ostream &operator<<(std::ostream &os, const NetConfig &config)

     {

       os << config.toString();

       return os;

     }


     NetConfig &operator=(const NetConfig &config)

     {

       m_confThreshold = config.m_confThreshold;

       m_nmsThreshold = config.m_nmsThreshold;

       m_classNames = config.m_classNames;

       m_inputSize = cv::Size(config.m_inputSize.width, config.m_inputSize.height);

       m_filterSizeRatio = config.m_filterSizeRatio;

       m_mean = cv::Scalar(config.m_mean[0], config.m_mean[1], config.m_mean[2]);

       m_scaleFactor = config.m_scaleFactor;

       m_swapRB = config.m_swapRB;

       m_parsingMethodType = config.m_parsingMethodType;

       m_modelFilename = config.m_modelFilename;

       m_modelConfigFilename = config.m_modelConfigFilename;

       m_framework = config.m_framework;

       return *this;

     }


     friend vpDetectorDNNOpenCV;

   } NetConfig;


   static std::string getAvailableDnnResultsParsingTypes();

   static std::string dnnResultsParsingTypeToString(const DNNResultsParsingType &type);

   static DNNResultsParsingType dnnResultsParsingTypeFromString(const std::string &name);

   static std::vector<std::string> parseClassNamesFile(const std::string &filename);

   vpDetectorDNNOpenCV();

   vpDetectorDNNOpenCV(const NetConfig &config, const DNNResultsParsingType &typeParsingMethod, void (*parsingMethod)(DetectionCandidates &, std::vector<cv::Mat> &, const NetConfig &) = postProcess_unimplemented);

 #ifdef VISP_HAVE_NLOHMANN_JSON

   vpDetectorDNNOpenCV(const std::string &jsonPath, void (*parsingMethod)(DetectionCandidates &, std::vector<cv::Mat> &, const NetConfig &) = postProcess_unimplemented);

   void initFromJSON(const std::string &jsonPath);

   void saveConfigurationInJSON(const std::string &jsonPath) const;

 #endif

   virtual ~vpDetectorDNNOpenCV();


   virtual bool detect(const vpImage<unsigned char> &I, std::vector<DetectedFeatures2D> &output);

   virtual bool detect(const vpImage<unsigned char> &I, std::map< std::string, std::vector<DetectedFeatures2D>> &output);

   virtual bool detect(const vpImage<unsigned char> &I, std::vector< std::pair<std::string, std::vector<DetectedFeatures2D>>> &output);

   virtual bool detect(const vpImage<vpRGBa> &I, std::vector<DetectedFeatures2D> &output);

   virtual bool detect(const vpImage<vpRGBa> &I, std::map< std::string, std::vector<DetectedFeatures2D>> &output);

   virtual bool detect(const vpImage<vpRGBa> &I, std::vector< std::pair<std::string, std::vector<DetectedFeatures2D>>> &output);

   virtual bool detect(const cv::Mat &I, std::vector<DetectedFeatures2D> &output);

   virtual bool detect(const cv::Mat &I, std::map< std::string, std::vector<DetectedFeatures2D>> &output);

   virtual bool detect(const cv::Mat &I, std::vector< std::pair<std::string, std::vector<DetectedFeatures2D>>> &output);


   void readNet(const std::string &model, const std::string &config = "", const std::string &framework = "");


   void setNetConfig(const NetConfig &config);

   void setConfidenceThreshold(const float &confThreshold);

   void setNMSThreshold(const float &nmsThreshold);

   void setDetectionFilterSizeRatio(const double &sizeRatio);

   void setInputSize(const int &width, const int &height);

   void setMean(const double &meanR, const double &meanG, const double &meanB);

   void setPreferableBackend(const int &backendId);

   void setPreferableTarget(const int &targetId);

   void setScaleFactor(const double &scaleFactor);

   void setSwapRB(const bool &swapRB);

   void setParsingMethod(const DNNResultsParsingType &typeParsingMethod, void (*parsingMethod)(DetectionCandidates &, std::vector<cv::Mat> &, const NetConfig &) = postProcess_unimplemented);

   inline const NetConfig &getNetConfig() const

   {

     return m_netConfig;

   }


 #ifdef VISP_HAVE_NLOHMANN_JSON

   friend inline void from_json(const nlohmann::json &j, vpDetectorDNNOpenCV &network)

   {

     network.m_netConfig = j.value("networkSettings", network.m_netConfig);

   }


   friend inline void to_json(nlohmann::json &j, const vpDetectorDNNOpenCV &network)

   {

     j = nlohmann::json {

       {"networkSettings", network.m_netConfig}

     };

   }

 #endif


   friend inline std::ostream &operator<<(std::ostream &os, const vpDetectorDNNOpenCV &network)

   {

     os << network.m_netConfig;

     return os;

   }


 protected:

 #if (VISP_HAVE_OPENCV_VERSION == 0x030403)

   std::vector<cv::String> getOutputsNames();

 #endif

   std::vector<DetectedFeatures2D>

     filterDetectionSingleClassInput(const std::vector<DetectedFeatures2D> &detected_features, const double minRatioOfAreaOk);


   std::vector<DetectedFeatures2D>

     filterDetectionMultiClassInput(const std::vector<DetectedFeatures2D> &detected_features, const double minRatioOfAreaOk);


   std::map<std::string, std::vector<vpDetectorDNNOpenCV::DetectedFeatures2D>>

     filterDetectionMultiClassInput(const std::map< std::string, std::vector<vpDetectorDNNOpenCV::DetectedFeatures2D>> &detected_features, const double minRatioOfAreaOk);


   void postProcess(DetectionCandidates &proposals);


   void postProcess_YoloV3_V4(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


   void postProcess_YoloV5_V7(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


   void postProcess_YoloV8_V11(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


   void postProcess_FasterRCNN(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


 #if defined(VISP_BUILD_DEPRECATED_FUNCTIONS)

   void postProcess_SSD_MobileNet(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);

 #endif


   void postProcess_ResNet_10(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


   static void postProcess_unimplemented(DetectionCandidates &proposals, std::vector<cv::Mat> &dnnRes, const NetConfig &netConfig);


   bool m_applySizeFilterAfterNMS;

   cv::Mat m_blob;

   vpImage<vpRGBa> m_I_color;

   cv::Mat m_img;

   std::vector<int> m_indices;

   cv::dnn::Net m_net;

   NetConfig m_netConfig;

   std::vector<cv::String> m_outNames;

   std::vector<cv::Mat> m_dnnRes;

   void (*m_parsingMethod)(DetectionCandidates &, std::vector<cv::Mat> &, const NetConfig &);

 };


 template < typename Type >

 inline void

 vpDetectorDNNOpenCV::DetectedFeatures2D::display(const vpImage< Type > &img, const vpColor &color, unsigned int thickness) const

 {

   vpDisplay::displayRectangle(img, m_bbox, color, false, thickness);


   std::stringstream ss;

   if (m_classname) {

     ss << *m_classname;

   }

   else {

     ss << m_cls;

   }

   ss << "(" << std::setprecision(4) << m_score * 100. << "%)";

   vpDisplay::displayText(img, m_bbox.getTopRight(), ss.str(), color);

 }

 END_VISP_NAMESPACE

 #endif

 #endif

vpColor
Class to define RGB colors available for display functionalities.
Definition: vpColor.h:157

vpColor::blue
static const vpColor blue
Definition: vpColor.h:204

vpDetectorDNNOpenCV::DetectedFeatures2D
Structure containing the bounding box, expressed in pixels, confidence and class information about an...
Definition: vpDetectorDNNOpenCV.h:121

vpDetectorDNNOpenCV::DetectedFeatures2D::display
void display(const vpImage< Type > &img, const vpColor &color=vpColor::blue, unsigned int thickness=1) const
Definition: vpDetectorDNNOpenCV.h:609

vpDetectorDNNOpenCV::DetectedFeatures2D::m_bbox
vpRect m_bbox
Definition: vpDetectorDNNOpenCV.h:123

vpDetectorDNNOpenCV::DetectedFeatures2D::vpDetectorDNNOpenCV
friend vpDetectorDNNOpenCV
Definition: vpDetectorDNNOpenCV.h:176

vpDetectorDNNOpenCV::DetectedFeatures2D::getBoundingBox
vpRect getBoundingBox() const
Definition: vpDetectorDNNOpenCV.h:159

vpDetectorDNNOpenCV::DetectedFeatures2D::DetectedFeatures2D
DetectedFeatures2D(double u_min, double u_max, double v_min, double v_max, unsigned int cls, double score, const std::optional< std::string > &classname)
Construct a new Detected Features 2 D object.
Definition: vpDetectorDNNOpenCV.h:139

vpDetectorDNNOpenCV::DetectedFeatures2D::getClassName
std::optional< std::string > getClassName() const
Definition: vpDetectorDNNOpenCV.h:171

vpDetectorDNNOpenCV::DetectedFeatures2D::m_score
double m_score
Definition: vpDetectorDNNOpenCV.h:124

vpDetectorDNNOpenCV::DetectedFeatures2D::getConfidenceScore
double getConfidenceScore() const
Definition: vpDetectorDNNOpenCV.h:163

vpDetectorDNNOpenCV::DetectedFeatures2D::m_classname
std::optional< std::string > m_classname
Definition: vpDetectorDNNOpenCV.h:126

vpDetectorDNNOpenCV::DetectedFeatures2D::m_cls
unsigned int m_cls
Definition: vpDetectorDNNOpenCV.h:125

vpDetectorDNNOpenCV::DetectedFeatures2D::getClassId
unsigned int getClassId() const
Definition: vpDetectorDNNOpenCV.h:167

vpDetectorDNNOpenCV::NetConfig
Structure containing some information required for the configuration of a vpDetectorDNNOpenCV object.
Definition: vpDetectorDNNOpenCV.h:184

vpDetectorDNNOpenCV::NetConfig::NetConfig
NetConfig(const NetConfig &config)
Definition: vpDetectorDNNOpenCV.h:342

vpDetectorDNNOpenCV::NetConfig::to_json
friend void to_json(nlohmann::json &j, const NetConfig &config)
Parse a vpDetectorDNNOpenCV::NetConfig into JSON format.
Definition: vpDetectorDNNOpenCV.h:248

vpDetectorDNNOpenCV::NetConfig::NetConfig
NetConfig()
Default constructor of the structure vpDetectorDNNOpenCV::NetConfig , required for JSON serialization...
Definition: vpDetectorDNNOpenCV.h:325

vpDetectorDNNOpenCV::NetConfig::vpDetectorDNNOpenCV
friend vpDetectorDNNOpenCV
Definition: vpDetectorDNNOpenCV.h:470

vpDetectorDNNOpenCV::NetConfig::operator<<
friend std::ostream & operator<<(std::ostream &os, const NetConfig &config)
Definition: vpDetectorDNNOpenCV.h:447

vpDetectorDNNOpenCV::NetConfig::toString
std::string toString() const
Definition: vpDetectorDNNOpenCV.h:428

vpDetectorDNNOpenCV::NetConfig::from_json
friend void from_json(const nlohmann::json &j, NetConfig &config)
Read the network configuration from JSON. All values are optional and if an argument is not present,...
Definition: vpDetectorDNNOpenCV.h:208

vpDetectorDNNOpenCV::NetConfig::NetConfig
NetConfig(float confThresh, const float &nmsThresh, const std::vector< std::string > &classNames, const cv::Size &dnnInputSize, const double &filterSizeRatio=0., const cv::Scalar &mean=cv::Scalar(127.5, 127.5, 127.5), const double &scaleFactor=2./255., const bool &swapRB=true, const DNNResultsParsingType &parsingType=vpDetectorDNNOpenCV::USER_SPECIFIED, const std::string &modelFilename="", const std::string &configFilename="", const std::string &framework="")
Construct a new Net Config object.
Definition: vpDetectorDNNOpenCV.h:376

vpDetectorDNNOpenCV::NetConfig::operator=
NetConfig & operator=(const NetConfig &config)
Definition: vpDetectorDNNOpenCV.h:453

vpDetectorDNNOpenCV::NetConfig::parseClassNamesFile
static std::vector< std::string > parseClassNamesFile(const std::string &filename)
Parse the file containing the list of classes the DNN can detect. These classes can be written either...
Definition: vpDetectorDNNOpenCV.h:292

vpDetectorDNNOpenCV::NetConfig::NetConfig
NetConfig(const float &confThresh, const float &nmsThresh, const std::string &classNamesFile, const cv::Size &dnnInputSize, const double &filterSizeRatio=0., const cv::Scalar &mean=cv::Scalar(127.5, 127.5, 127.5), const double &scaleFactor=2./255., const bool &swapRB=true, const DNNResultsParsingType &parsingType=vpDetectorDNNOpenCV::USER_SPECIFIED, const std::string &modelFilename="", const std::string &configFilename="", const std::string &framework="")
Construct a new Net Config object.
Definition: vpDetectorDNNOpenCV.h:410

vpDetectorDNNOpenCV
Definition: vpDetectorDNNOpenCV.h:86

vpDetectorDNNOpenCV::from_json
friend void from_json(const nlohmann::json &j, vpDetectorDNNOpenCV &network)
Read the network configuration from JSON. All values are optional and if an argument is not present,...
Definition: vpDetectorDNNOpenCV.h:522

vpDetectorDNNOpenCV::m_blob
cv::Mat m_blob
Buffer for the blob in input net.
Definition: vpDetectorDNNOpenCV.h:581

vpDetectorDNNOpenCV::operator<<
friend std::ostream & operator<<(std::ostream &os, const vpDetectorDNNOpenCV &network)
Definition: vpDetectorDNNOpenCV.h:541

vpDetectorDNNOpenCV::DNNResultsParsingType
DNNResultsParsingType
Enumeration listing the types of DNN for which the vpDetectorDNNOpenCV furnishes the methods permitti...
Definition: vpDetectorDNNOpenCV.h:94

vpDetectorDNNOpenCV::USER_SPECIFIED
@ USER_SPECIFIED
Definition: vpDetectorDNNOpenCV.h:95

vpDetectorDNNOpenCV::m_outNames
std::vector< cv::String > m_outNames
Names of layers with unconnected outputs.
Definition: vpDetectorDNNOpenCV.h:593

vpDetectorDNNOpenCV::to_json
friend void to_json(nlohmann::json &j, const vpDetectorDNNOpenCV &network)
Parse the network configuration into JSON format.
Definition: vpDetectorDNNOpenCV.h:533

vpDetectorDNNOpenCV::getNetConfig
const NetConfig & getNetConfig() const
Definition: vpDetectorDNNOpenCV.h:509

vpDetectorDNNOpenCV::m_img
cv::Mat m_img
Buffer for the input image.
Definition: vpDetectorDNNOpenCV.h:585

vpDetectorDNNOpenCV::m_indices
std::vector< int > m_indices
Indices for NMS.
Definition: vpDetectorDNNOpenCV.h:587

vpDetectorDNNOpenCV::m_netConfig
NetConfig m_netConfig
Configuration of the DNN.
Definition: vpDetectorDNNOpenCV.h:591

vpDetectorDNNOpenCV::m_dnnRes
std::vector< cv::Mat > m_dnnRes
Contains all output blobs for each layer specified in m_outNames.
Definition: vpDetectorDNNOpenCV.h:595

vpDetectorDNNOpenCV::m_net
cv::dnn::Net m_net
DNN network.
Definition: vpDetectorDNNOpenCV.h:589

vpDetectorDNNOpenCV::m_applySizeFilterAfterNMS
bool m_applySizeFilterAfterNMS
If true, filter the detections removing the ones for which the bbox does not respect area(bbox) € [me...
Definition: vpDetectorDNNOpenCV.h:579

vpDetectorDNNOpenCV::dnnResultsParsingTypeToString
static std::string dnnResultsParsingTypeToString(const DNNResultsParsingType &type)
Definition: vpDetectorDNNOpenCV.cpp:71

vpDetectorDNNOpenCV::m_I_color
vpImage< vpRGBa > m_I_color
Buffer for gray to RGBa image conversion.
Definition: vpDetectorDNNOpenCV.h:583

vpDisplay::displayRectangle
static void displayRectangle(const vpImage< unsigned char > &I, const vpImagePoint &topLeft, unsigned int width, unsigned int height, const vpColor &color, bool fill=false, unsigned int thickness=1)
Definition: vpDisplay_uchar.cpp:630

vpDisplay::displayText
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
Definition: vpDisplay_uchar.cpp:750

vpException
error that can be emitted by ViSP classes.
Definition: vpException.h:60

vpException::badValue
@ badValue
Used to indicate that a value is not in the allowed range.
Definition: vpException.h:73

vpException::dimensionError
@ dimensionError
Bad dimension.
Definition: vpException.h:71

vpImagePoint
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition: vpImagePoint.h:82

vpImage
Definition of the vpImage class member functions.
Definition: vpImage.h:131

vpRect
Defines a rectangle in the plane.
Definition: vpRect.h:79

vpRect::getTopRight
vpImagePoint getTopRight() const
Definition: vpRect.h:212

vpDetectorDNNOpenCV::DetectionCandidates
Definition: vpDetectorDNNOpenCV.h:109

vpDetectorDNNOpenCV::DetectionCandidates::m_classIds
std::vector< int > m_classIds
Definition: vpDetectorDNNOpenCV.h:112

vpDetectorDNNOpenCV::DetectionCandidates::m_confidences
std::vector< float > m_confidences
Definition: vpDetectorDNNOpenCV.h:110

vpDetectorDNNOpenCV::DetectionCandidates::m_boxes
std::vector< cv::Rect > m_boxes
Definition: vpDetectorDNNOpenCV.h:111