Autonomy_Software/TorchObjectDetection_8hpp_source.html

#ifndef TORCH_OBJECT_DETECTION_HPP

#define TORCH_OBJECT_DETECTION_HPP


#include "../../util/vision/ObjectDetectionUtility.hpp"

#include "../../util/vision/YOLOModel.hpp"


#include <chrono>


namespace torchobject

{


    inline std::vector<objectdetectutils::Object> Detect(const cv::Mat& cvFrame,

                                                         yolomodel::pytorch::PyTorchInterpreter& trPyTorchDetector,

                                                         const float fMinObjectConfidence = 0.40f,

                                                         const float fNMSThreshold        = 0.60f)

    {

        // Check if the input frame is in RGB format.

        if (cvFrame.channels() != 3)

        {

            // Submit logger message.

            LOG_ERROR(logging::g_qSharedLogger, "Detect() requires a RGB image.");

            return {};

        }


        // Declare instance variables.

        std::vector<objectdetectutils::Object> vDetectedTags;


        // Check if the PyTorch interpreter hardware is opened and the model is loaded.

        if (trPyTorchDetector.IsReadyForInference())

        {

            // Run inference on YOLO model with current image.

            std::vector<yolomodel::Detection> vOutputTensorTags = trPyTorchDetector.Inference(cvFrame, fMinObjectConfidence, fNMSThreshold);


            // Repackage detections into tensorflow tags.

            for (const yolomodel::Detection& stTagDetection : vOutputTensorTags)

            {

                // Create and initialize new TensorflowTag.

                objectdetectutils::Object stDetectedTag;

                stDetectedTag.dConfidence       = stTagDetection.fConfidence;

                stDetectedTag.pBoundingBox      = std::make_shared<cv::Rect2d>(stTagDetection.cvBoundingBox);

                stDetectedTag.szClassName       = stTagDetection.szClassName;

                stDetectedTag.eDetectionMethod  = objectdetectutils::ObjectDetectionMethod::eTorch;

                stDetectedTag.cvImageResolution = cvFrame.size();


                // Add the newly detected tag to the vector.

                vDetectedTags.emplace_back(stDetectedTag);

            }

        }

        else

        {

            // Submit logger message.

            LOG_WARNING(logging::g_qSharedLogger,

                        "TorchDetect: Unable to detect tags using YOLO torch detection because hardware is not opened or model is not initialized.");

        }


        // Return the detected tags.

        return vDetectedTags;

    }


    inline void DrawDetections(cv::Mat& cvDetectionsFrame, const std::vector<objectdetectutils::Object>& vDetectedTags)

    {

        // Check if the given frame is a 1 or 3 channel image. (not BGRA)

        if (!cvDetectionsFrame.empty() && (cvDetectionsFrame.channels() == 1 || cvDetectionsFrame.channels() == 3))

        {

            // Loop through each detection.

            for (const objectdetectutils::Object& stTag : vDetectedTags)

            {

                // Check if the tag detection type is Torch.

                if (stTag.eDetectionMethod == objectdetectutils::ObjectDetectionMethod::eTorch)

                {

                    // Draw bounding box onto image.

                    cv::rectangle(cvDetectionsFrame, *stTag.pBoundingBox, cv::Scalar(255, 255, 255), 2);

                    std::string szText  = stTag.szClassName + " " + std::to_string(static_cast<int>(stTag.dConfidence * 100)) + "%";

                    cv::Size cvTextSize = cv::getTextSize(szText, cv::FONT_HERSHEY_SIMPLEX, 0.75, 1, nullptr);

                    // Draw classID background box onto image.

                    cv::rectangle(cvDetectionsFrame,

                                  stTag.pBoundingBox->tl() + cv::Point2d(0, stTag.pBoundingBox->height),

                                  stTag.pBoundingBox->tl() + cv::Point2d(cvTextSize.width, stTag.pBoundingBox->height + cvTextSize.height),

                                  cv::Scalar(255, 255, 255),

                                  cv::FILLED);

                    // Draw class text onto image.

                    cv::putText(cvDetectionsFrame,

                                szText,

                                stTag.pBoundingBox->tl() + cv::Point2d(0, stTag.pBoundingBox->height + cvTextSize.height),

                                cv::FONT_HERSHEY_SIMPLEX,

                                0.5,

                                cv::Scalar(0, 0, 0));

                }

            }

        }

        else

        {

            // Submit logger message.

            LOG_ERROR(logging::g_qSharedLogger,

                      "TorchDetect: Unable to draw markers on image because it is empty or because it has {} channels. (Should be 1 or 3)",

                      cvDetectionsFrame.channels());

        }

    }


}    // namespace torchobject


#endif

cv::Mat

cv::Mat::size
MatSize size

cv::Mat::channels
int channels() const

cv::Mat::empty
bool empty() const

Point_< double >

Scalar_< double >

cv::Size_

cv::Size_::height
_Tp height

cv::Size_::width
_Tp width

yolomodel::pytorch::PyTorchInterpreter
This class is designed to enable quick, easy, and robust inferencing of .pt yolo model.
Definition YOLOModel.hpp:710

yolomodel::pytorch::PyTorchInterpreter::IsReadyForInference
bool IsReadyForInference() const
Check if the model is ready for inference.
Definition YOLOModel.hpp:946

yolomodel::pytorch::PyTorchInterpreter::Inference
std::vector< Detection > Inference(const cv::Mat &cvInputFrame, const float fMinObjectConfidence=0.85, const float fNMSThreshold=0.6)
Given an input image forward the image through the YOLO model to run inference on the PyTorch model,...
Definition YOLOModel.hpp:859

cv::rectangle
void rectangle(InputOutputArray img, Point pt1, Point pt2, const Scalar &color, int thickness=1, int lineType=LINE_8, int shift=0)

cv::getTextSize
Size getTextSize(const String &text, int fontFace, double fontScale, int thickness, int *baseLine)

cv::putText
void putText(InputOutputArray img, const String &text, Point org, int fontFace, double fontScale, Scalar color, int thickness=1, int lineType=LINE_8, bool bottomLeftOrigin=false)

cv::FONT_HERSHEY_SIMPLEX
FONT_HERSHEY_SIMPLEX

cv::FILLED
FILLED

torchobject
Namespace containing functions related to torch object detections operations on images using PyTorch.
Definition TorchObjectDetection.hpp:32

torchobject::DrawDetections
void DrawDetections(cv::Mat &cvDetectionsFrame, const std::vector< objectdetectutils::Object > &vDetectedTags)
Given a vector of objectdetectutils::Object structs draw each tag corner and confidence onto the give...
Definition TorchObjectDetection.hpp:102

torchobject::Detect
std::vector< objectdetectutils::Object > Detect(const cv::Mat &cvFrame, yolomodel::pytorch::PyTorchInterpreter &trPyTorchDetector, const float fMinObjectConfidence=0.40f, const float fNMSThreshold=0.60f)
Detects objects in the given image using a PyTorch model.
Definition TorchObjectDetection.hpp:45

objectdetectutils::Object
Represents a single detected object. Combines attributes from TorchObject and TensorflowObject struct...
Definition ObjectDetectionUtility.hpp:74

yolomodel::Detection
This struct is used to.
Definition YOLOModel.hpp:45