Lane-and-Object-Detection/_object_detector_8cpp_source.html

#include <cfloat>

#include <cstdint>

#include <format>

#include <string>

#include <vector>


#include <opencv2/core.hpp>

#include <opencv2/core/mat.hpp>

#include <opencv2/core/types.hpp>

#include <opencv2/dnn/dnn.hpp>


#include "helpers/Globals.hpp"


#include "detectors/ObjectDetector.hpp"


namespace LaneAndObjectDetection

{


    ObjectDetector::ObjectDetector() :

        m_blobSize(0),

        m_skipObjectDetection(false)

    {}


    void ObjectDetector::SetProperties(const std::string& p_yoloFolderPath,

                                       const Globals::ObjectDetectorTypes& p_objectDetectorTypes,

                                       const Globals::ObjectDetectorBackEnds& p_objectDetectorBackEnds,

                                       const Globals::ObjectDetectorBlobSizes& p_objectDetectorBlobSizes)

    {

        switch (p_objectDetectorTypes)

        {

        case Globals::ObjectDetectorTypes::NONE:

            m_skipObjectDetection = true;

            break;


        case Globals::ObjectDetectorTypes::STANDARD:

            m_skipObjectDetection = false;

            m_net = cv::dnn::readNetFromDarknet(p_yoloFolderPath + "yolov7.cfg", p_yoloFolderPath + "yolov7.weights");

            break;


        case Globals::ObjectDetectorTypes::TINY:

            m_skipObjectDetection = false;

            m_net = cv::dnn::readNetFromDarknet(p_yoloFolderPath + "yolov7-tiny.cfg", p_yoloFolderPath + "yolov7-tiny.weights");

            break;


        default:

            throw Globals::Exceptions::NotImplementedError();

        }


        switch (p_objectDetectorBackEnds)

        {

        case Globals::ObjectDetectorBackEnds::NONE:

            break;

        case Globals::ObjectDetectorBackEnds::CPU:

            m_net.setPreferableBackend(cv::dnn::DNN_BACKEND_OPENCV);

            m_net.setPreferableTarget(cv::dnn::DNN_TARGET_CPU);

            break;


        case Globals::ObjectDetectorBackEnds::GPU:

            m_net.setPreferableBackend(cv::dnn::DNN_BACKEND_OPENCV);

            m_net.setPreferableTarget(cv::dnn::DNN_TARGET_OPENCL);

            break;


        case Globals::ObjectDetectorBackEnds::CUDA:

            m_net.setPreferableBackend(cv::dnn::DNN_BACKEND_CUDA);

            m_net.setPreferableTarget(cv::dnn::DNN_TARGET_CUDA);

            break;


        default:

            throw Globals::Exceptions::NotImplementedError();

        }


        m_blobSize = static_cast<int32_t>(p_objectDetectorBlobSizes);


        m_unconnectedOutputLayerNames = m_net.getUnconnectedOutLayersNames();


        m_objectDetectionInformation.m_objectInformation.clear();

    }


    void ObjectDetector::RunObjectDetector(const cv::Mat& p_frame)

    {

        if (m_skipObjectDetection)

        {

            return;

        }


        m_objectDetectionInformation.m_objectInformation.clear();


        // Get output blobs from the frame

        std::vector<cv::Mat> outputBlobs;

        const cv::Mat BLOB_FROM_IMAGE = cv::dnn::blobFromImage(p_frame, Globals::G_OBJECT_DETECTOR_SCALE_FACTOR, cv::Size(m_blobSize, m_blobSize), Globals::G_COLOUR_BLACK);

        m_net.setInput(BLOB_FROM_IMAGE);

        m_net.forward(outputBlobs, m_unconnectedOutputLayerNames);


        // Go through all output blobs and only allow those with confidence above threshold

        std::vector<std::string> initialObjectNames;

        std::vector<cv::Rect> initialObjectBoundingBoxes;

        std::vector<float> initialObjectConfidences;

        cv::Point maxConfidenceObjectIndex;

        double maxConfidence = -DBL_MAX;


        for (auto& outputBlob : outputBlobs)

        {

            for (int32_t rowIndex = 0; rowIndex < outputBlob.rows; rowIndex++)

            {

                // Each row is structured as the following [cx, cy, w, h, box score, object 1 score, object 2 score, ..., object n score]


                // minMaxLoc returns the object index that has the maximum confidence as well as the maximum confidence

                cv::minMaxLoc(outputBlob.row(rowIndex).colRange(Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_OBJECT_SCORES_START_INDEX, outputBlob.cols), nullptr, &maxConfidence, nullptr, &maxConfidenceObjectIndex);


                if (maxConfidence > Globals::G_OBJECT_DETECTOR_CONFIDENCE_THRESHOLD)

                {

                    const double CENTER_X = outputBlob.at<float>(rowIndex, Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_X_COORD_INDEX) * Globals::G_VIDEO_INPUT_WIDTH;

                    const double CENTER_Y = outputBlob.at<float>(rowIndex, Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_Y_COORD_INDEX) * Globals::G_VIDEO_INPUT_HEIGHT;

                    const double WIDTH = (outputBlob.at<float>(rowIndex, Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_WIDTH_INDEX) * Globals::G_VIDEO_INPUT_WIDTH) + Globals::G_OBJECT_DETECTOR_BOUNDING_BOX_BUFFER;

                    const double HEIGHT = (outputBlob.at<float>(rowIndex, Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_HEIGHT_INDEX) * Globals::G_VIDEO_INPUT_HEIGHT) + Globals::G_OBJECT_DETECTOR_BOUNDING_BOX_BUFFER;


                    // Remove object detections on the hood of car

                    if (CENTER_Y < Globals::G_ROI_BOTTOM_HEIGHT)

                    {

                        initialObjectNames.push_back(Globals::G_OBJECT_DETECTOR_OBJECT_NAMES.at(maxConfidenceObjectIndex.x));

                        initialObjectBoundingBoxes.emplace_back(CENTER_X - (WIDTH / Globals::G_DIVIDE_BY_TWO), CENTER_Y - (HEIGHT / Globals::G_DIVIDE_BY_TWO), WIDTH, HEIGHT);

                        initialObjectConfidences.push_back(static_cast<float>(maxConfidence));

                    }

                }

            }

        }


        // Apply non-maxima suppression to suppress overlapping bounding boxes for objects that overlap, the highest confidence object will be chosen

        std::vector<int> nonMaximaSuppressedFilteredIndicies;


        cv::dnn::NMSBoxes(initialObjectBoundingBoxes, initialObjectConfidences, 0.0, static_cast<float>(Globals::G_OBJECT_DETECTOR_NMS_THRESHOLD), nonMaximaSuppressedFilteredIndicies);


        for (const int32_t& index : nonMaximaSuppressedFilteredIndicies)

        {

            m_objectDetectionInformation.m_objectInformation.push_back({.m_boundingBox = initialObjectBoundingBoxes.at(index),

                                                                        .m_boundingBoxColour = Globals::G_OBJECT_DETECTOR_OBJECT_NAMES_AND_COLOURS.at(initialObjectNames.at(index)),

                                                                        .m_objectName = std::format("{} ({} %)", initialObjectNames.at(index), std::to_string(static_cast<uint32_t>(initialObjectConfidences.at(index) * Globals::G_CONVERT_DECIMAL_TO_PERCENTAGE)))});

        }

    }


    ObjectDetectionInformation ObjectDetector::GetInformation()

    {

        return m_objectDetectionInformation;

    }


}

LaneAndObjectDetection::Globals::Exceptions::NotImplementedError
Used for functionality that has not been implemented.
Definition Globals.hpp:32

LaneAndObjectDetection::ObjectDetector::m_objectDetectionInformation
ObjectDetectionInformation m_objectDetectionInformation
The ObjectDetectionInformation struct containing all object detection-related information.
Definition ObjectDetector.hpp:71

LaneAndObjectDetection::ObjectDetector::m_net
cv::dnn::Net m_net
OpenCV object which allows the use of pre-trained neural networks.
Definition ObjectDetector.hpp:66

LaneAndObjectDetection::ObjectDetector::m_unconnectedOutputLayerNames
std::vector< std::string > m_unconnectedOutputLayerNames
The names of layers with unconnected outputs.
Definition ObjectDetector.hpp:76

LaneAndObjectDetection::ObjectDetector::SetProperties
void SetProperties(const std::string &p_yoloFolderPath, const Globals::ObjectDetectorTypes &p_objectDetectorTypes, const Globals::ObjectDetectorBackEnds &p_objectDetectorBackEnds, const Globals::ObjectDetectorBlobSizes &p_objectDetectorBlobSizes)
Set the properties of the ObjectDetector object.
Definition ObjectDetector.cpp:23

LaneAndObjectDetection::ObjectDetector::m_blobSize
int32_t m_blobSize
The spatial size for the output image used by the cv::dnn::blobFromImage function.
Definition ObjectDetector.hpp:81

LaneAndObjectDetection::ObjectDetector::ObjectDetector
ObjectDetector()
Construct a new ObjectDetector object.
Definition ObjectDetector.cpp:18

LaneAndObjectDetection::ObjectDetector::RunObjectDetector
void RunObjectDetector(const cv::Mat &p_frame)
Run the object detector against p_frame.
Definition ObjectDetector.cpp:78

LaneAndObjectDetection::ObjectDetector::m_skipObjectDetection
bool m_skipObjectDetection
Whether to skip object detection.
Definition ObjectDetector.hpp:86

LaneAndObjectDetection::ObjectDetector::GetInformation
ObjectDetectionInformation GetInformation()
Get the ObjectDetectionInformation struct.
Definition ObjectDetector.cpp:140

LaneAndObjectDetection::Globals::G_COLOUR_BLACK
static const cv::Scalar G_COLOUR_BLACK
OpenCV Colours (in BGR format).
Definition Globals.hpp:145

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_Y_COORD_INDEX
static const int32_t G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_Y_COORD_INDEX
The indicies representing various values in the output blobs.
Definition Globals.hpp:505

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_BOUNDING_BOX_BUFFER
static const uint32_t G_OBJECT_DETECTOR_BOUNDING_BOX_BUFFER
Object detection bounding box properties.
Definition Globals.hpp:492

LaneAndObjectDetection::Globals::G_VIDEO_INPUT_HEIGHT
static const uint32_t G_VIDEO_INPUT_HEIGHT
Input video dimensions.
Definition Globals.hpp:103

LaneAndObjectDetection::Globals::G_VIDEO_INPUT_WIDTH
static const uint32_t G_VIDEO_INPUT_WIDTH
Input video dimensions.
Definition Globals.hpp:104

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_CONFIDENCE_THRESHOLD
static const double G_OBJECT_DETECTOR_CONFIDENCE_THRESHOLD
Object detection threshold and properties.
Definition Globals.hpp:484

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_NMS_THRESHOLD
static const double G_OBJECT_DETECTOR_NMS_THRESHOLD
Object detection threshold and properties.
Definition Globals.hpp:485

LaneAndObjectDetection::Globals::G_DIVIDE_BY_TWO
static const double G_DIVIDE_BY_TWO
Divide by two.
Definition Globals.hpp:176

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_HEIGHT_INDEX
static const int32_t G_OBJECT_DETECTOR_OUTPUT_BLOBS_HEIGHT_INDEX
The indicies representing various values in the output blobs.
Definition Globals.hpp:507

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OBJECT_NAMES
static const std::array< std::string, G_OBJECT_DETECTOR_NUMBER_OF_DETECTABLE_OBJECTS > G_OBJECT_DETECTOR_OBJECT_NAMES
Names of detectable objects. The order is significant and should not be changed.
Definition Globals.hpp:516

LaneAndObjectDetection::Globals::G_ROI_BOTTOM_HEIGHT
static const int32_t G_ROI_BOTTOM_HEIGHT
Region-of-interest dimensions.
Definition Globals.hpp:267

LaneAndObjectDetection::Globals::ObjectDetectorTypes
ObjectDetectorTypes
The type of object detector to use with an option to disable object detection. The tiny version is mo...
Definition Globals.hpp:446

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_OBJECT_SCORES_START_INDEX
static const int32_t G_OBJECT_DETECTOR_OUTPUT_BLOBS_OBJECT_SCORES_START_INDEX
The indicies representing various values in the output blobs.
Definition Globals.hpp:508

LaneAndObjectDetection::Globals::ObjectDetectorBackEnds
ObjectDetectorBackEnds
The supported backends for the object detector to run on. In theory, GPU should be significantly more...
Definition Globals.hpp:458

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_X_COORD_INDEX
static const int32_t G_OBJECT_DETECTOR_OUTPUT_BLOBS_CENTER_X_COORD_INDEX
The indicies representing various values in the output blobs.
Definition Globals.hpp:504

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OBJECT_NAMES_AND_COLOURS
static const std::map< std::string, cv::Scalar > G_OBJECT_DETECTOR_OBJECT_NAMES_AND_COLOURS
Object names and bounding box colours. G_OPENCV_WHITE is used as the default colour while custom colo...
Definition Globals.hpp:604

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_SCALE_FACTOR
static const double G_OBJECT_DETECTOR_SCALE_FACTOR
Object detection threshold and properties.
Definition Globals.hpp:483

LaneAndObjectDetection::Globals::G_OBJECT_DETECTOR_OUTPUT_BLOBS_WIDTH_INDEX
static const int32_t G_OBJECT_DETECTOR_OUTPUT_BLOBS_WIDTH_INDEX
The indicies representing various values in the output blobs.
Definition Globals.hpp:506

LaneAndObjectDetection::Globals::ObjectDetectorBlobSizes
ObjectDetectorBlobSizes
The supported blob sizes for the object detector to run with. The larger the blob size the more perfo...
Definition Globals.hpp:470

LaneAndObjectDetection::Globals::G_CONVERT_DECIMAL_TO_PERCENTAGE
static const uint32_t G_CONVERT_DECIMAL_TO_PERCENTAGE
Convert a decimal value to a percentage.
Definition Globals.hpp:171

LaneAndObjectDetection
Contains all Lane-and-Object-Detection objects.

LaneAndObjectDetection::ObjectDetectionInformation
The information needed by FrameBuilder to update frame with object detection information.
Definition Information.hpp:19