Skip to content

Commit

Permalink
Merge pull request #450 from Nuzhny007/master
Browse files Browse the repository at this point in the history
Add YOLOv10 TensorRT detector
  • Loading branch information
Nuzhny007 authored Jun 9, 2024
2 parents 2cd0a37 + b649f2d commit 7ba7d8a
Show file tree
Hide file tree
Showing 9 changed files with 106 additions and 8 deletions.
2 changes: 2 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,8 @@

# Last changes

* YOLOv10 detector worked with TensorRT! Export pretrained Pytorch models [here (THU-MIG/yolov10)](https://github.com/THU-MIG/yolov10) to onnx format and run Multitarget-tracker with -e=6 example

* YOLOv9 detector worked with TensorRT! Export pretrained Pytorch models [here (WongKinYiu/yolov9)](https://github.com/WongKinYiu/yolov9) to onnx format and run Multitarget-tracker with -e=6 example

* YOLOv8 instance segmentation models worked with TensorRT! Export pretrained Pytorch models [here (ultralytics/ultralytics)](https://github.com/ultralytics/ultralytics) to onnx format and run Multitarget-tracker with -e=6 example
Expand Down
3 changes: 2 additions & 1 deletion example/examples.h
Original file line number Diff line number Diff line change
Expand Up @@ -650,7 +650,8 @@ class YoloTensorRTExample final : public VideoExample
YOLOv7Mask,
YOLOv8,
YOLOv8Mask,
YOLOv9
YOLOv9,
YOLOv10
};
YOLOModels usedModel = YOLOModels::YOLOv9;
switch (usedModel)
Expand Down
5 changes: 3 additions & 2 deletions src/Detector/OCVDNNDetector.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -140,6 +140,7 @@ bool OCVDNNDetector::Init(const config_t& config)
dictNetType["YOLOV8"] = ModelType::YOLOV8;
dictNetType["YOLOV8Mask"] = ModelType::YOLOV8Mask;
dictNetType["YOLOV9"] = ModelType::YOLOV9;
dictNetType["YOLOV10"] = ModelType::YOLOV10;

auto netType = dictNetType.find(net_type->second);
if (netType != dictNetType.end())
Expand Down Expand Up @@ -346,7 +347,7 @@ void OCVDNNDetector::DetectInCrop(const cv::UMat& colorFrame, const cv::Rect& cr
}
else
{
if (m_netType == ModelType::YOLOV8 || m_netType == ModelType::YOLOV5 || m_netType == ModelType::YOLOV9)
if (m_netType == ModelType::YOLOV8 || m_netType == ModelType::YOLOV5 || m_netType == ModelType::YOLOV9 || m_netType == ModelType::YOLOV10)
{
int rows = detections[0].size[1];
int dimensions = detections[0].size[2];
Expand All @@ -368,7 +369,7 @@ void OCVDNNDetector::DetectInCrop(const cv::UMat& colorFrame, const cv::Rect& cr

for (int i = 0; i < rows; ++i)
{
if (m_netType == ModelType::YOLOV8 || m_netType == ModelType::YOLOV9)
if (m_netType == ModelType::YOLOV8 || m_netType == ModelType::YOLOV9 || m_netType == ModelType::YOLOV10)
{
float* classes_scores = data + 4;

Expand Down
3 changes: 2 additions & 1 deletion src/Detector/OCVDNNDetector.h
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,8 @@ class OCVDNNDetector final : public BaseDetector
YOLOV7Mask,
YOLOV8,
YOLOV8Mask,
YOLOV9
YOLOV9,
YOLOV10
};

cv::dnn::Net m_net;
Expand Down
1 change: 1 addition & 0 deletions src/Detector/YoloTensorRTDetector.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -103,6 +103,7 @@ bool YoloTensorRTDetector::Init(const config_t& config)
dictNetType["YOLOV8"] = tensor_rt::YOLOV8;
dictNetType["YOLOV8Mask"] = tensor_rt::YOLOV8Mask;
dictNetType["YOLOV9"] = tensor_rt::YOLOV9;
dictNetType["YOLOV10"] = tensor_rt::YOLOV10;

auto netType = dictNetType.find(net_type->second);
if (netType != dictNetType.end())
Expand Down
85 changes: 85 additions & 0 deletions src/Detector/tensorrt_yolo/YoloONNXv10_bb.hpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,85 @@
#pragma once

#include "YoloONNX.hpp"

///
/// \brief The YOLOv10_bb_onnx class
///
class YOLOv10_bb_onnx : public YoloONNX
{
protected:
///
/// \brief GetResult
/// \param output
/// \return
///
std::vector<tensor_rt::Result> YoloONNX::GetResult(size_t imgIdx, int /*keep_topk*/, const std::vector<float*>& outputs, cv::Size frameSize)
{
std::vector<tensor_rt::Result> resBoxes;

//0: name: images, size: 1x3x640x640
//1: name: output0, size: 1x300x6

const float fw = static_cast<float>(frameSize.width) / static_cast<float>(m_inputDims.d[3]);
const float fh = static_cast<float>(frameSize.height) / static_cast<float>(m_inputDims.d[2]);

auto output = outputs[0];

size_t ncInd = 2;
size_t lenInd = 1;
size_t len = static_cast<size_t>(m_outpuDims[0].d[lenInd]) / m_params.explicitBatchSize;
//auto Volume = [](const nvinfer1::Dims& d)
//{
// return std::accumulate(d.d, d.d + d.nbDims, 1, std::multiplies<int>());
//};
auto volume = len * m_outpuDims[0].d[ncInd]; // Volume(m_outpuDims[0]);
output += volume * imgIdx;
//std::cout << "len = " << len << ", nc = " << nc << ", m_params.confThreshold = " << m_params.confThreshold << ", volume = " << volume << std::endl;

std::vector<int> classIds;
std::vector<float> confidences;
std::vector<cv::Rect> rectBoxes;
classIds.reserve(len);
confidences.reserve(len);
rectBoxes.reserve(len);

for (size_t i = 0; i < len; ++i)
{
// Box
size_t k = i * 6;

//if (i == 0)
// std::cout << i << ": " << output[k + 0] << " " << output[k + 1] << " " << output[k + 2] << " " << output[k + 3] << " " << output[k + 4] << " " << output[k + 5] << std::endl;

float x = fw * output[k + 0];
float y = fh * output[k + 1];
float width = fw * (output[k + 2] - output[k + 0]);
float height = fh * (output[k + 3] - output[k + 1]);
float objectConf = output[k + 4];
int classId = cvRound(output[k + 5]);
//if (i == 0)
// std::cout << i << ": object_conf = " << objectConf << ", classId = " << classId << ", rect = " << cv::Rect(cvRound(x), cvRound(y), cvRound(width), cvRound(height)) << std::endl;

if (objectConf >= m_params.confThreshold)
{
classIds.push_back(classId);
confidences.push_back(objectConf);

// (center x, center y, width, height) to (x, y, w, h)
rectBoxes.emplace_back(cvRound(x), cvRound(y), cvRound(width), cvRound(height));
}
}

// Non-maximum suppression to eliminate redudant overlapping boxes
std::vector<int> indices;
cv::dnn::NMSBoxes(rectBoxes, confidences, m_params.confThreshold, m_params.nmsThreshold, indices);
resBoxes.reserve(indices.size());

for (size_t bi = 0; bi < indices.size(); ++bi)
{
resBoxes.emplace_back(classIds[indices[bi]], confidences[indices[bi]], rectBoxes[indices[bi]]);
}

return resBoxes;
}
};
8 changes: 7 additions & 1 deletion src/Detector/tensorrt_yolo/class_detector.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@
#include "YoloONNXv8_bb.hpp"
#include "YoloONNXv8_instance.hpp"
#include "YoloONNXv9_bb.hpp"
#include "YoloONNXv10_bb.hpp"

namespace tensor_rt
{
Expand Down Expand Up @@ -98,6 +99,11 @@ namespace tensor_rt
m_params.outputTensorNames.push_back("output0");
m_detector = std::make_unique<YOLOv9_bb_onnx>();
break;
case ModelType::YOLOV10:
m_params.inputTensorNames.push_back("images");
m_params.outputTensorNames.push_back("output0");
m_detector = std::make_unique<YOLOv10_bb_onnx>();
break;
}

// Threshold values
Expand Down Expand Up @@ -181,7 +187,7 @@ namespace tensor_rt
if (config.net_type == ModelType::YOLOV6 ||
config.net_type == ModelType::YOLOV7 || config.net_type == ModelType::YOLOV7Mask ||
config.net_type == ModelType::YOLOV8 || config.net_type == ModelType::YOLOV8Mask ||
config.net_type == ModelType::YOLOV9)
config.net_type == ModelType::YOLOV9 || config.net_type == ModelType::YOLOV10)
m_impl = new YoloONNXImpl();
else
m_impl = new YoloDectectorImpl();
Expand Down
3 changes: 2 additions & 1 deletion src/Detector/tensorrt_yolo/class_detector.h
Original file line number Diff line number Diff line change
Expand Up @@ -52,7 +52,8 @@ namespace tensor_rt
YOLOV7Mask,
YOLOV8,
YOLOV8Mask,
YOLOV9
YOLOV9,
YOLOV10
};

///
Expand Down
4 changes: 2 additions & 2 deletions src/Detector/tensorrt_yolo/ds_image.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,7 @@ DsImage::DsImage(const cv::Mat& mat_image_, tensor_rt::ModelType net_type, const
if (tensor_rt::ModelType::YOLOV5 == net_type || tensor_rt::ModelType::YOLOV6 == net_type ||
tensor_rt::ModelType::YOLOV7 == net_type || tensor_rt::ModelType::YOLOV7Mask == net_type ||
tensor_rt::ModelType::YOLOV8 == net_type || tensor_rt::ModelType::YOLOV8Mask == net_type ||
tensor_rt::ModelType::YOLOV9 == net_type)
tensor_rt::ModelType::YOLOV9 == net_type || tensor_rt::ModelType::YOLOV10 == net_type)
{
// resize the DsImage with scale
float r = std::min(static_cast<float>(inputH) / static_cast<float>(m_Height), static_cast<float>(inputW) / static_cast<float>(m_Width));
Expand Down Expand Up @@ -101,7 +101,7 @@ DsImage::DsImage(const std::string& path, tensor_rt::ModelType net_type, const i
if (tensor_rt::ModelType::YOLOV5 == net_type || tensor_rt::ModelType::YOLOV6 == net_type ||
tensor_rt::ModelType::YOLOV7 == net_type || tensor_rt::ModelType::YOLOV7Mask == net_type ||
tensor_rt::ModelType::YOLOV8 == net_type || tensor_rt::ModelType::YOLOV8Mask == net_type ||
tensor_rt::ModelType::YOLOV9 == net_type)
tensor_rt::ModelType::YOLOV9 == net_type || tensor_rt::ModelType::YOLOV10 == net_type)
{
// resize the DsImage with scale
float dim = std::max(m_Height, m_Width);
Expand Down

0 comments on commit 7ba7d8a

Please sign in to comment.