基于Pytorch的YOLO系列网络改进设计源码资源-CSDN文库

共1013个文件

md：456个

py：299个

pyc：99个

版权申诉

Pytorch

改进设计

Python

Shell

70 浏览量 2024-10-27 00:23:53 上传评论收藏 57.5MB ZIP 举报

资源推荐

资源详情

资源评论

收起资源包目录

基于Pytorch的YOLO系列网络改进设计源码（1013个子文件）

main.cc 10KB

CITATION.cff 612B

setup.cfg 2KB

CNAME 21B

inference.cpp 13KB

inference.cpp 11KB

inference.cpp 6KB

main.cpp 5KB

main.cpp 4KB

main.cpp 2KB

style.css 1KB

Dockerfile 4KB

Dockerfile-arm64 2KB

Dockerfile-conda 2KB

Dockerfile-cpu 3KB

Dockerfile-jetson 2KB

Dockerfile-python 2KB

Dockerfile-runner 2KB

.gitignore 2KB

inference.h 2KB

comments.html 2KB

source-file.html 858B

main.html 439B

favicon.ico 9KB

tutorial.ipynb 35KB

tutorial.ipynb 32KB

object_tracking.ipynb 8KB

object_counting.ipynb 6KB

heatmaps.ipynb 6KB

hub.ipynb 4KB

hub.ipynb 3KB

logo.jpg 165KB

bus.jpg 134KB

zidane.jpg 49KB

extra.js 3KB

LICENSE 34KB

predict.md 47KB

cfg.md 42KB

predict.md 37KB

train.md 28KB

README.zh-CN.md 24KB

model-deployment-options.md 23KB

cfg.md 22KB

yolov8.md 20KB

openvino.md 20KB

quickstart.md 19KB

quickstart.md 18KB

train.md 17KB

yolo-common-issues.md 17KB

train_custom_data.md 17KB

track.md 16KB

roboflow.md 16KB

roboflow.md 15KB

model_export.md 15KB

heatmaps.md 15KB

inference-api.md 15KB

model_export.md 15KB

isolating-segmentation-objects.md 15KB

track.md 15KB

inference_api.md 14KB

pytorch_hub_model_loading.md 14KB

simple-utilities.md 14KB

yolov8.md 13KB

sam.md 13KB

models.md 13KB

yolo-world.md 13KB

kfold-cross-validation.md 12KB

pose.md 12KB

kfold-cross-validation.md 12KB

yolov9.md 12KB

sam.md 12KB

python.md 12KB

architecture_description.md 12KB

object-counting.md 12KB

pose.md 12KB

CI.md 12KB

architecture_description.md 12KB

obb.md 12KB

segment.md 12KB

yolo-performance-metrics.md 11KB

multi_gpu_training.md 11KB

CI.md 11KB

multi_gpu_training.md 11KB

projects.md 11KB

classify.md 11KB

共 1013 条

#include "inference.h" #include <regex> #define benchmark #define min(a,b) (((a) < (b)) ? (a) : (b)) YOLO_V8::YOLO_V8() { } YOLO_V8::~YOLO_V8() { delete session; } #ifdef USE_CUDA namespace Ort { template<> struct TypeToTensorType<half> { static constexpr ONNXTensorElementDataType type = ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT16; }; } #endif template<typename T> char* BlobFromImage(cv::Mat& iImg, T& iBlob) { int channels = iImg.channels(); int imgHeight = iImg.rows; int imgWidth = iImg.cols; for (int c = 0; c < channels; c++) { for (int h = 0; h < imgHeight; h++) { for (int w = 0; w < imgWidth; w++) { iBlob[c * imgWidth * imgHeight + h * imgWidth + w] = typename std::remove_pointer<T>::type( (iImg.at<cv::Vec3b>(h, w)[c]) / 255.0f); } } } return RET_OK; } char* YOLO_V8::PreProcess(cv::Mat& iImg, std::vector<int> iImgSize, cv::Mat& oImg) { if (iImg.channels() == 3) { oImg = iImg.clone(); cv::cvtColor(oImg, oImg, cv::COLOR_BGR2RGB); } else { cv::cvtColor(iImg, oImg, cv::COLOR_GRAY2RGB); } switch (modelType) { case YOLO_DETECT_V8: case YOLO_POSE: case YOLO_DETECT_V8_HALF: case YOLO_POSE_V8_HALF://LetterBox { if (iImg.cols >= iImg.rows) { resizeScales = iImg.cols / (float)iImgSize.at(0); cv::resize(oImg, oImg, cv::Size(iImgSize.at(0), int(iImg.rows / resizeScales))); } else { resizeScales = iImg.rows / (float)iImgSize.at(0); cv::resize(oImg, oImg, cv::Size(int(iImg.cols / resizeScales), iImgSize.at(1))); } cv::Mat tempImg = cv::Mat::zeros(iImgSize.at(0), iImgSize.at(1), CV_8UC3); oImg.copyTo(tempImg(cv::Rect(0, 0, oImg.cols, oImg.rows))); oImg = tempImg; break; } case YOLO_CLS://CenterCrop { int h = iImg.rows; int w = iImg.cols; int m = min(h, w); int top = (h - m) / 2; int left = (w - m) / 2; cv::resize(oImg(cv::Rect(left, top, m, m)), oImg, cv::Size(iImgSize.at(0), iImgSize.at(1))); break; } } return RET_OK; } char* YOLO_V8::CreateSession(DL_INIT_PARAM& iParams) { char* Ret = RET_OK; std::regex pattern("[\u4e00-\u9fa5]"); bool result = std::regex_search(iParams.modelPath, pattern); if (result) { Ret = "[YOLO_V8]:Your model path is error.Change your model path without chinese characters."; std::cout << Ret << std::endl; return Ret; } try { rectConfidenceThreshold = iParams.rectConfidenceThreshold; iouThreshold = iParams.iouThreshold; imgSize = iParams.imgSize; modelType = iParams.modelType; env = Ort::Env(ORT_LOGGING_LEVEL_WARNING, "Yolo"); Ort::SessionOptions sessionOption; if (iParams.cudaEnable) { cudaEnable = iParams.cudaEnable; OrtCUDAProviderOptions cudaOption; cudaOption.device_id = 0; sessionOption.AppendExecutionProvider_CUDA(cudaOption); } sessionOption.SetGraphOptimizationLevel(GraphOptimizationLevel::ORT_ENABLE_ALL); sessionOption.SetIntraOpNumThreads(iParams.intraOpNumThreads); sessionOption.SetLogSeverityLevel(iParams.logSeverityLevel); #ifdef _WIN32 int ModelPathSize = MultiByteToWideChar(CP_UTF8, 0, iParams.modelPath.c_str(), static_cast<int>(iParams.modelPath.length()), nullptr, 0); wchar_t* wide_cstr = new wchar_t[ModelPathSize + 1]; MultiByteToWideChar(CP_UTF8, 0, iParams.modelPath.c_str(), static_cast<int>(iParams.modelPath.length()), wide_cstr, ModelPathSize); wide_cstr[ModelPathSize] = L'\0'; const wchar_t* modelPath = wide_cstr; #else const char* modelPath = iParams.modelPath.c_str(); #endif // _WIN32 session = new Ort::Session(env, modelPath, sessionOption); Ort::AllocatorWithDefaultOptions allocator; size_t inputNodesNum = session->GetInputCount(); for (size_t i = 0; i < inputNodesNum; i++) { Ort::AllocatedStringPtr input_node_name = session->GetInputNameAllocated(i, allocator); char* temp_buf = new char[50]; strcpy(temp_buf, input_node_name.get()); inputNodeNames.push_back(temp_buf); } size_t OutputNodesNum = session->GetOutputCount(); for (size_t i = 0; i < OutputNodesNum; i++) { Ort::AllocatedStringPtr output_node_name = session->GetOutputNameAllocated(i, allocator); char* temp_buf = new char[10]; strcpy(temp_buf, output_node_name.get()); outputNodeNames.push_back(temp_buf); } options = Ort::RunOptions{ nullptr }; WarmUpSession(); return RET_OK; } catch (const std::exception& e) { const char* str1 = "[YOLO_V8]:"; const char* str2 = e.what(); std::string result = std::string(str1) + std::string(str2); char* merged = new char[result.length() + 1]; std::strcpy(merged, result.c_str()); std::cout << merged << std::endl; delete[] merged; return "[YOLO_V8]:Create session failed."; } } char* YOLO_V8::RunSession(cv::Mat& iImg, std::vector<DL_RESULT>& oResult) { #ifdef benchmark clock_t starttime_1 = clock(); #endif // benchmark char* Ret = RET_OK; cv::Mat processedImg; PreProcess(iImg, imgSize, processedImg); if (modelType < 4) { float* blob = new float[processedImg.total() * 3]; BlobFromImage(processedImg, blob); std::vector<int64_t> inputNodeDims = { 1, 3, imgSize.at(0), imgSize.at(1) }; TensorProcess(starttime_1, iImg, blob, inputNodeDims, oResult); } else { #ifdef USE_CUDA half* blob = new half[processedImg.total() * 3]; BlobFromImage(processedImg, blob); std::vector<int64_t> inputNodeDims = { 1,3,imgSize.at(0),imgSize.at(1) }; TensorProcess(starttime_1, iImg, blob, inputNodeDims, oResult); #endif } return Ret; } template<typename N> char* YOLO_V8::TensorProcess(clock_t& starttime_1, cv::Mat& iImg, N& blob, std::vector<int64_t>& inputNodeDims, std::vector<DL_RESULT>& oResult) { Ort::Value inputTensor = Ort::Value::CreateTensor<typename std::remove_pointer<N>::type>( Ort::MemoryInfo::CreateCpu(OrtDeviceAllocator, OrtMemTypeCPU), blob, 3 * imgSize.at(0) * imgSize.at(1), inputNodeDims.data(), inputNodeDims.size()); #ifdef benchmark clock_t starttime_2 = clock(); #endif // benchmark auto outputTensor = session->Run(options, inputNodeNames.data(), &inputTensor, 1, outputNodeNames.data(), outputNodeNames.size()); #ifdef benchmark clock_t starttime_3 = clock(); #endif // benchmark Ort::TypeInfo typeInfo = outputTensor.front().GetTypeInfo(); auto tensor_info = typeInfo.GetTensorTypeAndShapeInfo(); std::vector<int64_t> outputNodeDims = tensor_info.GetShape(); auto output = outputTensor.front().GetTensorMutableData<typename std::remove_pointer<N>::type>(); delete[] blob; switch (modelType) { case YOLO_DETECT_V8: case YOLO_DETECT_V8_HALF: { int strideNum = outputNodeDims[1];//8400 int signalResultNum = outputNodeDims[2];//84 std::vector<int> class_ids; std::vector<float> confidences; std::vector<cv::Rect> boxes; cv::Mat rawData; if (modelType == YOLO_DETECT_V8) { // FP32 rawData = cv::Mat(strideNum, signalResultNum, CV_32F, output); } else { // FP16 rawData = cv::Mat(strideNum, signalResultNum, CV_16F, output); rawData.convertTo(rawData, CV_32F); } //Note: //ultralytics add transpose operator to the output of yolov8 model.whi

评论收藏

内容反馈

版权申诉