c++调用onnx模型

#include <onnxruntime_cxx_api.h>
#include <opencv2/opencv.hpp>
#include <fstream>
#include <vector>
#include <filesystem>
using namespace cv;
using namespace std;


int main(int argc, char** argv)
{
    //step-1:set filepath and modelpath
    cv::Mat frame = cv::imread("F:/Yolov11-onnx_cpp-main/1.jpg");
    std::string onnxpath = "E:/ultralytics-main/ultralytics-main/runs/train/exp9/weights/best.onnx";

    //step2:load labels
    std::vector<std::string> labels;
    std::ifstream inputFile("E:/classes.names");
    if (inputFile.is_open())
    {
        std::string classLine;
        while (std::getline(inputFile, classLine))
            labels.push_back(classLine);
        inputFile.close();
    }

    //step-3:load onnx model
    int ih = frame.rows;
    int iw = frame.cols;

    std::wstring modelPath = std::wstring(onnxpath.begin(), onnxpath.end());
    Ort::SessionOptions session_options;
    Ort::Env env = Ort::Env(ORT_LOGGING_LEVEL_ERROR, "yolov11-onnx");

    session_options.SetGraphOptimizationLevel(ORT_ENABLE_BASIC);
    //std::cout << "onnxruntime inference try to use GPU Device" << std::endl;
    OrtSessionOptionsAppendExecutionProvider_CUDA(session_options, 0);
    Ort::Session session_(env, modelPath.c_str(), session_options);

    std::vector<std::string> input_node_names;
    std::vector<std::string> output_node_names;

    size_t numInputNodes = session_.GetInputCount();
    size_t numOutputNodes = session_.GetOutputCount();
    Ort::AllocatorWithDefaultOptions allocator;
    input_node_names.reserve(numInputNodes);

    int input_w = 0;
    int input_h = 0;
    for (int i = 0; i < numInputNodes; i++) {
        //onnx newest version-1.14
        auto input_name = session_.GetInputNameAllocated(i, allocator);
        input_node_names.push_back(input_name.get());

        //onnx old version-1.8
        //input_node_names.push_back(session_.GetInputName(i, allocator));

        Ort::TypeInfo input_type_info = session_.GetInputTypeInfo(i);
        auto input_tensor_info = input_type_info.GetTensorTypeAndShapeInfo();
        auto input_dims = input_tensor_info.GetShape();
        input_w = input_dims[3];
        input_h = input_dims[2];
        std::cout << "input format: NxCxHxW = " << input_dims[0] << "x" << input_dims[1] << "x" << input_dims[2] << "x" << input_dims[3] << std::endl;
    }

    //step-4:get output parameter
    int output_h = 0;
    int output_w = 0;
    Ort::TypeInfo output_type_info = session_.GetOutputTypeInfo(0);
    auto output_tensor_info = output_type_info.GetTensorTypeAndShapeInfo();
    auto output_dims = output_tensor_info.GetShape();
    output_h = output_dims[1];
    output_w = output_dims[2];
    std::cout << "output format : HxW = " << output_dims[1] << "x" << output_dims[2] << std::endl;
    for (int i = 0; i < numOutputNodes; i++)
    {
        //onnx newest version-1.14
        auto out_name = session_.GetOutputNameAllocated(i, allocator);
        output_node_names.push_back(out_name.get());

        //onnx old version-1.8
        //output_node_names.push_back(session_.GetOutputName(i, allocator));
    }
    std::cout << "input: " << input_node_names[0] << " output: " << output_node_names[0] << std::endl;

    //step-5:get infer result
    int64 start = cv::getTickCount();
    int w = frame.cols;
    int h = frame.rows;
    int _max = std::max(h, w);
    cv::Mat image = cv::Mat::zeros(cv::Size(_max, _max), CV_8UC3);
    cv::Rect roi(0, 0, w, h);
    frame.copyTo(image(roi));

    // fix bug, boxes consistence!
    float x_factor = image.cols / static_cast<float>(input_w);
    float y_factor = image.rows / static_cast<float>(input_h);

    cv::Mat blob = cv::dnn::blobFromImage(image, 1 / 255.0, cv::Size(input_w, input_h), cv::Scalar(0, 0, 0), true, false);
    size_t tpixels = input_h * input_w * 3;
    std::array<int64_t, 4> input_shape_info{ 1, 3, input_h, input_w };

    // set input data and inference
    auto allocator_info = Ort::MemoryInfo::CreateCpu(OrtDeviceAllocator, OrtMemTypeCPU);
    Ort::Value input_tensor_ = Ort::Value::CreateTensor<float>(allocator_info, blob.ptr<float>(), tpixels, input_shape_info.data(), input_shape_info.size());
    const std::array<const char*, 1> inputNames = { input_node_names[0].c_str() };
    const std::array<const char*, 1> outNames = { output_node_names[0].c_str() };
    std::vector<Ort::Value> ort_outputs;
    try {
        ort_outputs = session_.Run(Ort::RunOptions{ nullptr }, inputNames.data(), &input_tensor_, 1, outNames.data(), outNames.size());
    }
    catch (std::exception e) {
        std::cout << e.what() << std::endl;
    }

    // output data
    const float* pdata = ort_outputs[0].GetTensorMutableData<float>();
    cv::Mat dout(output_h, output_w, CV_32F, (float*)pdata);
    cv::Mat det_output = dout.t(); // 8400x84

    // post-process
    std::vector<cv::Rect> boxes;
    std::vector<int> classIds;
    std::vector<float> confidences;
    int returnValue = 0;
    for (int i = 0; i < det_output.rows; i++) {
        cv::Mat classes_scores = det_output.row(i).colRange(4, 9);
        cv::Point classIdPoint;
        double score;
        minMaxLoc(classes_scores, 0, &score, 0, &classIdPoint);

        //between 0～1
        if (score > 0.25)
        {
            float cx = det_output.at<float>(i, 0);
            float cy = det_output.at<float>(i, 1);
            float ow = det_output.at<float>(i, 2);
            float oh = det_output.at<float>(i, 3);
            int x = static_cast<int>((cx - 0.5 * ow) * x_factor);
            int y = static_cast<int>((cy - 0.5 * oh) * y_factor);
            int width = static_cast<int>(ow * x_factor);
            int height = static_cast<int>(oh * y_factor);
            cv::Rect box;
            box.x = x;
            box.y = y;
            box.width = width;
            box.height = height;

            // 获取类别ID
            int classId = classIdPoint.x;

            // 根据类别ID设置返回值
            if (classId == 0 || classId == 1) {  // 假设类别0为目标类别
                returnValue = 1; // 设置为1
            }
            else {
                returnValue = 0; // 默认值
            }

            boxes.push_back(box);
            classIds.push_back(classIdPoint.x);
            confidences.push_back(score);
        }
    }
    std::cout << "Detection Result: " << returnValue << std::endl;
    // NMS
    std::vector<int> indexes;
    cv::dnn::NMSBoxes(boxes, confidences, 0.25, 0.45, indexes);
    for (size_t i = 0; i < indexes.size(); i++) {
        int index = indexes[i];
        int idx = classIds[index];
        cv::rectangle(frame, boxes[index], cv::Scalar(0, 0, 255), 2, 8);
        cv::rectangle(frame, cv::Point(boxes[index].tl().x, boxes[index].tl().y - 20),
            cv::Point(boxes[index].br().x, boxes[index].tl().y), cv::Scalar(0, 255, 255), -1);

        std::string classString = labels[idx] + ' ' + std::to_string(confidences[idx]).substr(0, 4);
        putText(frame, classString, cv::Point(boxes[index].tl().x, boxes[index].tl().y), cv::FONT_HERSHEY_PLAIN, 2.0, cv::Scalar(255, 0, 0), 2, 8);
        cv::imshow("YOLOv11 onnxrunning", frame);
    }

    //calculate FPS render it
    float t = (cv::getTickCount() - start) / static_cast<float>(cv::getTickFrequency());
    putText(frame, cv::format("FPS: %.2f", 1.0 / t), cv::Point(20, 40), cv::FONT_HERSHEY_PLAIN, 2.0, cv::Scalar(255, 0, 0), 2, 8);
    cv::imshow("YOLOv11 onnxrunning", frame);
    cv::imwrite("result.jpg", frame);
    cv::waitKey(0);

    session_options.release();
    session_.release();
    return 0;
}

上述代码是我使用的c++调用onnx模型的代码，在我使用cpu时代码可以正常运行。但是当我使用gpu运行时它产生了错误：The requested API version [18] is not available, only API versions [1, 17] are supported in this build. Current ORT Version is: 1.17.1
我使用的是onnxruntime-gpu1.20.1版本，opencv是4.5的版本，cuda是11.8几，cudnn是8x。上述该问题应该怎么解决？

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

1条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
恐怖如斯恐怖如斯啊 2024-11-23 20:03
关注
以下回复参考：皆我百晓生、券券喵儿等免费微信小程序作答:

从错误信息来看，你正在尝试使用 ONNX Runtime 的一个版本（可能是 1.20.1），但你的构建只支持到 API 版本 17，而你正在尝试使用 API 版本 18。这个问题可能是由于你的 ONNX Runtime 版本与你的 CUDA 或 cuDNN 版本不兼容造成的。下面是一些可能的解决方案：

更新 ONNX Runtime 版本：确保你使用的是与 CUDA 和 cuDNN 兼容的 ONNX Runtime 版本。有时，最新版本的 ONNX Runtime 可能包含对新的 CUDA 和 cuDNN 版本的兼容性更新。你可以尝试下载并使用一个更新的版本，确保它与你的 CUDA 和 cuDNN 版本兼容。
检查 CUDA 和 cuDNN 版本：确认你的 CUDA 和 cuDNN 版本是否与你的 ONNX Runtime 版本兼容。有时候，某些版本的 CUDA 或 cuDNN 可能与某些版本的 ONNX Runtime 不完全兼容。你可以查看 ONNX Runtime 的官方文档，找到推荐的 CUDA 和 cuDNN 版本。
重新编译 ONNX Runtime：如果你有条件的话，可以尝试重新编译 ONNX Runtime，确保它是针对你的 CUDA 和 cuDNN 版本优化的。在编译时，确保你设置了正确的 CUDA 和 cuDNN 路径，并使用了正确的版本标志。
使用更低版本的 API：如果你的代码使用了某些新的 API 功能，而这些功能在你的当前构建版本中不可用，你可以尝试修改代码以使用较低版本的 API 功能。这可能意味着你需要修改你的代码中的一些调用或参数设置。

基于你提供的错误信息，我建议首先尝试更新 ONNX Runtime 到一个更新的版本，并确保它与你的 CUDA 和 cuDNN 版本兼容。如果问题仍然存在，你可以考虑重新编译 ONNX Runtime 或使用更低版本的 API。
解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

基于c++的onnxruntime gpu加速onnx模型推理
2025-05-08 16:06

通过C++调用ONNXRuntime，开发者可以享受到GPU带来的强大性能优势，这对于需要实时处理的场景（如摄像头图像捕捉和识别）尤为重要。具体实现步骤包括准备一个已经训练好的ONNX模型文件，然后通过C++代码加载这个...
人工智能混合编程实践：C++调用Python ONNX进行异常检测推理
2025-03-12 15:33

FriendshipT的博客 C++、Python、ONNX、人工智能、异常检测
基于paddleocr+onnxruntime实现车牌识别C++源码+模型.zip
2024-05-09 14:43

- 推理引擎初始化：在C++代码中，我们需要创建一个ONNXRuntime会话实例，加载转换后的ONNX模型。 - 图像处理：将预处理后的图像数据输入到ONNXRuntime进行推理，得到文字框的位置和识别出的文字。 - 后处理：根据...
基于onnxruntime+opencv部署yolov8的onnx模型支持检测分割旋转框C++源码+使用说明.zip
2024-05-21 07:23

C++是本项目的主要编程语言，它是一种通用且高效的语言，适合处理计算密集型的任务，如深度学习模型的推理。C++的源码设计使项目可移植性强，能够适应多种平台。 7. **软件/插件开发** 提到的“软件/插件”标签...
人工智能混合编程实践：C++调用Python ONNX进行YOLOv8推理
2025-03-11 20:37

FriendshipT的博客 C++、Python、ONNX、人工智能、目标检测
Pytorch导出onnx模型并在C++环境中调用（含python和C++工程）
2025-01-12 21:58

怡步晓心l的博客以表格数据为例-含数据集和PyCharm工程中简单介绍了在python中使用pytorch搭建神经网络模型的步骤和代码工程，此处介绍AI模型的跨平台调用问题，即使用跨平台的ONNX框架，在C++代码中进行模型调用。在机器学习多层...
在C＃中使用可移植的ONNX AI模型
2021-04-08 16:06

而ONNX运行时是执行这些模型的库，它提供了API，让开发者能够在各种语言（如C++、C#、Java等）中加载和运行ONNX模型。首先，让我们详细了解一下ONNX运行时。ONNX运行时是一个轻量级、高性能的库，支持模型的解析、...
C++使用纯opencv部署yolov11-cls图像分类onnx模型源码.7z
2024-10-07 06:59

此外，本项目的文件名称为“yolov11-cls-opencv-cplus”，暗示了本项目的编程语言选择为C++，以及项目与OpenCV和ONNX技术栈的紧密关联。本项目提供了一个实用的案例，展示了如何在C++环境中利用OpenCV库部署和运行...
人工智能混合编程实践：C++调用封装好的DLL进行YOLO26推理
2026-03-13 11:46

在本项目中，我们讨论的是如何利用C++调用预先封装好的DLL（动态链接库）来执行YOLOv26模型的推理任务。YOLO（You Only Look Once）是一种流行的实时对象检测系统，其模型可以准确地识别和定位图像中的对象。项目...
onnx 编程领域 dll动态库
2025-11-03 10:49

开发者在实现时会通过各种编程语言提供的接口调用DLL库中的函数。例如，在C++中，可以使用LoadLibrary和GetProcAddress函数加载和使用DLL中的函数。而在.NET环境中，开发者可以使用P/Invoke（平台调用）功能调用非...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 11月23日

c++调用onnx模型

1条回答 默认 最新

问题事件

1条回答默认最新