Convert yolov8 onnx format to tensorrt format using C++

When we use TensorRT for accelerated inference, we need to convert the onnx format to tensorrt format first. The following is the conversion code and the corresponding files using C++.

Operating system: ubuntu20.04

C++ code:

// 
#include &lt;iostream&gt;
#include &lt;memory&gt;
#include &lt;fstream&gt;
#include &lt;&gt;
#include ""
#include ""
#include ""

class Logger : public nvinfer1::ILogger{
    void log(Severity severity, const char* msg) noexcept override {
        // suppress info-level messages
        if (severity &lt;= Severity::kWARNING)
            std::cout &lt;&lt; msg &lt;&lt; std::endl;
    }
} logger;


int main(int argc, char** argv){
    if(argc !=2){
        std::cerr &lt;&lt; "usage: ./build [onnx_file_path]" &lt;&lt;std::endl;
        return -1;
    }

    // Get the onnx file path    char* onnx_file_path = argv[1];

    //=======================1.Create builder================================================= Create a builder============ Create a builder============ Create a builder==========    auto builder = std::unique_ptr&lt;nvinfer1::IBuilder&gt;(nvinfer1::createInferBuilder(logger));
    if(!builder){
        std::cerr &lt;&lt; "Failed to creater builder" &lt;&lt;std::endl;
        return -1;
    }

    //===================2.Create network=================================================== Create network=========== Create network============ Create network============ Create network============ Create network=========== Create network=========== Create network=========== Create network=========== Create network=========== Create network============ Create network=========== Create network=========== Create network=========== Create network============ Create network============ Create network============ Create network============ Create network============= Create network============= Create network============= Create network============= Create network============== Create network============== Create network=============== Create network============== Create network=============== Create network================ Create network================ Create network================ Create network======    const auto explicitBatch= 1U &lt;&lt;static_cast&lt;uint32_t&gt;(nvinfer1::NetworkDefinitionCreationFlag::kEXPLICIT_BATCH);
    auto network = std::unique_ptr&lt;nvinfer1::INetworkDefinition&gt;(builder-&gt;createNetworkV2(explicitBatch));
    if (!network){
        std::cout &lt;&lt; "Failed to create network" &lt;&lt; std::endl;
        return -1;
    }

    // =============== Create onnxparser for parsing onnx files ===============    auto parser = std::unique_ptr&lt;nvonnxparser::IParser&gt;(nvonnxparser::createParser(*network, logger));
    // Call onnxparser's parseFromFile method to parse onnx file    auto parsed = parser-&gt;parseFromFile(onnx_file_path, static_cast&lt;int&gt;(nvinfer1::ILogger::Severity::kWARNING));
    if (!parsed){
        std::cout &lt;&lt; "Failed to parse onnx file" &lt;&lt; std::endl;
        return -1;
    }
    // Configure network parameters    auto input = network-&gt;getInput(0);
    auto profile = builder-&gt;createOptimizationProfile();
    profile-&gt;setDimensions(input-&gt;getName(), nvinfer1::OptProfileSelector::kMIN, nvinfer1::Dims4{1, 3, 960, 960}); // Set the minimum size    profile-&gt;setDimensions(input-&gt;getName(), nvinfer1::OptProfileSelector::kOPT, nvinfer1::Dims4{1, 3, 960, 960}); // Set the optimal size    profile-&gt;setDimensions(input-&gt;getName(), nvinfer1::OptProfileSelector::kMAX, nvinfer1::Dims4{1, 3, 960, 960}); // Set the maximum size
    //================== Create config configuration=======================================================================================================================================================================================================================================================================================================================================================================================================================================================================================================    auto config = std::unique_ptr&lt;nvinfer1::IBuilderConfig&gt;(builder-&gt;createBuilderConfig());
    if (!config){
        std::cout &lt;&lt; "Failed to create config" &lt;&lt; std::endl;
        return -1;
    }

    config-&gt;addOptimizationProfile(profile);
    // Set the accuracy, set to FP16, and set to INT8 requires an additional calibrator    config-&gt;setFlag(nvinfer1::BuilderFlag::kFP16);
    // Set the maximum batchsize    builder-&gt;setMaxBatchSize(1);
    // Set the maximum workspace    config-&gt;setMemoryPoolLimit(nvinfer1::MemoryPoolType::kWORKSPACE, 1 &lt;&lt; 30);

    //Create a stream    auto profileStream = samplesCommon::makeCudaStream();
    if(!profileStream){
        return -1;
    }
    config-&gt;setProfileStream(*profileStream);

    // ============= Creation engine ===============    auto plan = std::unique_ptr&lt;nvinfer1::IHostMemory&gt;(builder-&gt;buildSerializedNetwork(*network, *config));
    if (!plan){
        std::cout &lt;&lt; "Failed to create engine" &lt;&lt; std::endl;
        return -1;
    }

    // ========== 5. Serialization save engine =============    std::ofstream engine_file("./", std::ios::binary);
    assert(engine_file.is_open() &amp;&amp; "Failed to open engine file");
    engine_file.write((char *)plan-&gt;data(), plan-&gt;size());
    engine_file.close();

    std::cout &lt;&lt; "Engine build success!" &lt;&lt; std::endl;
    return 0;
}

document:

cmake_minimum_required(VERSION 3.10)
project(TensorRT_Test LANGUAGES CXX CUDA)

set(CMAKE_CUDA_STANDARD 14)
set(CMAKE_CXX_STANDARD 14)

# Add header file path cuda tensorRTinclude_directories(/usr/local/cuda-11.8/include)
include_directories(/xxx/tensorRT/TensorRT-8.6.1.6/include)
include_directories(/xxx/tensorRT/TensorRT-8.6.1.6/samples/common/)

# Add library filelink_directories(/usr/local/cuda-11.8/lib64)
link_directories(/xxx/tensorRT/TensorRT-8.6.1.6/lib)

add_executable(build )
target_link_libraries(build nvinfer nvonnxparser cudart)

Notice:

The header file and library file paths of cuda and TensorRT need to be changed to their own

How to use:

Taking yolov8 as an example, after using cmake, a build executable file will be generated. Execute the following command to wait for the generated file

./build <onnx_path>

This is the article about using C++ to convert yolov8 onnx format into tensorrt format. For more related content to convert yolov8 onnx to tensorrt, please search for my previous articles or continue browsing the related articles below. I hope everyone will support me in the future!