docs/api/trt__engine__syh_8hpp_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


//!

//! TensorRTEngine.cpp

//! This file contains the implementation of the ONNX MNIST sample. It creates the network using

//! the MNIST onnx model.

//! It can be run with the following command line:

//! Command: ./sample_onnx_mnist [-h or --help] [-d=/path/to/data/dir or --datadir=/path/to/data/dir]

//! [--useDLACore=<int>]

//!


// Define TRT entrypoints used in common code

#define DEFINE_TRT_ENTRYPOINTS 1

#define DEFINE_TRT_LEGACY_PARSER_ENTRYPOINT 0


#include "argsParser.h"

#include "buffers.h"

#include "common.h"

#include "logger.h"

#include "parserOnnxConfig.h"


#include "NvInfer.h"

#include <cuda_runtime_api.h>


#include <cstdlib>

#include <fstream>

#include <iostream>

#include <sstream>


using namespace nvinfer1;

using samplesCommon::SampleUniquePtr;


const std::string gSampleName = "TensorRT.deep_learning_AO";


//! \brief  The TensorRTEngine class implements a generic TensorRT model

//!

//! \details It creates the network using an ONNX model

//!


class TensorRTEngine

{

public:

    TensorRTEngine(const samplesCommon::OnnxSampleParams& params) : mParams(params), mRuntime(nullptr), mEngine(nullptr){}


    //!

    //! \brief Function builds the network engine

    //!

    bool build();


    //!

    //! \brief Runs the TensorRT inference engine for this sample

    //!

    bool infer();


private:

    samplesCommon::OnnxSampleParams mParams; //!< The parameters for the sample.


    nvinfer1::Dims mInputDims;  //!< The dimensions of the input to the network.

    nvinfer1::Dims mOutputDims; //!< The dimensions of the output to the network.

    int mNumber{0};             //!< The number to classify


    std::shared_ptr<nvinfer1::IRuntime> mRuntime;   //!< The TensorRT runtime used to deserialize the engine

    std::shared_ptr<nvinfer1::ICudaEngine> mEngine; //!< The TensorRT engine used to run the network


    //!

    //! \brief Parses an ONNX model for MNIST and creates a TensorRT network

    //!

    bool constructNetwork(SampleUniquePtr<nvinfer1::IBuilder>& builder,

        SampleUniquePtr<nvinfer1::INetworkDefinition>& network, SampleUniquePtr<nvinfer1::IBuilderConfig>& config,

        SampleUniquePtr<nvonnxparser::IParser>& parser);


    //!

    //! \brief Reads the input and stores the result in a managed buffer

    //!

    bool processInput(float* filedata, const samplesCommon::BufferManager& buffers);


};


//!

//! \brief Creates the network, configures the builder and creates the network engine

//!

//! \details This function creates the Onnx MNIST network by parsing the Onnx model and builds

//!          the engine that will be used to run MNIST (mEngine)

//!

//! \return true if the engine was created successfully and false otherwise

//!


bool TensorRTEngine::build()

{

    auto builder = SampleUniquePtr<nvinfer1::IBuilder>(nvinfer1::createInferBuilder(sample::gLogger.getTRTLogger()));

    if (!builder)

    {

        return false;

    }


    auto network = SampleUniquePtr<nvinfer1::INetworkDefinition>(builder->createNetworkV2(0));

    if (!network)

    {

        return false;

    }


    auto config = SampleUniquePtr<nvinfer1::IBuilderConfig>(builder->createBuilderConfig());

    if (!config)

    {

        return false;

    }


    auto parser = SampleUniquePtr<nvonnxparser::IParser>(nvonnxparser::createParser(*network, sample::gLogger.getTRTLogger()));

    if (!parser)

    {

        return false;

    }


    auto constructed = constructNetwork(builder, network, config, parser);

    if (!constructed)

    {

        return false;

    }


    // CUDA stream used for profiling by the builder.

    auto profileStream = samplesCommon::makeCudaStream();

    if (!profileStream)

    {

        return false;

    }

    config->setProfileStream(*profileStream);


    SampleUniquePtr<IHostMemory> plan{builder->buildSerializedNetwork(*network, *config)};

    if (!plan)

    {

        return false;

    }


    mRuntime = std::shared_ptr<nvinfer1::IRuntime>(createInferRuntime(sample::gLogger.getTRTLogger()));

    if (!mRuntime)

    {

        return false;

    }


    mEngine = std::shared_ptr<nvinfer1::ICudaEngine>(

        mRuntime->deserializeCudaEngine(plan->data(), plan->size()), samplesCommon::InferDeleter());

    if (!mEngine)

    {

        return false;

    }


    ASSERT(network->getNbInputs() == 1);

    mInputDims = network->getInput(0)->getDimensions();

    ASSERT(mInputDims.nbDims == 4);


    ASSERT(network->getNbOutputs() == 1);

    mOutputDims = network->getOutput(0)->getDimensions();

    ASSERT(mOutputDims.nbDims == 2);


    return true;

}


//!

//! \brief Uses a ONNX parser to create the Onnx MNIST Network and marks the

//!        output layers

//!

//! \param network Pointer to the network that will be populated with the Onnx MNIST network

//!

//! \param builder Pointer to the engine builder

//!


bool TensorRTEngine::constructNetwork(SampleUniquePtr<nvinfer1::IBuilder>& builder,

    SampleUniquePtr<nvinfer1::INetworkDefinition>& network, SampleUniquePtr<nvinfer1::IBuilderConfig>& config,

    SampleUniquePtr<nvonnxparser::IParser>& parser)

{

    auto parsed = parser->parseFromFile(locateFile(mParams.onnxFileName, mParams.dataDirs).c_str(),

        static_cast<int>(sample::gLogger.getReportableSeverity()));

    if (!parsed)

    {

        return false;

    }


    if (mParams.fp16)

    {

        config->setFlag(BuilderFlag::kFP16);

    }

    if (mParams.bf16)

    {

        config->setFlag(BuilderFlag::kBF16);

    }

    if (mParams.int8)

    {

        config->setFlag(BuilderFlag::kINT8);

        samplesCommon::setAllDynamicRanges(network.get(), 127.0F, 127.0F);

    }


    samplesCommon::enableDLA(builder.get(), config.get(), mParams.dlaCore);


    return true;

}


//!

//! \brief Runs the TensorRT inference engine for this sample

//!

//! \details This function is the main execution function of the sample. It allocates the buffer,

//!          sets inputs and executes the engine.

//!


bool TensorRTEngine::infer()

{

    // Create RAII buffer manager object

    samplesCommon::BufferManager buffers(mEngine);


    auto context = SampleUniquePtr<nvinfer1::IExecutionContext>(mEngine->createExecutionContext());

    if (!context)

    {

        return false;

    }


    for (int32_t i = 0, e = mEngine->getNbIOTensors(); i < e; i++)

    {

        auto const name = mEngine->getIOTensorName(i);

        context->setTensorAddress(name, buffers.getDeviceBuffer(name));

    }


    // Read the input data into the managed buffers

    ASSERT(mParams.inputTensorNames.size() == 1);

    if (!processInput(buffers))

    {

        return false;

    }


    // Memcpy from host input buffers to device input buffers

    buffers.copyInputToDevice();


    bool status = context->executeV2(buffers.getDeviceBindings().data());

    if (!status)

    {

        return false;

    }


    // Memcpy from device output buffers to host output buffers

    buffers.copyOutputToHost();


    // Verify results

    if (!verifyOutput(buffers))

    {

        return false;

    }


    return true;

}


//!

//! \brief Reads the input and stores the result in a managed buffer

//!


bool TensorRTEngine::processInput(float* filedata, const samplesCommon::BufferManager& buffers)

{

   const int inputC = mInputDims.d[1];

    const int inputH = mInputDims.d[2];

    const int inputW = mInputDims.d[3];


   // Copy data into the buffer

    float* hostDataBuffer = static_cast<float*>(buffers.getHostBuffer(mParams.inputTensorNames[0]));

    for (int i = 0; i < inputC * inputH * inputW; i++)

    {

        hostDataBuffer[i] = fileData[i];

    }


    return true;

}


//!

//! \brief Initializes members of the params struct using the command line args

//!


samplesCommon::OnnxSampleParams initializeSampleParams(const samplesCommon::Args& args)

{

    samplesCommon::OnnxSampleParams params;

    if (args.dataDirs.empty()) // Use default directories if user hasn't provided directory paths

    {

        params.dataDirs.push_back("data/mnist/");

        params.dataDirs.push_back("data/samples/mnist/");

    }

    else // Use the data directory provided by the user

    {

        params.dataDirs = args.dataDirs;

    }

    params.onnxFileName = "mnist.onnx";

    params.inputTensorNames.push_back("Input3");

    params.outputTensorNames.push_back("Plus214_Output_0");

    params.dlaCore = args.useDLACore;

    params.int8 = args.runInInt8;

    params.fp16 = args.runInFp16;

    params.bf16 = args.runInBf16;


    return params;

}


int main(int argc, char** argv)

{

    auto sampleTest = sample::gLogger.defineTest(gSampleName, argc, argv);


    sample::gLogger.reportTestStart(sampleTest);


    TensorRTEngine sample(initializeSampleParams(args));


    sample::gLogInfo << "Building and running a GPU inference engine for Onnx MNIST" << std::endl;


    if (!sample.build())

    {

        return sample::gLogger.reportFail(sampleTest);

    }

    if (!sample.infer())

    {

        return sample::gLogger.reportFail(sampleTest);

    }


    return sample::gLogger.reportPass(sampleTest);

}


TensorRTEngine
The TensorRTEngine class implements a generic TensorRT model.
Definition trt_engine_syh.hpp:55

TensorRTEngine::mRuntime
std::shared_ptr< nvinfer1::IRuntime > mRuntime
The TensorRT runtime used to deserialize the engine.
Definition trt_engine_syh.hpp:76

TensorRTEngine::infer
bool infer()
Runs the TensorRT inference engine for this sample.
Definition trt_engine_syh.hpp:215

TensorRTEngine::build
bool build()
Function builds the network engine.
Definition trt_engine_syh.hpp:101

TensorRTEngine::mOutputDims
nvinfer1::Dims mOutputDims
The dimensions of the output to the network.
Definition trt_engine_syh.hpp:73

TensorRTEngine::mInputDims
nvinfer1::Dims mInputDims
The dimensions of the input to the network.
Definition trt_engine_syh.hpp:72

TensorRTEngine::processInput
bool processInput(float *filedata, const samplesCommon::BufferManager &buffers)
Reads the input and stores the result in a managed buffer.
Definition trt_engine_syh.hpp:263

TensorRTEngine::mParams
samplesCommon::OnnxSampleParams mParams
The parameters for the sample.
Definition trt_engine_syh.hpp:70

TensorRTEngine::TensorRTEngine
TensorRTEngine(const samplesCommon::OnnxSampleParams &params)
Definition trt_engine_syh.hpp:57

TensorRTEngine::mEngine
std::shared_ptr< nvinfer1::ICudaEngine > mEngine
The TensorRT engine used to run the network.
Definition trt_engine_syh.hpp:77

TensorRTEngine::mNumber
int mNumber
The number to classify.
Definition trt_engine_syh.hpp:74

TensorRTEngine::constructNetwork
bool constructNetwork(SampleUniquePtr< nvinfer1::IBuilder > &builder, SampleUniquePtr< nvinfer1::INetworkDefinition > &network, SampleUniquePtr< nvinfer1::IBuilderConfig > &config, SampleUniquePtr< nvonnxparser::IParser > &parser)
Parses an ONNX model for MNIST and creates a TensorRT network.
Definition trt_engine_syh.hpp:179

main
int main()
Definition configusbhub.cpp:20

gSampleName
const std::string gSampleName
Definition trt_engine_syh.hpp:48

initializeSampleParams
samplesCommon::OnnxSampleParams initializeSampleParams(const samplesCommon::Args &args)
Initializes members of the params struct using the command line args.
Definition trt_engine_syh.hpp:282

locateFile
std::string locateFile(const std::string &filepathSuffix, const std::vector< std::string > &directories, bool reportError=true)
Definition util.hpp:85