_static/cpp-api/_nv_onnx_parser_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_ONNX_PARSER_H

#define NV_ONNX_PARSER_H


#include "NvInfer.h"

#include <stddef.h>


#define NV_ONNX_PARSER_MAJOR 0

#define NV_ONNX_PARSER_MINOR 1

#define NV_ONNX_PARSER_PATCH 0


static constexpr int32_t NV_ONNX_PARSER_VERSION

    = ((NV_ONNX_PARSER_MAJOR * 10000) + (NV_ONNX_PARSER_MINOR * 100) + NV_ONNX_PARSER_PATCH);


namespace nvonnxparser

{


template <typename T>

constexpr int32_t EnumMax() noexcept = delete;


enum class ErrorCode : int

{

    kSUCCESS = 0,

    kINTERNAL_ERROR = 1,

    kMEM_ALLOC_FAILED = 2,

    kMODEL_DESERIALIZE_FAILED = 3,

    kINVALID_VALUE = 4,

    kINVALID_GRAPH = 5,

    kINVALID_NODE = 6,

    kUNSUPPORTED_GRAPH = 7,

    kUNSUPPORTED_NODE = 8,

    kUNSUPPORTED_NODE_ATTR = 9,

    kUNSUPPORTED_NODE_INPUT = 10,

    kUNSUPPORTED_NODE_DATATYPE = 11,

    kUNSUPPORTED_NODE_DYNAMIC = 12,

    kUNSUPPORTED_NODE_SHAPE = 13,

    kREFIT_FAILED = 14

};


template <>

constexpr int32_t EnumMax<ErrorCode>() noexcept

{

    return 14;

}


using OnnxParserFlags

    = uint32_t;


enum class OnnxParserFlag : int32_t

{

    kNATIVE_INSTANCENORM = 0,

    kENABLE_UINT8_AND_ASYMMETRIC_QUANTIZATION_DLA = 1,

    // This flag is set to be OFF by default.

    kREPORT_CAPABILITY_DLA = 2,

    kENABLE_PLUGIN_OVERRIDE = 3,

    kADJUST_FOR_DLA = 4

};


template <>

constexpr int32_t EnumMax<OnnxParserFlag>() noexcept

{

    return 4;

}


class IParserError

{

public:

    virtual ErrorCode code() const = 0;

    virtual char const* desc() const = 0;

    virtual char const* file() const = 0;

    virtual int line() const = 0;

    virtual char const* func() const = 0;

    virtual int node() const = 0;

    virtual char const* nodeName() const = 0;

    virtual char const* nodeOperator() const = 0;

    virtual char const* const* localFunctionStack() const = 0;

    //              a stack size of 0.

    virtual int32_t localFunctionStackSize() const = 0;


protected:

    virtual ~IParserError() {}

};


class IParser

{

public:

    virtual bool parse(

        void const* serialized_onnx_model, size_t serialized_onnx_model_size, const char* model_path = nullptr) noexcept

        = 0;


    virtual bool parseFromFile(char const* onnxModelFile, int verbosity) noexcept = 0;


    virtual bool supportsOperator(const char* op_name) const noexcept = 0;


    virtual int getNbErrors() const noexcept = 0;


    virtual IParserError const* getError(int index) const noexcept = 0;


    virtual void clearErrors() noexcept = 0;


    virtual ~IParser() noexcept = default;


    virtual char const* const* getUsedVCPluginLibraries(int64_t& nbPluginLibs) const noexcept = 0;


    virtual void setFlags(OnnxParserFlags onnxParserFlags) noexcept = 0;


    virtual OnnxParserFlags getFlags() const noexcept = 0;


    virtual void clearFlag(OnnxParserFlag onnxParserFlag) noexcept = 0;


    virtual void setFlag(OnnxParserFlag onnxParserFlag) noexcept = 0;


    virtual bool getFlag(OnnxParserFlag onnxParserFlag) const noexcept = 0;


    virtual nvinfer1::ITensor const* getLayerOutputTensor(char const* name, int64_t i) noexcept = 0;


    virtual bool supportsModelV2(

        void const* serializedOnnxModel, size_t serializedOnnxModelSize, char const* modelPath = nullptr) noexcept = 0;


    virtual int64_t getNbSubgraphs() noexcept = 0;


    virtual bool isSubgraphSupported(int64_t const index) noexcept = 0;


    virtual int64_t* getSubgraphNodes(int64_t const index, int64_t& subgraphLength) noexcept = 0;


    virtual bool loadModelProto(

        void const* serializedOnnxModel, size_t serializedOnnxModelSize, char const* modelPath = nullptr) noexcept = 0;


    virtual bool loadInitializer(char const* name, void const* data, size_t size) noexcept = 0;


    virtual bool parseModelProto() noexcept = 0;


    virtual bool setBuilderConfig(const nvinfer1::IBuilderConfig* const builderConfig) noexcept = 0;

};


class IParserRefitter

{

public:

    virtual bool refitFromBytes(

        void const* serializedOnnxModel, size_t serializedOnnxModelSize, char const* modelPath = nullptr) noexcept

        = 0;


    virtual bool refitFromFile(char const* onnxModelFile) noexcept = 0;


    virtual int32_t getNbErrors() const noexcept = 0;


    virtual IParserError const* getError(int32_t index) const noexcept = 0;


    virtual void clearErrors() = 0;


    virtual ~IParserRefitter() noexcept = default;


    virtual bool loadModelProto(

        void const* serializedOnnxModel, size_t serializedOnnxModelSize, char const* modelPath = nullptr) noexcept = 0;


    virtual bool loadInitializer(char const* name, void const* data, size_t size) noexcept = 0;


    virtual bool refitModelProto() noexcept = 0;

};


} // namespace nvonnxparser


extern "C" TENSORRTAPI void* createNvOnnxParser_INTERNAL(void* network, void* logger, int version) noexcept;

extern "C" TENSORRTAPI void* createNvOnnxParserRefitter_INTERNAL(

    void* refitter, void* logger, int32_t version) noexcept;

extern "C" TENSORRTAPI int getNvOnnxParserVersion() noexcept;


namespace nvonnxparser

{


namespace

{


inline IParser* createParser(nvinfer1::INetworkDefinition& network, nvinfer1::ILogger& logger) noexcept

{

    return static_cast<IParser*>(createNvOnnxParser_INTERNAL(&network, &logger, NV_ONNX_PARSER_VERSION));

}


inline IParserRefitter* createParserRefitter(nvinfer1::IRefitter& refitter, nvinfer1::ILogger& logger) noexcept

{

    return static_cast<IParserRefitter*>(

        createNvOnnxParserRefitter_INTERNAL(&refitter, &logger, NV_ONNX_PARSER_VERSION));

}


} // namespace


} // namespace nvonnxparser


#endif // NV_ONNX_PARSER_H

NvInfer.h

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:70

createNvOnnxParserRefitter_INTERNAL
TENSORRTAPI void * createNvOnnxParserRefitter_INTERNAL(void *refitter, void *logger, int32_t version) noexcept

createNvOnnxParser_INTERNAL
TENSORRTAPI void * createNvOnnxParser_INTERNAL(void *network, void *logger, int version) noexcept

getNvOnnxParserVersion
TENSORRTAPI int getNvOnnxParserVersion() noexcept

NV_ONNX_PARSER_PATCH
#define NV_ONNX_PARSER_PATCH
Definition: NvOnnxParser.h:32

NV_ONNX_PARSER_MINOR
#define NV_ONNX_PARSER_MINOR
Definition: NvOnnxParser.h:31

NV_ONNX_PARSER_MAJOR
#define NV_ONNX_PARSER_MAJOR
Definition: NvOnnxParser.h:30

nvinfer1::INetworkDefinition
A network definition for input to the builder.
Definition: NvInfer.h:8101

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:2259

nvinfer1::v_1_0::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntime.h:1575

nvonnxparser::IParserError
an object containing information about an error
Definition: NvOnnxParser.h:131

nvonnxparser::IParserError::nodeOperator
virtual char const * nodeOperator() const =0
name of the node operation in which the error occurred.

nvonnxparser::IParserError::func
virtual char const * func() const =0
source function in which the error occurred.

nvonnxparser::IParserError::line
virtual int line() const =0
source line at which the error occurred.

nvonnxparser::IParserError::desc
virtual char const * desc() const =0
description of the error.

nvonnxparser::IParserError::~IParserError
virtual ~IParserError()
Definition: NvOnnxParser.h:179

nvonnxparser::IParserError::code
virtual ErrorCode code() const =0
the error code.

nvonnxparser::IParserError::nodeName
virtual char const * nodeName() const =0
name of the node in which the error occurred.

nvonnxparser::IParserError::localFunctionStack
virtual char const *const * localFunctionStack() const =0
A list of the local function names, from the top level down, constituting the current stack trace in ...

nvonnxparser::IParserError::node
virtual int node() const =0
index of the ONNX model node in which the error occurred.

nvonnxparser::IParserError::file
virtual char const * file() const =0
source file in which the error occurred.

nvonnxparser::IParserError::localFunctionStackSize
virtual int32_t localFunctionStackSize() const =0
The size of the stack of local functions at the point where the error occurred. A top-level node that...

nvonnxparser::IParser
an object for parsing ONNX models into a TensorRT network definition
Definition: NvOnnxParser.h:193

nvonnxparser::IParser::getError
virtual IParserError const * getError(int index) const noexcept=0
Get an error that occurred during prior calls to parse.

nvonnxparser::IParser::getUsedVCPluginLibraries
virtual char const *const * getUsedVCPluginLibraries(int64_t &nbPluginLibs) const noexcept=0
Query the plugin libraries needed to implement operations used by the parser in a version-compatible ...

nvonnxparser::IParser::setFlag
virtual void setFlag(OnnxParserFlag onnxParserFlag) noexcept=0
Set a single parser flag.

nvonnxparser::IParser::loadInitializer
virtual bool loadInitializer(char const *name, void const *data, size_t size) noexcept=0
Prompt the ONNX parser to load an initializer with user-provided binary data. The lifetime of the dat...

nvonnxparser::IParser::supportsOperator
virtual bool supportsOperator(const char *op_name) const noexcept=0
Returns whether the specified operator may be supported by the parser.

nvonnxparser::IParser::parseModelProto
virtual bool parseModelProto() noexcept=0
Begin the parsing and conversion process of the loaded ONNX model into a TensorRT INetworkDefinition.

nvonnxparser::IParser::supportsModelV2
virtual bool supportsModelV2(void const *serializedOnnxModel, size_t serializedOnnxModelSize, char const *modelPath=nullptr) noexcept=0
Check whether TensorRT supports a particular ONNX model. If the function returns True,...

nvonnxparser::IParser::clearErrors
virtual void clearErrors() noexcept=0
Clear errors from prior calls to parse.

nvonnxparser::IParser::getFlag
virtual bool getFlag(OnnxParserFlag onnxParserFlag) const noexcept=0
Returns true if the parser flag is set.

nvonnxparser::IParser::clearFlag
virtual void clearFlag(OnnxParserFlag onnxParserFlag) noexcept=0
clear a parser flag.

nvonnxparser::IParser::getFlags
virtual OnnxParserFlags getFlags() const noexcept=0
Get the parser flags. Defaults to 0.

nvonnxparser::IParser::isSubgraphSupported
virtual bool isSubgraphSupported(int64_t const index) noexcept=0
Returns whether the subgraph is supported. Calling this function before calling supportsModelV2 resul...

nvonnxparser::IParser::getNbSubgraphs
virtual int64_t getNbSubgraphs() noexcept=0
Get the number of subgraphs. Calling this function before calling supportsModelV2 results in undefine...

nvonnxparser::IParser::loadModelProto
virtual bool loadModelProto(void const *serializedOnnxModel, size_t serializedOnnxModelSize, char const *modelPath=nullptr) noexcept=0
Load a serialized ONNX model into the parser. Unlike the parse() or parseFromFile() functions,...

nvonnxparser::IParser::getSubgraphNodes
virtual int64_t * getSubgraphNodes(int64_t const index, int64_t &subgraphLength) noexcept=0
Get the nodes of the specified subgraph. Calling this function before calling supportsModelV2 results...

nvonnxparser::IParser::setBuilderConfig
virtual bool setBuilderConfig(const nvinfer1::IBuilderConfig *const builderConfig) noexcept=0
Set the BuilderConfig for the parser.

nvonnxparser::IParser::setFlags
virtual void setFlags(OnnxParserFlags onnxParserFlags) noexcept=0
Set the parser flags.

nvonnxparser::IParser::parseFromFile
virtual bool parseFromFile(char const *onnxModelFile, int verbosity) noexcept=0
Parse an onnx model file, which can be a binary protobuf or a text onnx model calls parse method insi...

nvonnxparser::IParser::parse
virtual bool parse(void const *serialized_onnx_model, size_t serialized_onnx_model_size, const char *model_path=nullptr) noexcept=0
Parse a serialized ONNX model into the TensorRT network. This method has very limited diagnostics....

nvonnxparser::IParser::getNbErrors
virtual int getNbErrors() const noexcept=0
Get the number of errors that occurred during prior calls to parse.

nvonnxparser::IParser::getLayerOutputTensor
virtual nvinfer1::ITensor const * getLayerOutputTensor(char const *name, int64_t i) noexcept=0
Return the i-th output ITensor object for the ONNX layer "name".

nvonnxparser::IParserRefitter
An interface designed to refit weights from an ONNX model.
Definition: NvOnnxParser.h:453

nvonnxparser::IParserRefitter::refitFromBytes
virtual bool refitFromBytes(void const *serializedOnnxModel, size_t serializedOnnxModelSize, char const *modelPath=nullptr) noexcept=0
Load a serialized ONNX model from memory and perform weight refit.

nvinfer1
The TensorRT API version 1 namespace.
Definition: NvInferPluginBase.h:29

nvonnxparser::anonymous_namespace{NvOnnxParser.h}::createParser
IParser * createParser(nvinfer1::INetworkDefinition &network, nvinfer1::ILogger &logger) noexcept
Create a new parser object.
Definition: NvOnnxParser.h:583

nvonnxparser::anonymous_namespace{NvOnnxParser.h}::createParserRefitter
IParserRefitter * createParserRefitter(nvinfer1::IRefitter &refitter, nvinfer1::ILogger &logger) noexcept
Create a new ONNX refitter object.
Definition: NvOnnxParser.h:597

nvonnxparser
The TensorRT ONNX parser API namespace.
Definition: NvOnnxConfig.h:24

nvonnxparser::OnnxParserFlags
uint32_t OnnxParserFlags
Represents one or more OnnxParserFlag values using binary OR operations, e.g., 1U << OnnxParserFlag::...
Definition: NvOnnxParser.h:91

nvonnxparser::ErrorCode
ErrorCode
The type of error that the parser or refitter may return.
Definition: NvOnnxParser.h:59

nvonnxparser::ErrorCode::kUNSUPPORTED_GRAPH
@ kUNSUPPORTED_GRAPH

nvonnxparser::ErrorCode::kINVALID_GRAPH
@ kINVALID_GRAPH

nvonnxparser::ErrorCode::kMEM_ALLOC_FAILED
@ kMEM_ALLOC_FAILED

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE_DYNAMIC
@ kUNSUPPORTED_NODE_DYNAMIC

nvonnxparser::ErrorCode::kREFIT_FAILED
@ kREFIT_FAILED

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE_INPUT
@ kUNSUPPORTED_NODE_INPUT

nvonnxparser::ErrorCode::kINVALID_NODE
@ kINVALID_NODE

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE_DATATYPE
@ kUNSUPPORTED_NODE_DATATYPE

nvonnxparser::ErrorCode::kMODEL_DESERIALIZE_FAILED
@ kMODEL_DESERIALIZE_FAILED

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE_ATTR
@ kUNSUPPORTED_NODE_ATTR

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE
@ kUNSUPPORTED_NODE

nvonnxparser::ErrorCode::kINVALID_VALUE
@ kINVALID_VALUE

nvonnxparser::ErrorCode::kUNSUPPORTED_NODE_SHAPE
@ kUNSUPPORTED_NODE_SHAPE

nvonnxparser::OnnxParserFlag
OnnxParserFlag
Definition: NvOnnxParser.h:94

nvonnxparser::OnnxParserFlag::kENABLE_PLUGIN_OVERRIDE
@ kENABLE_PLUGIN_OVERRIDE

nvonnxparser::OnnxParserFlag::kNATIVE_INSTANCENORM
@ kNATIVE_INSTANCENORM

nvonnxparser::OnnxParserFlag::kENABLE_UINT8_AND_ASYMMETRIC_QUANTIZATION_DLA
@ kENABLE_UINT8_AND_ASYMMETRIC_QUANTIZATION_DLA

nvonnxparser::OnnxParserFlag::kREPORT_CAPABILITY_DLA
@ kREPORT_CAPABILITY_DLA

nvonnxparser::OnnxParserFlag::kADJUST_FOR_DLA
@ kADJUST_FOR_DLA
Opportunistically rewrite or modify layers to make them more amenable to running on DLA.

nvonnxparser::EnumMax< ErrorCode >
constexpr int32_t EnumMax< ErrorCode >() noexcept
Specialization. See nvonnxparser::EnumMax() for details.
Definition: NvOnnxParser.h:79

nvonnxparser::EnumMax
constexpr int32_t EnumMax() noexcept=delete

nvonnxparser::EnumMax< OnnxParserFlag >
constexpr int32_t EnumMax< OnnxParserFlag >() noexcept
Specialization. See nvonnxparser::EnumMax() for details.
Definition: NvOnnxParser.h:120