_static/c-api/_nv_infer_runtime_base_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_INFER_RUNTIME_BASE_H

#define NV_INFER_RUNTIME_BASE_H


#include "NvInferVersion.h"

#include <cstddef>

#include <cstdint>

#include <cuda_runtime_api.h>


// Items that are marked as deprecated will be removed in a future release.

#if __cplusplus >= 201402L

#define TRT_DEPRECATED [[deprecated]]

#if __GNUC__ < 6

#define TRT_DEPRECATED_ENUM

#else

#define TRT_DEPRECATED_ENUM TRT_DEPRECATED

#endif

#ifdef _MSC_VER

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED_API [[deprecated]] __attribute__((visibility("default")))

#endif

#else

#ifdef _MSC_VER

#define TRT_DEPRECATED

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED __attribute__((deprecated))

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __attribute__((deprecated, visibility("default")))

#endif

#endif


// Defines which symbols are exported

#ifdef TENSORRT_BUILD_LIB

#ifdef _MSC_VER

#define TENSORRTAPI __declspec(dllexport)

#else

#define TENSORRTAPI __attribute__((visibility("default")))

#endif

#else

#define TENSORRTAPI

#endif

#define TRTNOEXCEPT

#if !defined(NV_INFER_INTERNAL_INCLUDE)

static_assert(false, "Do not directly include this file. Include NvInferRuntime.h or NvInferPluginUtils.h");

#endif


extern "C"

{

    struct cublasContext;

    struct cudnnContext;

}


#define NV_TENSORRT_VERSION_INT(major, minor, patch) ((major) *10000L + (minor) *100L + (patch) *1L)


#define NV_TENSORRT_VERSION NV_TENSORRT_VERSION_INT(NV_TENSORRT_MAJOR, NV_TENSORRT_MINOR, NV_TENSORRT_PATCH)


namespace nvinfer1

{

using char_t = char;


using AsciiChar = char_t;


namespace v_1_0

{

class IErrorRecorder;

}

using IErrorRecorder = v_1_0::IErrorRecorder;


namespace impl

{

template <typename T>

struct EnumMaxImpl;

} // namespace impl


template <typename T>

constexpr int32_t EnumMax() noexcept

{

    return impl::EnumMaxImpl<T>::kVALUE;

}


enum class DataType : int32_t

{

    kFLOAT = 0,


    kHALF = 1,


    kINT8 = 2,


    kINT32 = 3,


    kBOOL = 4,


    kUINT8 = 5,


    kFP8 = 6,


    kBF16 = 7,


    kINT64 = 8,


    kINT4 = 9,


    kFP4 = 10,

};


namespace impl

{

template <>

struct EnumMaxImpl<DataType>

{

    static constexpr int32_t kVALUE = 11;

};

} // namespace impl


class Dims64

{

public:

    static constexpr int32_t MAX_DIMS{8};


    int32_t nbDims;


    int64_t d[MAX_DIMS];

};


using Dims = Dims64;


using InterfaceKind = char const*;


class InterfaceInfo

{

public:

    InterfaceKind kind;

    int32_t major;

    int32_t minor;

};


enum class APILanguage : int32_t

{

    kCPP = 0,

    kPYTHON = 1

};


namespace impl

{

template <>

struct EnumMaxImpl<APILanguage>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IVersionedInterface

{

public:

    virtual APILanguage getAPILanguage() const noexcept

    {

        return APILanguage::kCPP;

    }


    virtual InterfaceInfo getInterfaceInfo() const noexcept = 0;


    virtual ~IVersionedInterface() noexcept = default;


protected:

    IVersionedInterface() = default;

    IVersionedInterface(IVersionedInterface const&) = default;

    IVersionedInterface(IVersionedInterface&&) = default;

    IVersionedInterface& operator=(IVersionedInterface const&) & = default;

    IVersionedInterface& operator=(IVersionedInterface&&) & = default;

};


enum class ErrorCode : int32_t

{

    kSUCCESS = 0,


    kUNSPECIFIED_ERROR = 1,


    kINTERNAL_ERROR = 2,


    kINVALID_ARGUMENT = 3,


    kINVALID_CONFIG = 4,


    kFAILED_ALLOCATION = 5,


    kFAILED_INITIALIZATION = 6,


    kFAILED_EXECUTION = 7,


    kFAILED_COMPUTATION = 8,


    kINVALID_STATE = 9,


    kUNSUPPORTED_STATE = 10,


};


namespace impl

{

template <>

struct EnumMaxImpl<ErrorCode>

{

    static constexpr int32_t kVALUE = 11;

};

} // namespace impl


namespace v_1_0

{

class IErrorRecorder : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IErrorRecorder", 1, 0};

    }


    using ErrorDesc = char const*;


    static constexpr size_t kMAX_DESC_LENGTH{127U};


    using RefCount = int32_t;


    IErrorRecorder() = default;

    ~IErrorRecorder() noexcept override = default;


    // Public API used to retrieve information from the error recorder.


    virtual int32_t getNbErrors() const noexcept = 0;


    virtual ErrorCode getErrorCode(int32_t errorIdx) const noexcept = 0;


    virtual ErrorDesc getErrorDesc(int32_t errorIdx) const noexcept = 0;


    virtual bool hasOverflowed() const noexcept = 0;


    virtual void clear() noexcept = 0;


    // API used by TensorRT to report Error information to the application.


    virtual bool reportError(ErrorCode val, ErrorDesc desc) noexcept = 0;


    virtual RefCount incRefCount() noexcept = 0;


    virtual RefCount decRefCount() noexcept = 0;


protected:

    // @cond SuppressDoxyWarnings

    IErrorRecorder(IErrorRecorder const&) = default;

    IErrorRecorder(IErrorRecorder&&) = default;

    IErrorRecorder& operator=(IErrorRecorder const&) & = default;

    IErrorRecorder& operator=(IErrorRecorder&&) & = default;

    // @endcond

}; // class IErrorRecorder

} // namespace v_1_0


using IErrorRecorder = v_1_0::IErrorRecorder;


enum class TensorIOMode : int32_t

{

    kNONE = 0,


    kINPUT = 1,


    kOUTPUT = 2

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorIOMode>

{

    // Declaration of kVALUE that represents maximum number of elements in TensorIOMode enum

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl

} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibVersion() noexcept;


#endif // NV_INFER_RUNTIME_BASE_H

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:59

getInferLibVersion
int32_t getInferLibVersion() noexcept
Return the library version number.

NvInferVersion.h

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:203

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:206

nvinfer1::Dims64::d
int64_t d[MAX_DIMS]
The extent of each dimension.
Definition: NvInferRuntimeBase.h:212

nvinfer1::Dims64::nbDims
int32_t nbDims
The rank (number of dimensions).
Definition: NvInferRuntimeBase.h:209

nvinfer1::IVersionedInterface
An Interface class for version control.
Definition: NvInferRuntimeBase.h:263

nvinfer1::IVersionedInterface::getInterfaceInfo
virtual InterfaceInfo getInterfaceInfo() const noexcept=0
Return version information associated with this interface. Applications must not override this method...

nvinfer1::IVersionedInterface::getAPILanguage
virtual APILanguage getAPILanguage() const noexcept
The language used to build the implementation of this Interface.
Definition: NvInferRuntimeBase.h:270

nvinfer1::InterfaceInfo
Version information associated with a TRT interface.
Definition: NvInferRuntimeBase.h:228

nvinfer1::InterfaceInfo::kind
InterfaceKind kind
Definition: NvInferRuntimeBase.h:230

nvinfer1::InterfaceInfo::major
int32_t major
Definition: NvInferRuntimeBase.h:231

nvinfer1::InterfaceInfo::minor
int32_t minor
Definition: NvInferRuntimeBase.h:232

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:400

nvinfer1::v_1_0::IErrorRecorder::ErrorDesc
char const  * ErrorDesc
A typedef of a C-style string for reporting error descriptions.
Definition: NvInferRuntimeBase.h:413

nvinfer1::v_1_0::IErrorRecorder::~IErrorRecorder
~IErrorRecorder() noexcept override=default

nvinfer1::v_1_0::IErrorRecorder::RefCount
int32_t RefCount
A typedef of a 32-bit integer for reference counting.
Definition: NvInferRuntimeBase.h:425

nvinfer1::v_1_0::IErrorRecorder::IErrorRecorder
IErrorRecorder()=default

nvinfer1::v_1_0::IErrorRecorder::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntimeBase.h:405

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::ErrorCode
ErrorCode
Error codes that can be returned by TensorRT during execution.
Definition: NvInferRuntimeBase.h:296

nvinfer1::ErrorCode::kUNSUPPORTED_STATE
@ kUNSUPPORTED_STATE

nvinfer1::ErrorCode::kINVALID_STATE
@ kINVALID_STATE

nvinfer1::ErrorCode::kFAILED_INITIALIZATION
@ kFAILED_INITIALIZATION

nvinfer1::ErrorCode::kUNSPECIFIED_ERROR
@ kUNSPECIFIED_ERROR

nvinfer1::ErrorCode::kFAILED_ALLOCATION
@ kFAILED_ALLOCATION

nvinfer1::ErrorCode::kFAILED_COMPUTATION
@ kFAILED_COMPUTATION

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::ErrorCode::kFAILED_EXECUTION
@ kFAILED_EXECUTION

nvinfer1::ErrorCode::kSUCCESS
@ kSUCCESS

nvinfer1::ErrorCode::kINVALID_CONFIG
@ kINVALID_CONFIG

nvinfer1::ErrorCode::kINVALID_ARGUMENT
@ kINVALID_ARGUMENT

nvinfer1::TensorIOMode
TensorIOMode
Definition of tensor IO Mode.
Definition: NvInferRuntimeBase.h:643

nvinfer1::TensorIOMode::kOUTPUT
@ kOUTPUT
Tensor is output by the engine.

nvinfer1::TensorIOMode::kINPUT
@ kINPUT
Tensor is input to the engine.

nvinfer1::APILanguage
APILanguage
Programming language used in the implementation of a TRT interface.
Definition: NvInferRuntimeBase.h:241

nvinfer1::APILanguage::kPYTHON
@ kPYTHON

nvinfer1::APILanguage::kCPP
@ kCPP

nvinfer1::AsciiChar
char_t AsciiChar
Definition: NvInferRuntimeBase.h:105

nvinfer1::char_t
char char_t
char_t is the type used by TensorRT to represent all valid characters.
Definition: NvInferRuntimeBase.h:101

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeBase.h:133

nvinfer1::DataType::kUINT8
@ kUINT8

nvinfer1::DataType::kINT64
@ kINT64
Signed 64-bit integer type.

nvinfer1::DataType::kFLOAT
@ kFLOAT
32-bit floating point format.

nvinfer1::DataType::kFP4
@ kFP4

nvinfer1::DataType::kBOOL
@ kBOOL
8-bit boolean. 0 = false, 1 = true, other values undefined.

nvinfer1::DataType::kHALF
@ kHALF
IEEE 16-bit floating-point format – has a 5 bit exponent and 11 bit significand.

nvinfer1::DataType::kINT8
@ kINT8
Signed 8-bit integer representing a quantized floating-point value.

nvinfer1::DataType::kFP8
@ kFP8

nvinfer1::DataType::kBF16
@ kBF16
Brain float – has an 8 bit exponent and 8 bit significand.

nvinfer1::DataType::kINT4
@ kINT4
Signed 4-bit integer type.

nvinfer1::DataType::kINT32
@ kINT32
Signed 32-bit integer format.

nvinfer1::InterfaceKind
char const  * InterfaceKind
Definition: NvInferRuntimeBase.h:220

nvinfer1::EnumMax
constexpr int32_t EnumMax() noexcept
Maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:123

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::IErrorRecorder
v_1_0::IErrorRecorder IErrorRecorder
Definition: NvInferRuntimeBase.h:112

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:118