api/c_api/_nv_infer_runtime_common_8h_source.html

/*

 * Copyright (c) 1993-2021 NVIDIA Corporation. All rights reserved.

 *

 * NOTICE TO LICENSEE:

 *

 * This source code and/or documentation ("Licensed Deliverables") are

 * subject to NVIDIA intellectual property rights under U.S. and

 * international Copyright laws.

 *

 * These Licensed Deliverables contained herein is PROPRIETARY and

 * CONFIDENTIAL to NVIDIA and is being provided under the terms and

 * conditions of a form of NVIDIA software license agreement by and

 * between NVIDIA and Licensee ("License Agreement") or electronically

 * accepted by Licensee.  Notwithstanding any terms or conditions to

 * the contrary in the License Agreement, reproduction or disclosure

 * of the Licensed Deliverables to any third party without the express

 * written consent of NVIDIA is prohibited.

 *

 * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

 * LICENSE AGREEMENT, NVIDIA MAKES NO REPRESENTATION ABOUT THE

 * SUITABILITY OF THESE LICENSED DELIVERABLES FOR ANY PURPOSE.  IT IS

 * PROVIDED "AS IS" WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.

 * NVIDIA DISCLAIMS ALL WARRANTIES WITH REGARD TO THESE LICENSED

 * DELIVERABLES, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY,

 * NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.

 * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

 * LICENSE AGREEMENT, IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY

 * SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY

 * DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,

 * WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS

 * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE

 * OF THESE LICENSED DELIVERABLES.

 *

 * U.S. Government End Users.  These Licensed Deliverables are a

 * "commercial item" as that term is defined at 48 C.F.R. 2.101 (OCT

 * 1995), consisting of "commercial computer software" and "commercial

 * computer software documentation" as such terms are used in 48

 * C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Government

 * only as a commercial end item.  Consistent with 48 C.F.R.12.212 and

 * 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), all

 * U.S. Government End Users acquire the Licensed Deliverables with

 * only those rights set forth herein.

 *

 * Any use of the Licensed Deliverables in individual and commercial

 * software must include, in the user documentation and internal

 * comments to the code, the above Disclaimer and U.S. Government End

 * Users Notice.

 */


#ifndef NV_INFER_RUNTIME_COMMON_H

#define NV_INFER_RUNTIME_COMMON_H


#include "NvInferVersion.h"

#include <cstddef>

#include <cstdint>

#include <cuda_runtime_api.h>


#if __cplusplus >= 201402L

#define TRT_DEPRECATED [[deprecated]]

#if __GNUC__ < 6

#define TRT_DEPRECATED_ENUM

#else

#define TRT_DEPRECATED_ENUM TRT_DEPRECATED

#endif

#ifdef _MSC_VER

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED_API [[deprecated]] __attribute__((visibility("default")))

#endif

#else

#ifdef _MSC_VER

#define TRT_DEPRECATED

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED __attribute__((deprecated))

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __attribute__((deprecated, visibility("default")))

#endif

#endif


#ifdef TENSORRT_BUILD_LIB

#ifdef _MSC_VER

#define TENSORRTAPI __declspec(dllexport)

#else

#define TENSORRTAPI __attribute__((visibility("default")))

#endif

#else

#define TENSORRTAPI

#endif

#define TRTNOEXCEPT


// forward declare some CUDA types to avoid an include dependency


extern "C"

{

    struct cublasContext;

    struct cudnnContext;

}


#define NV_TENSORRT_VERSION nvinfer1::kNV_TENSORRT_VERSION_IMPL

namespace nvinfer1

{


static constexpr int32_t kNV_TENSORRT_VERSION_IMPL

    = (NV_TENSORRT_MAJOR * 1000) + (NV_TENSORRT_MINOR * 100) + NV_TENSORRT_PATCH; // major, minor, patch


using char_t = char;

using AsciiChar = char_t;


class IErrorRecorder;

class IGpuAllocator;


namespace impl

{

template <typename T>

struct EnumMaxImpl;

} // namespace impl


template <typename T>

constexpr int32_t EnumMax() noexcept

{

    return impl::EnumMaxImpl<T>::kVALUE;

}


enum class DataType : int32_t

{

    kFLOAT = 0,


    kHALF = 1,


    kINT8 = 2,


    kINT32 = 3,


    kBOOL = 4

};


namespace impl

{

template <>

struct EnumMaxImpl<DataType>

{

    // Declaration of kVALUE that represents maximum number of elements in DataType enum

    static constexpr int32_t kVALUE = 5;

};

} // namespace impl


class Dims32

{

public:

    static constexpr int32_t MAX_DIMS{8};

    int32_t nbDims;

    int32_t d[MAX_DIMS];

};


using Dims = Dims32;


enum class TensorFormat : int32_t

{

    kLINEAR = 0,


    kCHW2 = 1,


    kHWC8 = 2,


    kCHW4 = 3,


    kCHW16 = 4,


    kCHW32 = 5,


    kDHWC8 = 6,


    kCDHW32 = 7,


    kHWC = 8,


    kDLA_LINEAR = 9,


    kDLA_HWC4 = 10,


    kHWC16 = 11

};


using PluginFormat = TensorFormat;


namespace impl

{

template <>

struct EnumMaxImpl<TensorFormat>

{

    // coverity[autosar_cpp14_m0_1_4_violation] Approved RFD: https://jirasw.nvidia.com/browse/TID-489

    static constexpr int32_t kVALUE = 12;

};

} // namespace impl


struct PluginTensorDesc

{

    Dims dims;

    DataType type;

    TensorFormat format;

    float scale;

};


enum class PluginVersion : uint8_t

{

    kV2 = 0,

    kV2_EXT = 1,

    kV2_IOEXT = 2,

    kV2_DYNAMICEXT = 3,

};


class IPluginV2

{

public:

    virtual int32_t getTensorRTVersion() const noexcept

    {

        return NV_TENSORRT_VERSION;

    }


    virtual AsciiChar const* getPluginType() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual int32_t getNbOutputs() const noexcept = 0;


    virtual Dims getOutputDimensions(int32_t index, Dims const* inputs, int32_t nbInputDims) noexcept = 0;


    virtual bool supportsFormat(DataType type, PluginFormat format) const noexcept = 0;


    virtual void configureWithFormat(Dims const* inputDims, int32_t nbInputs, Dims const* outputDims, int32_t nbOutputs,

        DataType type, PluginFormat format, int32_t maxBatchSize) noexcept

        = 0;


    virtual int32_t initialize() noexcept = 0;


    virtual void terminate() noexcept = 0;


    virtual size_t getWorkspaceSize(int32_t maxBatchSize) const noexcept = 0;


    virtual int32_t enqueue(int32_t batchSize, void const* const* inputs, void* const* outputs, void* workspace,

        cudaStream_t stream) noexcept

        = 0;


    virtual size_t getSerializationSize() const noexcept = 0;


    virtual void serialize(void* buffer) const noexcept = 0;


    virtual void destroy() noexcept = 0;


    virtual IPluginV2* clone() const noexcept = 0;


    virtual void setPluginNamespace(AsciiChar const* pluginNamespace) noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


    // @cond SuppressDoxyWarnings

    IPluginV2() = default;

    virtual ~IPluginV2() noexcept = default;

// @endcond


protected:

// @cond SuppressDoxyWarnings

    IPluginV2(IPluginV2 const&) = default;

    IPluginV2(IPluginV2&&) = default;

    IPluginV2& operator=(IPluginV2 const&) & = default;

    IPluginV2& operator=(IPluginV2&&) & = default;

// @endcond

};


class IPluginV2Ext : public IPluginV2

{

public:

    virtual nvinfer1::DataType getOutputDataType(

        int32_t index, nvinfer1::DataType const* inputTypes, int32_t nbInputs) const noexcept

        = 0;


    virtual bool isOutputBroadcastAcrossBatch(

        int32_t outputIndex, bool const* inputIsBroadcasted, int32_t nbInputs) const noexcept

        = 0;


    virtual bool canBroadcastInputAcrossBatch(int32_t inputIndex) const noexcept = 0;


    virtual void configurePlugin(Dims const* inputDims, int32_t nbInputs, Dims const* outputDims, int32_t nbOutputs,

        DataType const* inputTypes, DataType const* outputTypes, bool const* inputIsBroadcast,

        bool const* outputIsBroadcast, PluginFormat floatFormat, int32_t maxBatchSize) noexcept

        = 0;


    IPluginV2Ext() = default;

    ~IPluginV2Ext() override = default;


    virtual void attachToContext(

        cudnnContext* /*cudnn*/, cublasContext* /*cublas*/, IGpuAllocator* /*allocator*/) noexcept

    {

    }


    virtual void detachFromContext() noexcept {}


    IPluginV2Ext* clone() const noexcept override = 0;


protected:

    // @cond SuppressDoxyWarnings

    IPluginV2Ext(IPluginV2Ext const&) = default;

    IPluginV2Ext(IPluginV2Ext&&) = default;

    IPluginV2Ext& operator=(IPluginV2Ext const&) & = default;

    IPluginV2Ext& operator=(IPluginV2Ext&&) & = default;

// @endcond


    int32_t getTensorRTVersion() const noexcept override

    {

        return static_cast<int32_t>((static_cast<uint32_t>(PluginVersion::kV2_EXT) << 24U)

            | (static_cast<uint32_t>(NV_TENSORRT_VERSION) & 0xFFFFFFU));

    }


    void configureWithFormat(Dims const* /*inputDims*/, int32_t /*nbInputs*/, Dims const* /*outputDims*/,

        int32_t /*nbOutputs*/, DataType /*type*/, PluginFormat /*format*/, int32_t /*maxBatchSize*/) noexcept override

    {

    }

};


class IPluginV2IOExt : public IPluginV2Ext

{

public:

    virtual void configurePlugin(

        PluginTensorDesc const* in, int32_t nbInput, PluginTensorDesc const* out, int32_t nbOutput) noexcept

        = 0;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) const noexcept

        = 0;


    // @cond SuppressDoxyWarnings

    IPluginV2IOExt() = default;

    ~IPluginV2IOExt() override = default;

// @endcond


protected:

// @cond SuppressDoxyWarnings

    IPluginV2IOExt(IPluginV2IOExt const&) = default;

    IPluginV2IOExt(IPluginV2IOExt&&) = default;

    IPluginV2IOExt& operator=(IPluginV2IOExt const&) & = default;

    IPluginV2IOExt& operator=(IPluginV2IOExt&&) & = default;

// @endcond


    int32_t getTensorRTVersion() const noexcept override

    {

        return static_cast<int32_t>((static_cast<uint32_t>(PluginVersion::kV2_IOEXT) << 24U)

            | (static_cast<uint32_t>(NV_TENSORRT_VERSION) & 0xFFFFFFU));

    }


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept final

    {

        return false;

    }

};


enum class PluginFieldType : int32_t

{

    kFLOAT16 = 0,

    kFLOAT32 = 1,

    kFLOAT64 = 2,

    kINT8 = 3,

    kINT16 = 4,

    kINT32 = 5,

    kCHAR = 6,

    kDIMS = 7,

    kUNKNOWN = 8

};


class PluginField

{

public:

    AsciiChar const* name;

    void const* data;

    PluginFieldType type;

    int32_t length;


    PluginField(AsciiChar const* const name_ = nullptr, void const* const data_ = nullptr,

        PluginFieldType const type_ = PluginFieldType::kUNKNOWN, int32_t const length_ = 0) noexcept

        : name(name_)

        , data(data_)

        , type(type_)

        , length(length_)

    {

    }

};


struct PluginFieldCollection

{

    int32_t nbFields;

    PluginField const* fields;

};


class IPluginCreator

{

public:

    virtual int32_t getTensorRTVersion() const noexcept

    {

        return NV_TENSORRT_VERSION;

    }


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual PluginFieldCollection const* getFieldNames() noexcept = 0;


    virtual IPluginV2* createPlugin(AsciiChar const* name, PluginFieldCollection const* fc) noexcept = 0;


    virtual IPluginV2* deserializePlugin(AsciiChar const* name, void const* serialData, size_t serialLength) noexcept

        = 0;


    virtual void setPluginNamespace(AsciiChar const* pluginNamespace) noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


    IPluginCreator() = default;

    virtual ~IPluginCreator() = default;


protected:

// @cond SuppressDoxyWarnings

    IPluginCreator(IPluginCreator const&) = default;

    IPluginCreator(IPluginCreator&&) = default;

    IPluginCreator& operator=(IPluginCreator const&) & = default;

    IPluginCreator& operator=(IPluginCreator&&) & = default;

// @endcond

};


class IPluginRegistry

{

public:

    virtual bool registerCreator(IPluginCreator& creator, AsciiChar const* const pluginNamespace) noexcept = 0;


    virtual IPluginCreator* const* getPluginCreatorList(int32_t* const numCreators) const noexcept = 0;


    virtual IPluginCreator* getPluginCreator(AsciiChar const* const pluginName, AsciiChar const* const pluginVersion,

        AsciiChar const* const pluginNamespace = "") noexcept

        = 0;


    // @cond SuppressDoxyWarnings

    IPluginRegistry() = default;

    IPluginRegistry(IPluginRegistry const&) = delete;

    IPluginRegistry(IPluginRegistry&&) = delete;

    IPluginRegistry& operator=(IPluginRegistry const&) & = delete;

    IPluginRegistry& operator=(IPluginRegistry&&) & = delete;

// @endcond


protected:

    virtual ~IPluginRegistry() noexcept = default;


public:

    //

    virtual void setErrorRecorder(IErrorRecorder* const recorder) noexcept = 0;


    virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;


    virtual bool deregisterCreator(IPluginCreator const& creator) noexcept = 0;

};


enum class AllocatorFlag : int32_t

{

    kRESIZABLE = 0,

};


namespace impl

{

template <>

struct EnumMaxImpl<AllocatorFlag>

{

    static constexpr int32_t kVALUE = 1;

};

} // namespace impl


using AllocatorFlags = uint32_t;


class IGpuAllocator

{

public:

    virtual void* allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept = 0;


    TRT_DEPRECATED virtual void free(void* const memory) noexcept = 0;


    virtual ~IGpuAllocator() = default;

    IGpuAllocator() = default;


    virtual void* reallocate(void* /*baseAddr*/, uint64_t /*alignment*/, uint64_t /*newSize*/) noexcept

    {

        return nullptr;

    }


    virtual bool deallocate(void* const memory) noexcept

    {

        this->free(memory);

        return true;

    }


protected:

// @cond SuppressDoxyWarnings

    IGpuAllocator(IGpuAllocator const&) = default;

    IGpuAllocator(IGpuAllocator&&) = default;

    IGpuAllocator& operator=(IGpuAllocator const&) & = default;

    IGpuAllocator& operator=(IGpuAllocator&&) & = default;

// @endcond

};


class ILogger

{

public:

    enum class Severity : int32_t

    {

        kINTERNAL_ERROR = 0,

        kERROR = 1,

        kWARNING = 2,

        kINFO = 3,

        kVERBOSE = 4,

    };


    virtual void log(Severity severity, AsciiChar const* msg) noexcept = 0;


    ILogger() = default;

    virtual ~ILogger() = default;


protected:

// @cond SuppressDoxyWarnings

    ILogger(ILogger const&) = default;

    ILogger(ILogger&&) = default;

    ILogger& operator=(ILogger const&) & = default;

    ILogger& operator=(ILogger&&) & = default;

// @endcond

};


namespace impl

{

template <>

struct EnumMaxImpl<ILogger::Severity>

{

    static constexpr int32_t kVALUE = 5;

};

} // namespace impl


enum class ErrorCode : int32_t

{

    kSUCCESS = 0,


    kUNSPECIFIED_ERROR = 1,


    kINTERNAL_ERROR = 2,


    kINVALID_ARGUMENT = 3,


    kINVALID_CONFIG = 4,


    kFAILED_ALLOCATION = 5,


    kFAILED_INITIALIZATION = 6,


    kFAILED_EXECUTION = 7,


    kFAILED_COMPUTATION = 8,


    kINVALID_STATE = 9,


    kUNSUPPORTED_STATE = 10,


};


namespace impl

{

template <>

struct EnumMaxImpl<ErrorCode>

{

    static constexpr int32_t kVALUE = 11;

};

} // namespace impl


class IErrorRecorder

{

public:

    using ErrorDesc = char const*;


    // coverity[autosar_cpp14_m0_1_4_violation] Approved RFD: https://jirasw.nvidia.com/browse/TID-489

    static constexpr size_t kMAX_DESC_LENGTH{127U};


    using RefCount = int32_t;


    IErrorRecorder() = default;

    virtual ~IErrorRecorder() noexcept = default;


    // Public API used to retrieve information from the error recorder.


    virtual int32_t getNbErrors() const noexcept = 0;


    virtual ErrorCode getErrorCode(int32_t errorIdx) const noexcept = 0;


    virtual ErrorDesc getErrorDesc(int32_t errorIdx) const noexcept = 0;


    virtual bool hasOverflowed() const noexcept = 0;


    virtual void clear() noexcept = 0;


    // API used by TensorRT to report Error information to the application.


    virtual bool reportError(ErrorCode val, ErrorDesc desc) noexcept = 0;


    virtual RefCount incRefCount() noexcept = 0;


    virtual RefCount decRefCount() noexcept = 0;


protected:

    // @cond SuppressDoxyWarnings

    IErrorRecorder(IErrorRecorder const&) = default;

    IErrorRecorder(IErrorRecorder&&) = default;

    IErrorRecorder& operator=(IErrorRecorder const&) & = default;

    IErrorRecorder& operator=(IErrorRecorder&&) & = default;

    // @endcond

}; // class IErrorRecorder

} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibVersion() noexcept;


#endif // NV_INFER_RUNTIME_COMMON_H

getInferLibVersion
int32_t getInferLibVersion() noexcept
Return the library version number.

TRT_DEPRECATED
#define TRT_DEPRECATED
< Items that are marked as deprecated will be removed in a future release.
Definition: NvInferRuntimeCommon.h:77

NvInferVersion.h

NV_TENSORRT_MINOR
#define NV_TENSORRT_MINOR
TensorRT minor version.
Definition: NvInferVersion.h:60

NV_TENSORRT_MAJOR
#define NV_TENSORRT_MAJOR
TensorRT major version.
Definition: NvInferVersion.h:59

NV_TENSORRT_PATCH
#define NV_TENSORRT_PATCH
TensorRT patch version.
Definition: NvInferVersion.h:61

nvinfer1::Dims32
Definition: NvInferRuntimeCommon.h:190

nvinfer1::Dims32::nbDims
int32_t nbDims
The rank (number of dimensions).
Definition: NvInferRuntimeCommon.h:195

nvinfer1::Dims32::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeCommon.h:193

nvinfer1::Dims32::d
int32_t d[MAX_DIMS]
The extent of each dimension.
Definition: NvInferRuntimeCommon.h:197

nvinfer1::IErrorRecorder
Reference counted application-implemented error reporting interface for TensorRT objects.
Definition: NvInferRuntimeCommon.h:1693

nvinfer1::IErrorRecorder::ErrorDesc
char const  * ErrorDesc
Definition: NvInferRuntimeCommon.h:1698

nvinfer1::IErrorRecorder::RefCount
int32_t RefCount
Definition: NvInferRuntimeCommon.h:1709

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInferRuntimeCommon.h:1372

nvinfer1::IGpuAllocator::deallocate
virtual bool deallocate(void *const memory) noexcept
Definition: NvInferRuntimeCommon.h:1482

nvinfer1::IGpuAllocator::reallocate
virtual void * reallocate(void *, uint64_t, uint64_t) noexcept
Definition: NvInferRuntimeCommon.h:1457

nvinfer1::IGpuAllocator::~IGpuAllocator
virtual ~IGpuAllocator()=default

nvinfer1::IGpuAllocator::allocate
virtual void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept=0

nvinfer1::IGpuAllocator::free
virtual TRT_DEPRECATED void free(void *const memory) noexcept=0

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntimeCommon.h:1506

nvinfer1::ILogger::Severity
Severity
Definition: NvInferRuntimeCommon.h:1514

nvinfer1::ILogger::log
virtual void log(Severity severity, AsciiChar const *msg) noexcept=0

nvinfer1::IPluginCreator
Plugin creator class for user implemented layers.
Definition: NvInferRuntimeCommon.h:1108

nvinfer1::IPluginCreator::getTensorRTVersion
virtual int32_t getTensorRTVersion() const noexcept
Return the version of the API the plugin creator was compiled with.
Definition: NvInferRuntimeCommon.h:1117

nvinfer1::IPluginCreator::getPluginName
virtual AsciiChar const * getPluginName() const noexcept=0
Return the plugin name.

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:1244

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator. Returns false if one with same type is already registered.

nvinfer1::IPluginRegistry::getPluginCreator
virtual IPluginCreator * getPluginCreator(AsciiChar const *const pluginName, AsciiChar const *const pluginVersion, AsciiChar const *const pluginNamespace="") noexcept=0
Return plugin creator based on plugin name, version, and namespace associated with plugin during netw...

nvinfer1::IPluginRegistry::getPluginCreatorList
virtual IPluginCreator *const * getPluginCreatorList(int32_t *const numCreators) const noexcept=0
Return all the registered plugin creators and the number of registered plugin creators....

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:714

nvinfer1::IPluginV2Ext::canBroadcastInputAcrossBatch
virtual bool canBroadcastInputAcrossBatch(int32_t inputIndex) const noexcept=0
Return true if plugin can use input that is broadcast across batch without replication.

nvinfer1::IPluginV2Ext::configureWithFormat
void configureWithFormat(Dims const *, int32_t, Dims const *, int32_t, DataType, PluginFormat, int32_t) noexcept override
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntimeCommon.h:901

nvinfer1::IPluginV2Ext::isOutputBroadcastAcrossBatch
virtual bool isOutputBroadcastAcrossBatch(int32_t outputIndex, bool const *inputIsBroadcasted, int32_t nbInputs) const noexcept=0
Return true if output tensor is broadcast across a batch.

nvinfer1::IPluginV2Ext::clone
IPluginV2Ext * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2Ext::configurePlugin
virtual void configurePlugin(Dims const *inputDims, int32_t nbInputs, Dims const *outputDims, int32_t nbOutputs, DataType const *inputTypes, DataType const *outputTypes, bool const *inputIsBroadcast, bool const *outputIsBroadcast, PluginFormat floatFormat, int32_t maxBatchSize) noexcept=0
Configure the layer with input and output data types.

nvinfer1::IPluginV2Ext::detachFromContext
virtual void detachFromContext() noexcept
Detach the plugin object from its execution context.
Definition: NvInferRuntimeCommon.h:857

nvinfer1::IPluginV2Ext::attachToContext
virtual void attachToContext(cudnnContext *, cublasContext *, IGpuAllocator *) noexcept
Attach the plugin object to an execution context and grant the plugin the access to some context reso...
Definition: NvInferRuntimeCommon.h:839

nvinfer1::IPluginV2Ext::getOutputDataType
virtual nvinfer1::DataType getOutputDataType(int32_t index, nvinfer1::DataType const *inputTypes, int32_t nbInputs) const noexcept=0
Return the DataType of the plugin output at the requested index.

nvinfer1::IPluginV2
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:411

nvinfer1::IPluginV2::getPluginType
virtual AsciiChar const * getPluginType() const noexcept=0
Return the plugin type. Should match the plugin name returned by the corresponding plugin creator.

nvinfer1::IPluginV2::terminate
virtual void terminate() noexcept=0
Release resources acquired during plugin layer initialization. This is called when the engine is dest...

nvinfer1::IPluginV2::getTensorRTVersion
virtual int32_t getTensorRTVersion() const noexcept
Return the API version with which this plugin was built.
Definition: NvInferRuntimeCommon.h:423

nvinfer1::IPluginV2::setPluginNamespace
virtual void setPluginNamespace(AsciiChar const *pluginNamespace) noexcept=0
Set the namespace that this plugin object belongs to. Ideally, all plugin objects from the same plugi...

nvinfer1::IPluginV2::configureWithFormat
virtual void configureWithFormat(Dims const *inputDims, int32_t nbInputs, Dims const *outputDims, int32_t nbOutputs, DataType type, PluginFormat format, int32_t maxBatchSize) noexcept=0
Configure the layer.

nvinfer1::IPluginV2::serialize
virtual void serialize(void *buffer) const noexcept=0
Serialize the layer.

nvinfer1::IPluginV2::destroy
virtual void destroy() noexcept=0
Destroy the plugin object. This will be called when the network, builder or engine is destroyed.

nvinfer1::IPluginV2::getPluginVersion
virtual AsciiChar const * getPluginVersion() const noexcept=0
Return the plugin version. Should match the plugin version returned by the corresponding plugin creat...

nvinfer1::IPluginV2::getOutputDimensions
virtual Dims getOutputDimensions(int32_t index, Dims const *inputs, int32_t nbInputDims) noexcept=0
Get the dimension of an output tensor.

nvinfer1::IPluginV2::clone
virtual IPluginV2 * clone() const noexcept=0
Clone the plugin object. This copies over internal plugin parameters and returns a new plugin object ...

nvinfer1::IPluginV2::enqueue
virtual int32_t enqueue(int32_t batchSize, void const *const *inputs, void *const *outputs, void *workspace, cudaStream_t stream) noexcept=0
Execute the layer.

nvinfer1::IPluginV2::getSerializationSize
virtual size_t getSerializationSize() const noexcept=0
Find the size of the serialization buffer required.

nvinfer1::IPluginV2::getWorkspaceSize
virtual size_t getWorkspaceSize(int32_t maxBatchSize) const noexcept=0
Find the workspace size required by the layer.

nvinfer1::IPluginV2::getNbOutputs
virtual int32_t getNbOutputs() const noexcept=0
Get the number of outputs from the layer.

nvinfer1::IPluginV2::getPluginNamespace
virtual AsciiChar const * getPluginNamespace() const noexcept=0
Return the namespace of the plugin object.

nvinfer1::IPluginV2::initialize
virtual int32_t initialize() noexcept=0
Initialize the layer for execution. This is called when the engine is created.

nvinfer1::IPluginV2::supportsFormat
virtual bool supportsFormat(DataType type, PluginFormat format) const noexcept=0
Check format support.

nvinfer1::IPluginV2IOExt
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:917

nvinfer1::IPluginV2IOExt::getTensorRTVersion
int32_t getTensorRTVersion() const noexcept override
Return the API version with which this plugin was built. The upper byte is reserved by TensorRT and i...
Definition: NvInferRuntimeCommon.h:1005

nvinfer1::IPluginV2IOExt::configurePlugin
virtual void configurePlugin(PluginTensorDesc const *in, int32_t nbInput, PluginTensorDesc const *out, int32_t nbOutput) noexcept=0
Configure the layer.

nvinfer1::IPluginV2IOExt::supportsFormatCombination
virtual bool supportsFormatCombination(int32_t pos, PluginTensorDesc const *inOut, int32_t nbInputs, int32_t nbOutputs) const noexcept=0
Return true if plugin supports the format and datatype for the input/output indexed by pos.

nvinfer1::PluginField
Structure containing plugin attribute field names and associated data This information can be parsed ...
Definition: NvInferRuntimeCommon.h:1060

nvinfer1::PluginField::name
AsciiChar const  * name
Plugin field attribute name.
Definition: NvInferRuntimeCommon.h:1065

nvinfer1::PluginField::data
void const  * data
Plugin field attribute data.
Definition: NvInferRuntimeCommon.h:1069

nvinfer1::PluginField::length
int32_t length
Number of data entries in the Plugin attribute.
Definition: NvInferRuntimeCommon.h:1078

nvinfer1::PluginField::type
PluginFieldType type
Plugin field attribute type.
Definition: NvInferRuntimeCommon.h:1074

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::ErrorCode
ErrorCode
Error codes that can be returned by TensorRT during execution.
Definition: NvInferRuntimeCommon.h:1568

nvinfer1::ErrorCode::kUNSUPPORTED_STATE
@ kUNSUPPORTED_STATE

nvinfer1::ErrorCode::kINVALID_STATE
@ kINVALID_STATE

nvinfer1::ErrorCode::kFAILED_INITIALIZATION
@ kFAILED_INITIALIZATION

nvinfer1::ErrorCode::kUNSPECIFIED_ERROR
@ kUNSPECIFIED_ERROR

nvinfer1::ErrorCode::kFAILED_ALLOCATION
@ kFAILED_ALLOCATION

nvinfer1::ErrorCode::kFAILED_COMPUTATION
@ kFAILED_COMPUTATION

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::ErrorCode::kFAILED_EXECUTION
@ kFAILED_EXECUTION

nvinfer1::ErrorCode::kSUCCESS
@ kSUCCESS

nvinfer1::ErrorCode::kINVALID_CONFIG
@ kINVALID_CONFIG

nvinfer1::ErrorCode::kINVALID_ARGUMENT
@ kINVALID_ARGUMENT

nvinfer1::PluginFieldType
PluginFieldType
Definition: NvInferRuntimeCommon.h:1031

nvinfer1::PluginFieldType::kUNKNOWN
@ kUNKNOWN
Unknown field type.

nvinfer1::PluginFieldType::kFLOAT32
@ kFLOAT32
FP32 field type.

nvinfer1::PluginFieldType::kCHAR
@ kCHAR
char field type.

nvinfer1::PluginFieldType::kINT16
@ kINT16
INT16 field type.

nvinfer1::PluginFieldType::kDIMS
@ kDIMS
nvinfer1::Dims field type.

nvinfer1::PluginFieldType::kFLOAT64
@ kFLOAT64
FP64 field type.

nvinfer1::PluginFieldType::kFLOAT16
@ kFLOAT16
FP16 field type.

nvinfer1::AsciiChar
char_t AsciiChar
AsciiChar is the type used by TensorRT to represent valid ASCII characters.
Definition: NvInferRuntimeCommon.h:125

nvinfer1::char_t
char char_t
char_t is the type used by TensorRT to represent all valid characters.
Definition: NvInferRuntimeCommon.h:123

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::PluginVersion::kV2
@ kV2
IPluginV2.

nvinfer1::PluginVersion::kV2_IOEXT
@ kV2_IOEXT
IPluginV2IOExt.

nvinfer1::PluginVersion::kV2_EXT
@ kV2_EXT
IPluginV2Ext.

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeCommon.h:151

nvinfer1::DataType::kFLOAT
@ kFLOAT
32-bit floating point format.

nvinfer1::DataType::kBOOL
@ kBOOL
8-bit boolean. 0 = false, 1 = true, other values undefined.

nvinfer1::DataType::kHALF
@ kHALF
IEEE 16-bit floating-point format.

nvinfer1::DataType::kINT8
@ kINT8
8-bit integer representing a quantized floating-point value.

nvinfer1::DataType::kINT32
@ kINT32
Signed 32-bit integer format.

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimeCommon.h:345

nvinfer1::BuilderFlag::kINT8
@ kINT8
Enable Int8 layer selection, with FP32 fallback with FP16 fallback if kFP16 also specified.

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntimeCommon.h:221

nvinfer1::TensorFormat::kCHW4
@ kCHW4

nvinfer1::TensorFormat::kHWC16
@ kHWC16

nvinfer1::TensorFormat::kDHWC8
@ kDHWC8

nvinfer1::TensorFormat::kDLA_LINEAR
@ kDLA_LINEAR

nvinfer1::TensorFormat::kCDHW32
@ kCDHW32

nvinfer1::TensorFormat::kDLA_HWC4
@ kDLA_HWC4

nvinfer1::TensorFormat::kCHW16
@ kCHW16

nvinfer1::TensorFormat::kHWC
@ kHWC

nvinfer1::TensorFormat::kCHW2
@ kCHW2

nvinfer1::TensorFormat::kHWC8
@ kHWC8

nvinfer1::TensorFormat::kLINEAR
@ kLINEAR

nvinfer1::TensorFormat::kCHW32
@ kCHW32

nvinfer1::EnumMax
constexpr int32_t EnumMax() noexcept
Maximum number of elements in an enumeration type.
Definition: NvInferRuntimeCommon.h:141

nvinfer1::AllocatorFlag
AllocatorFlag
Definition: NvInferRuntimeCommon.h:1350

nvinfer1::AllocatorFlag::kRESIZABLE
@ kRESIZABLE
TensorRT may call realloc() on this allocation.

PluginVersion
Definition of plugin versions.

nvinfer1::PluginFieldCollection
Plugin field collection struct.
Definition: NvInferRuntimeCommon.h:1092

nvinfer1::PluginFieldCollection::fields
PluginField const  * fields
Pointer to PluginField entries.
Definition: NvInferRuntimeCommon.h:1096

nvinfer1::PluginFieldCollection::nbFields
int32_t nbFields
Number of PluginField entries.
Definition: NvInferRuntimeCommon.h:1094

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimeCommon.h:370

nvinfer1::PluginTensorDesc::type
DataType type
Definition: NvInferRuntimeCommon.h:374

nvinfer1::PluginTensorDesc::dims
Dims dims
Dimensions.
Definition: NvInferRuntimeCommon.h:372

nvinfer1::PluginTensorDesc::format
TensorFormat format
Tensor format.
Definition: NvInferRuntimeCommon.h:376

nvinfer1::PluginTensorDesc::scale
float scale
Scale for INT8 data type.
Definition: NvInferRuntimeCommon.h:378

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeCommon.h:136