tensorrt-api/c_api/_nv_infer_runtime_8h_source.html

 /*
  * Copyright 1993-2019 NVIDIA Corporation.  All rights reserved.
  *
  * NOTICE TO LICENSEE:
  *
  * This source code and/or documentation ("Licensed Deliverables") are
  * subject to NVIDIA intellectual property rights under U.S. and
  * international Copyright laws.
  *
  * These Licensed Deliverables contained herein is PROPRIETARY and
  * CONFIDENTIAL to NVIDIA and is being provided under the terms and
  * conditions of a form of NVIDIA software license agreement by and
  * between NVIDIA and Licensee ("License Agreement") or electronically
  * accepted by Licensee.  Notwithstanding any terms or conditions to
  * the contrary in the License Agreement, reproduction or disclosure
  * of the Licensed Deliverables to any third party without the express
  * written consent of NVIDIA is prohibited.
  *
  * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE
  * LICENSE AGREEMENT, NVIDIA MAKES NO REPRESENTATION ABOUT THE
  * SUITABILITY OF THESE LICENSED DELIVERABLES FOR ANY PURPOSE.  IT IS
  * PROVIDED "AS IS" WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.
  * NVIDIA DISCLAIMS ALL WARRANTIES WITH REGARD TO THESE LICENSED
  * DELIVERABLES, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY,
  * NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.
  * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE
  * LICENSE AGREEMENT, IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY
  * SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY
  * DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
  * WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
  * OF THESE LICENSED DELIVERABLES.
  *
  * U.S. Government End Users.  These Licensed Deliverables are a
  * "commercial item" as that term is defined at 48 C.F.R. 2.101 (OCT
  * 1995), consisting of "commercial computer software" and "commercial
  * computer software documentation" as such terms are used in 48
  * C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Government
  * only as a commercial end item.  Consistent with 48 C.F.R.12.212 and
  * 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), all
  * U.S. Government End Users acquire the Licensed Deliverables with
  * only those rights set forth herein.
  *
  * Any use of the Licensed Deliverables in individual and commercial
  * software must include, in the user documentation and internal
  * comments to the code, the above Disclaimer and U.S. Government End
  * Users Notice.
  */

 #ifndef NV_INFER_RUNTIME_H
 #define NV_INFER_RUNTIME_H


 #include "NvInferRuntimeCommon.h"

 namespace nvinfer1
 {

 class IExecutionContext;
 class ICudaEngine;
 class IPluginFactory;

 enum class EngineCapability : int
 {
     kDEFAULT = 0,
     kSAFE_GPU = 1,
     kSAFE_DLA = 2,
 };

 template <>
 constexpr inline int EnumMax<EngineCapability>()
 {
     return 3;
 }


 class Weights
 {
 public:
     DataType type;
     const void* values;
     int64_t count;
 };

 class IHostMemory
 {
 public:
     virtual void* data() const noexcept = 0;
     virtual std::size_t size() const noexcept = 0;
     virtual DataType type() const noexcept = 0;
     virtual void destroy() noexcept = 0;
 protected:
     virtual ~IHostMemory() {}
 };

 class IPlugin
 {
 public:
     virtual int getNbOutputs() const TRTNOEXCEPT = 0;

     virtual Dims getOutputDimensions(int index, const Dims* inputs, int nbInputDims) TRTNOEXCEPT = 0;

     virtual void configure(const Dims* inputDims, int nbInputs, const Dims* outputDims, int nbOutputs, int maxBatchSize) TRTNOEXCEPT = 0;

     virtual int initialize() TRTNOEXCEPT = 0;

     virtual void terminate() TRTNOEXCEPT = 0;

     virtual size_t getWorkspaceSize(int maxBatchSize) const TRTNOEXCEPT = 0;

     virtual int enqueue(int batchSize, const void* const* inputs, void** outputs, void* workspace, cudaStream_t stream) TRTNOEXCEPT = 0;

     virtual size_t getSerializationSize() TRTNOEXCEPT = 0;

     virtual void serialize(void* buffer) TRTNOEXCEPT = 0;

     virtual ~IPlugin() {}
 };

 class IPluginExt : public IPlugin
 {
 public:
     virtual int getTensorRTVersion() const TRTNOEXCEPT
     {
         return NV_TENSORRT_VERSION;
     }

     virtual bool supportsFormat(DataType type, PluginFormat format) const TRTNOEXCEPT = 0;

     virtual void configureWithFormat(const Dims* inputDims, int nbInputs, const Dims* outputDims, int nbOutputs, DataType type, PluginFormat format, int maxBatchSize) TRTNOEXCEPT = 0;

     virtual ~IPluginExt() {}

 protected:
     void configure(const Dims* /*inputDims*/, int /*nbInputs*/, const Dims* /*outputDims*/, int /*nbOutputs*/, int /*maxBatchSize*/) _TENSORRT_FINAL TRTNOEXCEPT {}
 };

 enum class DimensionOperation : int
 {
     kSUM = 0,
     kPROD = 1,
     kMAX = 2,
     kMIN = 3,
     kSUB = 4,
     kEQUAL = 5,
     kLESS = 6,
     kFLOOR_DIV = 7,
     kCEIL_DIV = 8
 };

 template <>
 constexpr inline int EnumMax<DimensionOperation>()
 {
     return 9;
 }

 class IDimensionExpr
 {
 public:
     virtual bool isConstant() const = 0;

     virtual int getConstantValue() const = 0;

 protected:
     virtual ~IDimensionExpr() {}
 };

 class IExprBuilder
 {
 public:
     virtual const IDimensionExpr* constant(int value) = 0;

     virtual const IDimensionExpr* operation(DimensionOperation op, const IDimensionExpr& first, const IDimensionExpr& second) = 0;

 protected:
     virtual ~IExprBuilder() {}
 };

 class DimsExprs
 {
 public:
     int nbDims;
     const IDimensionExpr* d[Dims::MAX_DIMS];
 };

 struct DynamicPluginTensorDesc
 {
     PluginTensorDesc desc;

     Dims min;

     Dims max;
 };

 class IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext
 {
 public:
     IPluginV2DynamicExt* clone() const _TENSORRT_OVERRIDE TRTNOEXCEPT = 0;

     virtual DimsExprs getOutputDimensions(int outputIndex, const DimsExprs* inputs, int nbInputs, IExprBuilder& exprBuilder) = 0;

     static constexpr int kFORMAT_COMBINATION_LIMIT = 100;

     virtual bool supportsFormatCombination(int pos, const PluginTensorDesc* inOut, int nbInputs, int nbOutputs) TRTNOEXCEPT = 0;

     virtual void configurePlugin(const DynamicPluginTensorDesc* in, int nbInputs, const DynamicPluginTensorDesc* out, int nbOutputs) TRTNOEXCEPT = 0;

     virtual size_t getWorkspaceSize(const PluginTensorDesc* inputs, int nbInputs, const PluginTensorDesc* outputs, int nbOutputs) const TRTNOEXCEPT = 0;

     virtual int enqueue(const PluginTensorDesc* inputDesc, const PluginTensorDesc* outputDesc, const void* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) TRTNOEXCEPT = 0;

 protected:
     int getTensorRTVersion() const _TENSORRT_OVERRIDE TRTNOEXCEPT
     {
         return (static_cast<int>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));
     }

     virtual ~IPluginV2DynamicExt() {}

     // Rest of the methods below are obsolete inherited methods, and marked final when using a C++11 compiler.
     // Derived classes should not override them.

     TRT_DEPRECATED
     Dims getOutputDimensions(int /*index*/, const Dims* /*inputs*/, int /*nbInputDims*/) _TENSORRT_FINAL TRTNOEXCEPT
     {
         return Dims{-1, {}, {}};
     }

     TRT_DEPRECATED
     bool isOutputBroadcastAcrossBatch(int /*outputIndex*/, const bool* /*inputIsBroadcasted*/, int /*nbInputs*/) const _TENSORRT_FINAL TRTNOEXCEPT
     {
         return false;
     }

     TRT_DEPRECATED
     bool canBroadcastInputAcrossBatch(int /*inputIndex*/) const _TENSORRT_FINAL TRTNOEXCEPT
     {
         return true;
     }

     TRT_DEPRECATED
     bool supportsFormat(DataType /*type*/, PluginFormat /*format*/) const _TENSORRT_FINAL TRTNOEXCEPT { return false; }

     TRT_DEPRECATED
     void configurePlugin(const Dims* /*inputDims*/, int /*nbInputs*/, const Dims* /*outputDims*/,
                          int /*nbOutputs*/, const DataType* /*inputTypes*/, const DataType* /*outputTypes*/,
                          const bool* /*inputIsBroadcast*/, const bool* /*outputIsBroadcast*/, PluginFormat /*floatFormat*/, int /*maxBatchSize*/) _TENSORRT_FINAL TRTNOEXCEPT {}

     TRT_DEPRECATED
     size_t getWorkspaceSize(int /*maxBatchSize*/) const _TENSORRT_FINAL TRTNOEXCEPT { return 0; }

     TRT_DEPRECATED
     int enqueue(int /*batchSize*/, const void* const* /*inputs*/, void** /*outputs*/, void* /*workspace*/, cudaStream_t /*stream*/) _TENSORRT_FINAL TRTNOEXCEPT
     {
         return 1;
     }
 };

 class IProfiler
 {
 public:
     virtual void reportLayerTime(const char* layerName, float ms) TRTNOEXCEPT = 0;

     virtual ~IProfiler() {}
 };

 enum class WeightsRole : int
 {
     kKERNEL = 0,
     kBIAS = 1,
     kSHIFT = 2,
     kSCALE = 3,
     kCONSTANT = 4,
 };

 template <>
 constexpr inline int EnumMax<WeightsRole>()
 {
     return 5;
 }

 enum class DeviceType : int
 {
     kGPU,
     kDLA,
 };
 template <>
 constexpr inline int EnumMax<DeviceType>()
 {
     return 2;
 }


 class IRuntime
 {
 public:
     virtual nvinfer1::ICudaEngine* deserializeCudaEngine(const void* blob, std::size_t size, IPluginFactory* pluginFactory) noexcept = 0;

     virtual void setDLACore(int dlaCore) noexcept = 0;

     virtual int getDLACore() const noexcept = 0;

     virtual int getNbDLACores() const noexcept = 0;

     virtual void destroy() noexcept = 0;

 protected:
     virtual ~IRuntime() {}

 public:
     virtual void setGpuAllocator(IGpuAllocator* allocator) noexcept = 0;

     //
     virtual void setErrorRecorder(IErrorRecorder* recorder) noexcept = 0;

     virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

     nvinfer1::ICudaEngine* deserializeCudaEngine(const void* blob, std::size_t size) noexcept
     {
         return deserializeCudaEngine(blob, size, nullptr);
     }
 };

 class IRefitter
 {
 public:
     virtual bool setWeights(const char* layerName, WeightsRole role, Weights weights) TRTNOEXCEPT = 0;

     virtual bool refitCudaEngine() TRTNOEXCEPT = 0;

     virtual int getMissing(int size, const char** layerNames, WeightsRole* roles) TRTNOEXCEPT = 0;

     virtual int getAll(int size, const char** layerNames, WeightsRole* roles) TRTNOEXCEPT = 0;

     virtual void destroy() TRTNOEXCEPT = 0;

 protected:
     virtual ~IRefitter() {}

 public:
     virtual bool setDynamicRange(const char* tensorName, float min, float max) TRTNOEXCEPT = 0;

     virtual float getDynamicRangeMin(const char* tensorName) const TRTNOEXCEPT = 0;

     virtual float getDynamicRangeMax(const char* tensorName) const TRTNOEXCEPT = 0;

     virtual int getTensorsWithDynamicRange(int size, const char** tensorNames) const TRTNOEXCEPT = 0;

     //
     virtual void setErrorRecorder(IErrorRecorder* recorder) TRTNOEXCEPT = 0;

     virtual IErrorRecorder* getErrorRecorder() const TRTNOEXCEPT = 0;
 };

 class IPluginFactory
 {
 public:
     virtual IPlugin* createPlugin(const char* layerName, const void* serialData, size_t serialLength) TRTNOEXCEPT = 0;

     virtual ~IPluginFactory() {}
 };

 enum class OptProfileSelector : int
 {
     kMIN = 0,
     kOPT = 1,
     kMAX = 2
 };

 template <>
 constexpr inline int EnumMax<OptProfileSelector>()
 {
     return 3;
 }

 class IOptimizationProfile
 {
 public:
     virtual bool setDimensions(const char* inputName, OptProfileSelector select, Dims dims) noexcept = 0;

     virtual Dims getDimensions(const char* inputName, OptProfileSelector select) const noexcept = 0;

     virtual bool setShapeValues(
         const char* inputName, OptProfileSelector select, const int32_t* values, int nbValues) noexcept = 0;

     virtual int getNbShapeValues(const char* inputName) const noexcept = 0;

     virtual const int32_t* getShapeValues(const char* inputName, OptProfileSelector select) const noexcept = 0;

     virtual bool setExtraMemoryTarget(float target) noexcept = 0;

     virtual float getExtraMemoryTarget() const noexcept = 0;

     virtual bool isValid() const noexcept = 0;

 protected:
     ~IOptimizationProfile() noexcept = default;
 };

 class ICudaEngine
 {
 public:
     virtual int getNbBindings() const noexcept = 0;

     virtual int getBindingIndex(const char* name) const noexcept = 0;

     virtual const char* getBindingName(int bindingIndex) const noexcept = 0;

     virtual bool bindingIsInput(int bindingIndex) const noexcept = 0;

     virtual Dims getBindingDimensions(int bindingIndex) const noexcept = 0;

     virtual DataType getBindingDataType(int bindingIndex) const noexcept = 0;

     virtual int getMaxBatchSize() const noexcept = 0;

     virtual int getNbLayers() const noexcept = 0;

     TRT_DEPRECATED
     virtual std::size_t getWorkspaceSize() const noexcept = 0;

     virtual IHostMemory* serialize() const noexcept = 0;

     virtual IExecutionContext* createExecutionContext() noexcept = 0;

     virtual void destroy() noexcept = 0;

     virtual TensorLocation getLocation(int bindingIndex) const noexcept = 0;

 protected:
     virtual ~ICudaEngine() {}

 public:
     virtual IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept = 0;

     virtual size_t getDeviceMemorySize() const noexcept = 0;

     virtual bool isRefittable() const noexcept = 0;

     virtual int getBindingBytesPerComponent(int bindingIndex) const noexcept = 0;

     virtual int getBindingComponentsPerElement(int bindingIndex) const noexcept = 0;

     virtual TensorFormat getBindingFormat(int bindingIndex) const noexcept = 0;

     virtual const char* getBindingFormatDesc(int bindingIndex) const noexcept = 0;

     virtual int getBindingVectorizedDim(int bindingIndex) const noexcept = 0;

     virtual const char* getName() const noexcept = 0;

     virtual int getNbOptimizationProfiles() const noexcept = 0;

     virtual Dims getProfileDimensions(int bindingIndex, int profileIndex, OptProfileSelector select) const noexcept = 0;

     virtual const int32_t* getProfileShapeValues(int profileIndex, int inputIndex, OptProfileSelector select) const
         noexcept
         = 0;

     virtual bool isShapeBinding(int bindingIndex) const noexcept = 0;

     virtual bool isExecutionBinding(int bindingIndex) const noexcept = 0;

     virtual EngineCapability getEngineCapability() const noexcept = 0;

     //
     virtual void setErrorRecorder(IErrorRecorder* recorder) noexcept = 0;

     virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

     virtual bool hasImplicitBatchDimension() const TRTNOEXCEPT = 0;
 };

 class IExecutionContext
 {
 public:
     virtual bool execute(int batchSize, void** bindings) noexcept = 0;

     virtual bool enqueue(int batchSize, void** bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept = 0;

     virtual void setDebugSync(bool sync) noexcept = 0;

     virtual bool getDebugSync() const noexcept = 0;

     virtual void setProfiler(IProfiler*) noexcept = 0;

     virtual IProfiler* getProfiler() const noexcept = 0;

     virtual const ICudaEngine& getEngine() const noexcept = 0;

     virtual void destroy() noexcept = 0;

 protected:
     virtual ~IExecutionContext() noexcept {}

 public:
     virtual void setName(const char* name) noexcept = 0;

     virtual const char* getName() const noexcept = 0;

     virtual void setDeviceMemory(void* memory) noexcept = 0;

     virtual Dims getStrides(int bindingIndex) const noexcept = 0;

 public:
     virtual bool setOptimizationProfile(int profileIndex) noexcept = 0;

     virtual int getOptimizationProfile() const noexcept = 0;

     virtual bool setBindingDimensions(int bindingIndex, Dims dimensions) noexcept = 0;

     virtual Dims getBindingDimensions(int bindingIndex) const noexcept = 0;

     virtual bool setInputShapeBinding(int bindingIndex, const int32_t* data) noexcept = 0;

     virtual bool getShapeBinding(int bindingIndex, int32_t* data) const noexcept = 0;

     virtual bool allInputDimensionsSpecified() const noexcept = 0;

     virtual bool allInputShapesSpecified() const noexcept = 0;

     //
     virtual void setErrorRecorder(IErrorRecorder* recorder) noexcept = 0;

     virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

     virtual bool executeV2(void** bindings) noexcept = 0;

     virtual bool enqueueV2(void** bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept = 0;
 };
 }
 extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int version);

 extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int version);

 namespace nvinfer1
 {
 namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this header.
 {
 inline IRuntime* createInferRuntime(ILogger& logger)
 {
     return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));
 }

 inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger)
 {
     return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));
 }
 }
 }

 #endif // NV_INFER_RUNTIME_H
nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:1115

nvinfer1::ElementWiseOperation::kSUB
Substract the second element from the first.

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeCommon.h:162

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger)
Create an instance of an IRuntime class.
Definition: NvInferRuntime.h:1819

nvinfer1::ElementWiseOperation::kLESS
Check if element in first tensor is less than corresponding element in second tensor.

nvinfer1::ElementWiseOperation::kEQUAL
Check if two elements are equal.

nvinfer1::DeviceType::kGPU
GPU Device.

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:394

nvinfer1::EngineCapability::kSAFE_GPU
Safety restricted capability, TensorRT flow that can only run on GPU devices.

nvinfer1::EnumMax< WeightsRole >
constexpr int EnumMax< WeightsRole >()
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:665

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:962

cudaStream_t
struct CUstream_st * cudaStream_t
Forward declaration of cudaStream_t.
Definition: NvInferRuntimeCommon.h:112

nvinfer1::IPluginV2DynamicExt::canBroadcastInputAcrossBatch
TRT_DEPRECATED bool canBroadcastInputAcrossBatch(int) const _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:570

nvinfer1::Weights::values
const void * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:102

nvinfer1::IPluginExt::configure
void configure(const Dims *, int, const Dims *, int, int) _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:287

nvinfer1::IPluginV2DynamicExt
Definition: NvInferRuntime.h:422

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:694

nvinfer1::IPlugin
Plugin class for user-implemented layers.
Definition: NvInferRuntime.h:134

nvinfer1::Dims::MAX_DIMS
static const int MAX_DIMS
The maximum number of dimensions supported for a tensor.
Definition: NvInferRuntimeCommon.h:209

nvinfer1::IPluginV2DynamicExt::isOutputBroadcastAcrossBatch
TRT_DEPRECATED bool isOutputBroadcastAcrossBatch(int, const bool *, int) const _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:559

nvinfer1::WeightsRole::kBIAS
bias for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::SliceMode::kDEFAULT
Fail with error when the coordinates are out of bounds. This is the default.

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntimeCommon.h:926

nvinfer1::WeightsRole::kSHIFT
shift part of IScaleLayer

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:101

nvinfer1::PluginVersion::kV2_DYNAMICEXT
IPluginV2IOExt.

nvinfer1
The TensorRT API version 1 namespace.

NvInferRuntimeCommon.h

nvinfer1::ElementWiseOperation::kSUM
Sum of the two elements.

nvinfer1::IPluginFactory
Plugin factory for deserialization.
Definition: NvInferRuntime.h:930

nvinfer1::IRuntime::deserializeCudaEngine
nvinfer1::ICudaEngine * deserializeCudaEngine(const void *blob, std::size_t size) noexcept
Deserialize an engine from a stream when plugin factory is not used.
Definition: NvInferRuntime.h:779

nvinfer1::OptProfileSelector::kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::ElementWiseOperation::kPROD
Product of the two elements.

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:997

nvinfer1::IPluginV2DynamicExt::getOutputDimensions
TRT_DEPRECATED Dims getOutputDimensions(int, const Dims *, int) _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:548

nvinfer1::IPluginV2DynamicExt::getTensorRTVersion
int getTensorRTVersion() const _TENSORRT_OVERRIDE
Return the API version with which this plugin was built.
Definition: NvInferRuntime.h:532

nvinfer1::DimsExprs::nbDims
int nbDims
The number of dimensions.
Definition: NvInferRuntime.h:382

nvinfer1::EnumMax< DimensionOperation >
constexpr int EnumMax< DimensionOperation >()
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:314

nvinfer1::IErrorRecorder
Reference counted application-implemented error reporting interface for TensorRT objects.
Definition: NvInferRuntimeCommon.h:1142

nvinfer1::IPluginV2DynamicExt::enqueue
TRT_DEPRECATED int enqueue(int, const void *const *, void **, void *, cudaStream_t) _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:619

nvinfer1::Dims
Structure to define the dimensions of a tensor.
Definition: NvInferRuntimeCommon.h:206

nvinfer1::EnumMax< DeviceType >
constexpr int EnumMax< DeviceType >()
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:681

nvinfer1::DeviceType::kDLA
DLA Core.

nvinfer1::ElementWiseOperation::kMIN
Minimum of the two elements.

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:103

nvinfer1::IExprBuilder
Definition: NvInferRuntime.h:360

nvinfer1::LayerType::kCONSTANT
Constant layer.

nvinfer1::WeightsRole::kKERNEL
kernel for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:98

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRefitter
IRefitter * createInferRefitter(ICudaEngine &engine, ILogger &logger)
Create an instance of an IRefitter class.
Definition: NvInferRuntime.h:1829

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntimeCommon.h:236

nvinfer1::ILogger
Application-implemented logging interface for the builder, engine and runtime.
Definition: NvInferRuntimeCommon.h:986

nvinfer1::EnumMax< EngineCapability >
constexpr int EnumMax< EngineCapability >()
Maximum number of elements in EngineCapability enum.
Definition: NvInferRuntime.h:84

nvinfer1::IPluginExt
Plugin class for user-implemented layers.
Definition: NvInferRuntime.h:238

nvinfer1::ElementWiseOperation::kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimeCommon.h:311

nvinfer1::EngineCapability
EngineCapability
Forward declaration of IPluginFactory for use by other interfaces.
Definition: NvInferRuntime.h:76

nvinfer1::EngineCapability::kSAFE_DLA
Safety restricted capability, TensorRT flow that can only run on DLA devices.

nvinfer1::IDimensionExpr
Definition: NvInferRuntime.h:329

nvinfer1::DynamicPluginTensorDesc
Definition: NvInferRuntime.h:391

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:116

nvinfer1::EnumMax< OptProfileSelector >
constexpr int EnumMax< OptProfileSelector >()
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:970

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:400

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:300

nvinfer1::IPluginExt::getTensorRTVersion
virtual int getTensorRTVersion() const
Return the API version with which this plugin was built.
Definition: NvInferRuntime.h:246

_TENSORRT_OVERRIDE
#define _TENSORRT_OVERRIDE
Items that are marked as deprecated will be removed in a future release.
Definition: NvInferRuntimeCommon.h:62

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInferRuntimeCommon.h:943

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:1487

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:792

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:397

nvinfer1::LayerType::kSCALE
Scale layer.

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:675

nvinfer1::IPluginV2DynamicExt::getWorkspaceSize
TRT_DEPRECATED size_t getWorkspaceSize(int) const _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:609

nvinfer1::DimsExprs
Definition: NvInferRuntime.h:379

nvinfer1::IProfiler
Application-implemented interface for profiling.
Definition: NvInferRuntime.h:635

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:514

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:655

nvinfer1::IPluginV2DynamicExt::supportsFormat
TRT_DEPRECATED bool supportsFormat(DataType, PluginFormat) const _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:584

cudaEvent_t
struct CUevent_st * cudaEvent_t
Forward declaration of cudaEvent_t.
Definition: NvInferRuntimeCommon.h:113

nvinfer1::IPluginV2DynamicExt::configurePlugin
TRT_DEPRECATED void configurePlugin(const Dims *, int, const Dims *, int, const DataType *, const DataType *, const bool *, const bool *, PluginFormat, int) _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInferRuntime.h:595

nvinfer1::DimensionOperation::kCEIL_DIV
Division rounding up.