tensorrt-api/c_api/_nv_infer_8h_source.html

 /*

  * Copyright 1993-2018 NVIDIA Corporation.  All rights reserved.

  *

  * NOTICE TO LICENSEE:

  *

  * This source code and/or documentation ("Licensed Deliverables") are

  * subject to NVIDIA intellectual property rights under U.S. and

  * international Copyright laws.

  *

  * These Licensed Deliverables contained herein is PROPRIETARY and

  * CONFIDENTIAL to NVIDIA and is being provided under the terms and

  * conditions of a form of NVIDIA software license agreement by and

  * between NVIDIA and Licensee ("License Agreement") or electronically

  * accepted by Licensee.  Notwithstanding any terms or conditions to

  * the contrary in the License Agreement, reproduction or disclosure

  * of the Licensed Deliverables to any third party without the express

  * written consent of NVIDIA is prohibited.

  *

  * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

  * LICENSE AGREEMENT, NVIDIA MAKES NO REPRESENTATION ABOUT THE

  * SUITABILITY OF THESE LICENSED DELIVERABLES FOR ANY PURPOSE.  IT IS

  * PROVIDED "AS IS" WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.

  * NVIDIA DISCLAIMS ALL WARRANTIES WITH REGARD TO THESE LICENSED

  * DELIVERABLES, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY,

  * NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.

  * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

  * LICENSE AGREEMENT, IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY

  * SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY

  * DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,

  * WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS

  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE

  * OF THESE LICENSED DELIVERABLES.

  *

  * U.S. Government End Users.  These Licensed Deliverables are a

  * "commercial item" as that term is defined at 48 C.F.R. 2.101 (OCT

  * 1995), consisting of "commercial computer software" and "commercial

  * computer software documentation" as such terms are used in 48

  * C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Government

  * only as a commercial end item.  Consistent with 48 C.F.R.12.212 and

  * 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), all

  * U.S. Government End Users acquire the Licensed Deliverables with

  * only those rights set forth herein.

  *

  * Any use of the Licensed Deliverables in individual and commercial

  * software must include, in the user documentation and internal

  * comments to the code, the above Disclaimer and U.S. Government End

  * Users Notice.

  */


 #ifndef NV_INFER_H

 #define NV_INFER_H


 #include <cstddef>

 #include <cstdint>


 #define NV_TENSORRT_MAJOR 5

 #define NV_TENSORRT_MINOR 0

 #define NV_TENSORRT_PATCH 0

 #define NV_TENSORRT_BUILD 10


 #define NV_TENSORRT_SONAME_MAJOR 5

 #define NV_TENSORRT_SONAME_MINOR 0

 #define NV_TENSORRT_SONAME_PATCH 0


 #if __cplusplus > 201103L

 #define _TENSORRT_FINAL final

 #else

 #define _TENSORRT_FINAL

 #endif


 #ifdef TENSORRT_BUILD_LIB

 #define TENSORRTAPI __attribute__((visibility("default")))

 #else

 #define TENSORRTAPI

 #endif


 // forward declare some CUDA types to avoid an include dependency


 struct cublasContext;

 struct cudnnContext;


 typedef struct CUstream_st* cudaStream_t;

 typedef struct CUevent_st* cudaEvent_t;


 static const int NV_TENSORRT_VERSION = (NV_TENSORRT_MAJOR * 1000) + (NV_TENSORRT_MINOR * 100) + NV_TENSORRT_PATCH; // major, minor, patch


 namespace nvinfer1

 {


 template <typename T>

 inline int EnumMax();


 enum class DataType : int

 {

     kFLOAT = 0,

     kHALF = 1,

     kINT8 = 2,

     kINT32 = 3

 };


 template <>

 inline int EnumMax<DataType>()

 {

     return 4;

 }


 enum class DeviceType : int

 {

     kGPU,

     kDLA,

     kDLA0 = kDLA,

     kDLA1

 };

 template <>

 inline int EnumMax<DeviceType>()

 {

     return 3;

 }


 enum class DimensionType : int

 {

     kSPATIAL = 0,

     kCHANNEL = 1,

     kINDEX = 2,

     kSEQUENCE = 3

 };


 template <>

 inline int EnumMax<DimensionType>()

 {

     return 4;

 }


 class Dims

 {

 public:

     static const int MAX_DIMS = 8;

     int nbDims;

     int d[MAX_DIMS];

     DimensionType type[MAX_DIMS];

 };


 class Dims2 : public Dims

 {

 public:

     Dims2()

     {

         nbDims = 2;

         d[0] = d[1] = 0;

     }


     Dims2(int d0, int d1)

     {

         nbDims = 2;

         d[0] = d0;

         d[1] = d1;

     }

 };


 class DimsHW : public Dims2

 {

 public:

     DimsHW()

         : Dims2()

     {

         type[0] = type[1] = DimensionType::kSPATIAL;

     }


     DimsHW(int height, int width)

         : Dims2(height, width)

     {

         type[0] = type[1] = DimensionType::kSPATIAL;

     }


     int& h() { return d[0]; }


     int h() const { return d[0]; }


     int& w() { return d[1]; }


     int w() const { return d[1]; }

 };


 class Dims3 : public Dims

 {

 public:

     Dims3()

     {

         nbDims = 3;

         d[0] = d[1] = d[2] = 0;

     }


     Dims3(int d0, int d1, int d2)

     {

         nbDims = 3;

         d[0] = d0;

         d[1] = d1;

         d[2] = d2;

     }

 };


 class DimsCHW : public Dims3

 {

 public:

     DimsCHW()

         : Dims3()

     {

         type[0] = DimensionType::kCHANNEL;

         type[1] = type[2] = DimensionType::kSPATIAL;

     }


     DimsCHW(int channels, int height, int width)

         : Dims3(channels, height, width)

     {

         type[0] = DimensionType::kCHANNEL;

         type[1] = type[2] = DimensionType::kSPATIAL;

     }


     int& c() { return d[0]; }


     int c() const { return d[0]; }


     int& h() { return d[1]; }


     int h() const { return d[1]; }


     int& w() { return d[2]; }


     int w() const { return d[2]; }

 };


 class Dims4 : public Dims

 {

 public:

     Dims4()

     {

         nbDims = 4;

         d[0] = d[1] = d[2] = d[3] = 0;

     }


     Dims4(int d0, int d1, int d2, int d3)

     {

         nbDims = 4;

         d[0] = d0;

         d[1] = d1;

         d[2] = d2;

         d[3] = d3;

     }

 };


 class DimsNCHW : public Dims4

 {

 public:

     DimsNCHW()

         : Dims4()

     {

         type[0] = DimensionType::kINDEX;

         type[1] = DimensionType::kCHANNEL;

         type[2] = type[3] = DimensionType::kSPATIAL;

     }


     DimsNCHW(int batchSize, int channels, int height, int width)

         : Dims4(batchSize, channels, height, width)

     {

         type[0] = DimensionType::kINDEX;

         type[1] = DimensionType::kCHANNEL;

         type[2] = type[3] = DimensionType::kSPATIAL;

     }


     int& n() { return d[0]; }


     int n() const { return d[0]; }


     int& c() { return d[1]; }


     int c() const { return d[1]; }


     int& h() { return d[2]; }


     int h() const { return d[2]; }


     int& w() { return d[3]; }


     int w() const { return d[3]; }

 };


 class Weights

 {

 public:

     DataType type;

     const void* values;

     int64_t count;

 };


 class IHostMemory

 {

 public:

     virtual void* data() const = 0;

     virtual std::size_t size() const = 0;

     virtual DataType type() const = 0;

     virtual void destroy() = 0;

 protected:

     virtual ~IHostMemory() {}

 };


 enum class LayerType : int

 {

     kCONVOLUTION = 0,

     kFULLY_CONNECTED = 1,

     kACTIVATION = 2,

     kPOOLING = 3,

     kLRN = 4,

     kSCALE = 5,

     kSOFTMAX = 6,

     kDECONVOLUTION = 7,

     kCONCATENATION = 8,

     kELEMENTWISE = 9,

     kPLUGIN = 10,

     kRNN = 11,

     kUNARY = 12,

     kPADDING = 13,

     kSHUFFLE = 14,

     kREDUCE = 15,

     kTOPK = 16,

     kGATHER = 17,

     kMATRIX_MULTIPLY = 18,

     kRAGGED_SOFTMAX = 19,

     kCONSTANT = 20,

     kRNN_V2 = 21,

     kIDENTITY = 22

 };


 template <>

 inline int EnumMax<LayerType>()

 {

     return 22;

 }


 enum class TensorLocation : int

 {

     kDEVICE = 0,

     kHOST = 1

 };


 template <>

 inline int EnumMax<TensorLocation>()

 {

     return 2;

 }


 class ITensor

 {

 public:

     virtual void setName(const char* name) = 0;


     virtual const char* getName() const = 0;


     virtual void setDimensions(Dims dimensions) = 0; // only valid for input tensors


     virtual Dims getDimensions() const = 0;


     virtual void setType(DataType type) = 0;


     virtual DataType getType() const = 0;


     virtual bool setDynamicRange(float min, float max) = 0;


     virtual bool isNetworkInput() const = 0;


     virtual bool isNetworkOutput() const = 0;


 protected:

     virtual ~ITensor() {}


 public:

     virtual void setBroadcastAcrossBatch(bool broadcastAcrossBatch) = 0;


     virtual bool getBroadcastAcrossBatch() const = 0;


     virtual TensorLocation getLocation() const = 0;


     virtual void setLocation(TensorLocation location) = 0;

 };


 class ILayer

 {

 public:

     virtual LayerType getType() const = 0;


     virtual void setName(const char* name) = 0;


     virtual const char* getName() const = 0;


     virtual int getNbInputs() const = 0;


     virtual ITensor* getInput(int index) const = 0;


     virtual int getNbOutputs() const = 0;


     virtual ITensor* getOutput(int index) const = 0;


     virtual void setInput(int index, ITensor& tensor) = 0;


     virtual void setPrecision(DataType dataType) = 0;


     virtual DataType getPrecision() const = 0;


     virtual bool precisionIsSet() const = 0;


     virtual void resetPrecision() = 0;


     virtual void setOutputType(int index, DataType dataType) = 0;


     virtual DataType getOutputType(int index) const = 0;


     virtual bool outputTypeIsSet(int index) const = 0;


     virtual void resetOutputType(int index) = 0;


 protected:

     virtual ~ILayer() {}

 };


 class IConvolutionLayer : public ILayer

 {

 public:

     virtual void setKernelSize(DimsHW kernelSize) = 0;


     virtual DimsHW getKernelSize() const = 0;


     virtual void setNbOutputMaps(int nbOutputMaps) = 0;


     virtual int getNbOutputMaps() const = 0;


     virtual void setStride(DimsHW stride) = 0;


     virtual DimsHW getStride() const = 0;


     virtual void setPadding(DimsHW padding) = 0;


     virtual DimsHW getPadding() const = 0; // padding defaults to 0


     virtual void setNbGroups(int nbGroups) = 0;


     virtual int getNbGroups() const = 0;


     virtual void setKernelWeights(Weights weights) = 0;


     virtual Weights getKernelWeights() const = 0;


     virtual void setBiasWeights(Weights weights) = 0;


     virtual Weights getBiasWeights() const = 0;


     virtual void setDilation(DimsHW dims) = 0;


     virtual DimsHW getDilation() const = 0;


 protected:

     virtual ~IConvolutionLayer() {}

 };


 class IFullyConnectedLayer : public ILayer

 {

 public:

     virtual void setNbOutputChannels(int nbOutputs) = 0;


     virtual int getNbOutputChannels() const = 0;


     virtual void setKernelWeights(Weights weights) = 0;


     virtual Weights getKernelWeights() const = 0;


     virtual void setBiasWeights(Weights weights) = 0;


     virtual Weights getBiasWeights() const = 0;


 protected:

     virtual ~IFullyConnectedLayer() {}

 };


 enum class ActivationType : int

 {

     kRELU = 0,

     kSIGMOID = 1,

     kTANH = 2

 };


 template <>

 inline int EnumMax<ActivationType>()

 {

     return 3;

 }


 class IActivationLayer : public ILayer

 {

 public:

     virtual void setActivationType(ActivationType type) = 0;


     virtual ActivationType getActivationType() const = 0;


 protected:

     virtual ~IActivationLayer() {}

 };


 enum class PoolingType : int

 {

     kMAX = 0,              // Maximum over elements

     kAVERAGE = 1,          // Average over elements. If the tensor is padded, the count includes the padding

     kMAX_AVERAGE_BLEND = 2 // Blending between the max pooling and average pooling: (1-blendFactor)*maxPool + blendFactor*avgPool

 };


 template <>

 inline int EnumMax<PoolingType>()

 {

     return 3;

 }


 class IPoolingLayer : public ILayer

 {

 public:

     virtual void setPoolingType(PoolingType type) = 0;


     virtual PoolingType getPoolingType() const = 0;


     virtual void setWindowSize(DimsHW windowSize) = 0;


     virtual DimsHW getWindowSize() const = 0;


     virtual void setStride(DimsHW stride) = 0;


     virtual DimsHW getStride() const = 0;


     virtual void setPadding(DimsHW padding) = 0;


     virtual DimsHW getPadding() const = 0;


     virtual void setBlendFactor(float blendFactor) = 0;


     virtual float getBlendFactor() const = 0;


     virtual void setAverageCountExcludesPadding(bool exclusive) = 0;


     virtual bool getAverageCountExcludesPadding() const = 0;


 protected:

     virtual ~IPoolingLayer() {}

 };


 class ILRNLayer : public ILayer

 {

 public:

     virtual void setWindowSize(int windowSize) = 0;


     virtual int getWindowSize() const = 0;


     virtual void setAlpha(float alpha) = 0;


     virtual float getAlpha() const = 0;


     virtual void setBeta(float beta) = 0;


     virtual float getBeta() const = 0;


     virtual void setK(float k) = 0;


     virtual float getK() const = 0;


 protected:

     virtual ~ILRNLayer() {}

 };


 enum class ScaleMode : int

 {

     kUNIFORM = 0,

     kCHANNEL = 1,

     kELEMENTWISE = 2

 };


 template <>

 inline int EnumMax<ScaleMode>()

 {

     return 3;

 }


 class IScaleLayer : public ILayer

 {

 public:

     virtual void setMode(ScaleMode mode) = 0;


     virtual ScaleMode getMode() const = 0;


     virtual void setShift(Weights shift) = 0;


     virtual Weights getShift() const = 0;


     virtual void setScale(Weights scale) = 0;


     virtual Weights getScale() const = 0;


     virtual void setPower(Weights power) = 0;


     virtual Weights getPower() const = 0;


 protected:

     virtual ~IScaleLayer() {}

 };


 class ISoftMaxLayer : public ILayer

 {

 protected:

     virtual ~ISoftMaxLayer() {}

 public:

     virtual void setAxes(uint32_t axes) = 0;


     virtual uint32_t getAxes() const = 0;

 };


 class IConcatenationLayer : public ILayer

 {

 protected:

     virtual ~IConcatenationLayer() {}


 public:

     virtual void setAxis(int axis) = 0;


     virtual int getAxis() const = 0;

 };


 class IDeconvolutionLayer : public ILayer

 {

 public:

     virtual void setKernelSize(DimsHW kernelSize) = 0;


     virtual DimsHW getKernelSize() const = 0;


     virtual void setNbOutputMaps(int nbOutputMaps) = 0;


     virtual int getNbOutputMaps() const = 0;


     virtual void setStride(DimsHW stride) = 0;


     virtual DimsHW getStride() const = 0;


     virtual void setPadding(DimsHW padding) = 0;


     virtual DimsHW getPadding() const = 0; // padding defaults to 0


     virtual void setNbGroups(int nbGroups) = 0;


     virtual int getNbGroups() const = 0;


     virtual void setKernelWeights(Weights weights) = 0;


     virtual Weights getKernelWeights() const = 0;


     virtual void setBiasWeights(Weights weights) = 0;


     virtual Weights getBiasWeights() const = 0;


 protected:

     virtual ~IDeconvolutionLayer() {}

 };


 enum class ElementWiseOperation : int

 {

     kSUM = 0,

     kPROD = 1,

     kMAX = 2,

     kMIN = 3,

     kSUB = 4,

     kDIV = 5,

     kPOW = 6

 };


 template <>

 inline int EnumMax<ElementWiseOperation>()

 {

     return 7;

 }


 class IElementWiseLayer : public ILayer

 {

 public:

     virtual void setOperation(ElementWiseOperation type) = 0;


     virtual ElementWiseOperation getOperation() const = 0;


 protected:

     virtual ~IElementWiseLayer() {}

 };


 class IGatherLayer : public ILayer

 {

 public:

     virtual void setGatherAxis(int axis) = 0;


     virtual int getGatherAxis() const = 0;


 protected:

     virtual ~IGatherLayer() {}

 };


 enum class RNNOperation : int

 {

     kRELU = 0,

     kTANH = 1,

     kLSTM = 2,

     kGRU = 3

 };


 template <>

 inline int EnumMax<RNNOperation>()

 {

     return 4;

 }


 enum class RNNDirection : int

 {

     kUNIDIRECTION = 0,

     kBIDIRECTION = 1

 };


 template <>

 inline int EnumMax<RNNDirection>()

 {

     return 2;

 }


 enum class RNNInputMode : int

 {

     kLINEAR = 0,

     kSKIP = 1

 };


 template <>

 inline int EnumMax<RNNInputMode>()

 {

     return 2;

 }


 class IRNNLayer : public ILayer

 {

 public:

     virtual unsigned getLayerCount() const = 0;


     virtual std::size_t getHiddenSize() const = 0;


     virtual int getSeqLength() const = 0;


     virtual void setOperation(RNNOperation op) = 0;


     virtual RNNOperation getOperation() const = 0;


     virtual void setInputMode(RNNInputMode op) = 0;


     virtual RNNInputMode getInputMode() const = 0;


     virtual void setDirection(RNNDirection op) = 0;


     virtual RNNDirection getDirection() const = 0;


     virtual void setWeights(Weights weights) = 0;


     virtual Weights getWeights() const = 0;


     virtual void setBias(Weights bias) = 0;


     virtual Weights getBias() const = 0;


     virtual int getDataLength() const = 0;


     virtual void setHiddenState(ITensor& hidden) = 0;


     virtual ITensor* getHiddenState() const = 0;


     virtual void setCellState(ITensor& cell) = 0;


     virtual ITensor* getCellState() const = 0;


 protected:

     virtual ~IRNNLayer() {}

 };


 enum class RNNGateType : int

 {

     kINPUT = 0,

     kOUTPUT = 1,

     kFORGET = 2,

     kUPDATE = 3,

     kRESET = 4,

     kCELL = 5,

     kHIDDEN = 6

 };


 template <>

 inline int EnumMax<RNNGateType>()

 {

     return 7;

 }


 class IRNNv2Layer : public ILayer

 {

 public:

     virtual int32_t getLayerCount() const = 0;   //< Get the layer count of the RNN

     virtual int32_t getHiddenSize() const = 0;   //< Get the hidden size of the RNN

     virtual int32_t getMaxSeqLength() const = 0; //< Get the maximum sequence length of the RNN

     virtual int32_t getDataLength() const = 0;   //< Get the maximum data length of the RNN


     virtual void setSequenceLengths(ITensor& seqLengths) = 0;


     virtual ITensor* getSequenceLengths() const = 0;


     virtual void setOperation(RNNOperation op) = 0;


     virtual RNNOperation getOperation() const = 0;


     virtual void setInputMode(RNNInputMode op) = 0;


     virtual RNNInputMode getInputMode() const = 0;


     virtual void setDirection(RNNDirection op) = 0;


     virtual RNNDirection getDirection() const = 0;


     virtual void setWeightsForGate(int layerIndex, RNNGateType gate, bool isW, Weights weights) = 0;


     virtual Weights getWeightsForGate(int layerIndex, RNNGateType gate, bool isW) const = 0;


     virtual void setBiasForGate(int layerIndex, RNNGateType gate, bool isW, Weights bias) = 0;


     virtual Weights getBiasForGate(int layerIndex, RNNGateType gate, bool isW) const = 0;


     virtual void setHiddenState(ITensor& hidden) = 0;


     virtual ITensor* getHiddenState() const = 0;


     virtual void setCellState(ITensor& cell) = 0;


     virtual ITensor* getCellState() const = 0;


 protected:

     virtual ~IRNNv2Layer() {}

 };


 class IOutputDimensionsFormula

 {

 public:

     virtual DimsHW compute(DimsHW inputDims, DimsHW kernelSize, DimsHW stride, DimsHW padding, DimsHW dilation, const char* layerName) const = 0;


 protected:

     virtual ~IOutputDimensionsFormula() {}

 };


 enum class PluginFormat : uint8_t

 {

     kNCHW = 0,

     kNC2HW2 = 1,

     kNHWC8 = 2

 };


 template <>

 inline int EnumMax<PluginFormat>()

 {

     return 3;

 }


 class IPlugin

 {

 public:

     virtual int getNbOutputs() const = 0;


     virtual Dims getOutputDimensions(int index, const Dims* inputs, int nbInputDims) = 0;


     virtual void configure(const Dims* inputDims, int nbInputs, const Dims* outputDims, int nbOutputs, int maxBatchSize) = 0;


     virtual int initialize() = 0;


     virtual void terminate() = 0;


     virtual size_t getWorkspaceSize(int maxBatchSize) const = 0;


     virtual int enqueue(int batchSize, const void* const* inputs, void** outputs, void* workspace, cudaStream_t stream) = 0;


     virtual size_t getSerializationSize() = 0;


     virtual void serialize(void* buffer) = 0;


 protected:

     virtual ~IPlugin() {}

 };


 class IPluginExt : public IPlugin

 {

 public:

     virtual int getTensorRTVersion() const

     {

         return NV_TENSORRT_VERSION;

     }


     virtual bool supportsFormat(DataType type, PluginFormat format) const = 0;


     virtual void configureWithFormat(const Dims* inputDims, int nbInputs, const Dims* outputDims, int nbOutputs, DataType type, PluginFormat format, int maxBatchSize) = 0;


     // \see IPluginCreator::getPluginName()

     virtual const char* getPluginType() const = 0;


     // \see IPluginCreator::getPluginVersion()

     virtual const char* getPluginVersion() const = 0;


     virtual void destroy() = 0;


     virtual IPluginExt* clone() const = 0;


 protected:

     void configure(const Dims* /*inputDims*/, int /*nbInputs*/, const Dims* /*outputDims*/, int /*nbOutputs*/, int /*maxBatchSize*/) _TENSORRT_FINAL {}


     virtual ~IPluginExt() {}

 };


 class IPluginLayer : public ILayer

 {

 public:

     virtual IPlugin& getPlugin() = 0;


 protected:

     virtual ~IPluginLayer() {}

 };


 enum class PluginFieldType : int

 {

     kFLOAT16 = 0,

     kFLOAT32 = 1,

     kFLOAT64 = 2,

     kINT8 = 3,

     kINT16 = 4,

     kINT32 = 5,

     kCHAR = 6,

     kDIMS = 7,

     kUNKNOWN = 8

 };


 struct PluginField

 {

     const char* name;

     const void* data;

     PluginFieldType type;

     int length;


     PluginField(const char* name_ = nullptr, const void* data_ = nullptr, const PluginFieldType type_ = PluginFieldType::kUNKNOWN, int length_ = 0)

         : name(name_)

         , data(data_)

         , type(type_)

         , length(length_)

     {

     }

 };


 struct PluginFieldCollection

 {

     int nbFields;

     const PluginField* fields;

 };


 class IPluginCreator

 {

 public:

     virtual int getTensorRTVersion() const { return NV_TENSORRT_VERSION; }


     virtual const char* getPluginName() const = 0;


     virtual const char* getPluginVersion() const = 0;


     virtual const PluginFieldCollection* getFieldNames() = 0;


     virtual IPluginExt* createPlugin(const char* name, const PluginFieldCollection* fc) = 0;


     virtual IPluginExt* deserializePlugin(const char* name, const void* serialData, size_t serialLength) = 0;


     virtual ~IPluginCreator() {}

 };


 class IPluginRegistry

 {

 public:

     virtual bool registerCreator(IPluginCreator&) = 0;


     virtual IPluginCreator* const* getPluginCreatorList(int* numCreators) const = 0;


     virtual IPluginCreator* getPluginCreator(const char* pluginType, const char* pluginVersion) = 0;


 protected:

     virtual ~IPluginRegistry() {}

 };


 enum class UnaryOperation : int

 {

     kEXP = 0,

     kLOG = 1,

     kSQRT = 2,

     kRECIP = 3,

     kABS = 4,

     kNEG = 5,

 };


 template <>

 inline int EnumMax<UnaryOperation>()

 {

     return 6;

 }


 class IUnaryLayer : public ILayer

 {

 public:

     virtual void setOperation(UnaryOperation op) = 0;


     virtual UnaryOperation getOperation() const = 0;


 protected:

     virtual ~IUnaryLayer() {}

 };


 enum class ReduceOperation : int

 {

     kSUM = 0,

     kPROD = 1,

     kMAX = 2,

     kMIN = 3,

     kAVG = 4

 };


 template <>

 inline int EnumMax<ReduceOperation>()

 {

     return 5;

 }


 class IReduceLayer : public ILayer

 {

 public:

     virtual void setOperation(ReduceOperation op) = 0;


     virtual ReduceOperation getOperation() const = 0;


     virtual void setReduceAxes(uint32_t reduceAxes) = 0;


     virtual uint32_t getReduceAxes() const = 0;


     virtual void setKeepDimensions(bool keepDimensions) = 0;


     virtual bool getKeepDimensions() const = 0;


 protected:

     virtual ~IReduceLayer() {}

 };


 class IPaddingLayer : public ILayer

 {

 public:

     virtual void setPrePadding(DimsHW padding) = 0;


     virtual DimsHW getPrePadding() const = 0;


     virtual void setPostPadding(DimsHW padding) = 0;


     virtual DimsHW getPostPadding() const = 0;


 protected:

     virtual ~IPaddingLayer() {}

 };


 struct Permutation

 {

     int order[Dims::MAX_DIMS];

 };


 class IShuffleLayer : public ILayer

 {

 public:

     virtual void setFirstTranspose(Permutation permutation) = 0;


     virtual Permutation getFirstTranspose() const = 0;


     virtual void setReshapeDimensions(Dims dimensions) = 0;


     virtual Dims getReshapeDimensions() const = 0;


     virtual void setSecondTranspose(Permutation permutation) = 0;


     virtual Permutation getSecondTranspose() const = 0;


 protected:

     virtual ~IShuffleLayer() {}

 };


 enum class TopKOperation : int

 {

     kMAX = 0,

     kMIN = 1,

 };


 template <>

 inline int EnumMax<TopKOperation>()

 {

     return 2;

 }


 class ITopKLayer : public ILayer

 {

 public:

     virtual void setOperation(TopKOperation op) = 0;


     virtual TopKOperation getOperation() const = 0;


     virtual void setK(int k) = 0;


     virtual int getK() const = 0;


     virtual void setReduceAxes(uint32_t reduceAxes) = 0;


     virtual uint32_t getReduceAxes() const = 0;


 protected:

     virtual ~ITopKLayer() {}

 };


 class IMatrixMultiplyLayer : public ILayer

 {

 public:

     virtual void setTranspose(int index, bool val) = 0;


     virtual bool getTranspose(int index) const = 0;


 protected:

     virtual ~IMatrixMultiplyLayer() {}

 };


 class IRaggedSoftMaxLayer : public ILayer

 {

 protected:

     virtual ~IRaggedSoftMaxLayer() {}

 };


 class IIdentityLayer : public ILayer

 {

 protected:

     virtual ~IIdentityLayer() {}

 };


 class IConstantLayer : public ILayer

 {

 public:

     virtual void setWeights(Weights weights) = 0;


     virtual Weights getWeights() const = 0;


     virtual void setDimensions(Dims dimensions) = 0;


     virtual Dims getDimensions() const = 0;


 protected:

     virtual ~IConstantLayer() {}

 };


 class INetworkDefinition

 {

 public:

     virtual ITensor* addInput(const char* name, DataType type, Dims dimensions) = 0;


     virtual void markOutput(ITensor& tensor) = 0;


     virtual IConvolutionLayer* addConvolution(ITensor& input, int nbOutputMaps, DimsHW kernelSize, Weights kernelWeights, Weights biasWeights) = 0;


     virtual IFullyConnectedLayer* addFullyConnected(ITensor& input, int nbOutputs, Weights kernelWeights, Weights biasWeights) = 0;


     virtual IActivationLayer* addActivation(ITensor& input, ActivationType type) = 0;


     virtual IPoolingLayer* addPooling(ITensor& input, PoolingType type, DimsHW windowSize) = 0;


     virtual ILRNLayer* addLRN(ITensor& input, int window, float alpha, float beta, float k) = 0;


     virtual IScaleLayer* addScale(ITensor& input, ScaleMode mode, Weights shift, Weights scale, Weights power) = 0;


     virtual ISoftMaxLayer* addSoftMax(ITensor& input) = 0;


     virtual IConcatenationLayer* addConcatenation(ITensor* const* inputs, int nbInputs) = 0;


     virtual IDeconvolutionLayer* addDeconvolution(ITensor& input, int nbOutputMaps, DimsHW kernelSize, Weights kernelWeights, Weights biasWeights) = 0;


     virtual IElementWiseLayer* addElementWise(ITensor& input1, ITensor& input2, ElementWiseOperation op) = 0;


     virtual IRNNLayer* addRNN(ITensor& inputs, int layerCount, std::size_t hiddenSize, int maxSeqLen, RNNOperation op, RNNInputMode mode, RNNDirection dir, Weights weights, Weights bias) = 0;


     virtual IPluginLayer* addPlugin(ITensor* const* inputs, int nbInputs, IPlugin& plugin) = 0;


     virtual IUnaryLayer* addUnary(ITensor& input, UnaryOperation operation) = 0;


     virtual IPaddingLayer* addPadding(ITensor& input, DimsHW prePadding, DimsHW postPadding) = 0;


     virtual IShuffleLayer* addShuffle(ITensor& input) = 0;


     virtual void setPoolingOutputDimensionsFormula(IOutputDimensionsFormula* formula) = 0;


     virtual IOutputDimensionsFormula& getPoolingOutputDimensionsFormula() const = 0;


     virtual void setConvolutionOutputDimensionsFormula(IOutputDimensionsFormula* formula) = 0;


     virtual IOutputDimensionsFormula& getConvolutionOutputDimensionsFormula() const = 0;


     virtual void setDeconvolutionOutputDimensionsFormula(IOutputDimensionsFormula* formula) = 0;


     virtual IOutputDimensionsFormula& getDeconvolutionOutputDimensionsFormula() const = 0;


     virtual int getNbLayers() const = 0;


     virtual ILayer* getLayer(int index) const = 0;


     virtual int getNbInputs() const = 0;


     virtual ITensor* getInput(int index) const = 0; // adding inputs invalidates indexing here


     virtual int getNbOutputs() const = 0;


     virtual ITensor* getOutput(int index) const = 0; // adding outputs invalidates indexing here


     virtual void destroy() = 0;


 protected:

     virtual ~INetworkDefinition() {}


 public:

     virtual IReduceLayer* addReduce(ITensor& input, ReduceOperation operation, uint32_t reduceAxes, bool keepDimensions) = 0;


     virtual ITopKLayer* addTopK(ITensor& input, TopKOperation op, int k, uint32_t reduceAxes) = 0;


     virtual IGatherLayer* addGather(ITensor& data, ITensor& indices, int axis) = 0;


     virtual IRaggedSoftMaxLayer* addRaggedSoftMax(ITensor& input, ITensor& bounds) = 0;


     virtual IMatrixMultiplyLayer* addMatrixMultiply(ITensor& input0, bool transpose0, ITensor& input1, bool transpose1) = 0;


     virtual IConstantLayer* addConstant(Dims dimensions, Weights weights) = 0;


     virtual IRNNv2Layer* addRNNv2(ITensor& input, int32_t layerCount, int32_t hiddenSize, int32_t maxSeqLen, RNNOperation op) = 0;


     virtual IPluginLayer* addPluginExt(ITensor* const* inputs, int nbInputs, IPluginExt& plugin) = 0;


     virtual IIdentityLayer* addIdentity(ITensor& input) = 0;


     virtual void removeTensor(ITensor& tensor) = 0;


     virtual void unmarkOutput(ITensor& tensor) = 0;

 };


 class IProfiler

 {

 public:

     virtual void reportLayerTime(const char* layerName, float ms) = 0;


 protected:

     virtual ~IProfiler() {}

 };


 class ICudaEngine;


 class IExecutionContext

 {

 public:

     virtual bool execute(int batchSize, void** bindings) = 0;


     virtual bool enqueue(int batchSize, void** bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) = 0;


     virtual void setDebugSync(bool sync) = 0;


     virtual bool getDebugSync() const = 0;


     virtual void setProfiler(IProfiler*) = 0;


     virtual IProfiler* getProfiler() const = 0;


     virtual const ICudaEngine& getEngine() const = 0;


     virtual void destroy() = 0;


 protected:

     virtual ~IExecutionContext() {}


 public:

     virtual void setName(const char* name) = 0;


     virtual const char* getName() const = 0;


     virtual void setDeviceMemory(void* memory) = 0;

 };


 class ICudaEngine

 {

 public:

     virtual int getNbBindings() const = 0;


     virtual int getBindingIndex(const char* name) const = 0;


     virtual const char* getBindingName(int bindingIndex) const = 0;


     virtual bool bindingIsInput(int bindingIndex) const = 0;


     virtual Dims getBindingDimensions(int bindingIndex) const = 0;


     virtual DataType getBindingDataType(int bindingIndex) const = 0;


     virtual int getMaxBatchSize() const = 0;


     virtual int getNbLayers() const = 0;


     virtual std::size_t getWorkspaceSize() const = 0;


     virtual IHostMemory* serialize() const = 0;


     virtual IExecutionContext* createExecutionContext() = 0;


     virtual void destroy() = 0;


     virtual TensorLocation getLocation(int bindingIndex) const = 0;


 protected:

     virtual ~ICudaEngine() {}


 public:

     virtual IExecutionContext* createExecutionContextWithoutDeviceMemory() = 0;


     virtual size_t getDeviceMemorySize() const = 0;

 };


 enum class CalibrationAlgoType : int

 {

     kLEGACY_CALIBRATION = 0,

     kENTROPY_CALIBRATION = 1

 };


 template <>

 inline int EnumMax<CalibrationAlgoType>()

 {

     return 2;

 }


 class IInt8Calibrator

 {

 public:

     virtual int getBatchSize() const = 0;


     virtual bool getBatch(void* bindings[], const char* names[], int nbBindings) = 0; // get a pointer to the input batch


     virtual const void* readCalibrationCache(std::size_t& length) = 0;


     virtual void writeCalibrationCache(const void* ptr, std::size_t length) = 0;


     virtual CalibrationAlgoType getAlgorithm() = 0;


 protected:

     virtual ~IInt8Calibrator() {}

 };


 class IInt8EntropyCalibrator : public IInt8Calibrator

 {

 public:

     virtual CalibrationAlgoType getAlgorithm() { return CalibrationAlgoType::kENTROPY_CALIBRATION; }

 protected:

     virtual ~IInt8EntropyCalibrator() {}

 };


 class IInt8LegacyCalibrator : public IInt8Calibrator

 {

 public:

     virtual CalibrationAlgoType getAlgorithm() { return CalibrationAlgoType::kLEGACY_CALIBRATION; }


     virtual double getQuantile() const = 0;


     virtual double getRegressionCutoff() const = 0;


     virtual const void* readHistogramCache(std::size_t& length) = 0;


     virtual void writeHistogramCache(const void* ptr, std::size_t length) = 0;


 protected:

     virtual ~IInt8LegacyCalibrator() {}

 };


 class IGpuAllocator

 {

 public:

     virtual void* allocate(uint64_t size, uint64_t alignment, uint32_t flags) = 0;


     virtual void free(void* memory) = 0;

 };


 class IBuilder

 {

 public:

     virtual nvinfer1::INetworkDefinition* createNetwork() = 0;


     virtual void setMaxBatchSize(int batchSize) = 0;


     virtual int getMaxBatchSize() const = 0;


     virtual void setMaxWorkspaceSize(std::size_t workspaceSize) = 0;


     virtual std::size_t getMaxWorkspaceSize() const = 0;


     virtual void setHalf2Mode(bool mode) = 0;


     virtual bool getHalf2Mode() const = 0;


     virtual void setDebugSync(bool sync) = 0;


     virtual bool getDebugSync() const = 0;


     virtual void setMinFindIterations(int minFind) = 0;


     virtual int getMinFindIterations() const = 0;


     virtual void setAverageFindIterations(int avgFind) = 0;


     virtual int getAverageFindIterations() const = 0;


     virtual nvinfer1::ICudaEngine* buildCudaEngine(nvinfer1::INetworkDefinition& network) = 0;


     virtual bool platformHasFastFp16() const = 0;


     virtual bool platformHasFastInt8() const = 0;


     virtual void destroy() = 0;


     virtual void setInt8Mode(bool mode) = 0;


     virtual bool getInt8Mode() const = 0;


     virtual void setInt8Calibrator(IInt8Calibrator* calibrator) = 0;


     virtual void setDeviceType(ILayer* layer, DeviceType deviceType) = 0;


     virtual DeviceType getDeviceType(const ILayer* layer) const = 0;


     virtual bool isDeviceTypeSet(const ILayer* layer) const = 0;


     virtual void resetDeviceType(ILayer* layer) = 0;


     virtual bool canRunOnDLA(const ILayer* layer) const = 0;


     virtual void setDefaultDeviceType(DeviceType deviceType) = 0;


     virtual DeviceType getDefaultDeviceType() const = 0;


     virtual int getMaxDLABatchSize(DeviceType deviceType) const = 0;


     virtual void allowGPUFallback(bool setFallBackMode) = 0;


     virtual void reset(nvinfer1::INetworkDefinition& network) = 0;


 protected:

     virtual ~IBuilder() {}


 public:

     virtual void setGpuAllocator(IGpuAllocator* allocator) = 0;


     virtual void setFp16Mode(bool mode) = 0;


     virtual bool getFp16Mode() const = 0;


     virtual void setStrictTypeConstraints(bool mode) = 0;


     virtual bool getStrictTypeConstraints() const = 0;


 };


 class IPluginFactory

 {

 public:

     virtual IPlugin* createPlugin(const char* layerName, const void* serialData, size_t serialLength) = 0;

 };


 class IRuntime

 {

 public:

     virtual nvinfer1::ICudaEngine* deserializeCudaEngine(const void* blob, std::size_t size, IPluginFactory* pluginFactory) = 0;


     virtual void destroy() = 0;


 protected:

     virtual ~IRuntime() {}


 public:

     virtual void setGpuAllocator(IGpuAllocator* allocator) = 0;

 };


 class ILogger

 {

 public:

     enum class Severity

     {

         kINTERNAL_ERROR = 0,

         kERROR = 1,

         kWARNING = 2,

         kINFO = 3

     };


     virtual void log(Severity severity, const char* msg) = 0;


 protected:

     virtual ~ILogger() {}

 };


 template <>

 inline int EnumMax<ILogger::Severity>()

 {

     return 4;

 }


 } // namespace nvinfer1


 extern "C" TENSORRTAPI void* createInferBuilder_INTERNAL(void* logger, int version);

 extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int version);


 extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger();


 extern "C" TENSORRTAPI int getInferLibVersion();


 extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry();


 namespace nvinfer1

 {

 namespace // unnamed namespace in case the compiler doesn't inline these

 {

 inline IBuilder* createInferBuilder(ILogger& logger)

 {

     return static_cast<IBuilder*>(createInferBuilder_INTERNAL(&logger, NV_TENSORRT_VERSION));

 }


 inline IRuntime* createInferRuntime(ILogger& logger)

 {

     return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

 }

 }


 template <typename T>

 class PluginRegistrar

 {

 public:

     PluginRegistrar() { getPluginRegistry()->registerCreator(instance); }

 private:

    T instance{};

 };


 #define REGISTER_TENSORRT_PLUGIN(name) static PluginRegistrar<name> pluginRegistrar##name{}


 }


 #endif

nvinfer1::LayerType::kELEMENTWISE
Elementwise layer.

nvinfer1::Dims::type
DimensionType type[MAX_DIMS]
The type of each dimension.
Definition: NvInfer.h:182

nvinfer1::EnumMax< PluginFormat >
int EnumMax< PluginFormat >()
Maximum number of elements in PluginFormat enum.
Definition: NvInfer.h:2496

nvinfer1::IExecutionContext::enqueue
virtual bool enqueue(int batchSize, void **bindings, cudaStream_t stream, cudaEvent_t *inputConsumed)=0
Asynchronously execute inference on a batch.

nvinfer1::DimsNCHW::w
int w() const
Get the width.
Definition: NvInfer.h:500

nvinfer1::DimsNCHW::n
int n() const
Get the index count.
Definition: NvInfer.h:458

nvinfer1::ICudaEngine
An engine for executing inference on a built network.
Definition: NvInfer.h:4055

nvinfer1::ElementWiseOperation::kSUB
Substract the second element from the first.

nvinfer1::RNNInputMode::kLINEAR
Perform the normal matrix multiplication in the first recurrent layer.

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInfer.h:118

nvinfer1::IPoolingLayer::setAverageCountExcludesPadding
virtual void setAverageCountExcludesPadding(bool exclusive)=0
Set whether average pooling uses as a denominator the overlap area between the window and the unpadde...

nvinfer1::ITensor::isNetworkInput
virtual bool isNetworkInput() const =0
Whether the tensor is a network input.

nvinfer1::LayerType::kGATHER
Gather Layer.

nvinfer1::IConvolutionLayer::getDilation
virtual DimsHW getDilation() const =0
Get the dilation for a convolution.

nvinfer1::ILogger::Severity
Severity
Definition: NvInfer.h:4756

nvinfer1::IBuilder::setMinFindIterations
virtual void setMinFindIterations(int minFind)=0
Set the number of minimization iterations used when timing layers.

nvinfer1::IBuilder::getMaxBatchSize
virtual int getMaxBatchSize() const =0
Get the maximum batch size.

nvinfer1::EnumMax< TensorLocation >
int EnumMax< TensorLocation >()
Maximum number of elements in TensorLocation enum.
Definition: NvInfer.h:589

nvinfer1::IRNNLayer::getCellState
virtual ITensor * getCellState() const =0
Get the initial cell state of the RNN.

nvinfer1::IPluginFactory::createPlugin
virtual IPlugin * createPlugin(const char *layerName, const void *serialData, size_t serialLength)=0
Create a plugin from serialized data.

nvinfer1::INetworkDefinition::addInput
virtual ITensor * addInput(const char *name, DataType type, Dims dimensions)=0
Add an input tensor to the network.

nvinfer1::ISoftMaxLayer::getAxes
virtual uint32_t getAxes() const =0
Get the axis along which softmax occurs.

nvinfer1::ILayer::resetPrecision
virtual void resetPrecision()=0
reset the computational precision for this layer

nvinfer1::IRNNLayer::setBias
virtual void setBias(Weights bias)=0
Set the bias parameters for the RNN.

nvinfer1::DimsNCHW::DimsNCHW
DimsNCHW(int batchSize, int channels, int height, int width)
Construct a DimsNCHW given batch size, channel count, height and width.
Definition: NvInfer.h:438

nvinfer1::IDeconvolutionLayer::setKernelWeights
virtual void setKernelWeights(Weights weights)=0
Set the kernel weights for the deconvolution.

nvinfer1::IReduceLayer::getOperation
virtual ReduceOperation getOperation() const =0
Get the reduce operation for the layer.

NV_TENSORRT_MAJOR
#define NV_TENSORRT_MAJOR
TensorRT major version.
Definition: NvInfer.h:56

nvinfer1::ICudaEngine::createExecutionContext
virtual IExecutionContext * createExecutionContext()=0
Create an execution context.

nvinfer1::IInt8Calibrator::getBatchSize
virtual int getBatchSize() const =0
Get the batch size used for calibration batches.

nvinfer1::RNNOperation
RNNOperation
Enumerates the RNN operations that may be performed by an RNN layer.
Definition: NvInfer.h:1871

nvinfer1::IElementWiseLayer::setOperation
virtual void setOperation(ElementWiseOperation type)=0
Set the binary operation for the layer.

nvinfer1::UnaryOperation::kSQRT
Square root.

nvinfer1::ITensor::setBroadcastAcrossBatch
virtual void setBroadcastAcrossBatch(bool broadcastAcrossBatch)=0
Set whether to enable broadcast of tensor across the batch.

nvinfer1::ISoftMaxLayer
A Softmax layer in a network definition.
Definition: NvInfer.h:1508

nvinfer1::IConvolutionLayer::getNbGroups
virtual int getNbGroups() const =0
Set the number of groups for a convolution.

nvinfer1::IScaleLayer::getPower
virtual Weights getPower() const =0
Get the power value.

nvinfer1::IRNNv2Layer::setWeightsForGate
virtual void setWeightsForGate(int layerIndex, RNNGateType gate, bool isW, Weights weights)=0
Set the weight parameters for an individual gate in the RNN.

nvinfer1::Permutation
Definition: NvInfer.h:3015

nvinfer1::IInt8LegacyCalibrator::getQuantile
virtual double getQuantile() const =0
The quantile (between 0 and 1) that will be used to select the region maximum when the quantile metho...

nvinfer1::ICudaEngine::getWorkspaceSize
virtual std::size_t getWorkspaceSize() const =0
Get the amount of workspace the engine uses.

nvinfer1::DeviceType::kGPU
GPU Device.

nvinfer1::ILogger::Severity::kERROR
An application error has occurred.

nvinfer1::ILogger::Severity::kWARNING
An application error has been discovered, but TensorRT has recovered or fallen back to a default...

nvinfer1::IRNNLayer::getBias
virtual Weights getBias() const =0
Get the bias parameter vector for the RNN.

nvinfer1::IHostMemory::destroy
virtual void destroy()=0
Destroy the allocated memory.

nvinfer1::INetworkDefinition::addMatrixMultiply
virtual IMatrixMultiplyLayer * addMatrixMultiply(ITensor &input0, bool transpose0, ITensor &input1, bool transpose1)=0
Add a MatrixMultiply layer to the network.

nvinfer1::ICudaEngine::bindingIsInput
virtual bool bindingIsInput(int bindingIndex) const =0
Determine whether a binding is an input binding.

nvinfer1::IGatherLayer::getGatherAxis
virtual int getGatherAxis() const =0
Get the non-batch dimension axis to gather on.

nvinfer1::IRNNv2Layer::setInputMode
virtual void setInputMode(RNNInputMode op)=0
Set the input mode of the RNN layer.

nvinfer1::ILayer::getName
virtual const char * getName() const =0
Return the name of a layer.

nvinfer1::IScaleLayer::getScale
virtual Weights getScale() const =0
Get the scale value.

nvinfer1::IDeconvolutionLayer::getKernelSize
virtual DimsHW getKernelSize() const =0
Get the HW kernel size of the deconvolution.

nvinfer1::IUnaryLayer
Layer that represents an unary operation.
Definition: NvInfer.h:2866

nvinfer1::LayerType::kRNN_V2
RNNv2 layer.

nvinfer1::IBuilder::destroy
virtual void destroy()=0
Destroy this object.

nvinfer1::IDeconvolutionLayer::getStride
virtual DimsHW getStride() const =0
Get the stride of the deconvolution.

nvinfer1::IPluginCreator::createPlugin
virtual IPluginExt * createPlugin(const char *name, const PluginFieldCollection *fc)=0
a plugin object. Return nullptr in case of error

nvinfer1::PluginFieldType::kFLOAT16
FP16 field type.

nvinfer1::PluginFieldType
PluginFieldType
Definition: NvInfer.h:2714

nvinfer1::ActivationType::kRELU
Rectified linear activation.

nvinfer1::IExecutionContext::getDebugSync
virtual bool getDebugSync() const =0
Get the debug sync flag.

nvinfer1::IExecutionContext::execute
virtual bool execute(int batchSize, void **bindings)=0
Synchronously execute inference on a batch.

nvinfer1::LayerType::kCONCATENATION
Concatenation layer.

nvinfer1::INetworkDefinition::destroy
virtual void destroy()=0
Destroy this INetworkDefinition object.

nvinfer1::IPluginCreator::getFieldNames
virtual const PluginFieldCollection * getFieldNames()=0
Return a list of fields that needs to be passed to createPlugin.

nvinfer1::IActivationLayer
An Activation layer in a network definition.
Definition: NvInfer.h:1165

createInferRuntime_INTERNAL
TENSORRTAPI void * createInferRuntime_INTERNAL(void *logger, int version)
Internal C entry point for creating IRuntime.

nvinfer1::DimsCHW::w
int w() const
Get the width.
Definition: NvInfer.h:375

nvinfer1::RNNGateType::kOUTPUT
Output gate (o).

nvinfer1::IPlugin::getOutputDimensions
virtual Dims getOutputDimensions(int index, const Dims *inputs, int nbInputDims)=0
Get the dimension of an output tensor.

nvinfer1::RNNDirection
RNNDirection
Enumerates the RNN direction that may be performed by an RNN layer.
Definition: NvInfer.h:1892

nvinfer1::EnumMax< DataType >
int EnumMax< DataType >()
Maximum number of elements in DataType enum.
Definition: NvInfer.h:127

nvinfer1::IMatrixMultiplyLayer
Layer that represents a Matrix Multiplication.
Definition: NvInfer.h:3195

nvinfer1::IConvolutionLayer::getKernelSize
virtual DimsHW getKernelSize() const =0
Get the HW kernel size of the convolution.

nvinfer1::IHostMemory::type
virtual DataType type() const =0
The type of the memory that was allocated.

nvinfer1::IBuilder::getAverageFindIterations
virtual int getAverageFindIterations() const =0
Query the number of averaging iterations.

nvinfer1::DimsCHW::DimsCHW
DimsCHW()
Construct an empty DimsCHW object.
Definition: NvInfer.h:314

nvinfer1::RNNInputMode::kSKIP
No operation is performed on the first recurrent layer.

nvinfer1::Weights::values
const void * values
The weight values, in a contiguous array.
Definition: NvInfer.h:515

nvinfer1::DimsNCHW::c
int c() const
Get the channel count.
Definition: NvInfer.h:472

nvinfer1::IPluginExt::configure
void configure(const Dims *, int, const Dims *, int, int) _TENSORRT_FINAL
Derived classes should not implement this. In a C++11 API it would be override final.
Definition: NvInfer.h:2683

nvinfer1::IBuilder::getDebugSync
virtual bool getDebugSync() const =0
Query whether the builder will use debug synchronization.

nvinfer1::ILRNLayer::setAlpha
virtual void setAlpha(float alpha)=0
Set the LRN alpha value.

cudaEvent_t
struct CUevent_st * cudaEvent_t
Forward declaration of cudaEvent_t.
Definition: NvInfer.h:99

nvinfer1::RNNGateType::kHIDDEN
Hidden gate (h).

nvinfer1::ICudaEngine::getBindingDimensions
virtual Dims getBindingDimensions(int bindingIndex) const =0
Get the dimensions of a binding.

nvinfer1::DimsNCHW::h
int h() const
Get the height.
Definition: NvInfer.h:486

nvinfer1::ILayer::setPrecision
virtual void setPrecision(DataType dataType)=0
Set the computational precision of this layer.

nvinfer1::IConvolutionLayer
A convolution layer in a network definition.
Definition: NvInfer.h:912

nvinfer1::INetworkDefinition::addTopK
virtual ITopKLayer * addTopK(ITensor &input, TopKOperation op, int k, uint32_t reduceAxes)=0
Add a TopK layer to the network.

nvinfer1::IPluginExt::getPluginVersion
virtual const char * getPluginVersion() const =0
Return the plugin version. Should match the plugin version returned by the corresponding plugin creat...

nvinfer1::IRuntime
Allows a serialized engine to be deserialized.
Definition: NvInfer.h:4706

nvinfer1::IShuffleLayer::getReshapeDimensions
virtual Dims getReshapeDimensions() const =0
Get the reshaped dimensions.

nvinfer1::IInt8LegacyCalibrator::writeHistogramCache
virtual void writeHistogramCache(const void *ptr, std::size_t length)=0
Save a histogram cache.

nvinfer1::PluginFormat::kNC2HW2
NCHW with 2-element packed channels.

nvinfer1::INetworkDefinition::setPoolingOutputDimensionsFormula
virtual void setPoolingOutputDimensionsFormula(IOutputDimensionsFormula *formula)=0
Set the pooling output dimensions formula.

nvinfer1::IRaggedSoftMaxLayer
A RaggedSoftmax layer in a network definition.
Definition: NvInfer.h:3229

nvinfer1::IRNNLayer::getLayerCount
virtual unsigned getLayerCount() const =0
Get the number of layers in the RNN.

nvinfer1::IPlugin::getNbOutputs
virtual int getNbOutputs() const =0
Get the number of outputs from the layer.

nvinfer1::LayerType::kPADDING
Padding Layer.

nvinfer1::IPlugin::configure
virtual void configure(const Dims *inputDims, int nbInputs, const Dims *outputDims, int nbOutputs, int maxBatchSize)=0
Configure the layer.

nvinfer1::ScaleMode
ScaleMode
Controls how scale is applied in a Scale layer.
Definition: NvInfer.h:1403

nvinfer1::IPlugin
Plugin class for user-implemented layers.
Definition: NvInfer.h:2508

nvinfer1::IConstantLayer
Layer that represents a constant value.
Definition: NvInfer.h:3251

nvinfer1::IPluginCreator::deserializePlugin
virtual IPluginExt * deserializePlugin(const char *name, const void *serialData, size_t serialLength)=0
during deserialization of plugin layer. Return a plugin object

nvinfer1::ILayer::getPrecision
virtual DataType getPrecision() const =0
get the computational precision of this layer

nvinfer1::INetworkDefinition::getLayer
virtual ILayer * getLayer(int index) const =0
Get the layer specified by the given index.

nvinfer1::IScaleLayer
A Scale layer in a network definition.
Definition: NvInfer.h:1436

nvinfer1::DataType::kHALF
FP16 format.

nvinfer1::IInt8Calibrator::getBatch
virtual bool getBatch(void *bindings[], const char *names[], int nbBindings)=0
Get a batch of input for calibration.

nvinfer1::LayerType::kRNN
RNN Layer.

nvinfer1::INetworkDefinition::addRaggedSoftMax
virtual IRaggedSoftMaxLayer * addRaggedSoftMax(ITensor &input, ITensor &bounds)=0
Add a RaggedSoftMax layer to the network.

nvinfer1::IDeconvolutionLayer::getNbGroups
virtual int getNbGroups() const =0
Get the number of groups for a deconvolution.

nvinfer1::PluginFormat::kNHWC8
NHWC with 8-element packed channels (C must be a multiple of 8).

nvinfer1::IConvolutionLayer::setNbOutputMaps
virtual void setNbOutputMaps(int nbOutputMaps)=0
Set the number of output maps for the convolution.

nvinfer1::ILogger::log
virtual void log(Severity severity, const char *msg)=0

nvinfer1::ICudaEngine::getBindingName
virtual const char * getBindingName(int bindingIndex) const =0
Retrieve the name corresponding to a binding index.

nvinfer1::INetworkDefinition::addRNNv2
virtual IRNNv2Layer * addRNNv2(ITensor &input, int32_t layerCount, int32_t hiddenSize, int32_t maxSeqLen, RNNOperation op)=0
Add an layerCount deep RNN layer to the network with hiddenSize internal states that can take a batch...

nvinfer1::LayerType::kIDENTITY
Identity layer.

nvinfer1::PluginFieldCollection::fields
const PluginField * fields
Pointer to PluginField entries.
Definition: NvInfer.h:2766

nvinfer1::IBuilder::getFp16Mode
virtual bool getFp16Mode() const =0
Query whether 16-bit kernels are permitted.

nvinfer1::INetworkDefinition::addScale
virtual IScaleLayer * addScale(ITensor &input, ScaleMode mode, Weights shift, Weights scale, Weights power)=0
Add a Scale layer to the network.

nvinfer1::IRNNLayer::setHiddenState
virtual void setHiddenState(ITensor &hidden)=0
Set the initial hidden state of the RNN with the provided hidden ITensor.

nvinfer1::LayerType::kPLUGIN
Plugin layer.

nvinfer1::EnumMax< RNNOperation >
int EnumMax< RNNOperation >()
Maximum number of elements in RNNOperation enum.
Definition: NvInfer.h:1880

nvinfer1::EnumMax< LayerType >
int EnumMax< LayerType >()
Maximum number of elements in LayerType enum.
Definition: NvInfer.h:573

nvinfer1::ISoftMaxLayer::setAxes
virtual void setAxes(uint32_t axes)=0
Set the axis along which softmax is computed. Currently, only one axis can be set.

nvinfer1::Dims::MAX_DIMS
static const int MAX_DIMS
The maximum number of dimensions supported for a tensor.
Definition: NvInfer.h:179

nvinfer1::IPaddingLayer::setPrePadding
virtual void setPrePadding(DimsHW padding)=0
Set the padding that is applied at the start of the tensor.

nvinfer1::RNNGateType::kCELL
Cell gate (c).

nvinfer1::ICudaEngine::getBindingDataType
virtual DataType getBindingDataType(int bindingIndex) const =0
Determine the required data type for a buffer from its binding index.

nvinfer1::IFullyConnectedLayer
A fully connected layer in a network definition. This layer expects an input tensor of three or more ...
Definition: NvInfer.h:1085

nvinfer1::IRNNv2Layer::getSequenceLengths
virtual ITensor * getSequenceLengths() const =0
Get the sequence lengths specified for the RNN.

nvinfer1::IBuilder::resetDeviceType
virtual void resetDeviceType(ILayer *layer)=0
reset the DeviceType for this layer

nvinfer1::ITensor::getType
virtual DataType getType() const =0
Get the data type of a tensor.

nvinfer1::DeviceType::kDLA1
DLA Core 1.

nvinfer1::PluginFormat
PluginFormat
Definition: NvInfer.h:2488

createInferBuilder_INTERNAL
TENSORRTAPI void * createInferBuilder_INTERNAL(void *logger, int version)
Internal C entry point for creating IBuilder.

nvinfer1::IReduceLayer::setKeepDimensions
virtual void setKeepDimensions(bool keepDimensions)=0
Set the boolean that specifies whether or not to keep the reduced dimensions for the layer...

nvinfer1::ILRNLayer::setBeta
virtual void setBeta(float beta)=0
Set the LRN beta value.

nvinfer1::DimsHW::w
int w() const
Get the width.
Definition: NvInfer.h:269

nvinfer1::LayerType::kFULLY_CONNECTED
Fully connected layer.

nvinfer1::ReduceOperation
ReduceOperation
Enumerates the reduce operations that may be performed by a Reduce layer.
Definition: NvInfer.h:2892

nvinfer1::PluginFieldCollection
Definition: NvInfer.h:2763

nvinfer1::ILogger::Severity::kINTERNAL_ERROR
An internal error has occurred. Execution is unrecoverable.

nvinfer1::IExecutionContext::getName
virtual const char * getName() const =0
Return the name of the execution context.

nvinfer1::ILRNLayer
A LRN layer in a network definition.
Definition: NvInfer.h:1331

nvinfer1::EnumMax< DeviceType >
int EnumMax< DeviceType >()
Maximum number of elements in DeviceType enum.
Definition: NvInfer.h:145

nvinfer1::Dims3
Descriptor for three-dimensional data.
Definition: NvInfer.h:276

nvinfer1::IBuilder::getInt8Mode
virtual bool getInt8Mode() const =0
Query whether Int8 mode is used.

nvinfer1::INetworkDefinition::getNbLayers
virtual int getNbLayers() const =0
Get the number of layers in the network.

nvinfer1::IElementWiseLayer::getOperation
virtual ElementWiseOperation getOperation() const =0
Get the binary operation for the layer.

nvinfer1::IUnaryLayer::setOperation
virtual void setOperation(UnaryOperation op)=0
Set the unary operation for the layer.

nvinfer1::INetworkDefinition::addPadding
virtual IPaddingLayer * addPadding(ITensor &input, DimsHW prePadding, DimsHW postPadding)=0
Add a padding layer to the network.

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInfer.h:582

nvinfer1::LayerType::kUNARY
UnaryOp Operation Layer.

nvinfer1::IGatherLayer
Definition: NvInfer.h:1770

nvinfer1::IBuilder
Builds an engine from a network definition.
Definition: NvInfer.h:4397

nvinfer1::INetworkDefinition::markOutput
virtual void markOutput(ITensor &tensor)=0
Mark a tensor as a network output.

nvinfer1::IDeconvolutionLayer::getPadding
virtual DimsHW getPadding() const =0
Get the padding of the deconvolution.

nvinfer1::UnaryOperation::kABS
Absolute value.

nvinfer1::IRNNv2Layer::setOperation
virtual void setOperation(RNNOperation op)=0
Set the operation of the RNN layer.

nvinfer1::IInt8Calibrator::writeCalibrationCache
virtual void writeCalibrationCache(const void *ptr, std::size_t length)=0
Save a calibration cache.

nvinfer1::IConvolutionLayer::setBiasWeights
virtual void setBiasWeights(Weights weights)=0
Set the bias weights for the convolution.

getLogger
TENSORRTAPI nvinfer1::ILogger * getLogger()
Return the logger object.

nvinfer1::ITopKLayer::getOperation
virtual TopKOperation getOperation() const =0
Get the operation for the layer.

nvinfer1::DeviceType::kDLA0
DLA core 0.

nvinfer1::ITopKLayer
Layer that represents a TopK reduction.
Definition: NvInfer.h:3125

nvinfer1::IRNNv2Layer::getInputMode
virtual RNNInputMode getInputMode() const =0
Get the input mode of the RNN layer.

nvinfer1::EnumMax< ActivationType >
int EnumMax< ActivationType >()
Maximum number of elements in ActivationType enum.
Definition: NvInfer.h:1151

nvinfer1::IBuilder::setInt8Mode
virtual void setInt8Mode(bool mode)=0
Set the maximum value for a region.

nvinfer1::IShuffleLayer::setReshapeDimensions
virtual void setReshapeDimensions(Dims dimensions)=0
Set the reshaped dimensions.

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInfer.h:514

nvinfer1::ILRNLayer::getBeta
virtual float getBeta() const =0
Get the LRN beta value.

nvinfer1::IDeconvolutionLayer::setPadding
virtual void setPadding(DimsHW padding)=0
Set the padding of the deconvolution.

nvinfer1::LayerType::kLRN
LRN layer.

nvinfer1::IPlugin::enqueue
virtual int enqueue(int batchSize, const void *const *inputs, void **outputs, void *workspace, cudaStream_t stream)=0
Execute the layer.

nvinfer1::ITensor::getLocation
virtual TensorLocation getLocation() const =0
Get the storage location of a tensor.

nvinfer1::IRNNv2Layer
An RNN layer in a network definition, version 2.
Definition: NvInfer.h:2296

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInfer.h:4836

nvinfer1::ActivationType::kSIGMOID
Sigmoid activation.

nvinfer1::ITensor::setType
virtual void setType(DataType type)=0
Set the data type of a tensor.

nvinfer1::INetworkDefinition::getOutput
virtual ITensor * getOutput(int index) const =0
Get the output tensor specified by the given index.

nvinfer1::IShuffleLayer::getSecondTranspose
virtual Permutation getSecondTranspose() const =0
Get the permutation applied by the second transpose operation.

nvinfer1::DimsCHW::h
int & h()
Get the height.
Definition: NvInfer.h:354

nvinfer1::DimensionType::kSPATIAL
Elements correspond to different spatial data.

nvinfer1::IConvolutionLayer::getPadding
virtual DimsHW getPadding() const =0
Get the padding of the convolution.

nvinfer1::IBuilder::createNetwork
virtual nvinfer1::INetworkDefinition * createNetwork()=0
Create a network definition object.

nvinfer1::PluginFieldType::kFLOAT64
FP64 field type.

nvinfer1::IFullyConnectedLayer::getNbOutputChannels
virtual int getNbOutputChannels() const =0
Get the number of output channels K from the fully connected layer.

nvinfer1::IMatrixMultiplyLayer::getTranspose
virtual bool getTranspose(int index) const =0
Get the transpose flag for an input tensor.

nvinfer1::IConstantLayer::getWeights
virtual Weights getWeights() const =0
Get the weights for the layer.

nvinfer1::IBuilder::setFp16Mode
virtual void setFp16Mode(bool mode)=0
Set whether or not 16-bit kernels are permitted.

nvinfer1::IProfiler::reportLayerTime
virtual void reportLayerTime(const char *layerName, float ms)=0
Layer time reporting callback.

nvinfer1::LayerType::kRAGGED_SOFTMAX
Ragged softmax Layer.

nvinfer1::ITopKLayer::setK
virtual void setK(int k)=0
Set the k value for the layer.

nvinfer1::INetworkDefinition::addDeconvolution
virtual IDeconvolutionLayer * addDeconvolution(ITensor &input, int nbOutputMaps, DimsHW kernelSize, Weights kernelWeights, Weights biasWeights)=0
Add a deconvolution layer to the network.

nvinfer1::INetworkDefinition::addActivation
virtual IActivationLayer * addActivation(ITensor &input, ActivationType type)=0
Add an activation layer to the network.

nvinfer1::IFullyConnectedLayer::getKernelWeights
virtual Weights getKernelWeights() const =0
Get the kernel weights.

nvinfer1::UnaryOperation::kLOG
Log (base e).

nvinfer1::IExecutionContext::setName
virtual void setName(const char *name)=0
Set the name of the execution context.

nvinfer1::INetworkDefinition::getNbOutputs
virtual int getNbOutputs() const =0
Get the number of outputs in the network.

nvinfer1::DimsNCHW::n
int & n()
Get the index count.
Definition: NvInfer.h:451

nvinfer1::TensorLocation::kDEVICE
Data stored on device.

nvinfer1::EnumMax< TopKOperation >
int EnumMax< TopKOperation >()
Maximum number of elements in TopKOperation enum.
Definition: NvInfer.h:3115

nvinfer1::DimensionType::kSEQUENCE
Elements correspond to different sequence values.

nvinfer1::IHostMemory::size
virtual std::size_t size() const =0
The size in bytes of the data that was allocated.

nvinfer1::EnumMax
int EnumMax()
Maximum number of elements in an enumeration type.

nvinfer1::IBuilder::isDeviceTypeSet
virtual bool isDeviceTypeSet(const ILayer *layer) const =0
whether the DeviceType has been explicitly set for this layer

nvinfer1::DimsCHW::c
int c() const
Get the channel count.
Definition: NvInfer.h:347

nvinfer1::DimsCHW::w
int & w()
Get the width.
Definition: NvInfer.h:368

nvinfer1::INetworkDefinition::addElementWise
virtual IElementWiseLayer * addElementWise(ITensor &input1, ITensor &input2, ElementWiseOperation op)=0
Add an elementwise layer to the network.

nvinfer1::IPoolingLayer::getAverageCountExcludesPadding
virtual bool getAverageCountExcludesPadding() const =0
Get whether exclusive pooling uses as a denominator the overlap area betwen the window and the unpadd...

nvinfer1::IReduceLayer
Layer that represents a reduction operator.
Definition: NvInfer.h:2912

nvinfer1::IInt8LegacyCalibrator
Definition: NvInfer.h:4309

nvinfer1::PoolingType
PoolingType
The type of pooling to perform in a pooling layer.
Definition: NvInfer.h:1191

nvinfer1::DimsCHW::h
int h() const
Get the height.
Definition: NvInfer.h:361

nvinfer1::IPluginRegistry
Definition: NvInfer.h:2814

nvinfer1::ElementWiseOperation::kSUM
Sum of the two elements.

nvinfer1::IPoolingLayer::getBlendFactor
virtual float getBlendFactor() const =0
Get the blending factor for the max_average_blend mode: max_average_blendPool = (1-blendFactor)*maxPo...

nvinfer1::Permutation::order
int order[Dims::MAX_DIMS]
Definition: NvInfer.h:3023

nvinfer1::EnumMax< RNNGateType >
int EnumMax< RNNGateType >()
Maximum number of elements in RNNGateType enum.
Definition: NvInfer.h:2284

nvinfer1::IScaleLayer::setMode
virtual void setMode(ScaleMode mode)=0
Set the scale mode.

nvinfer1::ILayer::getInput
virtual ITensor * getInput(int index) const =0
Get the layer input corresponding to the given index.

nvinfer1::IPluginExt::supportsFormat
virtual bool supportsFormat(DataType type, PluginFormat format) const =0
Check format support.

nvinfer1::INetworkDefinition::setConvolutionOutputDimensionsFormula
virtual void setConvolutionOutputDimensionsFormula(IOutputDimensionsFormula *formula)=0
Set the convolution output dimensions formula.

nvinfer1::IPluginCreator
Plugin creator class for user implemented layers.
Definition: NvInfer.h:2777

nvinfer1::DimsHW::w
int & w()
Get the width.
Definition: NvInfer.h:262

nvinfer1::IRNNv2Layer::setSequenceLengths
virtual void setSequenceLengths(ITensor &seqLengths)=0
Specify individual sequence lengths in the batch with the ITensor pointed to by seqLengths.

nvinfer1::IPluginFactory
Plugin factory for deserialization.
Definition: NvInfer.h:4681

nvinfer1::INetworkDefinition::getNbInputs
virtual int getNbInputs() const =0
Get the number of inputs in the network.

nvinfer1::IRNNv2Layer::getHiddenState
virtual ITensor * getHiddenState() const =0
Get the initial hidden state of the RNN.

nvinfer1::PluginField::length
int length
Number of data entries in the Plugin attribute.
Definition: NvInfer.h:2752

nvinfer1::ITopKLayer::setOperation
virtual void setOperation(TopKOperation op)=0
Set the operation for the layer.

nvinfer1::DimsCHW
Descriptor for data with one channel dimension and two spatial dimensions.
Definition: NvInfer.h:308

nvinfer1::IPoolingLayer::getWindowSize
virtual DimsHW getWindowSize() const =0
Get the window size for pooling.

nvinfer1::ElementWiseOperation::kPOW
The first element to the power of the second element.

nvinfer1::INetworkDefinition
A network definition for input to the builder.
Definition: NvInfer.h:3295

nvinfer1::ICudaEngine::getNbLayers
virtual int getNbLayers() const =0
Get the number of layers in the network.

nvinfer1::ICudaEngine::serialize
virtual IHostMemory * serialize() const =0
Serialize the network to a stream.

nvinfer1::IInt8LegacyCalibrator::getAlgorithm
virtual CalibrationAlgoType getAlgorithm()
Definition: NvInfer.h:4315

nvinfer1::INetworkDefinition::addUnary
virtual IUnaryLayer * addUnary(ITensor &input, UnaryOperation operation)=0
Add a unary layer to the network.

nvinfer1::PluginField
Structure containing plugin attribute field names and associated data This information can be parsed ...
Definition: NvInfer.h:2734

nvinfer1::IReduceLayer::setOperation
virtual void setOperation(ReduceOperation op)=0
Set the reduce operation for the layer.

nvinfer1::IPluginCreator::getTensorRTVersion
virtual int getTensorRTVersion() const
Return the version of the API the plugin creator was compiled with.
Definition: NvInfer.h:2783

nvinfer1::IRuntime::destroy
virtual void destroy()=0
Destroy this object.

nvinfer1::EnumMax< CalibrationAlgoType >
int EnumMax< CalibrationAlgoType >()
Maximum number of elements in CalibrationAlgoType enum.
Definition: NvInfer.h:4215

nvinfer1::IRNNLayer::getDirection
virtual RNNDirection getDirection() const =0
Get the direction of the RNN layer.

nvinfer1::IPoolingLayer::getPadding
virtual DimsHW getPadding() const =0
Get the padding for pooling.

nvinfer1::IPlugin::getSerializationSize
virtual size_t getSerializationSize()=0
Find the size of the serialization buffer required.

nvinfer1::IRNNLayer::getHiddenState
virtual ITensor * getHiddenState() const =0
Get the initial hidden state of the RNN.

nvinfer1::INetworkDefinition::addConstant
virtual IConstantLayer * addConstant(Dims dimensions, Weights weights)=0
Add a constant layer to the network.

nvinfer1::IBuilder::setGpuAllocator
virtual void setGpuAllocator(IGpuAllocator *allocator)=0
Set the GPU allocator.

nvinfer1::DataType::kINT32
INT32 format.

nvinfer1::IBuilder::getStrictTypeConstraints
virtual bool getStrictTypeConstraints() const =0
Query whether or not type constraints are strict.

nvinfer1::ElementWiseOperation::kDIV
Divide the first element by the second.

nvinfer1::IBuilder::getMinFindIterations
virtual int getMinFindIterations() const =0
Query the number of minimization iterations.

nvinfer1::ILayer::getType
virtual LayerType getType() const =0
Return the type of a layer.

nvinfer1::IExecutionContext::setDeviceMemory
virtual void setDeviceMemory(void *memory)=0
set the device memory for use by this execution context.

nvinfer1::ILRNLayer::getK
virtual float getK() const =0
Get the LRN K value.

nvinfer1::ILayer::resetOutputType
virtual void resetOutputType(int index)=0
reset the output type for this layer

nvinfer1::IRNNv2Layer::getDirection
virtual RNNDirection getDirection() const =0
Get the direction of the RNN layer.

nvinfer1::ElementWiseOperation::kPROD
Product of the two elements.

nvinfer1::Dims2::Dims2
Dims2()
Construct an empty Dims2 object.
Definition: NvInfer.h:195

nvinfer1::IExecutionContext::getProfiler
virtual IProfiler * getProfiler() const =0
Get the profiler.

nvinfer1::LayerType::kTOPK
TopK Layer.

nvinfer1::TopKOperation
TopKOperation
Enumerates the operations that may be performed by a TopK layer.
Definition: NvInfer.h:3108

nvinfer1::IRNNv2Layer::getWeightsForGate
virtual Weights getWeightsForGate(int layerIndex, RNNGateType gate, bool isW) const =0
Get the weight parameters for an individual gate in the RNN.

cudaStream_t
struct CUstream_st * cudaStream_t
Forward declaration of cudaStream_t.
Definition: NvInfer.h:98

nvinfer1::Dims3::Dims3
Dims3(int d0, int d1, int d2)
Construct a Dims3 from 3 elements.
Definition: NvInfer.h:295

nvinfer1::IPoolingLayer::setStride
virtual void setStride(DimsHW stride)=0
Set the stride for pooling.

nvinfer1::LayerType::kDECONVOLUTION
Deconvolution layer.

nvinfer1::IRNNLayer::getSeqLength
virtual int getSeqLength() const =0
Get the sequence length.

nvinfer1::Dims4
Descriptor for four-dimensional data.
Definition: NvInfer.h:382

nvinfer1::IPoolingLayer::getStride
virtual DimsHW getStride() const =0
Get the stride for pooling.

nvinfer1::DimensionType::kCHANNEL
Elements correspond to different channels.

nvinfer1::IBuilder::setStrictTypeConstraints
virtual void setStrictTypeConstraints(bool mode)=0
Set whether or not type constraints are strict.

nvinfer1::EnumMax< ReduceOperation >
int EnumMax< ReduceOperation >()
Maximum number of elements in ReduceOperation enum.
Definition: NvInfer.h:2902

nvinfer1::EnumMax< DimensionType >
int EnumMax< DimensionType >()
Maximum number of elements in DimensionType enum.
Definition: NvInfer.h:163

nvinfer1::PluginFieldType::kDIMS
nvinfer1::Dims field type.

nvinfer1::ActivationType
ActivationType
Enumerates the types of activation to perform in an activation layer.
Definition: NvInfer.h:1143

nvinfer1::INetworkDefinition::setDeconvolutionOutputDimensionsFormula
virtual void setDeconvolutionOutputDimensionsFormula(IOutputDimensionsFormula *formula)=0
Set the deconvolution output dimensions formula.

nvinfer1::DimsNCHW
Descriptor for data with one index dimension, one channel dimension and two spatial dimensions...
Definition: NvInfer.h:416

nvinfer1::IFullyConnectedLayer::setKernelWeights
virtual void setKernelWeights(Weights weights)=0
Set the kernel weights, given as a KxC matrix in row-major order.

nvinfer1::ITensor::setDynamicRange
virtual bool setDynamicRange(float min, float max)=0
Set user calibration scales.

nvinfer1::IBuilder::setMaxBatchSize
virtual void setMaxBatchSize(int batchSize)=0
Set the maximum batch size.

nvinfer1::ICudaEngine::getBindingIndex
virtual int getBindingIndex(const char *name) const =0
Retrieve the binding index for a named tensor.

nvinfer1::INetworkDefinition::addFullyConnected
virtual IFullyConnectedLayer * addFullyConnected(ITensor &input, int nbOutputs, Weights kernelWeights, Weights biasWeights)=0
Add a fully connected layer to the network.

getPluginRegistry
TENSORRTAPI nvinfer1::IPluginRegistry * getPluginRegistry()
Return the plugin registry.

nvinfer1::IGatherLayer::setGatherAxis
virtual void setGatherAxis(int axis)=0
Set the non-batch dimension axis to gather on. The axis must be less than the number of non-batch dim...

nvinfer1::ITopKLayer::getK
virtual int getK() const =0
Get the k value for the layer.

nvinfer1::IInt8Calibrator::readCalibrationCache
virtual const void * readCalibrationCache(std::size_t &length)=0
Load a calibration cache.

nvinfer1::IRNNv2Layer::setBiasForGate
virtual void setBiasForGate(int layerIndex, RNNGateType gate, bool isW, Weights bias)=0
Set the bias parameters for an individual gate in the RNN.

nvinfer1::IBuilder::setDeviceType
virtual void setDeviceType(ILayer *layer, DeviceType deviceType)=0
Set the device that this layer must execute on.

nvinfer1::INetworkDefinition::addReduce
virtual IReduceLayer * addReduce(ITensor &input, ReduceOperation operation, uint32_t reduceAxes, bool keepDimensions)=0
Add a reduce layer to the network.

nvinfer1::TensorLocation::kHOST
Data stored on host.

nvinfer1::IPoolingLayer::setPadding
virtual void setPadding(DimsHW padding)=0
Set the padding for pooling.

nvinfer1::DimsHW::DimsHW
DimsHW()
Construct an empty DimsHW object.
Definition: NvInfer.h:225

nvinfer1::IPoolingLayer::setWindowSize
virtual void setWindowSize(DimsHW windowSize)=0
Set the window size for pooling.

nvinfer1::ILayer
Base class for all layer classes in a network definition.
Definition: NvInfer.h:753

nvinfer1::DataType::kINT8
quantized INT8 format.

nvinfer1::IMatrixMultiplyLayer::setTranspose
virtual void setTranspose(int index, bool val)=0
Set the transpose flag for an input tensor.

nvinfer1::Dims4::Dims4
Dims4(int d0, int d1, int d2, int d3)
Construct a Dims4 from 4 elements.
Definition: NvInfer.h:402

nvinfer1::EnumMax< PoolingType >
int EnumMax< PoolingType >()
Maximum number of elements in PoolingType enum.
Definition: NvInfer.h:1199

nvinfer1::DimsNCHW::h
int & h()
Get the height.
Definition: NvInfer.h:479

nvinfer1::UnaryOperation::kRECIP
Reciprocal.

nvinfer1::ILRNLayer::getWindowSize
virtual int getWindowSize() const =0
Get the LRN window size.

nvinfer1::DimsHW::h
int & h()
Get the height.
Definition: NvInfer.h:248

nvinfer1::IGpuAllocator::free
virtual void free(void *memory)=0

nvinfer1::IBuilder::reset
virtual void reset(nvinfer1::INetworkDefinition &network)=0
Resets the builder state.

nvinfer1::IActivationLayer::setActivationType
virtual void setActivationType(ActivationType type)=0
Set the type of activation to be performed.

getInferLibVersion
TENSORRTAPI int getInferLibVersion()
Return the library version number.

nvinfer1::IRNNLayer::getHiddenSize
virtual std::size_t getHiddenSize() const =0
Get the size of the hidden layers.

nvinfer1::DimsNCHW::c
int & c()
Get the channel count.
Definition: NvInfer.h:465

nvinfer1::IDeconvolutionLayer::setStride
virtual void setStride(DimsHW stride)=0
Get the stride of the deconvolution.

nvinfer1::Dims
Structure to define the dimensions of a tensor.
Definition: NvInfer.h:176

nvinfer1::RNNDirection::kBIDIRECTION
Network iterates from first to last and vice versa and outputs concatenated.

NV_TENSORRT_PATCH
#define NV_TENSORRT_PATCH
TensorRT patch version.
Definition: NvInfer.h:58

nvinfer1::INetworkDefinition::addRNN
virtual IRNNLayer * addRNN(ITensor &inputs, int layerCount, std::size_t hiddenSize, int maxSeqLen, RNNOperation op, RNNInputMode mode, RNNDirection dir, Weights weights, Weights bias)=0
Add an layerCount deep RNN layer to the network with a sequence length of maxSeqLen and hiddenSize in...

nvinfer1::ILayer::precisionIsSet
virtual bool precisionIsSet() const =0
whether the computational precision has been set for this layer

nvinfer1::ITopKLayer::setReduceAxes
virtual void setReduceAxes(uint32_t reduceAxes)=0
Set which axes to reduce for the layer.

nvinfer1::IRuntime::setGpuAllocator
virtual void setGpuAllocator(IGpuAllocator *allocator)=0
Set the GPU allocator.

nvinfer1::IShuffleLayer
Layer type for shuffling data.
Definition: NvInfer.h:3026

nvinfer1::IBuilder::platformHasFastFp16
virtual bool platformHasFastFp16() const =0
Determine whether the platform has fast native fp16.

nvinfer1::DimsCHW::DimsCHW
DimsCHW(int channels, int height, int width)
Construct a DimsCHW given channel count, height and width.
Definition: NvInfer.h:328

nvinfer1::IElementWiseLayer
A elementwise layer in a network definition.
Definition: NvInfer.h:1743

nvinfer1::IPoolingLayer
A Pooling layer in a network definition.
Definition: NvInfer.h:1212

nvinfer1::IBuilder::setDefaultDeviceType
virtual void setDefaultDeviceType(DeviceType deviceType)=0
Sets the default DeviceType to be used by the builder. It ensures that all the layers that can run on...

_TENSORRT_FINAL
#define _TENSORRT_FINAL
Defines which symbols are exported.
Definition: NvInfer.h:68

nvinfer1::IRNNv2Layer::getOperation
virtual RNNOperation getOperation() const =0
Get the operation of the RNN layer.

nvinfer1::IPlugin::serialize
virtual void serialize(void *buffer)=0
Serialize the layer.

nvinfer1::IConvolutionLayer::setDilation
virtual void setDilation(DimsHW dims)=0
Set the dilation for a convolution.

nvinfer1::IRNNLayer::setOperation
virtual void setOperation(RNNOperation op)=0
Set the operation of the RNN layer.

nvinfer1::IPluginExt::configureWithFormat
virtual void configureWithFormat(const Dims *inputDims, int nbInputs, const Dims *outputDims, int nbOutputs, DataType type, PluginFormat format, int maxBatchSize)=0
Configure the layer.

nvinfer1::IPaddingLayer::getPrePadding
virtual DimsHW getPrePadding() const =0
Set the padding that is applied at the start of the tensor.

nvinfer1::IRNNv2Layer::setDirection
virtual void setDirection(RNNDirection op)=0
Set the direction of the RNN layer.

nvinfer1::Dims::d
int d[MAX_DIMS]
The extent of each dimension.
Definition: NvInfer.h:181

nvinfer1::RNNGateType::kFORGET
Forget gate (f).

nvinfer1::IOutputDimensionsFormula
Application-implemented interface to compute layer output sizes.
Definition: NvInfer.h:2458

nvinfer1::ElementWiseOperation::kMIN
Minimum of the two elements.

nvinfer1::IFullyConnectedLayer::getBiasWeights
virtual Weights getBiasWeights() const =0
Get the bias weights.

NV_TENSORRT_MINOR
#define NV_TENSORRT_MINOR
TensorRT minor version.
Definition: NvInfer.h:57

nvinfer1::ICudaEngine::getNbBindings
virtual int getNbBindings() const =0
Get the number of binding indices.

nvinfer1::IConvolutionLayer::setPadding
virtual void setPadding(DimsHW padding)=0
Set the padding of the convolution.

nvinfer1::ITensor::getDimensions
virtual Dims getDimensions() const =0
Get the dimensions of a tensor.

nvinfer1::INetworkDefinition::removeTensor
virtual void removeTensor(ITensor &tensor)=0
remove a tensor from the network definition.

nvinfer1::ElementWiseOperation
ElementWiseOperation
Enumerates the binary operations that may be performed by an ElementWise layer.
Definition: NvInfer.h:1717

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInfer.h:516

nvinfer1::RNNOperation::kGRU
Three-gate network consisting of Gated Recurrent Units.

nvinfer1::ITensor::getName
virtual const char * getName() const =0
Get the tensor name.

nvinfer1::IPluginExt::getPluginType
virtual const char * getPluginType() const =0
Return the plugin type. Should match the plugin name returned by the corresponding plugin creator...

nvinfer1::RNNGateType
RNNGateType
Identifies an individual gate within an RNN cell.
Definition: NvInfer.h:2272

nvinfer1::RNNDirection::kUNIDIRECTION
Network iterations from first input to last input.

nvinfer1::IDeconvolutionLayer::setBiasWeights
virtual void setBiasWeights(Weights weights)=0
Set the bias weights for the deconvolution.

nvinfer1::DimsCHW::c
int & c()
Get the channel count.
Definition: NvInfer.h:340

nvinfer1::IShuffleLayer::setSecondTranspose
virtual void setSecondTranspose(Permutation permutation)=0
Set the permutation applied by the second transpose operation.

nvinfer1::IReduceLayer::getKeepDimensions
virtual bool getKeepDimensions() const =0
Get the boolean that specifies whether or not to keep the reduced dimensions for the layer...

nvinfer1::ITensor::isNetworkOutput
virtual bool isNetworkOutput() const =0
Whether the tensor is a network output.

nvinfer1::Dims3::Dims3
Dims3()
Construct an empty Dims3 object.
Definition: NvInfer.h:282

nvinfer1::ITensor::getBroadcastAcrossBatch
virtual bool getBroadcastAcrossBatch() const =0
Check if tensor is broadcast across the batch.

nvinfer1::IRNNv2Layer::getCellState
virtual ITensor * getCellState() const =0
Get the initial cell state of the RNN.

nvinfer1::IRNNv2Layer::setCellState
virtual void setCellState(ITensor &cell)=0
Set the initial cell state of the LSTM with the provided cell ITensor.

nvinfer1::ITensor
A tensor in a network definition.
Definition: NvInfer.h:601

nvinfer1::ICudaEngine::destroy
virtual void destroy()=0
Destroy this object;.

nvinfer1::ITensor::setLocation
virtual void setLocation(TensorLocation location)=0
Set the storage location of a tensor.

nvinfer1::IPluginRegistry::getPluginCreatorList
virtual IPluginCreator *const * getPluginCreatorList(int *numCreators) const =0
Return all the registered plugin creators and the number of registered plugin creators. Returns nullptr if none found.

nvinfer1::LayerType::kCONSTANT
Constant Layer.

nvinfer1::EnumMax< UnaryOperation >
int EnumMax< UnaryOperation >()
Maximum number of elements in UnaryOperation enum.
Definition: NvInfer.h:2856

nvinfer1::IPoolingLayer::setBlendFactor
virtual void setBlendFactor(float blendFactor)=0
Set the blending factor for the max_average_blend mode: max_average_blendPool = (1-blendFactor)*maxPo...

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInfer.h:511

nvinfer1::DimsNCHW::w
int & w()
Get the width.
Definition: NvInfer.h:493

nvinfer1::PluginField::name
const char * name
Plugin field attribute name.
Definition: NvInfer.h:2739

nvinfer1::DimsHW::h
int h() const
Get the height.
Definition: NvInfer.h:255

nvinfer1::IRNNLayer::getDataLength
virtual int getDataLength() const =0
Get the length of the data being processed by the RNN for use in computing other values.

nvinfer1::RNNGateType::kUPDATE
Update gate (z).

nvinfer1::IBuilder::getDeviceType
virtual DeviceType getDeviceType(const ILayer *layer) const =0
Get the device that this layer executes on.

nvinfer1::IRuntime::deserializeCudaEngine
virtual nvinfer1::ICudaEngine * deserializeCudaEngine(const void *blob, std::size_t size, IPluginFactory *pluginFactory)=0
Deserialize an engine from a stream.

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreator &)=0
Register a plugin creator. Returns false if one with same type is already registered.

nvinfer1::IBuilder::buildCudaEngine
virtual nvinfer1::ICudaEngine * buildCudaEngine(nvinfer1::INetworkDefinition &network)=0
Build a CUDA engine from a network definition.

nvinfer1::LayerType::kREDUCE
Reduce layer.

nvinfer1::Dims2::Dims2
Dims2(int d0, int d1)
Construct a Dims2 from 2 elements.
Definition: NvInfer.h:207

nvinfer1::IScaleLayer::getShift
virtual Weights getShift() const =0
Get the shift value.

nvinfer1::IConcatenationLayer::setAxis
virtual void setAxis(int axis)=0
Set the axis along which concatenation occurs.

nvinfer1::IDeconvolutionLayer::getNbOutputMaps
virtual int getNbOutputMaps() const =0
Get the number of output feature maps for the deconvolution.

nvinfer1::Dims4::Dims4
Dims4()
Construct an empty Dims2 object.
Definition: NvInfer.h:388

nvinfer1::IScaleLayer::setScale
virtual void setScale(Weights scale)=0
Set the scale value.

nvinfer1::ILayer::setInput
virtual void setInput(int index, ITensor &tensor)=0
replace an input of this layer with a specific tensor

nvinfer1::INetworkDefinition::addPooling
virtual IPoolingLayer * addPooling(ITensor &input, PoolingType type, DimsHW windowSize)=0
Add a pooling layer to the network.

nvinfer1::Dims::nbDims
int nbDims
The number of dimensions.
Definition: NvInfer.h:180

nvinfer1::IBuilder::platformHasFastInt8
virtual bool platformHasFastInt8() const =0
Determine whether the platform has fast native int8.

nvinfer1::IConvolutionLayer::getStride
virtual DimsHW getStride() const =0
Get the stride of the convolution.

nvinfer1::IInt8Calibrator
Application-implemented interface for calibration.
Definition: NvInfer.h:4231

nvinfer1::ILogger
Application-implemented logging interface for the builder, engine and runtime.
Definition: NvInfer.h:4748

nvinfer1::ILayer::getOutputType
virtual DataType getOutputType(int index) const =0
get the output type of this layer

nvinfer1::INetworkDefinition::addPluginExt
virtual IPluginLayer * addPluginExt(ITensor *const *inputs, int nbInputs, IPluginExt &plugin)=0
Add a plugin layer to the network using an IPluginExt interface.

nvinfer1::IRNNLayer::setDirection
virtual void setDirection(RNNDirection op)=0
Set the direction of the RNN layer.

nvinfer1::IBuilder::setInt8Calibrator
virtual void setInt8Calibrator(IInt8Calibrator *calibrator)=0
Set Int8 Calibration interface.

nvinfer1::ILayer::outputTypeIsSet
virtual bool outputTypeIsSet(int index) const =0
whether the output type has been set for this layer

nvinfer1::LayerType::kACTIVATION
Activation layer.

nvinfer1::DimsHW::DimsHW
DimsHW(int height, int width)
Construct a DimsHW given height and width.
Definition: NvInfer.h:237

nvinfer1::IHostMemory::data
virtual void * data() const =0
A pointer to the raw data that is owned by the library.

nvinfer1::UnaryOperation::kNEG
Negation.

nvinfer1::ScaleMode::kUNIFORM
Identical coefficients across all elements of the tensor.

nvinfer1::EnumMax< ElementWiseOperation >
int EnumMax< ElementWiseOperation >()
Maximum number of elements in ElementWiseOperation enum.
Definition: NvInfer.h:1729

nvinfer1::IPluginExt
Plugin class for user-implemented layers.
Definition: NvInfer.h:2613

nvinfer1::IPaddingLayer
Layer that represents a padding operation.
Definition: NvInfer.h:2969

nvinfer1::IFullyConnectedLayer::setBiasWeights
virtual void setBiasWeights(Weights weights)=0
Set the bias weights.

nvinfer1::INetworkDefinition::addIdentity
virtual IIdentityLayer * addIdentity(ITensor &input)=0
Add an identity layer.

nvinfer1::IDeconvolutionLayer::setNbOutputMaps
virtual void setNbOutputMaps(int nbOutputMaps)=0
Set the number of output feature maps for the deconvolution.

nvinfer1::IFullyConnectedLayer::setNbOutputChannels
virtual void setNbOutputChannels(int nbOutputs)=0
Set the number of output channels K from the fully connected layer.

nvinfer1::IConvolutionLayer::setKernelWeights
virtual void setKernelWeights(Weights weights)=0
Set the kernel weights for the convolution.

nvinfer1::IConvolutionLayer::getBiasWeights
virtual Weights getBiasWeights() const =0
Get the bias weights for the convolution.

nvinfer1::IPlugin::getWorkspaceSize
virtual size_t getWorkspaceSize(int maxBatchSize) const =0
Find the workspace size required by the layer.

nvinfer1::IReduceLayer::getReduceAxes
virtual uint32_t getReduceAxes() const =0
Get the axes over which to reduce for the layer.

nvinfer1::ILayer::getOutput
virtual ITensor * getOutput(int index) const =0
Get the layer output corresponding to the given index.

nvinfer1::IPluginLayer::getPlugin
virtual IPlugin & getPlugin()=0
Get the plugin for the layer.

nvinfer1::LayerType::kCONVOLUTION
Convolution layer.

nvinfer1::IRNNLayer::setInputMode
virtual void setInputMode(RNNInputMode op)=0
Set the operation of the RNN layer.

nvinfer1::IConvolutionLayer::setNbGroups
virtual void setNbGroups(int nbGroups)=0
Set the number of groups for a convolution.

nvinfer1::IRNNLayer::setCellState
virtual void setCellState(ITensor &cell)=0
Set the initial cell state of the RNN with the provided cell ITensor.

nvinfer1::IConvolutionLayer::setKernelSize
virtual void setKernelSize(DimsHW kernelSize)=0
Set the HW kernel size of the convolution.

nvinfer1::CalibrationAlgoType
CalibrationAlgoType
Version of calibration algorithm to use.
Definition: NvInfer.h:4208

nvinfer1::UnaryOperation::kEXP
Exponentiation.

nvinfer1::IConvolutionLayer::setStride
virtual void setStride(DimsHW stride)=0
Get the stride of the convolution.

nvinfer1::ILRNLayer::getAlpha
virtual float getAlpha() const =0
Get the LRN alpha value.

nvinfer1::IReduceLayer::setReduceAxes
virtual void setReduceAxes(uint32_t reduceAxes)=0
Set the axes over which to reduce.

nvinfer1::ILogger::Severity::kINFO
Informational messages.

nvinfer1::IInt8EntropyCalibrator::getAlgorithm
virtual CalibrationAlgoType getAlgorithm()
Definition: NvInfer.h:4300

nvinfer1::INetworkDefinition::addConvolution
virtual IConvolutionLayer * addConvolution(ITensor &input, int nbOutputMaps, DimsHW kernelSize, Weights kernelWeights, Weights biasWeights)=0
Add a convolution layer to the network.

nvinfer1::IShuffleLayer::setFirstTranspose
virtual void setFirstTranspose(Permutation permutation)=0
Set the permutation applied by the first transpose operation.

nvinfer1::DimsNCHW::DimsNCHW
DimsNCHW()
Construct an empty DimsNCHW object.
Definition: NvInfer.h:422

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInfer.h:527

nvinfer1::LayerType
LayerType
The type values of layer classes.
Definition: NvInfer.h:545

nvinfer1::EnumMax< ScaleMode >
int EnumMax< ScaleMode >()
Maximum number of elements in ScaleMode enum.
Definition: NvInfer.h:1411

nvinfer1::IIdentityLayer
A layer that represents the identity function.
Definition: NvInfer.h:3241

nvinfer1::IBuilder::canRunOnDLA
virtual bool canRunOnDLA(const ILayer *layer) const =0
Checks if a layer can run on DLA.

nvinfer1::IOutputDimensionsFormula::compute
virtual DimsHW compute(DimsHW inputDims, DimsHW kernelSize, DimsHW stride, DimsHW padding, DimsHW dilation, const char *layerName) const =0
Application-implemented interface to compute the HW output dimensions of a layer from the layer input...

nvinfer1::IConstantLayer::setDimensions
virtual void setDimensions(Dims dimensions)=0
Set the dimensions for the layer.

nvinfer1::IDeconvolutionLayer::getBiasWeights
virtual Weights getBiasWeights() const =0
Get the bias weights for the deconvolution.

nvinfer1::IExecutionContext::setProfiler
virtual void setProfiler(IProfiler *)=0
Set the profiler.

nvinfer1::IConstantLayer::setWeights
virtual void setWeights(Weights weights)=0
Set the weights for the layer.

nvinfer1::RNNInputMode
RNNInputMode
Enumerates the RNN input modes that may occur with an RNN layer.
Definition: NvInfer.h:1919

nvinfer1::IRNNLayer
A RNN layer in a network definition.
Definition: NvInfer.h:1940

nvinfer1::IPluginRegistry::getPluginCreator
virtual IPluginCreator * getPluginCreator(const char *pluginType, const char *pluginVersion)=0
Return plugin creator based on type and version.

nvinfer1::ILayer::setName
virtual void setName(const char *name)=0
Set the name of a layer.

nvinfer1::PluginFieldType::kCHAR
char field type.

nvinfer1::IActivationLayer::getActivationType
virtual ActivationType getActivationType() const =0
Get the type of activation to be performed.

nvinfer1::IConstantLayer::getDimensions
virtual Dims getDimensions() const =0
Get the dimensions for the layer.

nvinfer1::IExecutionContext::setDebugSync
virtual void setDebugSync(bool sync)=0
Set the debug sync flag.

nvinfer1::PluginFormat::kNCHW
NCHW.

nvinfer1::IExecutionContext::destroy
virtual void destroy()=0
Destroy this object.

nvinfer1::INetworkDefinition::unmarkOutput
virtual void unmarkOutput(ITensor &tensor)=0
unmark a tensor as a network output.

nvinfer1::PluginFieldType::kFLOAT32
FP32 field type.

nvinfer1::IPaddingLayer::setPostPadding
virtual void setPostPadding(DimsHW padding)=0
Set the padding that is applied at the end of the tensor.

nvinfer1::IPluginLayer
Layer type for plugins.
Definition: NvInfer.h:2695

nvinfer1::IUnaryLayer::getOperation
virtual UnaryOperation getOperation() const =0
Get the unary operation for the layer.

nvinfer1::DimensionType
DimensionType
The type of data encoded across this dimension.
Definition: NvInfer.h:154

nvinfer1::INetworkDefinition::addConcatenation
virtual IConcatenationLayer * addConcatenation(ITensor *const *inputs, int nbInputs)=0
Add a concatenation layer to the network.

nvinfer1::RNNOperation::kLSTM
Four-gate LSTM network w/o peephole connections.

nvinfer1::IPaddingLayer::getPostPadding
virtual DimsHW getPostPadding() const =0
Set the padding that is applied at the end of the tensor.

nvinfer1::IExecutionContext::getEngine
virtual const ICudaEngine & getEngine() const =0
Get the associated engine.

nvinfer1::IGpuAllocator::allocate
virtual void * allocate(uint64_t size, uint64_t alignment, uint32_t flags)=0

nvinfer1::IRNNv2Layer::setHiddenState
virtual void setHiddenState(ITensor &hidden)=0
Set the initial hidden state of the RNN with the provided hidden ITensor.

nvinfer1::ICudaEngine::getLocation
virtual TensorLocation getLocation(int bindingIndex) const =0
Get location of binding.

nvinfer1::IScaleLayer::getMode
virtual ScaleMode getMode() const =0
Set the scale mode.

nvinfer1::INetworkDefinition::addLRN
virtual ILRNLayer * addLRN(ITensor &input, int window, float alpha, float beta, float k)=0
Add a LRN layer to the network.

nvinfer1::IPluginExt::getTensorRTVersion
virtual int getTensorRTVersion() const
Return the API version with which this plugin was built.
Definition: NvInfer.h:2621

nvinfer1::IBuilder::setMaxWorkspaceSize
virtual void setMaxWorkspaceSize(std::size_t workspaceSize)=0
Set the maximum workspace size.

nvinfer1::IScaleLayer::setShift
virtual void setShift(Weights shift)=0
Set the shift value.

nvinfer1::ActivationType::kTANH
TanH activation.

nvinfer1::ICudaEngine::getDeviceMemorySize
virtual size_t getDeviceMemorySize() const =0
Return the amount of device memory required by an execution context.

nvinfer1::IDeconvolutionLayer::getKernelWeights
virtual Weights getKernelWeights() const =0
Get the kernel weights for the deconvolution.

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInfer.h:4363

nvinfer1::IExecutionContext
Context for executing inference using an engine.
Definition: NvInfer.h:3943

nvinfer1::INetworkDefinition::getInput
virtual ITensor * getInput(int index) const =0
Get the input tensor specified by the given index.

nvinfer1::IBuilder::getMaxDLABatchSize
virtual int getMaxDLABatchSize(DeviceType deviceType) const =0
Get the maximum batch size DLA can support. For any tensor the total volume of index dimensions combi...

nvinfer1::IScaleLayer::setPower
virtual void setPower(Weights power)=0
Set the power value.

nvinfer1::IInt8LegacyCalibrator::getRegressionCutoff
virtual double getRegressionCutoff() const =0
The fraction (between 0 and 1) of the maximum used to define the regression cutoff when using regress...

nvinfer1::IBuilder::setHalf2Mode
virtual void setHalf2Mode(bool mode)=0
Set whether half2 mode is used.

nvinfer1::ILayer::setOutputType
virtual void setOutputType(int index, DataType dataType)=0
Set the output type of this layer.

nvinfer1::RNNGateType::kINPUT
Input gate (i).

nvinfer1::IBuilder::getMaxWorkspaceSize
virtual std::size_t getMaxWorkspaceSize() const =0
Get the maximum workspace size.

nvinfer1::IConcatenationLayer::getAxis
virtual int getAxis() const =0
Get the axis along which concatenation occurs.

nvinfer1::DimsHW
Descriptor for two-dimensional spatial data.
Definition: NvInfer.h:219

nvinfer1::UnaryOperation
UnaryOperation
Enumerates the unary operations that may be performed by a Unary layer.
Definition: NvInfer.h:2845

nvinfer1::IBuilder::setAverageFindIterations
virtual void setAverageFindIterations(int avgFind)=0
Set the number of averaging iterations used when timing layers.

nvinfer1::IConvolutionLayer::getNbOutputMaps
virtual int getNbOutputMaps() const =0
Get the number of output maps for the convolution.

nvinfer1::LayerType::kSHUFFLE
Shuffle Layer.

nvinfer1::IBuilder::getDefaultDeviceType
virtual DeviceType getDefaultDeviceType() const =0
Get the default DeviceType which was set by setDefaultDeviceType.

nvinfer1::LayerType::kSCALE
Scale Layer.

nvinfer1::IRNNLayer::getOperation
virtual RNNOperation getOperation() const =0
Get the operation of the RNN layer.

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInfer.h:137

nvinfer1::DataType::kFLOAT
FP32 format.

nvinfer1::IBuilder::getHalf2Mode
virtual bool getHalf2Mode() const =0
Query whether half2 mode is used.

nvinfer1::ILayer::getNbInputs
virtual int getNbInputs() const =0
Get the number of inputs of a layer.

nvinfer1::INetworkDefinition::addSoftMax
virtual ISoftMaxLayer * addSoftMax(ITensor &input)=0
Add a SoftMax layer to the network.

nvinfer1::DimensionType::kINDEX
Elements correspond to different batch index.

nvinfer1::IRNNv2Layer::getBiasForGate
virtual Weights getBiasForGate(int layerIndex, RNNGateType gate, bool isW) const =0
Get the bias parameters for an individual gate in the RNN.

nvinfer1::LayerType::kMATRIX_MULTIPLY
Matrix Multiply Layer.

nvinfer1::Dims2
Descriptor for two-dimensional data.
Definition: NvInfer.h:189

nvinfer1::ICudaEngine::getMaxBatchSize
virtual int getMaxBatchSize() const =0
Get the maximum batch size which can be used for inference.

nvinfer1::ITensor::setName
virtual void setName(const char *name)=0
Set the tensor name.

nvinfer1::INetworkDefinition::getPoolingOutputDimensionsFormula
virtual IOutputDimensionsFormula & getPoolingOutputDimensionsFormula() const =0
Get the pooling output dimensions formula.

nvinfer1::ILayer::getNbOutputs
virtual int getNbOutputs() const =0
Get the number of outputs of a layer.

nvinfer1::INetworkDefinition::addGather
virtual IGatherLayer * addGather(ITensor &data, ITensor &indices, int axis)=0
Add a gather layer to the network.

nvinfer1::INetworkDefinition::getDeconvolutionOutputDimensionsFormula
virtual IOutputDimensionsFormula & getDeconvolutionOutputDimensionsFormula() const =0
Get the deconvolution output dimensions formula.

nvinfer1::ITensor::setDimensions
virtual void setDimensions(Dims dimensions)=0
Set the dimensions of a tensor.

nvinfer1::ILRNLayer::setWindowSize
virtual void setWindowSize(int windowSize)=0
Set the LRN window size.

nvinfer1::IConvolutionLayer::getKernelWeights
virtual Weights getKernelWeights() const =0
Get the kernel weights for the convolution.

nvinfer1::IInt8Calibrator::getAlgorithm
virtual CalibrationAlgoType getAlgorithm()=0
Get the algorithm used by this calibrator.

nvinfer1::IProfiler
Application-implemented interface for profiling.
Definition: NvInfer.h:3918

nvinfer1::IRNNLayer::getInputMode
virtual RNNInputMode getInputMode() const =0
Get the operation of the RNN layer.

nvinfer1::IConcatenationLayer
A concatenation layer in a network definition.
Definition: NvInfer.h:1547

nvinfer1::ILRNLayer::setK
virtual void setK(float k)=0
Set the LRN K value.

nvinfer1::IDeconvolutionLayer::setNbGroups
virtual void setNbGroups(int nbGroups)=0
Set the number of groups for a deconvolution.

nvinfer1::PluginField::data
const void * data
Plugin field attribute data.
Definition: NvInfer.h:2743

nvinfer1::INetworkDefinition::addPlugin
virtual IPluginLayer * addPlugin(ITensor *const *inputs, int nbInputs, IPlugin &plugin)=0
Add a plugin layer to the network.

nvinfer1::EnumMax< RNNDirection >
int EnumMax< RNNDirection >()
Maximum number of elements in RNNDirection enum.
Definition: NvInfer.h:1899

nvinfer1::IInt8LegacyCalibrator::readHistogramCache
virtual const void * readHistogramCache(std::size_t &length)=0
Load a histogram.

nvinfer1::IBuilder::allowGPUFallback
virtual void allowGPUFallback(bool setFallBackMode)=0
Sets the builder to use GPU if a layer that was supposed to run on DLA can not run on DLA...

nvinfer1::PluginFieldCollection::nbFields
int nbFields
Number of PluginField entries.
Definition: NvInfer.h:2765

nvinfer1::IShuffleLayer::getFirstTranspose
virtual Permutation getFirstTranspose() const =0
Get the permutation applied by the first transpose operation.

nvinfer1::IPluginCreator::getPluginVersion
virtual const char * getPluginVersion() const =0
Return the plugin version.

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
virtual IExecutionContext * createExecutionContextWithoutDeviceMemory()=0
create an execution context without any device memory allocated

nvinfer1::IDeconvolutionLayer::setKernelSize
virtual void setKernelSize(DimsHW kernelSize)=0
Set the HW kernel size of the convolution.

nvinfer1::IRNNLayer::setWeights
virtual void setWeights(Weights weights)=0
Set the weight parameters for the RNN.

nvinfer1::IRNNLayer::getWeights
virtual Weights getWeights() const =0
Get the W weights for the RNN.

nvinfer1::IPluginCreator::getPluginName
virtual const char * getPluginName() const =0
Return the plugin name.

nvinfer1::IPlugin::terminate
virtual void terminate()=0
Release resources acquired during plugin layer initialization. This is called when the engine is dest...

nvinfer1::IPoolingLayer::getPoolingType
virtual PoolingType getPoolingType() const =0
Get the type of activation to be performed.

nvinfer1::PluginField::type
PluginFieldType type
Plugin field attribute type.
Definition: NvInfer.h:2748

nvinfer1::IDeconvolutionLayer
A deconvolution layer in a network definition.
Definition: NvInfer.h:1578

nvinfer1::INetworkDefinition::addShuffle
virtual IShuffleLayer * addShuffle(ITensor &input)=0
Add a shuffle layer to the network.

nvinfer1::IPoolingLayer::setPoolingType
virtual void setPoolingType(PoolingType type)=0
Set the type of activation to be performed.

nvinfer1::INetworkDefinition::getConvolutionOutputDimensionsFormula
virtual IOutputDimensionsFormula & getConvolutionOutputDimensionsFormula() const =0
Get the convolution output dimensions formula.

nvinfer1::IBuilder::setDebugSync
virtual void setDebugSync(bool sync)=0
Set whether the builder should use debug synchronization.

nvinfer1::ITopKLayer::getReduceAxes
virtual uint32_t getReduceAxes() const =0
Get the axes to reduce for the layer.

nvinfer1::LayerType::kSOFTMAX
SoftMax layer.

nvinfer1::LayerType::kPOOLING
Pooling layer.

nvinfer1::IPlugin::initialize
virtual int initialize()=0
Initialize the layer for execution. This is called when the engine is created.

nvinfer1::IInt8EntropyCalibrator
Definition: NvInfer.h:4294

nvinfer1::PluginFieldType::kINT16
INT16 field type.

nvinfer1::RNNGateType::kRESET
Reset gate (r).

nvinfer1::EnumMax< RNNInputMode >
int EnumMax< RNNInputMode >()
Maximum number of elements in RNNInputMode enum.
Definition: NvInfer.h:1926