api/c_api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: LicenseRef-NvidiaProprietary

 *

 * NVIDIA CORPORATION, its affiliates and licensors retain all intellectual

 * property and proprietary rights in and to this material, related

 * documentation and any modifications thereto. Any use, reproduction,

 * disclosure or distribution of this material and related documentation

 * without an express license agreement from NVIDIA CORPORATION or

 * its affiliates is strictly prohibited.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h"

#include "NvInferRuntimeCommon.h"


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(INoCopy const& other) = delete;

    INoCopy& operator=(INoCopy const& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kDEFAULT TRT_DEPRECATED_ENUM = kSTANDARD,


    kSAFETY = 1,


    kSAFE_GPU TRT_DEPRECATED_ENUM = kSAFETY,


    kDLA_STANDALONE = 2,


    kSAFE_DLA TRT_DEPRECATED_ENUM = kDLA_STANDALONE,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public:

    DataType type;

    void const* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = default;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }

    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


protected:

    apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

    return 9;

}


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int32_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = default;

};


class IExprBuilder : public INoCopy

{

public:

    IDimensionExpr const* constant(int32_t value) noexcept

    {

        return mImpl->constant(value);

    }


    IDimensionExpr const* operation(

        DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = default;

};


class DimsExprs

{

public:

    int32_t nbDims;

    IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;

};


class IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

        int32_t nbOutputs) const noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

        return Dims{-1, {}};

    }


    bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

        return false;

    }


    bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

        return true;

    }


    size_t getWorkspaceSize(int32_t) const noexcept override final

    {

        return 0;

    }


    int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

        return 1;

    }

};


class IProfiler

{

public:

    virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


    virtual ~IProfiler() noexcept {}

};


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

    return 6;

}


enum class DeviceType : int32_t

{

    kGPU,

    kDLA,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

    return 2;

}


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = default;


    TRT_DEPRECATED nvinfer1::ICudaEngine* deserializeCudaEngine(

        void const* blob, std::size_t size, IPluginFactory* pluginFactory) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


protected:

    apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = default;


    bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    bool setDynamicRange(char const* tensorName, float min, float max) noexcept

    {

        return mImpl->setDynamicRange(tensorName, min, max);

    }


    float getDynamicRangeMin(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMin(tensorName);

    }


    float getDynamicRangeMax(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMax(tensorName);

    }


    int32_t getTensorsWithDynamicRange(int32_t size, char const** tensorNames) const noexcept

    {

        return mImpl->getTensorsWithDynamicRange(size, tensorNames);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(char const* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


protected:

    apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

    return 3;

}


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(char const* inputName, OptProfileSelector select, Dims dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    bool setShapeValues(

        char const* inputName, OptProfileSelector select, int32_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


    int32_t getNbShapeValues(char const* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    int32_t const* getShapeValues(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValues(inputName, select);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

    kCUBLAS = 0,

    kCUBLAS_LT = 1,

    kCUDNN = 2,


    kEDGE_MASK_CONVOLUTIONS = 3

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

    return 4;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,


    kDEFAULT TRT_DEPRECATED_ENUM = kLAYER_NAMES_ONLY,

    kVERBOSE TRT_DEPRECATED_ENUM = kDETAILED

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

    return 3;

}


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = default;


    int32_t getNbBindings() const noexcept

    {

        return mImpl->getNbBindings();

    }


    int32_t getBindingIndex(char const* name) const noexcept

    {

        return mImpl->getBindingIndex(name);

    }


    char const* getBindingName(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingName(bindingIndex);

    }


    bool bindingIsInput(int32_t bindingIndex) const noexcept

    {

        return mImpl->bindingIsInput(bindingIndex);

    }


    Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    DataType getBindingDataType(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDataType(bindingIndex);

    }


    TRT_DEPRECATED int32_t getMaxBatchSize() const noexcept

    {

        return mImpl->getMaxBatchSize();

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext() noexcept

    {

        return mImpl->createExecutionContext();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    TensorLocation getLocation(int32_t bindingIndex) const noexcept

    {

        return mImpl->getLocation(bindingIndex);

    }


    IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept

    {

        return mImpl->createExecutionContextWithoutDeviceMemory();

    }


    size_t getDeviceMemorySize() const noexcept

    {

        return mImpl->getDeviceMemorySize();

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingBytesPerComponent(bindingIndex);

    }


    int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingComponentsPerElement(bindingIndex);

    }


    TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormat(bindingIndex);

    }


    char const* getBindingFormatDesc(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormatDesc(bindingIndex);

    }


    int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingVectorizedDim(bindingIndex);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    Dims getProfileDimensions(int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileDimensions(bindingIndex, profileIndex, select);

    }


    int32_t const* getProfileShapeValues(

        int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShapeValues(profileIndex, inputIndex, select);

    }


    bool isShapeBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isShapeBinding(bindingIndex);

    }


    bool isExecutionBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isExecutionBinding(bindingIndex);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


protected:

    apiv::VCudaEngine* mImpl;

};


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = default;


    TRT_DEPRECATED bool execute(int32_t batchSize, void* const* bindings) noexcept

    {

        return mImpl->execute(batchSize, bindings);

    }


    TRT_DEPRECATED bool enqueue(

        int32_t batchSize, void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueue(batchSize, bindings, stream, inputConsumed);

    }


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    ICudaEngine const& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    Dims getStrides(int32_t bindingIndex) const noexcept

    {

        return mImpl->getStrides(bindingIndex);

    }


public:

    TRT_DEPRECATED

    bool setOptimizationProfile(int32_t profileIndex) noexcept

    {

        return mImpl->setOptimizationProfile(profileIndex);

    }


    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept

    {

        return mImpl->setBindingDimensions(bindingIndex, dimensions);

    }


    Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    bool setInputShapeBinding(int32_t bindingIndex, int32_t const* data) noexcept

    {

        return mImpl->setInputShapeBinding(bindingIndex, data);

    }


    bool getShapeBinding(int32_t bindingIndex, int32_t* data) const noexcept

    {

        return mImpl->getShapeBinding(bindingIndex, data);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    bool allInputShapesSpecified() const noexcept


    {

        return mImpl->allInputShapesSpecified();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    bool enqueueV2(void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueueV2(bindings, stream, inputConsumed);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

    return 2;

}


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = default;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    AsciiChar const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    AsciiChar const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}

#endif // NV_INFER_RUNTIME_H

getLogger
nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getPluginRegistry
nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

NvInferRuntimeCommon.h

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeCommon.h:54

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeCommon.h:73

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeCommon.h:40

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeCommon.h:41

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims32
Definition: NvInferRuntimeCommon.h:153

nvinfer1::Dims32::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeCommon.h:156

nvinfer1::DimsExprs
Definition: NvInferRuntime.h:309

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:311

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:1343

nvinfer1::ICudaEngine::getBindingBytesPerComponent
int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept
Return the number of bytes per component of an element.
Definition: NvInferRuntime.h:1580

nvinfer1::ICudaEngine::getBindingComponentsPerElement
int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept
Return the number of components included in one element.
Definition: NvInferRuntime.h:1594

nvinfer1::ICudaEngine::isShapeBinding
bool isShapeBinding(int32_t bindingIndex) const noexcept
True if tensor is required as input for shape calculations or output from them.
Definition: NvInferRuntime.h:1751

nvinfer1::ICudaEngine::hasImplicitBatchDimension
bool hasImplicitBatchDimension() const noexcept
Query whether the engine was built with an implicit batch dimension.
Definition: NvInferRuntime.h:1832

nvinfer1::ICudaEngine::getProfileShapeValues
int32_t const * getProfileShapeValues(int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const noexcept
Get minimum / optimum / maximum values for an input shape binding under an optimization profile.
Definition: NvInferRuntime.h:1714

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:1780

nvinfer1::ICudaEngine::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object;.
Definition: NvInferRuntime.h:1522

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1813

nvinfer1::ICudaEngine::getBindingFormat
TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept
Return the binding format.
Definition: NvInferRuntime.h:1604

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:1874

nvinfer1::ICudaEngine::getLocation
TensorLocation getLocation(int32_t bindingIndex) const noexcept
Get location of binding.
Definition: NvInferRuntime.h:1537

nvinfer1::ICudaEngine::getProfileDimensions
Dims getProfileDimensions(int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a particular binding under an optimization profile...
Definition: NvInferRuntime.h:1688

nvinfer1::ICudaEngine::getBindingDimensions
Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dimensions of a binding.
Definition: NvInferRuntime.h:1437

nvinfer1::ICudaEngine::getBindingVectorizedDim
int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept
Return the dimension index that the buffer is vectorized.
Definition: NvInferRuntime.h:1635

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1798

nvinfer1::ICudaEngine::getBindingName
char const * getBindingName(int32_t bindingIndex) const noexcept
Retrieve the name corresponding to a binding index.
Definition: NvInferRuntime.h:1399

nvinfer1::ICudaEngine::getDeviceMemorySize
size_t getDeviceMemorySize() const noexcept
Return the amount of device memory required by an execution context.
Definition: NvInferRuntime.h:1556

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine.
Definition: NvInferRuntime.h:1847

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:1650

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:1858

nvinfer1::ICudaEngine::getBindingIndex
int32_t getBindingIndex(char const *name) const noexcept
Retrieve the binding index for a named tensor.
Definition: NvInferRuntime.h:1379

nvinfer1::ICudaEngine::getBindingFormatDesc
char const * getBindingFormatDesc(int32_t bindingIndex) const noexcept
Return the human readable description of the tensor format.
Definition: NvInferRuntime.h:1623

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:1494

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
IExecutionContext * createExecutionContextWithoutDeviceMemory() noexcept
create an execution context without any device memory allocated
Definition: NvInferRuntime.h:1546

nvinfer1::ICudaEngine::getBindingDataType
DataType getBindingDataType(int32_t bindingIndex) const noexcept
Determine the required data type for a buffer from its binding index.
Definition: NvInferRuntime.h:1450

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext() noexcept
Create an execution context.
Definition: NvInferRuntime.h:1510

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:1868

nvinfer1::ICudaEngine::getMaxBatchSize
TRT_DEPRECATED int32_t getMaxBatchSize() const noexcept
Get the maximum batch size which can be used for inference. Should only be called if the engine is bu...
Definition: NvInferRuntime.h:1466

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:1661

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:1480

nvinfer1::ICudaEngine::bindingIsInput
bool bindingIsInput(int32_t bindingIndex) const noexcept
Determine whether a binding is an input binding.
Definition: NvInferRuntime.h:1412

nvinfer1::ICudaEngine::isExecutionBinding
bool isExecutionBinding(int32_t bindingIndex) const noexcept
True if pointer to tensor data is required for execution phase, false if nullptr can be supplied.
Definition: NvInferRuntime.h:1765

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:1566

nvinfer1::IDimensionExpr
Definition: NvInferRuntime.h:244

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:247

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:260

nvinfer1::IDimensionExpr::getConstantValue
int32_t getConstantValue() const noexcept
Definition: NvInferRuntime.h:254

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:2505

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2617

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2602

nvinfer1::IEngineInspector::getEngineInformation
AsciiChar const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:2583

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:2533

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:2623

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getLayerInformation
AsciiChar const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:2558

nvinfer1::IErrorRecorder
Reference counted application-implemented error reporting interface for TensorRT objects.
Definition: NvInferRuntimeCommon.h:1665

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:1888

nvinfer1::IExecutionContext::enqueue
TRT_DEPRECATED bool enqueue(int32_t batchSize, void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Asynchronously execute inference on a batch.
Definition: NvInferRuntime.h:1948

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2311

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:2459

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:2052

nvinfer1::IExecutionContext::getBindingDimensions
Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dynamic dimensions of a binding.
Definition: NvInferRuntime.h:2195

nvinfer1::IExecutionContext::getShapeBinding
bool getShapeBinding(int32_t bindingIndex, int32_t *data) const noexcept
Get values of an input tensor required for shape calculations or an output tensor produced by shape c...
Definition: NvInferRuntime.h:2247

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:2036

nvinfer1::IExecutionContext::setDebugSync
void setDebugSync(bool sync) noexcept
Set the debug sync flag.
Definition: NvInferRuntime.h:1962

nvinfer1::IExecutionContext::enqueueV2
bool enqueueV2(void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Asynchronously execute inference.
Definition: NvInferRuntime.h:2356

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:2419

nvinfer1::IExecutionContext::setBindingDimensions
bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept
Set the dynamic dimensions of a binding.
Definition: NvInferRuntime.h:2165

nvinfer1::IExecutionContext::setInputShapeBinding
bool setInputShapeBinding(int32_t bindingIndex, int32_t const *data) noexcept
Set values of input tensor required by shape calculations.
Definition: NvInferRuntime.h:2225

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute inference a network.
Definition: NvInferRuntime.h:2328

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:2430

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:2404

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:2465

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:2002

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:2128

nvinfer1::IExecutionContext::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:2014

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:1972

nvinfer1::IExecutionContext::getStrides
Dims getStrides(int32_t bindingIndex) const noexcept
Return the strides of the buffer for the given binding.
Definition: NvInferRuntime.h:2073

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:1992

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2296

nvinfer1::IExecutionContext::setOptimizationProfile
TRT_DEPRECATED bool setOptimizationProfile(int32_t profileIndex) noexcept
Select an optimization profile for the current context.
Definition: NvInferRuntime.h:2116

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:2262

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:1982

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:2026

nvinfer1::IExecutionContext::allInputShapesSpecified
bool allInputShapesSpecified() const noexcept
Whether all input shape bindings have been specified.
Definition: NvInferRuntime.h:2276

nvinfer1::IExprBuilder
Definition: NvInferRuntime.h:282

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
Definition: NvInferRuntime.h:292

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:299

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int32_t value) noexcept
Return pointer to IDimensionExp for given value.
Definition: NvInferRuntime.h:285

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInferRuntimeCommon.h:1338

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:144

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:149

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:161

nvinfer1::IHostMemory::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:172

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:155

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:178

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntimeCommon.h:1476

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:43

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:1120

nvinfer1::IOptimizationProfile::getShapeValues
int32_t const * getShapeValues(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1222

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:1270

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1157

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:1248

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1147

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:1240

nvinfer1::IOptimizationProfile::setShapeValues
bool setShapeValues(char const *inputName, OptProfileSelector select, int32_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1200

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:1264

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:1212

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:1210

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator. Returns false if one with same type is already registered.

nvinfer1::IPluginV2DynamicExt
Definition: NvInferRuntime.h:351

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:503

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:680

nvinfer1::IProfiler
Application-implemented interface for profiling.
Definition: NvInferRuntime.h:556

nvinfer1::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
Definition: NvInferRuntime.h:566

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:800

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:1060

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:986

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:1022

nvinfer1::IRefitter::setDynamicRange
bool setDynamicRange(char const *tensorName, float min, float max) noexcept
Definition: NvInferRuntime.h:894

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:1032

nvinfer1::IRefitter::getTensorsWithDynamicRange
int32_t getTensorsWithDynamicRange(int32_t size, char const **tensorNames) const noexcept
Get names of all tensors that have refittable dynamic ranges.
Definition: NvInferRuntime.h:934

nvinfer1::IRefitter::getDynamicRangeMin
float getDynamicRangeMin(char const *tensorName) const noexcept
Get minimum of dynamic range.
Definition: NvInferRuntime.h:906

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Updates associated engine. Return true if successful.
Definition: NvInferRuntime.h:829

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:1006

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:850

nvinfer1::IRefitter::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:877

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:1046

nvinfer1::IRefitter::getDynamicRangeMax
float getDynamicRangeMax(char const *tensorName) const noexcept
Get maximum of dynamic range.
Definition: NvInferRuntime.h:918

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:1066

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:867

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:953

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:968

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:618

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:769

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:682

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
Definition: NvInferRuntime.h:789

nvinfer1::IRuntime::setDLACore
void setDLACore(int32_t dlaCore) noexcept
Sets the DLA core used by the network. Defaults to -1.
Definition: NvInferRuntime.h:653

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible or 0 if DLA is unavailable.
Definition: NvInferRuntime.h:670

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
Deserialize an engine from a stream.
Definition: NvInferRuntime.h:745

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:662

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:696

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:730

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:755

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:783

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:715

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:2692

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:2694

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:126

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:128

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:130

nvinfer1::Weights::values
void const  * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:129

nvinfer1::safe::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an safe::IRuntime class.

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:1305

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:69

nvinfer1::EngineCapability::kDEFAULT
@ kDEFAULT

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kSAFE_DLA
@ kSAFE_DLA

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::EngineCapability::kSAFE_GPU
@ kSAFE_GPU

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:192

nvinfer1::DimensionOperation::kSUB
@ kSUB
Substract the second element from the first.

nvinfer1::DimensionOperation::kSUM
@ kSUM
Sum of the two operands.

nvinfer1::DimensionOperation::kPROD
@ kPROD
Product of the two operands.

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
1 if operands are equal, 0 otherwise.

nvinfer1::DimensionOperation::kMIN
@ kMIN
Minimum of the two operands.

nvinfer1::DimensionOperation::kLESS
@ kLESS
1 if first operand is less than second operand, 0 otherwise.

nvinfer1::DimensionOperation::kMAX
@ kMAX
Maximum of the two operands.

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:587

nvinfer1::AsciiChar
char_t AsciiChar
AsciiChar is the type used by TensorRT to represent valid ASCII characters.
Definition: NvInferRuntimeCommon.h:88

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
Definition: NvInferRuntime.h:2484

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeCommon.h:114

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:598

nvinfer1::DeviceType::kGPU
@ kGPU
GPU Device.

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::GatherMode::kDEFAULT
@ kDEFAULT
Similar to ONNX Gather.

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:1092

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:576

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
Maximum number of profile verbosity levels in ProfilingVerbosity enum.
Definition: NvInferRuntime.h:1330

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:1317

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::ProfilingVerbosity::kVERBOSE
@ kVERBOSE

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:1282

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT
cuBLAS LT tactics

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kCUDNN
@ kCUDNN
cuDNN tactics

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS
cuBLAS tactics.

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimeCommon.h:308

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntimeCommon.h:183

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
Maximum number of tactic sources in TacticSource enum.
Definition: NvInferRuntime.h:1294

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:2476

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::PoolingType::kMAX
@ kMAX

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:605

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:206

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:216

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:1080

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::DynamicPluginTensorDesc
Definition: NvInferRuntime.h:321

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:326

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:329

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:323

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimeCommon.h:332

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeCommon.h:99