api/c_api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: LicenseRef-NvidiaProprietary

 *

 * NVIDIA CORPORATION, its affiliates and licensors retain all intellectual

 * property and proprietary rights in and to this material, related

 * documentation and any modifications thereto. Any use, reproduction,

 * disclosure or distribution of this material and related documentation

 * without an express license agreement from NVIDIA CORPORATION or

 * its affiliates is strictly prohibited.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h"

#include "NvInferRuntimeCommon.h"


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(INoCopy const& other) = delete;

    INoCopy& operator=(INoCopy const& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kDEFAULT TRT_DEPRECATED_ENUM = kSTANDARD,


    kSAFETY = 1,


    kSAFE_GPU TRT_DEPRECATED_ENUM = kSAFETY,


    kDLA_STANDALONE = 2,


    kSAFE_DLA TRT_DEPRECATED_ENUM = kDLA_STANDALONE,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public:

    DataType type;

    void const* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = default;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }

    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


protected:

    apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

    return 9;

}


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int32_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = default;

};


class IExprBuilder : public INoCopy

{

public:

    IDimensionExpr const* constant(int32_t value) noexcept

    {

        return mImpl->constant(value);

    }


    IDimensionExpr const* operation(

        DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = default;

};


class DimsExprs

{

public:

    int32_t nbDims;

    IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;

};


class IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

        int32_t nbOutputs) const noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

        return Dims{-1, {}};

    }


    bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

        return false;

    }


    bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

        return true;

    }


    size_t getWorkspaceSize(int32_t) const noexcept override final

    {

        return 0;

    }


    int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

        return 1;

    }

};


class IProfiler

{

public:

    virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


    virtual ~IProfiler() noexcept {}

};


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

    return 6;

}


enum class DeviceType : int32_t

{

    kGPU,

    kDLA,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

    return 2;

}


enum class TempfileControlFlag : int32_t

{

    kALLOW_IN_MEMORY_FILES = 0,


    kALLOW_TEMPORARY_FILES = 1,

};


template <>

constexpr inline int32_t EnumMax<TempfileControlFlag>() noexcept

{

    return 2;

}


using TempfileControlFlags = uint32_t;


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = default;


    TRT_DEPRECATED nvinfer1::ICudaEngine* deserializeCudaEngine(

        void const* blob, std::size_t size, IPluginFactory* pluginFactory) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    void setTemporaryDirectory(char const* path) noexcept

    {

        return mImpl->setTemporaryDirectory(path);

    }


    char const* getTemporaryDirectory() const noexcept

    {

        return mImpl->getTemporaryDirectory();

    }


    void setTempfileControlFlags(TempfileControlFlags flags) noexcept

    {

        return mImpl->setTempfileControlFlags(flags);

    }


    TempfileControlFlags getTempfileControlFlags() const noexcept

    {

        return mImpl->getTempfileControlFlags();

    }


    IPluginRegistry& getPluginRegistry() noexcept

    {

        return mImpl->getPluginRegistry();

    }


    IRuntime* loadRuntime(char const* path) noexcept

    {

        return mImpl->loadRuntime(path);

    }


    void setEngineHostCodeAllowed(bool allowed) noexcept

    {

        return mImpl->setEngineHostCodeAllowed(allowed);

    }


    bool getEngineHostCodeAllowed() const noexcept

    {

        return mImpl->getEngineHostCodeAllowed();

    }


protected:

    apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = default;


    bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    bool setDynamicRange(char const* tensorName, float min, float max) noexcept

    {

        return mImpl->setDynamicRange(tensorName, min, max);

    }


    float getDynamicRangeMin(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMin(tensorName);

    }


    float getDynamicRangeMax(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMax(tensorName);

    }


    int32_t getTensorsWithDynamicRange(int32_t size, char const** tensorNames) const noexcept

    {

        return mImpl->getTensorsWithDynamicRange(size, tensorNames);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(char const* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


protected:

    apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

    return 3;

}


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(char const* inputName, OptProfileSelector select, Dims dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    bool setShapeValues(

        char const* inputName, OptProfileSelector select, int32_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


    int32_t getNbShapeValues(char const* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    int32_t const* getShapeValues(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValues(inputName, select);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

    kCUBLAS = 0,

    kCUBLAS_LT = 1,

    kCUDNN = 2,


    kEDGE_MASK_CONVOLUTIONS = 3,


    kJIT_CONVOLUTIONS = 4,

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

    return 5;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,


    kDEFAULT TRT_DEPRECATED_ENUM = kLAYER_NAMES_ONLY,

    kVERBOSE TRT_DEPRECATED_ENUM = kDETAILED

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

    return 3;

}


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = default;


    TRT_DEPRECATED int32_t getNbBindings() const noexcept

    {

        return mImpl->getNbBindings();

    }


    TRT_DEPRECATED int32_t getBindingIndex(char const* name) const noexcept

    {

        return mImpl->getBindingIndex(name);

    }


    TRT_DEPRECATED char const* getBindingName(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingName(bindingIndex);

    }


    TRT_DEPRECATED bool bindingIsInput(int32_t bindingIndex) const noexcept

    {

        return mImpl->bindingIsInput(bindingIndex);

    }


    TRT_DEPRECATED Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    TRT_DEPRECATED DataType getBindingDataType(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDataType(bindingIndex);

    }


    DataType getTensorDataType(char const* tensorName) const noexcept

    {

        return mImpl->getTensorDataType(tensorName);

    }


    TRT_DEPRECATED int32_t getMaxBatchSize() const noexcept

    {

        return mImpl->getMaxBatchSize();

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext() noexcept

    {

        return mImpl->createExecutionContext();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    TRT_DEPRECATED TensorLocation getLocation(int32_t bindingIndex) const noexcept

    {

        return mImpl->getLocation(bindingIndex);

    }


    TensorLocation getTensorLocation(char const* tensorName) const noexcept

    {

        return mImpl->getTensorLocation(tensorName);

    }


    bool isShapeInferenceIO(char const* tensorName) const noexcept

    {

        return mImpl->isShapeInferenceIO(tensorName);

    }


    TensorIOMode getTensorIOMode(char const* tensorName) const noexcept

    {

        return mImpl->getTensorIOMode(tensorName);

    }


    IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept

    {

        return mImpl->createExecutionContextWithoutDeviceMemory();

    }


    size_t getDeviceMemorySize() const noexcept

    {

        return mImpl->getDeviceMemorySize();

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    TRT_DEPRECATED int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingBytesPerComponent(bindingIndex);

    }


    int32_t getTensorBytesPerComponent(char const* tensorName) const noexcept

    {

        return mImpl->getTensorBytesPerComponent(tensorName);

    }


    TRT_DEPRECATED int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingComponentsPerElement(bindingIndex);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName) const noexcept

    {

        return mImpl->getTensorComponentsPerElement(tensorName);

    }


    TRT_DEPRECATED TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormat(bindingIndex);

    }


    TensorFormat getTensorFormat(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormat(tensorName);

    }


    TRT_DEPRECATED char const* getBindingFormatDesc(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormatDesc(bindingIndex);

    }


    char const* getTensorFormatDesc(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormatDesc(tensorName);

    }


    TRT_DEPRECATED int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingVectorizedDim(bindingIndex);

    }


    int32_t getTensorVectorizedDim(char const* tensorName) const noexcept

    {

        return mImpl->getTensorVectorizedDim(tensorName);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    TRT_DEPRECATED Dims getProfileDimensions(

        int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileDimensions(bindingIndex, profileIndex, select);

    }


    Dims getProfileShape(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShape(tensorName, profileIndex, select);

    }


    TRT_DEPRECATED int32_t const* getProfileShapeValues(

        int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShapeValues(profileIndex, inputIndex, select);

    }


    TRT_DEPRECATED bool isShapeBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isShapeBinding(bindingIndex);

    }


    TRT_DEPRECATED bool isExecutionBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isExecutionBinding(bindingIndex);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


    int32_t getNbIOTensors() const noexcept

    {

        return mImpl->getNbIOTensors();

    }


    char const* getIOTensorName(int32_t index) const noexcept

    {

        return mImpl->getIOTensorName(index);

    }


    HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

        return mImpl->getHardwareCompatibilityLevel();

    }


    int32_t getNbAuxStreams() const noexcept

    {

        return mImpl->getNbAuxStreams();

    }


protected:

    apiv::VCudaEngine* mImpl;

};


class IOutputAllocator

{

public:

    virtual int32_t getInterfaceVersion() const noexcept

    {

        return 1;

    }


    virtual void* reallocateOutput(char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment) noexcept = 0;


    virtual void notifyShape(char const* tensorName, Dims const& dims) noexcept = 0;


    virtual ~IOutputAllocator() = default;

};


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = default;


    TRT_DEPRECATED bool execute(int32_t batchSize, void* const* bindings) noexcept

    {

        return mImpl->execute(batchSize, bindings);

    }


    TRT_DEPRECATED bool enqueue(

        int32_t batchSize, void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueue(batchSize, bindings, stream, inputConsumed);

    }


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    ICudaEngine const& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    TRT_DEPRECATED Dims getStrides(int32_t bindingIndex) const noexcept

    {

        return mImpl->getStrides(bindingIndex);

    }


    Dims getTensorStrides(char const* tensorName) const noexcept

    {

        return mImpl->getTensorStrides(tensorName);

    }


public:

    TRT_DEPRECATED

    bool setOptimizationProfile(int32_t profileIndex) noexcept

    {

        return mImpl->setOptimizationProfile(profileIndex);

    }


    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    TRT_DEPRECATED bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept

    {

        return mImpl->setBindingDimensions(bindingIndex, dimensions);

    }


    bool setInputShape(char const* tensorName, Dims const& dims) noexcept

    {

        return mImpl->setInputShape(tensorName, dims);

    }


    TRT_DEPRECATED Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    TRT_DEPRECATED bool setInputShapeBinding(int32_t bindingIndex, int32_t const* data) noexcept

    {

        return mImpl->setInputShapeBinding(bindingIndex, data);

    }


    TRT_DEPRECATED bool getShapeBinding(int32_t bindingIndex, int32_t* data) const noexcept

    {

        return mImpl->getShapeBinding(bindingIndex, data);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    bool allInputShapesSpecified() const noexcept

    {

        return mImpl->allInputShapesSpecified();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    TRT_DEPRECATED bool enqueueV2(void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueueV2(bindings, stream, inputConsumed);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


    bool setTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setTensorAddress(tensorName, data);

    }


    void const* getTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getTensorAddress(tensorName);

    }


    bool setInputTensorAddress(char const* tensorName, void const* data) noexcept

    {

        return mImpl->setInputTensorAddress(tensorName, data);

    }


    void* getOutputTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getOutputTensorAddress(tensorName);

    }


    int32_t inferShapes(int32_t nbMaxNames, char const** tensorNames) noexcept

    {

        return mImpl->inferShapes(nbMaxNames, tensorNames);

    }


    bool setInputConsumedEvent(cudaEvent_t event) noexcept

    {

        return mImpl->setInputConsumedEvent(event);

    }


    cudaEvent_t getInputConsumedEvent() const noexcept

    {

        return mImpl->getInputConsumedEvent();

    }


    bool setOutputAllocator(char const* tensorName, IOutputAllocator* outputAllocator) noexcept

    {

        return mImpl->setOutputAllocator(tensorName, outputAllocator);

    }


    IOutputAllocator* getOutputAllocator(char const* tensorName) const noexcept

    {

        return mImpl->getOutputAllocator(tensorName);

    }


    int64_t getMaxOutputSize(char const* tensorName) const noexcept

    {

        return mImpl->getMaxOutputSize(tensorName);

    }


    bool setTemporaryStorageAllocator(IGpuAllocator* allocator) noexcept

    {

        return mImpl->setTemporaryStorageAllocator(allocator);

    }


    IGpuAllocator* getTemporaryStorageAllocator() const noexcept

    {

        return mImpl->getTemporaryStorageAllocator();

    }


    bool enqueueV3(cudaStream_t stream) noexcept

    {

        return mImpl->enqueueV3(stream);

    }


    void setPersistentCacheLimit(size_t size) noexcept

    {

        mImpl->setPersistentCacheLimit(size);

    }


    size_t getPersistentCacheLimit() const noexcept

    {

        return mImpl->getPersistentCacheLimit();

    }


    bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept

    {

        return mImpl->setNvtxVerbosity(verbosity);

    }


    ProfilingVerbosity getNvtxVerbosity() const noexcept

    {

        return mImpl->getNvtxVerbosity();

    }


    void setAuxStreams(cudaStream_t* auxStreams, int32_t nbStreams) noexcept

    {

        mImpl->setAuxStreams(auxStreams, nbStreams);

    }


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

    return 2;

}


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = default;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    char const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    char const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}


namespace nvinfer1

{

class ILoggerFinder

{

public:

    virtual ILogger* findLogger() = 0;


protected:

    virtual ~ILoggerFinder() = default;

};


} // namespace nvinfer1


#endif // NV_INFER_RUNTIME_H

getLogger
nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getPluginRegistry
nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:54

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeBase.h:76

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeBase.h:40

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeBase.h:41

NvInferRuntimeCommon.h

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims32
Definition: NvInferRuntimeBase.h:179

nvinfer1::Dims32::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:182

nvinfer1::DimsExprs
Definition: NvInferRuntime.h:309

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:311

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:1543

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName) const noexcept
Return the number of bytes per component of an element, or -1 if the provided name does not map to an...
Definition: NvInferRuntime.h:1902

nvinfer1::ICudaEngine::hasImplicitBatchDimension
bool hasImplicitBatchDimension() const noexcept
Query whether the engine was built with an implicit batch dimension.
Definition: NvInferRuntime.h:2270

nvinfer1::ICudaEngine::getIOTensorName
char const * getIOTensorName(int32_t index) const noexcept
Return name of an IO tensor.
Definition: NvInferRuntime.h:2331

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:2218

nvinfer1::ICudaEngine::isExecutionBinding
TRT_DEPRECATED bool isExecutionBinding(int32_t bindingIndex) const noexcept
True if pointer to tensor data is required for execution phase, false if nullptr can be supplied.
Definition: NvInferRuntime.h:2203

nvinfer1::ICudaEngine::getBindingIndex
TRT_DEPRECATED int32_t getBindingIndex(char const *name) const noexcept
Retrieve the binding index for a named tensor.
Definition: NvInferRuntime.h:1587

nvinfer1::ICudaEngine::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object;.
Definition: NvInferRuntime.h:1770

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2251

nvinfer1::ICudaEngine::getBindingName
TRT_DEPRECATED char const * getBindingName(int32_t bindingIndex) const noexcept
Retrieve the name corresponding to a binding index.
Definition: NvInferRuntime.h:1610

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:2364

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName) const noexcept
Return the human readable description of the tensor format, or empty string if the provided name does...
Definition: NvInferRuntime.h:2008

nvinfer1::ICudaEngine::getProfileShape
Dims getProfileShape(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for an input tensor given its name under an optimizati...
Definition: NvInferRuntime.h:2118

nvinfer1::ICudaEngine::getProfileShapeValues
TRT_DEPRECATED int32_t const * getProfileShapeValues(int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const noexcept
Get minimum / optimum / maximum values for an input shape binding under an optimization profile.
Definition: NvInferRuntime.h:2147

nvinfer1::ICudaEngine::getNbAuxStreams
int32_t getNbAuxStreams() const noexcept
Return the number of auxiliary streams used by this engine.
Definition: NvInferRuntime.h:2358

nvinfer1::ICudaEngine::bindingIsInput
TRT_DEPRECATED bool bindingIsInput(int32_t bindingIndex) const noexcept
Determine whether a binding is an input binding.
Definition: NvInferRuntime.h:1625

nvinfer1::ICudaEngine::getBindingDimensions
TRT_DEPRECATED Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dimensions of a binding.
Definition: NvInferRuntime.h:1652

nvinfer1::ICudaEngine::getTensorDataType
DataType getTensorDataType(char const *tensorName) const noexcept
Determine the required data type for a buffer from its tensor name.
Definition: NvInferRuntime.h:1697

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2236

nvinfer1::ICudaEngine::getDeviceMemorySize
size_t getDeviceMemorySize() const noexcept
Return the amount of device memory required by an execution context.
Definition: NvInferRuntime.h:1858

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine.
Definition: NvInferRuntime.h:2285

nvinfer1::ICudaEngine::getBindingFormat
TRT_DEPRECATED TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept
Return the binding format.
Definition: NvInferRuntime.h:1949

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getBindingComponentsPerElement
TRT_DEPRECATED int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept
Return the number of components included in one element.
Definition: NvInferRuntime.h:1918

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:2054

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:2296

nvinfer1::ICudaEngine::isShapeInferenceIO
bool isShapeInferenceIO(char const *tensorName) const noexcept
True if tensor is required as input for shape calculations or is output from shape calculations.
Definition: NvInferRuntime.h:1825

nvinfer1::ICudaEngine::isShapeBinding
TRT_DEPRECATED bool isShapeBinding(int32_t bindingIndex) const noexcept
True if tensor is required as input for shape calculations or output from them.
Definition: NvInferRuntime.h:2186

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName) const noexcept
Return the dimension index that the buffer is vectorized, or -1 if the provided name does not map to ...
Definition: NvInferRuntime.h:2039

nvinfer1::ICudaEngine::getBindingDataType
TRT_DEPRECATED DataType getBindingDataType(int32_t bindingIndex) const noexcept
Determine the required data type for a buffer from its binding index.
Definition: NvInferRuntime.h:1682

nvinfer1::ICudaEngine::getBindingVectorizedDim
TRT_DEPRECATED int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept
Return the dimension index that the buffer is vectorized, or -1 is the name is not found.
Definition: NvInferRuntime.h:2024

nvinfer1::ICudaEngine::getBindingFormatDesc
TRT_DEPRECATED char const * getBindingFormatDesc(int32_t bindingIndex) const noexcept
Return the human readable description of the tensor format, or nullptr if the provided name does not ...
Definition: NvInferRuntime.h:1986

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName) const noexcept
Return the binding format, or TensorFormat::kLINEAR if the provided name does not map to an input or ...
Definition: NvInferRuntime.h:1962

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:1741

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
IExecutionContext * createExecutionContextWithoutDeviceMemory() noexcept
create an execution context without any device memory allocated
Definition: NvInferRuntime.h:1848

nvinfer1::ICudaEngine::getTensorLocation
TensorLocation getTensorLocation(char const *tensorName) const noexcept
Get whether an input or output tensor must be on GPU or CPU.
Definition: NvInferRuntime.h:1805

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext() noexcept
Create an execution context.
Definition: NvInferRuntime.h:1758

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:2306

nvinfer1::ICudaEngine::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
Return the hardware compatibility level of this engine.
Definition: NvInferRuntime.h:2343

nvinfer1::ICudaEngine::getMaxBatchSize
TRT_DEPRECATED int32_t getMaxBatchSize() const noexcept
Get the maximum batch size which can be used for inference. Should only be called if the engine is bu...
Definition: NvInferRuntime.h:1713

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:2065

nvinfer1::ICudaEngine::getTensorIOMode
TensorIOMode getTensorIOMode(char const *tensorName) const noexcept
Determine whether a tensor is an input or output tensor.
Definition: NvInferRuntime.h:1839

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:1727

nvinfer1::ICudaEngine::getLocation
TRT_DEPRECATED TensorLocation getLocation(int32_t bindingIndex) const noexcept
Get location of binding.
Definition: NvInferRuntime.h:1788

nvinfer1::ICudaEngine::getNbIOTensors
int32_t getNbIOTensors() const noexcept
Return number of IO tensors.
Definition: NvInferRuntime.h:2319

nvinfer1::ICudaEngine::getProfileDimensions
TRT_DEPRECATED Dims getProfileDimensions(int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a particular input binding under an optimization p...
Definition: NvInferRuntime.h:2097

nvinfer1::ICudaEngine::getBindingBytesPerComponent
TRT_DEPRECATED int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept
Return the number of bytes per component of an element.
Definition: NvInferRuntime.h:1885

nvinfer1::ICudaEngine::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
Get shape of an input or output tensor.
Definition: NvInferRuntime.h:1667

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName) const noexcept
Return the number of components included in one element, or -1 if the provided name does not map to a...
Definition: NvInferRuntime.h:1935

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:1868

nvinfer1::IDimensionExpr
Definition: NvInferRuntime.h:244

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:247

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:260

nvinfer1::IDimensionExpr::getConstantValue
int32_t getConstantValue() const noexcept
Definition: NvInferRuntime.h:254

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:3496

nvinfer1::IEngineInspector::getLayerInformation
char const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:3549

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:3606

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:3591

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:3524

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:3612

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getEngineInformation
char const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:3572

nvinfer1::IErrorRecorder
Reference counted application-implemented error reporting interface for TensorRT objects.
Definition: NvInferRuntimeBase.h:694

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:2433

nvinfer1::IExecutionContext::enqueue
TRT_DEPRECATED bool enqueue(int32_t batchSize, void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Enqueue inference of a batch on a stream.
Definition: NvInferRuntime.h:2493

nvinfer1::IExecutionContext::getOutputAllocator
IOutputAllocator * getOutputAllocator(char const *tensorName) const noexcept
Get output allocator associated with output tensor of given name, or nullptr if the provided name doe...
Definition: NvInferRuntime.h:3291

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2951

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:3100

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:2600

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:2583

nvinfer1::IExecutionContext::setDebugSync
void setDebugSync(bool sync) noexcept
Set the debug sync flag.
Definition: NvInferRuntime.h:2507

nvinfer1::IExecutionContext::getTemporaryStorageAllocator
IGpuAllocator * getTemporaryStorageAllocator() const noexcept
Get allocator set by setTemporaryStorageAllocator.
Definition: NvInferRuntime.h:3339

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:3060

nvinfer1::IExecutionContext::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
Return the shape of the given input or output.
Definition: NvInferRuntime.h:2823

nvinfer1::IExecutionContext::setInputShape
bool setInputShape(char const *tensorName, Dims const &dims) noexcept
Set shape of given input.
Definition: NvInferRuntime.h:2753

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute inference a network.
Definition: NvInferRuntime.h:2968

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:3071

nvinfer1::IExecutionContext::setBindingDimensions
TRT_DEPRECATED bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept
Set the dynamic dimensions of an input binding.
Definition: NvInferRuntime.h:2735

nvinfer1::IExecutionContext::getTensorAddress
void const * getTensorAddress(char const *tensorName) const noexcept
Get memory address bound to given input or output tensor, or nullptr if the provided name does not ma...
Definition: NvInferRuntime.h:3159

nvinfer1::IExecutionContext::setOutputAllocator
bool setOutputAllocator(char const *tensorName, IOutputAllocator *outputAllocator) noexcept
Set output allocator to use for output tensor of given name. Pass nullptr to outputAllocator to unset...
Definition: NvInferRuntime.h:3278

nvinfer1::IExecutionContext::enqueueV2
TRT_DEPRECATED bool enqueueV2(void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Enqueue inference on a stream.
Definition: NvInferRuntime.h:2998

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:3045

nvinfer1::IExecutionContext::setInputShapeBinding
TRT_DEPRECATED bool setInputShapeBinding(int32_t bindingIndex, int32_t const *data) noexcept
Set values of input tensor required by shape calculations.
Definition: NvInferRuntime.h:2858

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:3456

nvinfer1::IExecutionContext::setPersistentCacheLimit
void setPersistentCacheLimit(size_t size) noexcept
Set the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:3372

nvinfer1::IExecutionContext::getPersistentCacheLimit
size_t getPersistentCacheLimit() const noexcept
Get the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:3383

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:2547

nvinfer1::IExecutionContext::getNvtxVerbosity
ProfilingVerbosity getNvtxVerbosity() const noexcept
Get the NVTX verbosity of the execution context.
Definition: NvInferRuntime.h:3419

nvinfer1::IExecutionContext::setAuxStreams
void setAuxStreams(cudaStream_t *auxStreams, int32_t nbStreams) noexcept
Set the auxiliary streams that TensorRT should launch kernels on in the next enqueueV3() call.
Definition: NvInferRuntime.h:3450

nvinfer1::IExecutionContext::getMaxOutputSize
int64_t getMaxOutputSize(char const *tensorName) const noexcept
Get upper bound on an output tensor's size, in bytes, based on the current optimization profile and i...
Definition: NvInferRuntime.h:3309

nvinfer1::IExecutionContext::inferShapes
int32_t inferShapes(int32_t nbMaxNames, char const **tensorNames) noexcept
Run shape calculations.
Definition: NvInferRuntime.h:3233

nvinfer1::IExecutionContext::setTensorAddress
bool setTensorAddress(char const *tensorName, void *data) noexcept
Set memory address for given input or output tensor.
Definition: NvInferRuntime.h:3142

nvinfer1::IExecutionContext::setTemporaryStorageAllocator
bool setTemporaryStorageAllocator(IGpuAllocator *allocator) noexcept
Specify allocator to use for internal temporary storage.
Definition: NvInferRuntime.h:3329

nvinfer1::IExecutionContext::getOutputTensorAddress
void * getOutputTensorAddress(char const *tensorName) const noexcept
Get memory address for given output.
Definition: NvInferRuntime.h:3200

nvinfer1::IExecutionContext::enqueueV3
bool enqueueV3(cudaStream_t stream) noexcept
Enqueue inference on a stream.
Definition: NvInferRuntime.h:3357

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:2696

nvinfer1::IExecutionContext::setInputTensorAddress
bool setInputTensorAddress(char const *tensorName, void const *data) noexcept
Set memory address for given input.
Definition: NvInferRuntime.h:3181

nvinfer1::IExecutionContext::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:2559

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:2517

nvinfer1::IExecutionContext::getBindingDimensions
TRT_DEPRECATED Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dynamic dimensions of a binding.
Definition: NvInferRuntime.h:2786

nvinfer1::IExecutionContext::setInputConsumedEvent
bool setInputConsumedEvent(cudaEvent_t event) noexcept
Mark input as consumed.
Definition: NvInferRuntime.h:3249

nvinfer1::IExecutionContext::getTensorStrides
Dims getTensorStrides(char const *tensorName) const noexcept
Return the strides of the buffer for the given tensor name.
Definition: NvInferRuntime.h:2644

nvinfer1::IExecutionContext::setNvtxVerbosity
bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept
Set the verbosity of the NVTX markers in the execution context.
Definition: NvInferRuntime.h:3407

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:2537

nvinfer1::IExecutionContext::getStrides
TRT_DEPRECATED Dims getStrides(int32_t bindingIndex) const noexcept
Return the strides of the buffer for the given binding.
Definition: NvInferRuntime.h:2623

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2936

nvinfer1::IExecutionContext::setOptimizationProfile
TRT_DEPRECATED bool setOptimizationProfile(int32_t profileIndex) noexcept
Select an optimization profile for the current context.
Definition: NvInferRuntime.h:2682

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:2900

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:2527

nvinfer1::IExecutionContext::getShapeBinding
TRT_DEPRECATED bool getShapeBinding(int32_t bindingIndex, int32_t *data) const noexcept
Get values of an input tensor required for shape calculations or an output tensor produced by shape c...
Definition: NvInferRuntime.h:2882

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:2573

nvinfer1::IExecutionContext::getInputConsumedEvent
cudaEvent_t getInputConsumedEvent() const noexcept
The event associated with consuming the input.
Definition: NvInferRuntime.h:3259

nvinfer1::IExecutionContext::allInputShapesSpecified
bool allInputShapesSpecified() const noexcept
Whether all input shape bindings have been specified.
Definition: NvInferRuntime.h:2917

nvinfer1::IExprBuilder
Definition: NvInferRuntime.h:282

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
Definition: NvInferRuntime.h:292

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:299

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int32_t value) noexcept
Return pointer to IDimensionExp for given value.
Definition: NvInferRuntime.h:285

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInferRuntimeBase.h:367

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:144

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:149

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:161

nvinfer1::IHostMemory::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:172

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:155

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:178

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILoggerFinder
A virtual base class to find a logger. Allows a plugin to find an instance of a logger if it needs to...
Definition: NvInferRuntime.h:3709

nvinfer1::ILoggerFinder::findLogger
virtual ILogger * findLogger()=0
Get the logger used by the engine or execution context which called the plugin method.

nvinfer1::ILoggerFinder::~ILoggerFinder
virtual ~ILoggerFinder()=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntimeBase.h:505

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:43

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:1293

nvinfer1::IOptimizationProfile::getShapeValues
int32_t const * getShapeValues(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1406

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:1459

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1334

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:1436

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1322

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:1424

nvinfer1::IOptimizationProfile::setShapeValues
bool setShapeValues(char const *inputName, OptProfileSelector select, int32_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1380

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:1453

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:1394

nvinfer1::IOutputAllocator
Callback from ExecutionContext::enqueueV3()
Definition: NvInferRuntime.h:2377

nvinfer1::IOutputAllocator::notifyShape
virtual void notifyShape(char const *tensorName, Dims const &dims) noexcept=0
Called by TensorRT when the shape of the output tensor is known.

nvinfer1::IOutputAllocator::~IOutputAllocator
virtual ~IOutputAllocator()=default

nvinfer1::IOutputAllocator::getInterfaceVersion
virtual int32_t getInterfaceVersion() const noexcept
Return the API version of this IOutputAllocator.
Definition: NvInferRuntime.h:2386

nvinfer1::IOutputAllocator::reallocateOutput
virtual void * reallocateOutput(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment) noexcept=0
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated.

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:50

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator. Returns false if one with same type is already registered.

nvinfer1::IPluginV2DynamicExt
Definition: NvInferRuntime.h:351

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:503

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimePlugin.h:408

nvinfer1::IProfiler
Application-implemented interface for profiling.
Definition: NvInferRuntime.h:556

nvinfer1::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
Definition: NvInferRuntime.h:567

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:960

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:1233

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:1159

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:1195

nvinfer1::IRefitter::setDynamicRange
bool setDynamicRange(char const *tensorName, float min, float max) noexcept
Definition: NvInferRuntime.h:1060

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:1205

nvinfer1::IRefitter::getTensorsWithDynamicRange
int32_t getTensorsWithDynamicRange(int32_t size, char const **tensorNames) const noexcept
Get names of all tensors that have refittable dynamic ranges.
Definition: NvInferRuntime.h:1104

nvinfer1::IRefitter::getDynamicRangeMin
float getDynamicRangeMin(char const *tensorName) const noexcept
Get minimum of dynamic range.
Definition: NvInferRuntime.h:1074

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Updates associated engine. Return true if successful.
Definition: NvInferRuntime.h:992

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:1179

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:1013

nvinfer1::IRefitter::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:1040

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:1219

nvinfer1::IRefitter::getDynamicRangeMax
float getDynamicRangeMax(char const *tensorName) const noexcept
Get maximum of dynamic range.
Definition: NvInferRuntime.h:1088

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:1239

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:1030

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1123

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1138

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:654

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:805

nvinfer1::IRuntime::loadRuntime
IRuntime * loadRuntime(char const *path) noexcept
Load IRuntime from the file.
Definition: NvInferRuntime.h:921

nvinfer1::IRuntime::getEngineHostCodeAllowed
bool getEngineHostCodeAllowed() const noexcept
Get whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:943

nvinfer1::IRuntime::getTempfileControlFlags
TempfileControlFlags getTempfileControlFlags() const noexcept
Get the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:893

nvinfer1::IRuntime::setEngineHostCodeAllowed
void setEngineHostCodeAllowed(bool allowed) noexcept
Set whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:933

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::setTemporaryDirectory
void setTemporaryDirectory(char const *path) noexcept
Set the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:854

nvinfer1::IRuntime::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
Get the local plugin registry that can be used by the runtime.
Definition: NvInferRuntime.h:903

nvinfer1::IRuntime::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:718

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
Definition: NvInferRuntime.h:949

nvinfer1::IRuntime::setDLACore
void setDLACore(int32_t dlaCore) noexcept
Sets the DLA core used by the network. Defaults to -1.
Definition: NvInferRuntime.h:689

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible or 0 if DLA is unavailable.
Definition: NvInferRuntime.h:706

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
Deserialize an engine from a stream.
Definition: NvInferRuntime.h:781

nvinfer1::IRuntime::setTempfileControlFlags
void setTempfileControlFlags(TempfileControlFlags flags) noexcept
Set the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:881

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:698

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:732

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:766

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:791

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:819

nvinfer1::IRuntime::getTemporaryDirectory
char const * getTemporaryDirectory() const noexcept
Get the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:865

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:751

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:3681

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:3683

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:126

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:128

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:130

nvinfer1::Weights::values
void const  * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:129

nvinfer1::safe::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an safe::IRuntime class.

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:1505

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:69

nvinfer1::EngineCapability::kDEFAULT
@ kDEFAULT

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kSAFE_DLA
@ kSAFE_DLA

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::EngineCapability::kSAFE_GPU
@ kSAFE_GPU

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:192

nvinfer1::DimensionOperation::kSUB
@ kSUB
Substract the second element from the first.

nvinfer1::DimensionOperation::kSUM
@ kSUM
Sum of the two operands.

nvinfer1::DimensionOperation::kPROD
@ kPROD
Product of the two operands.

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
1 if operands are equal, 0 otherwise.

nvinfer1::DimensionOperation::kMIN
@ kMIN
Minimum of the two operands.

nvinfer1::DimensionOperation::kLESS
@ kLESS
1 if first operand is less than second operand, 0 otherwise.

nvinfer1::DimensionOperation::kMAX
@ kMAX
Maximum of the two operands.

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::TensorIOMode
TensorIOMode
Definition of tensor IO Mode.
Definition: NvInferRuntimeBase.h:883

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
Definition: NvInfer.h:9057

nvinfer1::TempfileControlFlags
uint32_t TempfileControlFlags
Represents a collection of one or more TempfileControlFlag values combined using bitwise-OR operation...
Definition: NvInferRuntime.h:644

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:588

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
Definition: NvInferRuntime.h:3475

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeBase.h:120

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:599

nvinfer1::DeviceType::kGPU
@ kGPU
GPU Device.

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::GatherMode::kDEFAULT
@ kDEFAULT
Similar to ONNX Gather.

nvinfer1::TempfileControlFlag
TempfileControlFlag
Flags used to control TensorRT's behavior when creating executable temporary files.
Definition: NvInferRuntime.h:622

nvinfer1::TempfileControlFlag::kALLOW_TEMPORARY_FILES
@ kALLOW_TEMPORARY_FILES

nvinfer1::TempfileControlFlag::kALLOW_IN_MEMORY_FILES
@ kALLOW_IN_MEMORY_FILES
Allow creating and loading files in-memory (or unnamed files).

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:1265

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:577

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
Maximum number of profile verbosity levels in ProfilingVerbosity enum.
Definition: NvInferRuntime.h:1530

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:1517

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::ProfilingVerbosity::kVERBOSE
@ kVERBOSE

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:1472

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kCUDNN
@ kCUDNN

nvinfer1::TacticSource::kJIT_CONVOLUTIONS
@ kJIT_CONVOLUTIONS

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimePlugin.h:41

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::EnumMax< TempfileControlFlag >
constexpr int32_t EnumMax< TempfileControlFlag >() noexcept
Maximum number of elements in TempfileControlFlag enum.
Definition: NvInferRuntime.h:634

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntimeBase.h:209

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
Maximum number of tactic sources in TacticSource enum.
Definition: NvInferRuntime.h:1494

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:3467

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::PoolingType::kMAX
@ kMAX

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:606

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:206

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:216

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:1253

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::DynamicPluginTensorDesc
Definition: NvInferRuntime.h:321

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:326

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:329

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:323

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimePlugin.h:54

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:105