api/c_api/_nv_infer_runtime_8h_source.html

/*

 * Copyright (c) 1993-2022, NVIDIA CORPORATION. All rights reserved.

 *

 * NOTICE TO LICENSEE:

 *

 * This source code and/or documentation ("Licensed Deliverables") are

 * subject to NVIDIA intellectual property rights under U.S. and

 * international Copyright laws.

 *

 * These Licensed Deliverables contained herein is PROPRIETARY and

 * CONFIDENTIAL to NVIDIA and is being provided under the terms and

 * conditions of a form of NVIDIA software license agreement by and

 * between NVIDIA and Licensee ("License Agreement") or electronically

 * accepted by Licensee.  Notwithstanding any terms or conditions to

 * the contrary in the License Agreement, reproduction or disclosure

 * of the Licensed Deliverables to any third party without the express

 * written consent of NVIDIA is prohibited.

 *

 * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

 * LICENSE AGREEMENT, NVIDIA MAKES NO REPRESENTATION ABOUT THE

 * SUITABILITY OF THESE LICENSED DELIVERABLES FOR ANY PURPOSE.  IT IS

 * PROVIDED "AS IS" WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.

 * NVIDIA DISCLAIMS ALL WARRANTIES WITH REGARD TO THESE LICENSED

 * DELIVERABLES, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY,

 * NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.

 * NOTWITHSTANDING ANY TERMS OR CONDITIONS TO THE CONTRARY IN THE

 * LICENSE AGREEMENT, IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY

 * SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY

 * DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,

 * WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS

 * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE

 * OF THESE LICENSED DELIVERABLES.

 *

 * U.S. Government End Users.  These Licensed Deliverables are a

 * "commercial item" as that term is defined at 48 C.F.R. 2.101 (OCT

 * 1995), consisting of "commercial computer software" and "commercial

 * computer software documentation" as such terms are used in 48

 * C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Government

 * only as a commercial end item.  Consistent with 48 C.F.R.12.212 and

 * 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), all

 * U.S. Government End Users acquire the Licensed Deliverables with

 * only those rights set forth herein.

 *

 * Any use of the Licensed Deliverables in individual and commercial

 * software must include, in the user documentation and internal

 * comments to the code, the above Disclaimer and U.S. Government End

 * Users Notice.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h"

#include "NvInferRuntimeCommon.h"


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(const INoCopy& other) = delete;

    INoCopy& operator=(const INoCopy& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kDEFAULT TRT_DEPRECATED_ENUM = kSTANDARD,


    kSAFETY = 1,


    kSAFE_GPU TRT_DEPRECATED_ENUM = kSAFETY,


    kDLA_STANDALONE = 2,


    kSAFE_DLA TRT_DEPRECATED_ENUM = kDLA_STANDALONE,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public:

    DataType type;

    const void* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = default;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }

    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


protected:

    apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

    return 9;

}


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int32_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = default;

};


class IExprBuilder : public INoCopy

{

public:

    const IDimensionExpr* constant(int32_t value) noexcept

    {

        return mImpl->constant(value);

    }


    const IDimensionExpr* operation(

        DimensionOperation op, const IDimensionExpr& first, const IDimensionExpr& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = default;

};


class DimsExprs

{

public:

    int32_t nbDims;

    const IDimensionExpr* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;

};


class IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, const DimsExprs* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept

        = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, const PluginTensorDesc* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept

        = 0;


    virtual void configurePlugin(const DynamicPluginTensorDesc* in, int32_t nbInputs,

        const DynamicPluginTensorDesc* out, int32_t nbOutputs) noexcept

        = 0;


    virtual size_t getWorkspaceSize(const PluginTensorDesc* inputs, int32_t nbInputs, const PluginTensorDesc* outputs,

        int32_t nbOutputs) const noexcept

        = 0;


    virtual int32_t enqueue(const PluginTensorDesc* inputDesc, const PluginTensorDesc* outputDesc,

        const void* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept

        = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

        return Dims{-1, {}};

    }


    bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

        return false;

    }


    bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

        return true;

    }


    size_t getWorkspaceSize(int32_t) const noexcept override final

    {

        return 0;

    }


    int32_t enqueue(int32_t, const void* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

        return 1;

    }

};


class IProfiler

{

public:

    virtual void reportLayerTime(const char* layerName, float ms) noexcept = 0;


    virtual ~IProfiler() noexcept {}

};


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

    return 6;

}


enum class DeviceType : int32_t

{

    kGPU,

    kDLA,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

    return 2;

}


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = default;


    TRT_DEPRECATED nvinfer1::ICudaEngine* deserializeCudaEngine(

        const void* blob, std::size_t size, IPluginFactory* pluginFactory) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(const void* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size, nullptr);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


protected:

    apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = default;


    bool setWeights(const char* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, const char** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, const char** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    bool setDynamicRange(const char* tensorName, float min, float max) noexcept

    {

        return mImpl->setDynamicRange(tensorName, min, max);

    }


    float getDynamicRangeMin(const char* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMin(tensorName);

    }


    float getDynamicRangeMax(const char* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMax(tensorName);

    }


    int32_t getTensorsWithDynamicRange(int32_t size, const char** tensorNames) const noexcept

    {

        return mImpl->getTensorsWithDynamicRange(size, tensorNames);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(const char* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, const char** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, const char** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


protected:

    apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

    return 3;

}


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(const char* inputName, OptProfileSelector select, Dims dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(const char* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    bool setShapeValues(

        const char* inputName, OptProfileSelector select, const int32_t* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


    int32_t getNbShapeValues(const char* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    int32_t const* getShapeValues(const char* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValues(inputName, select);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

    kCUBLAS = 0,

    kCUBLAS_LT = 1,

    kCUDNN = 2

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

    return 3;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,


    kDEFAULT TRT_DEPRECATED_ENUM = kLAYER_NAMES_ONLY,

    kVERBOSE TRT_DEPRECATED_ENUM = kDETAILED

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

    return 3;

}


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = default;


    int32_t getNbBindings() const noexcept

    {

        return mImpl->getNbBindings();

    }


    int32_t getBindingIndex(const char* name) const noexcept

    {

        return mImpl->getBindingIndex(name);

    }


    const char* getBindingName(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingName(bindingIndex);

    }


    bool bindingIsInput(int32_t bindingIndex) const noexcept

    {

        return mImpl->bindingIsInput(bindingIndex);

    }


    Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    DataType getBindingDataType(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDataType(bindingIndex);

    }


    int32_t getMaxBatchSize() const noexcept

    {

        return mImpl->getMaxBatchSize();

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext() noexcept

    {

        return mImpl->createExecutionContext();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    TensorLocation getLocation(int32_t bindingIndex) const noexcept

    {

        return mImpl->getLocation(bindingIndex);

    }


    IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept

    {

        return mImpl->createExecutionContextWithoutDeviceMemory();

    }


    size_t getDeviceMemorySize() const noexcept

    {

        return mImpl->getDeviceMemorySize();

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingBytesPerComponent(bindingIndex);

    }


    int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingComponentsPerElement(bindingIndex);

    }


    TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormat(bindingIndex);

    }


    const char* getBindingFormatDesc(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingFormatDesc(bindingIndex);

    }


    int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingVectorizedDim(bindingIndex);

    }


    const char* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    Dims getProfileDimensions(int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileDimensions(bindingIndex, profileIndex, select);

    }


    const int32_t* getProfileShapeValues(int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const

        noexcept

    {

        return mImpl->getProfileShapeValues(profileIndex, inputIndex, select);

    }


    bool isShapeBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isShapeBinding(bindingIndex);

    }


    bool isExecutionBinding(int32_t bindingIndex) const noexcept

    {

        return mImpl->isExecutionBinding(bindingIndex);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


protected:

    apiv::VCudaEngine* mImpl;

};


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = default;


    bool execute(int32_t batchSize, void* const* bindings) noexcept

    {

        return mImpl->execute(batchSize, bindings);

    }


    bool enqueue(int32_t batchSize, void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueue(batchSize, bindings, stream, inputConsumed);

    }


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    const ICudaEngine& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    TRT_DEPRECATED void destroy() noexcept

    {

        delete this;

    }


    void setName(const char* name) noexcept

    {

        mImpl->setName(name);

    }


    const char* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    Dims getStrides(int32_t bindingIndex) const noexcept

    {

        return mImpl->getStrides(bindingIndex);

    }


public:

    TRT_DEPRECATED

    bool setOptimizationProfile(int32_t profileIndex) noexcept

    {

        return mImpl->setOptimizationProfile(profileIndex);

    }


    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept

    {

        return mImpl->setBindingDimensions(bindingIndex, dimensions);

    }


    Dims getBindingDimensions(int32_t bindingIndex) const noexcept

    {

        return mImpl->getBindingDimensions(bindingIndex);

    }


    bool setInputShapeBinding(int32_t bindingIndex, int32_t const* data) noexcept

    {

        return mImpl->setInputShapeBinding(bindingIndex, data);

    }


    bool getShapeBinding(int32_t bindingIndex, int32_t* data) const noexcept

    {

        return mImpl->getShapeBinding(bindingIndex, data);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    bool allInputShapesSpecified() const noexcept


    {

        return mImpl->allInputShapesSpecified();

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    bool enqueueV2(void* const* bindings, cudaStream_t stream, cudaEvent_t* inputConsumed) noexcept

    {

        return mImpl->enqueueV2(bindings, stream, inputConsumed);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

    return 2;

}


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = default;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    AsciiChar const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    AsciiChar const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}

#endif // NV_INFER_RUNTIME_H

getLogger
nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getPluginRegistry
nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

NvInferRuntimeCommon.h

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeCommon.h:91

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeCommon.h:110

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeCommon.h:77

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeCommon.h:78

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims32
Definition: NvInferRuntimeCommon.h:190

nvinfer1::Dims32::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeCommon.h:193

nvinfer1::DimsExprs
Definition: NvInferRuntime.h:346

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:348

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:1379

nvinfer1::ICudaEngine::getBindingBytesPerComponent
int32_t getBindingBytesPerComponent(int32_t bindingIndex) const noexcept
Return the number of bytes per component of an element.
Definition: NvInferRuntime.h:1612

nvinfer1::ICudaEngine::getBindingComponentsPerElement
int32_t getBindingComponentsPerElement(int32_t bindingIndex) const noexcept
Return the number of components included in one element.
Definition: NvInferRuntime.h:1626

nvinfer1::ICudaEngine::isShapeBinding
bool isShapeBinding(int32_t bindingIndex) const noexcept
True if tensor is required as input for shape calculations or output from them.
Definition: NvInferRuntime.h:1783

nvinfer1::ICudaEngine::hasImplicitBatchDimension
bool hasImplicitBatchDimension() const noexcept
Query whether the engine was built with an implicit batch dimension.
Definition: NvInferRuntime.h:1864

nvinfer1::ICudaEngine::getName
const char * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:1682

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:1812

nvinfer1::ICudaEngine::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object;.
Definition: NvInferRuntime.h:1554

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1845

nvinfer1::ICudaEngine::getBindingFormat
TensorFormat getBindingFormat(int32_t bindingIndex) const noexcept
Return the binding format.
Definition: NvInferRuntime.h:1636

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:1900

nvinfer1::ICudaEngine::getProfileShapeValues
const int32_t * getProfileShapeValues(int32_t profileIndex, int32_t inputIndex, OptProfileSelector select) const noexcept
Get minimum / optimum / maximum values for an input shape binding under an optimization profile.
Definition: NvInferRuntime.h:1746

nvinfer1::ICudaEngine::getLocation
TensorLocation getLocation(int32_t bindingIndex) const noexcept
Get location of binding.
Definition: NvInferRuntime.h:1569

nvinfer1::ICudaEngine::getProfileDimensions
Dims getProfileDimensions(int32_t bindingIndex, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a particular binding under an optimization profile...
Definition: NvInferRuntime.h:1720

nvinfer1::ICudaEngine::getBindingDimensions
Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dimensions of a binding.
Definition: NvInferRuntime.h:1473

nvinfer1::ICudaEngine::getBindingVectorizedDim
int32_t getBindingVectorizedDim(int32_t bindingIndex) const noexcept
Return the dimension index that the buffer is vectorized.
Definition: NvInferRuntime.h:1667

nvinfer1::ICudaEngine::getMaxBatchSize
int32_t getMaxBatchSize() const noexcept
Get the maximum batch size which can be used for inference.
Definition: NvInferRuntime.h:1498

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1830

nvinfer1::ICudaEngine::getDeviceMemorySize
size_t getDeviceMemorySize() const noexcept
Return the amount of device memory required by an execution context.
Definition: NvInferRuntime.h:1588

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine
Definition: NvInferRuntime.h:1873

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:1884

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:1526

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
IExecutionContext * createExecutionContextWithoutDeviceMemory() noexcept
create an execution context without any device memory allocated
Definition: NvInferRuntime.h:1578

nvinfer1::ICudaEngine::getBindingIndex
int32_t getBindingIndex(const char *name) const noexcept
Retrieve the binding index for a named tensor.
Definition: NvInferRuntime.h:1415

nvinfer1::ICudaEngine::getBindingDataType
DataType getBindingDataType(int32_t bindingIndex) const noexcept
Determine the required data type for a buffer from its binding index.
Definition: NvInferRuntime.h:1486

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext() noexcept
Create an execution context.
Definition: NvInferRuntime.h:1542

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:1894

nvinfer1::ICudaEngine::getBindingName
const char * getBindingName(int32_t bindingIndex) const noexcept
Retrieve the name corresponding to a binding index.
Definition: NvInferRuntime.h:1435

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:1693

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:1512

nvinfer1::ICudaEngine::getBindingFormatDesc
const char * getBindingFormatDesc(int32_t bindingIndex) const noexcept
Return the human readable description of the tensor format.
Definition: NvInferRuntime.h:1655

nvinfer1::ICudaEngine::bindingIsInput
bool bindingIsInput(int32_t bindingIndex) const noexcept
Determine whether a binding is an input binding.
Definition: NvInferRuntime.h:1448

nvinfer1::ICudaEngine::isExecutionBinding
bool isExecutionBinding(int32_t bindingIndex) const noexcept
True if pointer to tensor data is required for execution phase, false if nullptr can be supplied.
Definition: NvInferRuntime.h:1797

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:1598

nvinfer1::IDimensionExpr
Definition: NvInferRuntime.h:281

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:284

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:297

nvinfer1::IDimensionExpr::getConstantValue
int32_t getConstantValue() const noexcept
Definition: NvInferRuntime.h:291

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:2518

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2630

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2615

nvinfer1::IEngineInspector::getEngineInformation
AsciiChar const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:2596

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:2546

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:2636

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getLayerInformation
AsciiChar const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:2571

nvinfer1::IErrorRecorder
Reference counted application-implemented error reporting interface for TensorRT objects.
Definition: NvInferRuntimeCommon.h:1699

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:1914

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2326

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:2472

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:2067

nvinfer1::IExecutionContext::getBindingDimensions
Dims getBindingDimensions(int32_t bindingIndex) const noexcept
Get the dynamic dimensions of a binding.
Definition: NvInferRuntime.h:2210

nvinfer1::IExecutionContext::getShapeBinding
bool getShapeBinding(int32_t bindingIndex, int32_t *data) const noexcept
Get values of an input tensor required for shape calculations or an output tensor produced by shape c...
Definition: NvInferRuntime.h:2262

nvinfer1::IExecutionContext::setDebugSync
void setDebugSync(bool sync) noexcept
Set the debug sync flag.
Definition: NvInferRuntime.h:1977

nvinfer1::IExecutionContext::enqueueV2
bool enqueueV2(void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Asynchronously execute inference.
Definition: NvInferRuntime.h:2371

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:2434

nvinfer1::IExecutionContext::setBindingDimensions
bool setBindingDimensions(int32_t bindingIndex, Dims dimensions) noexcept
Set the dynamic dimensions of a binding.
Definition: NvInferRuntime.h:2180

nvinfer1::IExecutionContext::setInputShapeBinding
bool setInputShapeBinding(int32_t bindingIndex, int32_t const *data) noexcept
Set values of input tensor required by shape calculations.
Definition: NvInferRuntime.h:2240

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute inference a network.
Definition: NvInferRuntime.h:2343

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:2445

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:2419

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:2478

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:2143

nvinfer1::IExecutionContext::enqueue
bool enqueue(int32_t batchSize, void *const *bindings, cudaStream_t stream, cudaEvent_t *inputConsumed) noexcept
Asynchronously execute inference on a batch.
Definition: NvInferRuntime.h:1964

nvinfer1::IExecutionContext::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:2029

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:1987

nvinfer1::IExecutionContext::getName
const char * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:2051

nvinfer1::IExecutionContext::getStrides
Dims getStrides(int32_t bindingIndex) const noexcept
Return the strides of the buffer for the given binding.
Definition: NvInferRuntime.h:2088

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:2007

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2311

nvinfer1::IExecutionContext::setOptimizationProfile
TRT_DEPRECATED bool setOptimizationProfile(int32_t profileIndex) noexcept
Select an optimization profile for the current context.
Definition: NvInferRuntime.h:2131

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:2277

nvinfer1::IExecutionContext::getEngine
const ICudaEngine & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:2017

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:1997

nvinfer1::IExecutionContext::allInputShapesSpecified
bool allInputShapesSpecified() const noexcept
Whether all input shape bindings have been specified.
Definition: NvInferRuntime.h:2291

nvinfer1::IExecutionContext::setName
void setName(const char *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:2041

nvinfer1::IExprBuilder
Definition: NvInferRuntime.h:319

nvinfer1::IExprBuilder::constant
const IDimensionExpr * constant(int32_t value) noexcept
Return pointer to IDimensionExp for given value.
Definition: NvInferRuntime.h:322

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:336

nvinfer1::IExprBuilder::operation
const IDimensionExpr * operation(DimensionOperation op, const IDimensionExpr &first, const IDimensionExpr &second) noexcept
Definition: NvInferRuntime.h:329

nvinfer1::IGpuAllocator
Application-implemented class for controlling allocation on the GPU.
Definition: NvInferRuntimeCommon.h:1372

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:181

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:186

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:198

nvinfer1::IHostMemory::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:209

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:192

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:215

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntimeCommon.h:1510

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:80

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::operator=
INoCopy & operator=(const INoCopy &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::INoCopy
INoCopy(const INoCopy &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:1160

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:1310

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(const char *inputName, OptProfileSelector select, Dims dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1187

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(const char *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:1252

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:1288

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(const char *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:1197

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:1280

nvinfer1::IOptimizationProfile::getShapeValues
int32_t const * getShapeValues(const char *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1262

nvinfer1::IOptimizationProfile::setShapeValues
bool setShapeValues(const char *inputName, OptProfileSelector select, const int32_t *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:1240

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:1304

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:1244

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator. Returns false if one with same type is already registered.

nvinfer1::IPluginV2DynamicExt
Definition: NvInferRuntime.h:388

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:545

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimeCommon.h:714

nvinfer1::IProfiler
Application-implemented interface for profiling.
Definition: NvInferRuntime.h:597

nvinfer1::IProfiler::reportLayerTime
virtual void reportLayerTime(const char *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
Definition: NvInferRuntime.h:607

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:840

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:1100

nvinfer1::IRefitter::getDynamicRangeMin
float getDynamicRangeMin(const char *tensorName) const noexcept
Get minimum of dynamic range.
Definition: NvInferRuntime.h:946

nvinfer1::IRefitter::setDynamicRange
bool setDynamicRange(const char *tensorName, float min, float max) noexcept
Definition: NvInferRuntime.h:934

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:1072

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Updates associated engine. Return true if successful.
Definition: NvInferRuntime.h:869

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, const char **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:890

nvinfer1::IRefitter::getTensorsWithDynamicRange
int32_t getTensorsWithDynamicRange(int32_t size, const char **tensorNames) const noexcept
Get names of all tensors that have refittable dynamic ranges.
Definition: NvInferRuntime.h:974

nvinfer1::IRefitter::destroy
TRT_DEPRECATED void destroy() noexcept
Definition: NvInferRuntime.h:917

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:1086

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, const char **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:907

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, const char **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:1046

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(const char *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:1026

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:1106

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::getDynamicRangeMax
float getDynamicRangeMax(const char *tensorName) const noexcept
Get maximum of dynamic range.
Definition: NvInferRuntime.h:958

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:993

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, const char **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:1062

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1008

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:659

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:809

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(const void *blob, std::size_t size) noexcept
Deserialize an engine from a stream.
Definition: NvInferRuntime.h:785

nvinfer1::IRuntime::destroy
TRT_DEPRECATED void destroy() noexcept
Destroy this object.
Definition: NvInferRuntime.h:722

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
Definition: NvInferRuntime.h:829

nvinfer1::IRuntime::setDLACore
void setDLACore(int32_t dlaCore) noexcept
Set the DLA core that the deserialized engine must execute on.
Definition: NvInferRuntime.h:691

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible.
Definition: NvInferRuntime.h:710

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:702

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:736

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:770

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:795

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:823

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:755

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:2705

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:2707

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:163

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:165

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:167

nvinfer1::Weights::values
const void * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:166

nvinfer1::safe::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an safe::IRuntime class.

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:1341

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:106

nvinfer1::EngineCapability::kDEFAULT
@ kDEFAULT

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kSAFE_DLA
@ kSAFE_DLA

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::EngineCapability::kSAFE_GPU
@ kSAFE_GPU

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:229

nvinfer1::DimensionOperation::kSUB
@ kSUB
Substract the second element from the first.

nvinfer1::DimensionOperation::kSUM
@ kSUM
Sum of the two operands.

nvinfer1::DimensionOperation::kPROD
@ kPROD
Product of the two operands.

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
1 if operands are equal, 0 otherwise.

nvinfer1::DimensionOperation::kMIN
@ kMIN
Minimum of the two operands.

nvinfer1::DimensionOperation::kLESS
@ kLESS
1 if first operand is less than second operand, 0 otherwise.

nvinfer1::DimensionOperation::kMAX
@ kMAX
Maximum of the two operands.

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:628

nvinfer1::AsciiChar
char_t AsciiChar
AsciiChar is the type used by TensorRT to represent valid ASCII characters.
Definition: NvInferRuntimeCommon.h:125

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
Definition: NvInferRuntime.h:2497

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeCommon.h:151

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:639

nvinfer1::DeviceType::kGPU
@ kGPU
GPU Device.

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::GatherMode::kDEFAULT
@ kDEFAULT
Similar to ONNX Gather.

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:1132

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:617

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer, IDeconvolutionLayer, or IFullyConnectedLayer

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
Maximum number of profile verbosity levels in ProfilingVerbosity enum.
Definition: NvInferRuntime.h:1366

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:1353

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::ProfilingVerbosity::kVERBOSE
@ kVERBOSE

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:1322

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT
cuBLAS LT tactics

nvinfer1::TacticSource::kCUDNN
@ kCUDNN
cuDNN tactics

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS
cuBLAS tactics.

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimeCommon.h:345

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntimeCommon.h:221

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
Maximum number of tactic sources in TacticSource enum.
Definition: NvInferRuntime.h:1330

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:2489

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::PoolingType::kMAX
@ kMAX

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:646

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:243

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:253

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:1120

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::DynamicPluginTensorDesc
Definition: NvInferRuntime.h:358

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:363

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:366

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:360

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimeCommon.h:370

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeCommon.h:136