_static/c-api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h"

#define NV_INFER_INTERNAL_INCLUDE 1

#include "NvInferPluginBase.h"

#undef NV_INFER_INTERNAL_INCLUDE

#include "NvInferRuntimeCommon.h"


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(INoCopy const& other) = delete;

    INoCopy& operator=(INoCopy const& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kSAFETY = 1,


    kDLA_STANDALONE = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public:

    DataType type;

    void const* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = default;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }


protected:

    apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

    return 9;

}


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int64_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = default;


public:

    bool isSizeTensor() const noexcept

    {

        return mImpl->isSizeTensor();

    }

};


class IExprBuilder : public INoCopy

{

public:

    IDimensionExpr const* constant(int64_t value) noexcept

    {

        return mImpl->constant(value);

    }


    IDimensionExpr const* operation(

        DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = default;


public:

    IDimensionExpr const* declareSizeTensor(int32_t outputIndex, IDimensionExpr const& opt, IDimensionExpr const& upper)

    {

        return mImpl->declareSizeTensor(outputIndex, opt, upper);

    }

};


class DimsExprs

{

public:

    int32_t nbDims;

    IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;


    Dims opt;

};


class TRT_DEPRECATED IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

        int32_t nbOutputs) const noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

        return Dims{-1, {}};

    }


    TRT_DEPRECATED bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

        return false;

    }


    TRT_DEPRECATED bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

        return true;

    }


    size_t getWorkspaceSize(int32_t) const noexcept override final

    {

        return 0;

    }


    int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

        return 1;

    }

};


namespace v_1_0

{

class IStreamReader : public IVersionedInterface

{

public:

    ~IStreamReader() override = default;

    IStreamReader() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReader", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes) = 0;


protected:

    IStreamReader(IStreamReader const&) = default;

    IStreamReader(IStreamReader&&) = default;

    IStreamReader& operator=(IStreamReader const&) & = default;

    IStreamReader& operator=(IStreamReader&&) & = default;

};

} // namespace v_1_0


using IStreamReader = v_1_0::IStreamReader;


enum class SeekPosition : int32_t

{

    kSET = 0,


    kCUR = 1,


    kEND = 2,

};


namespace v_1_0

{

class IStreamReaderV2 : public IVersionedInterface

{

public:

    ~IStreamReaderV2() override = default;

    IStreamReaderV2() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReaderV2", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes, cudaStream_t stream) noexcept = 0;


    virtual bool seek(int64_t offset, SeekPosition where) noexcept = 0;


protected:

    IStreamReaderV2(IStreamReaderV2 const&) = default;

    IStreamReaderV2(IStreamReaderV2&&) = default;

    IStreamReaderV2& operator=(IStreamReaderV2 const&) & = default;

    IStreamReaderV2& operator=(IStreamReaderV2&&) & = default;

};

} // namespace v_1_0


using IStreamReaderV2 = v_1_0::IStreamReaderV2;


class IPluginResourceContext

{

public:

    virtual IGpuAllocator* getGpuAllocator() const noexcept = 0;


    virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

    virtual ~IPluginResourceContext() noexcept = default;


protected:

    IPluginResourceContext() = default;

    IPluginResourceContext(IPluginResourceContext const&) = default;

    IPluginResourceContext(IPluginResourceContext&&) = default;

    IPluginResourceContext& operator=(IPluginResourceContext const&) & = default;

    IPluginResourceContext& operator=(IPluginResourceContext&&) & = default;

};


namespace v_1_0

{

class IPluginV3OneCore : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_CORE", 1, 0};

    }


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;

};


class IPluginV3OneBuild : public IPluginCapability

{

public:

    static constexpr int32_t kDEFAULT_FORMAT_COMBINATION_LIMIT = 100;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 1, 0};

    }


    virtual int32_t configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getOutputDataTypes(

        DataType* outputTypes, int32_t nbOutputs, const DataType* inputTypes, int32_t nbInputs) const noexcept = 0;


    virtual int32_t getOutputShapes(DimsExprs const* inputs, int32_t nbInputs, DimsExprs const* shapeInputs,

        int32_t nbShapeInputs, DimsExprs* outputs, int32_t nbOutputs, IExprBuilder& exprBuilder) noexcept = 0;


    virtual bool supportsFormatCombination(

        int32_t pos, DynamicPluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getNbOutputs() const noexcept = 0;


    virtual size_t getWorkspaceSize(DynamicPluginTensorDesc const* inputs, int32_t nbInputs,

        DynamicPluginTensorDesc const* outputs, int32_t nbOutputs) const noexcept

    {

        return 0;

    }


    virtual int32_t getValidTactics(int32_t* tactics, int32_t nbTactics) noexcept

    {

        return 0;

    }


    virtual int32_t getNbTactics() noexcept

    {

        return 0;

    }


    virtual char const* getTimingCacheID() noexcept

    {

        return nullptr;

    }


    virtual int32_t getFormatCombinationLimit() noexcept

    {

        return kDEFAULT_FORMAT_COMBINATION_LIMIT;

    }


    virtual char const* getMetadataString() noexcept

    {

        return nullptr;

    }

};


class IPluginV3OneRuntime : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_RUNTIME", 1, 0};

    }


    virtual int32_t setTactic(int32_t tactic) noexcept

    {

        return 0;

    }


    virtual int32_t onShapeChange(

        PluginTensorDesc const* in, int32_t nbInputs, PluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


    virtual IPluginV3* attachToContext(IPluginResourceContext* context) noexcept = 0;


    virtual PluginFieldCollection const* getFieldsToSerialize() noexcept = 0;

};

} // namespace v_1_0


namespace v_2_0

{


class IPluginV3OneBuild : public v_1_0::IPluginV3OneBuild

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 2, 0};

    }


    virtual int32_t getAliasedInput(int32_t outputIndex) noexcept

    {

        return -1;

    }

};


} // namespace v_2_0


using IPluginV3OneCore = v_1_0::IPluginV3OneCore;


using IPluginV3OneBuild = v_1_0::IPluginV3OneBuild;


using IPluginV3OneRuntime = v_1_0::IPluginV3OneRuntime;


using IPluginV3OneBuildV2 = v_2_0::IPluginV3OneBuild;


namespace v_1_0

{

class IProfiler

{

public:

    virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


    virtual ~IProfiler() noexcept {}

};

} // namespace v_1_0


using IProfiler = v_1_0::IProfiler;


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

    return 6;

}


enum class DeviceType : int32_t

{

    kGPU = 0,

    kDLA = 1,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

    return 2;

}


enum class TempfileControlFlag : int32_t

{

    kALLOW_IN_MEMORY_FILES = 0,


    kALLOW_TEMPORARY_FILES = 1,

};


template <>

constexpr inline int32_t EnumMax<TempfileControlFlag>() noexcept

{

    return 2;

}


using TempfileControlFlags = uint32_t;


enum class TensorFormat : int32_t

{

    kLINEAR = 0,


    kCHW2 = 1,


    kHWC8 = 2,


    kCHW4 = 3,


    kCHW16 = 4,


    kCHW32 = 5,


    kDHWC8 = 6,


    kCDHW32 = 7,


    kHWC = 8,


    kDLA_LINEAR = 9,


    kDLA_HWC4 = 10,


    kHWC16 = 11,


    kDHWC = 12

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorFormat>

{

    static constexpr int32_t kVALUE = 13;

};

} // namespace impl


enum class AllocatorFlag : int32_t

{

    kRESIZABLE = 0,

};


namespace impl

{

template <>

struct EnumMaxImpl<AllocatorFlag>

{

    static constexpr int32_t kVALUE = 1;

};

} // namespace impl


using AllocatorFlags = uint32_t;


class ILogger

{

public:

    enum class Severity : int32_t

    {

        kINTERNAL_ERROR = 0,

        kERROR = 1,

        kWARNING = 2,

        kINFO = 3,

        kVERBOSE = 4,

    };


    virtual void log(Severity severity, AsciiChar const* msg) noexcept = 0;


    ILogger() = default;

    virtual ~ILogger() = default;


protected:

    // @cond SuppressDoxyWarnings

    ILogger(ILogger const&) = default;

    ILogger(ILogger&&) = default;

    ILogger& operator=(ILogger const&) & = default;

    ILogger& operator=(ILogger&&) & = default;

    // @endcond

};


namespace impl

{

template <>

struct EnumMaxImpl<ILogger::Severity>

{

    static constexpr int32_t kVALUE = 5;

};

} // namespace impl


namespace v_1_0

{


class IGpuAllocator : public IVersionedInterface

{

public:

    TRT_DEPRECATED virtual void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept = 0;


    ~IGpuAllocator() override = default;

    IGpuAllocator() = default;


    virtual void* reallocate(void* const /*baseAddr*/, uint64_t /*alignment*/, uint64_t /*newSize*/) noexcept

    {

        return nullptr;

    }


    TRT_DEPRECATED virtual bool deallocate(void* const memory) noexcept = 0;


    virtual void* allocateAsync(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t /*stream*/) noexcept

    {

        return allocate(size, alignment, flags);

    }

    virtual bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept

    {

        return deallocate(memory);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }


protected:

    // @cond SuppressDoxyWarnings

    IGpuAllocator(IGpuAllocator const&) = default;

    IGpuAllocator(IGpuAllocator&&) = default;

    IGpuAllocator& operator=(IGpuAllocator const&) & = default;

    IGpuAllocator& operator=(IGpuAllocator&&) & = default;

    // @endcond

};


} // namespace v_1_0


using IGpuAllocator = v_1_0::IGpuAllocator;


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = default;


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size);

    }


    TRT_DEPRECATED ICudaEngine* deserializeCudaEngine(IStreamReader& streamReader)

    {

        return mImpl->deserializeCudaEngine(streamReader);

    }


    ICudaEngine* deserializeCudaEngine(IStreamReaderV2& streamReader)

    {

        return mImpl->deserializeCudaEngineV2(streamReader);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    void setTemporaryDirectory(char const* path) noexcept

    {

        return mImpl->setTemporaryDirectory(path);

    }


    char const* getTemporaryDirectory() const noexcept

    {

        return mImpl->getTemporaryDirectory();

    }


    void setTempfileControlFlags(TempfileControlFlags flags) noexcept

    {

        return mImpl->setTempfileControlFlags(flags);

    }


    TempfileControlFlags getTempfileControlFlags() const noexcept

    {

        return mImpl->getTempfileControlFlags();

    }


    IPluginRegistry& getPluginRegistry() noexcept

    {

        return mImpl->getPluginRegistry();

    }


    IRuntime* loadRuntime(char const* path) noexcept

    {

        return mImpl->loadRuntime(path);

    }


    void setEngineHostCodeAllowed(bool allowed) noexcept

    {

        return mImpl->setEngineHostCodeAllowed(allowed);

    }


    bool getEngineHostCodeAllowed() const noexcept

    {

        return mImpl->getEngineHostCodeAllowed();

    }


protected:

    apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = default;


    bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    TRT_DEPRECATED bool setDynamicRange(char const* tensorName, float min, float max) noexcept

    {

        return mImpl->setDynamicRange(tensorName, min, max);

    }


    TRT_DEPRECATED float getDynamicRangeMin(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMin(tensorName);

    }


    TRT_DEPRECATED float getDynamicRangeMax(char const* tensorName) const noexcept

    {

        return mImpl->getDynamicRangeMax(tensorName);

    }


    TRT_DEPRECATED int32_t getTensorsWithDynamicRange(int32_t size, char const** tensorNames) const noexcept

    {

        return mImpl->getTensorsWithDynamicRange(size, tensorNames);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(char const* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    bool setNamedWeights(char const* name, Weights weights, TensorLocation location) noexcept

    {

        return mImpl->setNamedWeightsWithLocation(name, weights, location);

    }


    Weights getNamedWeights(char const* weightsName) const noexcept

    {

        return mImpl->getNamedWeights(weightsName);

    }


    TensorLocation getWeightsLocation(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsLocation(weightsName);

    }


    bool unsetNamedWeights(char const* weightsName) noexcept

    {

        return mImpl->unsetNamedWeights(weightsName);

    }


    void setWeightsValidation(bool weightsValidation) noexcept

    {

        return mImpl->setWeightsValidation(weightsValidation);

    }


    bool getWeightsValidation() const noexcept

    {

        return mImpl->getWeightsValidation();

    }


    bool refitCudaEngineAsync(cudaStream_t stream) noexcept

    {

        return mImpl->refitCudaEngineAsync(stream);

    }


    Weights getWeightsPrototype(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsPrototype(weightsName);

    }


protected:

    apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

    return 3;

}


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(char const* inputName, OptProfileSelector select, Dims const& dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    bool setShapeValues(

        char const* inputName, OptProfileSelector select, int32_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


    int32_t getNbShapeValues(char const* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    int32_t const* getShapeValues(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValues(inputName, select);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

    kCUBLAS TRT_DEPRECATED_ENUM = 0,


    kCUBLAS_LT TRT_DEPRECATED_ENUM = 1,


    kCUDNN TRT_DEPRECATED_ENUM = 2,


    kEDGE_MASK_CONVOLUTIONS = 3,


    kJIT_CONVOLUTIONS = 4,

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

    return 5;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

    return 3;

}


using SerializationFlags = uint32_t;


enum class SerializationFlag : int32_t

{

    kEXCLUDE_WEIGHTS = 0,

    kEXCLUDE_LEAN_RUNTIME = 1,

};


template <>

constexpr inline int32_t EnumMax<SerializationFlag>() noexcept

{

    return 2;

}


class ISerializationConfig : public INoCopy

{

public:

    virtual ~ISerializationConfig() noexcept = default;


    bool setFlags(SerializationFlags serializationFlags) noexcept

    {

        return mImpl->setFlags(serializationFlags);

    }


    SerializationFlags getFlags() const noexcept

    {

        return mImpl->getFlags();

    }


    bool clearFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->clearFlag(serializationFlag);

    }


    bool setFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->setFlag(serializationFlag);

    }


    bool getFlag(SerializationFlag serializationFlag) const noexcept

    {

        return mImpl->getFlag(serializationFlag);

    }


protected:

    apiv::VSerializationConfig* mImpl;

};


enum class ExecutionContextAllocationStrategy : int32_t

{

    kSTATIC = 0,

    kON_PROFILE_CHANGE = 1,

    kUSER_MANAGED = 2,

};


template <>

constexpr inline int32_t EnumMax<ExecutionContextAllocationStrategy>() noexcept

{

    return 3;

}


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = default;


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    DataType getTensorDataType(char const* tensorName) const noexcept

    {

        return mImpl->getTensorDataType(tensorName);

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext(

        ExecutionContextAllocationStrategy strategy = ExecutionContextAllocationStrategy::kSTATIC) noexcept

    {

        return mImpl->createExecutionContext(strategy);

    }


    TensorLocation getTensorLocation(char const* tensorName) const noexcept

    {

        return mImpl->getTensorLocation(tensorName);

    }


    bool isShapeInferenceIO(char const* tensorName) const noexcept

    {

        return mImpl->isShapeInferenceIO(tensorName);

    }


    TensorIOMode getTensorIOMode(char const* tensorName) const noexcept

    {

        return mImpl->getTensorIOMode(tensorName);

    }


    TRT_DEPRECATED IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept

    {

        return mImpl->createExecutionContextWithoutDeviceMemory();

    }


    TRT_DEPRECATED size_t getDeviceMemorySize() const noexcept

    {

        return mImpl->getDeviceMemorySize();

    }


    TRT_DEPRECATED size_t getDeviceMemorySizeForProfile(int32_t profileIndex) const noexcept

    {

        return mImpl->getDeviceMemorySizeForProfile(profileIndex);

    }


    int64_t getDeviceMemorySizeV2() const noexcept

    {

        return mImpl->getDeviceMemorySizeV2();

    }


    int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept

    {

        return mImpl->getDeviceMemorySizeForProfileV2(profileIndex);

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    int32_t getTensorBytesPerComponent(char const* tensorName) const noexcept

    {

        return mImpl->getTensorBytesPerComponent(tensorName);

    }


    int32_t getTensorBytesPerComponent(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorBytesPerComponentV2(tensorName, profileIndex);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName) const noexcept

    {

        return mImpl->getTensorComponentsPerElement(tensorName);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorComponentsPerElementV2(tensorName, profileIndex);

    }


    TensorFormat getTensorFormat(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormat(tensorName);

    }


    TensorFormat getTensorFormat(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatV2(tensorName, profileIndex);

    }


    char const* getTensorFormatDesc(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormatDesc(tensorName);

    }


    char const* getTensorFormatDesc(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatDescV2(tensorName, profileIndex);

    }


    int32_t getTensorVectorizedDim(char const* tensorName) const noexcept

    {

        return mImpl->getTensorVectorizedDim(tensorName);

    }


    int32_t getTensorVectorizedDim(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorVectorizedDimV2(tensorName, profileIndex);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    Dims getProfileShape(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShape(tensorName, profileIndex, select);

    }


    int32_t const* getProfileTensorValues(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const

        noexcept

    {

        return mImpl->getProfileTensorValues(tensorName, profileIndex, select);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


    int32_t getNbIOTensors() const noexcept

    {

        return mImpl->getNbIOTensors();

    }


    char const* getIOTensorName(int32_t index) const noexcept

    {

        return mImpl->getIOTensorName(index);

    }


    HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

        return mImpl->getHardwareCompatibilityLevel();

    }


    int32_t getNbAuxStreams() const noexcept

    {

        return mImpl->getNbAuxStreams();

    }


    ISerializationConfig* createSerializationConfig() noexcept

    {

        return mImpl->createSerializationConfig();

    }


    IHostMemory* serializeWithConfig(ISerializationConfig& config) const noexcept

    {

        return mImpl->serializeWithConfig(config);

    }


    TRT_DEPRECATED bool setWeightStreamingBudget(int64_t gpuMemoryBudget) noexcept

    {

        return mImpl->setWeightStreamingBudget(gpuMemoryBudget);

    }


    TRT_DEPRECATED int64_t getWeightStreamingBudget() const noexcept

    {

        return mImpl->getWeightStreamingBudget();

    }


    TRT_DEPRECATED int64_t getMinimumWeightStreamingBudget() const noexcept

    {

        return mImpl->getMinimumWeightStreamingBudget();

    }


    int64_t getStreamableWeightsSize() const noexcept

    {

        return mImpl->getStreamableWeightsSize();

    }


    bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept

    {

        return mImpl->setWeightStreamingBudgetV2(gpuMemoryBudget);

    }


    int64_t getWeightStreamingBudgetV2() const noexcept

    {

        return mImpl->getWeightStreamingBudgetV2();

    }


    int64_t getWeightStreamingAutomaticBudget() const noexcept

    {

        return mImpl->getWeightStreamingAutomaticBudget();

    }


    int64_t getWeightStreamingScratchMemorySize() const noexcept

    {

        return mImpl->getWeightStreamingScratchMemorySize();

    }


    bool isDebugTensor(char const* name) const noexcept

    {

        return mImpl->isDebugTensor(name);

    }


protected:

    apiv::VCudaEngine* mImpl;

};


namespace v_1_0

{

class IOutputAllocator : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IOutputAllocator", 1, 0};

    }


    TRT_DEPRECATED virtual void* reallocateOutput(

        char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment) noexcept

    {

        return nullptr;

    }


    virtual void* reallocateOutputAsync(

        char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment, cudaStream_t /*stream*/)

    {

        return reallocateOutput(tensorName, currentMemory, size, alignment);

    }


    virtual void notifyShape(char const* tensorName, Dims const& dims) noexcept = 0;

};

} // namespace v_1_0


using IOutputAllocator = v_1_0::IOutputAllocator;


namespace v_1_0

{

class IDebugListener : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IDebugListener", 1, 0};

    }


    virtual bool processDebugTensor(void const* addr, TensorLocation location, DataType type, Dims const& shape,

        char const* name, cudaStream_t stream)

        = 0;


    ~IDebugListener() override = default;

};

} // namespace v_1_0


using IDebugListener = v_1_0::IDebugListener;


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = default;


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    ICudaEngine const& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    void setDeviceMemoryV2(void* memory, int64_t size) noexcept

    {

        return mImpl->setDeviceMemoryV2(memory, size);

    }


    Dims getTensorStrides(char const* tensorName) const noexcept

    {

        return mImpl->getTensorStrides(tensorName);

    }


public:

    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    bool setInputShape(char const* tensorName, Dims const& dims) noexcept

    {

        return mImpl->setInputShape(tensorName, dims);

    }


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    TRT_DEPRECATED bool allInputShapesSpecified() const noexcept

    {

        return mImpl->allInputShapesSpecified();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


    bool setTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setTensorAddress(tensorName, data);

    }


    void const* getTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getTensorAddress(tensorName);

    }


    bool setOutputTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setOutputTensorAddress(tensorName, data);

    }


    bool setInputTensorAddress(char const* tensorName, void const* data) noexcept

    {

        return mImpl->setInputTensorAddress(tensorName, data);

    }


    void* getOutputTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getOutputTensorAddress(tensorName);

    }


    int32_t inferShapes(int32_t nbMaxNames, char const** tensorNames) noexcept

    {

        return mImpl->inferShapes(nbMaxNames, tensorNames);

    }


    size_t updateDeviceMemorySizeForShapes() noexcept

    {

        return mImpl->updateDeviceMemorySizeForShapes();

    }


    bool setInputConsumedEvent(cudaEvent_t event) noexcept

    {

        return mImpl->setInputConsumedEvent(event);

    }


    cudaEvent_t getInputConsumedEvent() const noexcept

    {

        return mImpl->getInputConsumedEvent();

    }


    bool setOutputAllocator(char const* tensorName, IOutputAllocator* outputAllocator) noexcept

    {

        return mImpl->setOutputAllocator(tensorName, outputAllocator);

    }


    IOutputAllocator* getOutputAllocator(char const* tensorName) const noexcept

    {

        return mImpl->getOutputAllocator(tensorName);

    }


    int64_t getMaxOutputSize(char const* tensorName) const noexcept

    {

        return mImpl->getMaxOutputSize(tensorName);

    }


    bool setTemporaryStorageAllocator(IGpuAllocator* allocator) noexcept

    {

        return mImpl->setTemporaryStorageAllocator(allocator);

    }


    IGpuAllocator* getTemporaryStorageAllocator() const noexcept

    {

        return mImpl->getTemporaryStorageAllocator();

    }


    bool enqueueV3(cudaStream_t stream) noexcept

    {

        return mImpl->enqueueV3(stream);

    }


    void setPersistentCacheLimit(size_t size) noexcept

    {

        mImpl->setPersistentCacheLimit(size);

    }


    size_t getPersistentCacheLimit() const noexcept

    {

        return mImpl->getPersistentCacheLimit();

    }


    bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept

    {

        return mImpl->setNvtxVerbosity(verbosity);

    }


    ProfilingVerbosity getNvtxVerbosity() const noexcept

    {

        return mImpl->getNvtxVerbosity();

    }


    void setAuxStreams(cudaStream_t* auxStreams, int32_t nbStreams) noexcept

    {

        mImpl->setAuxStreams(auxStreams, nbStreams);

    }


    bool setDebugListener(IDebugListener* listener) noexcept

    {

        return mImpl->setDebugListener(listener);

    }


    IDebugListener* getDebugListener() noexcept

    {

        return mImpl->getDebugListener();

    }


    bool setTensorDebugState(char const* name, bool flag) noexcept

    {

        return mImpl->setTensorDebugState(name, flag);

    }


    bool setAllTensorsDebugState(bool flag) noexcept

    {

        return mImpl->setAllTensorsDebugState(flag);

    }


    bool getDebugState(char const* name) const noexcept

    {

        return mImpl->getDebugState(name);

    }


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

    return 2;

}


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = default;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    char const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    char const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}


namespace nvinfer1

{

class ILoggerFinder

{

public:

    virtual ILogger* findLogger() = 0;


protected:

    virtual ~ILoggerFinder() = default;

};


namespace v_1_0

{


class IGpuAsyncAllocator : public IGpuAllocator

{

public:

    IGpuAsyncAllocator() = default;

    ~IGpuAsyncAllocator() override = default;


    void* allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags,

        cudaStream_t /*stream*/) noexcept override = 0;


    bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept override = 0;


    TRT_DEPRECATED void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override

    {

        return allocateAsync(size, alignment, flags, nullptr);

    }


    TRT_DEPRECATED bool deallocate(void* const memory) noexcept override

    {

        return deallocateAsync(memory, nullptr);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }

};


class IPluginCreatorV3One : public IPluginCreatorInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN CREATOR_V3ONE", 1, 0};

    }


    virtual IPluginV3* createPlugin(

        AsciiChar const* name, PluginFieldCollection const* fc, TensorRTPhase phase) noexcept = 0;


    virtual PluginFieldCollection const* getFieldNames() noexcept = 0;


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


    IPluginCreatorV3One() = default;

    virtual ~IPluginCreatorV3One() = default;


protected:

    IPluginCreatorV3One(IPluginCreatorV3One const&) = default;

    IPluginCreatorV3One(IPluginCreatorV3One&&) = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One const&) & = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One&&) & = default;

};


} // namespace v_1_0


using IGpuAsyncAllocator = v_1_0::IGpuAsyncAllocator;


using IPluginCreatorV3One = v_1_0::IPluginCreatorV3One;


} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibMajorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibMinorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibPatchVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibBuildVersion() noexcept;


#endif // NV_INFER_RUNTIME_H

NvInferImpl.h

NvInferPluginBase.h

getLogger
nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getInferLibMajorVersion
int32_t getInferLibMajorVersion() noexcept
Return the library major version number.

getPluginRegistry
nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

getInferLibPatchVersion
int32_t getInferLibPatchVersion() noexcept
Return the library patch version number.

getInferLibMinorVersion
int32_t getInferLibMinorVersion() noexcept
Return the library minor version number.

getInferLibBuildVersion
int32_t getInferLibBuildVersion() noexcept
Return the library build version number.

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:55

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeBase.h:87

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeBase.h:41

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeBase.h:42

NvInferRuntimeCommon.h

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:200

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:203

nvinfer1::DimsExprs
Analog of class Dims with expressions instead of constants for the dimensions.
Definition: NvInferRuntime.h:350

nvinfer1::DimsExprs::d
IDimensionExpr const  * d[Dims::MAX_DIMS]
The extent of each dimension.
Definition: NvInferRuntime.h:353

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:352

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:3004

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName) const noexcept
Return the number of bytes per component of an element, or -1 if the tensor is not vectorized or prov...
Definition: NvInferRuntime.h:3229

nvinfer1::ICudaEngine::createSerializationConfig
ISerializationConfig * createSerializationConfig() noexcept
Create a serialization configuration object.
Definition: NvInferRuntime.h:3626

nvinfer1::ICudaEngine::getWeightStreamingBudget
TRT_DEPRECATED int64_t getWeightStreamingBudget() const noexcept
Returns the current weight streaming device memory budget in bytes.
Definition: NvInferRuntime.h:3707

nvinfer1::ICudaEngine::getProfileTensorValues
int32_t const * getProfileTensorValues(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values (not dimensions) for an input tensor given its name under ...
Definition: NvInferRuntime.h:3463

nvinfer1::ICudaEngine::getIOTensorName
char const * getIOTensorName(int32_t index) const noexcept
Return name of an IO tensor.
Definition: NvInferRuntime.h:3590

nvinfer1::ICudaEngine::getWeightStreamingBudgetV2
int64_t getWeightStreamingBudgetV2() const noexcept
Returns the current weight streaming device memory budget in bytes.
Definition: NvInferRuntime.h:3806

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:3479

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:3513

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName, int32_t profileIndex) const noexcept
Return the tensor format of given profile, or TensorFormat::kLINEAR if the provided name does not map...
Definition: NvInferRuntime.h:3315

nvinfer1::ICudaEngine::hasImplicitBatchDimension
TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept
Query whether the engine was built with an implicit batch dimension.
Definition: NvInferRuntime.h:3527

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:3879

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfile
TRT_DEPRECATED size_t getDeviceMemorySizeForProfile(int32_t profileIndex) const noexcept
Return the maximum device memory required by the context for a profile.
Definition: NvInferRuntime.h:3166

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(ExecutionContextAllocationStrategy strategy=ExecutionContextAllocationStrategy::kSTATIC) noexcept
Create an execution context and specify the strategy for allocating internal activation memory.
Definition: NvInferRuntime.h:3078

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName) const noexcept
Return the human readable description of the tensor format, or empty string if the provided name does...
Definition: NvInferRuntime.h:3339

nvinfer1::ICudaEngine::getProfileShape
Dims getProfileShape(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for an input tensor given its name under an optimizati...
Definition: NvInferRuntime.h:3441

nvinfer1::ICudaEngine::setWeightStreamingBudgetV2
bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept
Limit the maximum amount of GPU memory usable for network weights in bytes.
Definition: NvInferRuntime.h:3788

nvinfer1::ICudaEngine::getNbAuxStreams
int32_t getNbAuxStreams() const noexcept
Return the number of auxiliary streams used by this engine.
Definition: NvInferRuntime.h:3616

nvinfer1::ICudaEngine::getStreamableWeightsSize
int64_t getStreamableWeightsSize() const noexcept
Get the total size in bytes of all streamable weights.
Definition: NvInferRuntime.h:3746

nvinfer1::ICudaEngine::getTensorDataType
DataType getTensorDataType(char const *tensorName) const noexcept
Determine the required data type for a buffer from its tensor name.
Definition: NvInferRuntime.h:3033

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:3498

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine.
Definition: NvInferRuntime.h:3543

nvinfer1::ICudaEngine::serializeWithConfig
IHostMemory * serializeWithConfig(ISerializationConfig &config) const noexcept
Serialize the network to a stream with the provided SerializationConfig.
Definition: NvInferRuntime.h:3642

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getWeightStreamingAutomaticBudget
int64_t getWeightStreamingAutomaticBudget() const noexcept
TensorRT automatically determines a device memory budget for the model to run. The budget is close to...
Definition: NvInferRuntime.h:3831

nvinfer1::ICudaEngine::isDebugTensor
bool isDebugTensor(char const *name) const noexcept
Check if a tensor is marked as a debug tensor.
Definition: NvInferRuntime.h:3873

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName, int32_t profileIndex) const noexcept
Return the dimension index that the buffer is vectorized of given profile, or -1 if the provided name...
Definition: NvInferRuntime.h:3395

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:3410

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:3555

nvinfer1::ICudaEngine::isShapeInferenceIO
bool isShapeInferenceIO(char const *tensorName) const noexcept
True if tensor is required as input for shape calculations or is output from shape calculations.
Definition: NvInferRuntime.h:3116

nvinfer1::ICudaEngine::getWeightStreamingScratchMemorySize
int64_t getWeightStreamingScratchMemorySize() const noexcept
Returns the size of the scratch memory required by the current weight streaming budget.
Definition: NvInferRuntime.h:3859

nvinfer1::ICudaEngine::setWeightStreamingBudget
TRT_DEPRECATED bool setWeightStreamingBudget(int64_t gpuMemoryBudget) noexcept
Limit the maximum amount of GPU memory usable for network weights in bytes.
Definition: NvInferRuntime.h:3687

nvinfer1::ICudaEngine::getDeviceMemorySizeV2
int64_t getDeviceMemorySizeV2() const noexcept
Return the maximum device memory required by the context over all profiles.
Definition: NvInferRuntime.h:3182

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName) const noexcept
Return the dimension index that the buffer is vectorized, or -1 if the provided name does not map to ...
Definition: NvInferRuntime.h:3379

nvinfer1::ICudaEngine::getDeviceMemorySize
TRT_DEPRECATED size_t getDeviceMemorySize() const noexcept
Return the maximum device memory required by the context over all profiles.
Definition: NvInferRuntime.h:3154

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of components included in one element of given profile, or -1 if tensor is not vect...
Definition: NvInferRuntime.h:3286

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfileV2
int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept
Return the maximum device memory required by the context for a profile.
Definition: NvInferRuntime.h:3198

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName) const noexcept
Return the tensor format, or TensorFormat::kLINEAR if the provided name does not map to an input or o...
Definition: NvInferRuntime.h:3301

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:3061

nvinfer1::ICudaEngine::getTensorLocation
TensorLocation getTensorLocation(char const *tensorName) const noexcept
Get whether an input or output tensor must be on GPU or CPU.
Definition: NvInferRuntime.h:3096

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:3565

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of bytes per component of an element given of given profile, or -1 if the tensor is...
Definition: NvInferRuntime.h:3247

nvinfer1::ICudaEngine::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
Return the hardware compatibility level of this engine.
Definition: NvInferRuntime.h:3601

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:3421

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
TRT_DEPRECATED IExecutionContext * createExecutionContextWithoutDeviceMemory() noexcept
create an execution context without any device memory allocated
Definition: NvInferRuntime.h:3142

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName, int32_t profileIndex) const noexcept
Return the human readable description of the tensor format of given profile, or empty string if the p...
Definition: NvInferRuntime.h:3362

nvinfer1::ICudaEngine::getMinimumWeightStreamingBudget
TRT_DEPRECATED int64_t getMinimumWeightStreamingBudget() const noexcept
The minimum number of bytes of GPU memory required by network weights for successful weight streaming...
Definition: NvInferRuntime.h:3730

nvinfer1::ICudaEngine::getTensorIOMode
TensorIOMode getTensorIOMode(char const *tensorName) const noexcept
Determine whether a tensor is an input or output tensor.
Definition: NvInferRuntime.h:3130

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:3047

nvinfer1::ICudaEngine::getNbIOTensors
int32_t getNbIOTensors() const noexcept
Return number of IO tensors.
Definition: NvInferRuntime.h:3578

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName) const noexcept
Return the number of components included in one element, or -1 if tensor is not vectorized or if the ...
Definition: NvInferRuntime.h:3268

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:3208

nvinfer1::IDimensionExpr
An IDimensionExpr represents an integer expression constructed from constants, input dimensions,...
Definition: NvInferRuntime.h:232

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:237

nvinfer1::IDimensionExpr::isSizeTensor
bool isSizeTensor() const noexcept
Return true if this denotes the value of a size tensor.
Definition: NvInferRuntime.h:263

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:254

nvinfer1::IDimensionExpr::getConstantValue
int64_t getConstantValue() const noexcept
Get the value of the constant.
Definition: NvInferRuntime.h:248

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:4932

nvinfer1::IEngineInspector::getLayerInformation
char const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:4985

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:5042

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:5027

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:4960

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:5048

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getEngineInformation
char const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:5008

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:4021

nvinfer1::IExecutionContext::getOutputAllocator
IOutputAllocator * getOutputAllocator(char const *tensorName) const noexcept
Get output allocator associated with output tensor of given name, or nullptr if the provided name doe...
Definition: NvInferRuntime.h:4656

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:4304

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:4423

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:4124

nvinfer1::IExecutionContext::allInputShapesSpecified
TRT_DEPRECATED bool allInputShapesSpecified() const noexcept
Whether all input shape bindings have been specified.
Definition: NvInferRuntime.h:4270

nvinfer1::IExecutionContext::setTensorDebugState
bool setTensorDebugState(char const *name, bool flag) noexcept
Set debug state of tensor given the tensor name.
Definition: NvInferRuntime.h:4863

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:4097

nvinfer1::IExecutionContext::getTemporaryStorageAllocator
IGpuAllocator * getTemporaryStorageAllocator() const noexcept
Get allocator set by setTemporaryStorageAllocator.
Definition: NvInferRuntime.h:4704

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:4381

nvinfer1::IExecutionContext::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
Return the shape of the given input or output.
Definition: NvInferRuntime.h:4237

nvinfer1::IExecutionContext::getDebugState
bool getDebugState(char const *name) const noexcept
Definition: NvInferRuntime.h:4886

nvinfer1::IExecutionContext::setInputShape
bool setInputShape(char const *tensorName, Dims const &dims) noexcept
Set shape of given input.
Definition: NvInferRuntime.h:4200

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute a network.
Definition: NvInferRuntime.h:4321

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:4393

nvinfer1::IExecutionContext::getTensorAddress
void const * getTensorAddress(char const *tensorName) const noexcept
Get memory address bound to given input or output tensor, or nullptr if the provided name does not ma...
Definition: NvInferRuntime.h:4484

nvinfer1::IExecutionContext::setOutputAllocator
bool setOutputAllocator(char const *tensorName, IOutputAllocator *outputAllocator) noexcept
Set output allocator to use for output tensor of given name. Pass nullptr to outputAllocator to unset...
Definition: NvInferRuntime.h:4643

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:4365

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:4892

nvinfer1::IExecutionContext::setOutputTensorAddress
bool setOutputTensorAddress(char const *tensorName, void *data) noexcept
Set the memory address for a given output tensor.
Definition: NvInferRuntime.h:4507

nvinfer1::IExecutionContext::setPersistentCacheLimit
void setPersistentCacheLimit(size_t size) noexcept
Set the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:4744

nvinfer1::IExecutionContext::getPersistentCacheLimit
size_t getPersistentCacheLimit() const noexcept
Get the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:4755

nvinfer1::IExecutionContext::setAllTensorsDebugState
bool setAllTensorsDebugState(bool flag) noexcept
Definition: NvInferRuntime.h:4876

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:4073

nvinfer1::IExecutionContext::getNvtxVerbosity
ProfilingVerbosity getNvtxVerbosity() const noexcept
Get the NVTX verbosity of the execution context.
Definition: NvInferRuntime.h:4791

nvinfer1::IExecutionContext::updateDeviceMemorySizeForShapes
size_t updateDeviceMemorySizeForShapes() noexcept
Recompute the internal activation buffer sizes based on the current input shapes, and return the tota...
Definition: NvInferRuntime.h:4598

nvinfer1::IExecutionContext::setAuxStreams
void setAuxStreams(cudaStream_t *auxStreams, int32_t nbStreams) noexcept
Set the auxiliary streams that TensorRT should launch kernels on in the next enqueueV3() call.
Definition: NvInferRuntime.h:4822

nvinfer1::IExecutionContext::getMaxOutputSize
int64_t getMaxOutputSize(char const *tensorName) const noexcept
Get upper bound on an output tensor's size, in bytes, based on the current optimization profile and i...
Definition: NvInferRuntime.h:4674

nvinfer1::IExecutionContext::inferShapes
int32_t inferShapes(int32_t nbMaxNames, char const **tensorNames) noexcept
Run shape calculations.
Definition: NvInferRuntime.h:4581

nvinfer1::IExecutionContext::setDebugListener
bool setDebugListener(IDebugListener *listener) noexcept
Set DebugListener for this execution context.
Definition: NvInferRuntime.h:4834

nvinfer1::IExecutionContext::setTensorAddress
bool setTensorAddress(char const *tensorName, void *data) noexcept
Set memory address for given input or output tensor.
Definition: NvInferRuntime.h:4467

nvinfer1::IExecutionContext::setTemporaryStorageAllocator
bool setTemporaryStorageAllocator(IGpuAllocator *allocator) noexcept
Specify allocator to use for internal temporary storage.
Definition: NvInferRuntime.h:4694

nvinfer1::IExecutionContext::getOutputTensorAddress
void * getOutputTensorAddress(char const *tensorName) const noexcept
Get memory address for given output.
Definition: NvInferRuntime.h:4548

nvinfer1::IExecutionContext::enqueueV3
bool enqueueV3(cudaStream_t stream) noexcept
Enqueue inference on a stream.
Definition: NvInferRuntime.h:4728

nvinfer1::IExecutionContext::getDebugListener
IDebugListener * getDebugListener() noexcept
Get the DebugListener of this execution context.
Definition: NvInferRuntime.h:4844

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:4182

nvinfer1::IExecutionContext::setInputTensorAddress
bool setInputTensorAddress(char const *tensorName, void const *data) noexcept
Set memory address for given input.
Definition: NvInferRuntime.h:4529

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:4043

nvinfer1::IExecutionContext::setInputConsumedEvent
bool setInputConsumedEvent(cudaEvent_t event) noexcept
Mark input as consumed.
Definition: NvInferRuntime.h:4614

nvinfer1::IExecutionContext::getTensorStrides
Dims getTensorStrides(char const *tensorName) const noexcept
Return the strides of the buffer for the given tensor name.
Definition: NvInferRuntime.h:4167

nvinfer1::IExecutionContext::setNvtxVerbosity
bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept
Set the verbosity of the NVTX markers in the execution context.
Definition: NvInferRuntime.h:4779

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:4063

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:4289

nvinfer1::IExecutionContext::setDeviceMemoryV2
void setDeviceMemoryV2(void *memory, int64_t size) noexcept
Set the device memory and its corresponding size for use by this execution context.
Definition: NvInferRuntime.h:4146

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:4253

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:4053

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:4087

nvinfer1::IExecutionContext::getInputConsumedEvent
cudaEvent_t getInputConsumedEvent() const noexcept
The event associated with consuming the input.
Definition: NvInferRuntime.h:4624

nvinfer1::IExprBuilder
Object for constructing IDimensionExpr.
Definition: NvInferRuntime.h:287

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
Get the operation.
Definition: NvInferRuntime.h:303

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int64_t value) noexcept
Return pointer to IDimensionExpr for given value.
Definition: NvInferRuntime.h:292

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:310

nvinfer1::IExprBuilder::declareSizeTensor
IDimensionExpr const * declareSizeTensor(int32_t outputIndex, IDimensionExpr const &opt, IDimensionExpr const &upper)
Declare a size tensor at the given output index, with the specified auto-tuning formula and upper bou...
Definition: NvInferRuntime.h:338

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:142

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:147

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:159

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:153

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:165

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILoggerFinder
A virtual base class to find a logger. Allows a plugin to find an instance of a logger if it needs to...
Definition: NvInferRuntime.h:5146

nvinfer1::ILoggerFinder::findLogger
virtual ILogger * findLogger()=0
Get the logger used by the engine or execution context which called the plugin method.

nvinfer1::ILoggerFinder::~ILoggerFinder
virtual ~ILoggerFinder()=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntime.h:1542

nvinfer1::ILogger::ILogger
ILogger()=default

nvinfer1::ILogger::~ILogger
virtual ~ILogger()=default

nvinfer1::ILogger::Severity
Severity
The severity corresponding to a log message.
Definition: NvInferRuntime.h:1550

nvinfer1::ILogger::log
virtual void log(Severity severity, AsciiChar const *msg) noexcept=0
A callback implemented by the application to handle logging messages;.

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:51

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:2618

nvinfer1::IOptimizationProfile::getShapeValues
int32_t const * getShapeValues(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2732

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:2785

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2659

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:2762

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:2750

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims const &dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2647

nvinfer1::IOptimizationProfile::setShapeValues
bool setShapeValues(char const *inputName, OptProfileSelector select, int32_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2706

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:2779

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:2720

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:56

nvinfer1::IPluginRegistry::registerCreator
virtual TRT_DEPRECATED bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator implementing IPluginCreator. Returns false if any plugin creator with the s...

nvinfer1::IPluginResourceContext
Interface for plugins to access per context resources provided by TensorRT.
Definition: NvInferRuntime.h:767

nvinfer1::IPluginResourceContext::getErrorRecorder
virtual IErrorRecorder * getErrorRecorder() const noexcept=0
Get the error recorder associated with the resource context.

nvinfer1::IPluginResourceContext::operator=
IPluginResourceContext & operator=(IPluginResourceContext const &) &=default

nvinfer1::IPluginResourceContext::getGpuAllocator
virtual IGpuAllocator * getGpuAllocator() const noexcept=0
Get the GPU allocator associated with the resource context.

nvinfer1::IPluginV2DynamicExt
Similar to IPluginV2Ext, but with support for dynamic shapes.
Definition: NvInferRuntime.h:407

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:558

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimePlugin.h:474

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:2138

nvinfer1::IRefitter::refitCudaEngineAsync
bool refitCudaEngineAsync(cudaStream_t stream) noexcept
Enqueue weights refitting of the associated engine on the given stream.
Definition: NvInferRuntime.h:2540

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:2419

nvinfer1::IRefitter::getWeightsLocation
TensorLocation getWeightsLocation(char const *weightsName) const noexcept
Get location for the weights associated with the given name.
Definition: NvInferRuntime.h:2478

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:2343

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:2379

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:2389

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Refits associated engine.
Definition: NvInferRuntime.h:2174

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:2363

nvinfer1::IRefitter::getDynamicRangeMax
TRT_DEPRECATED float getDynamicRangeMax(char const *tensorName) const noexcept
Get maximum of dynamic range.
Definition: NvInferRuntime.h:2266

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:2195

nvinfer1::IRefitter::getNamedWeights
Weights getNamedWeights(char const *weightsName) const noexcept
Get weights associated with the given name.
Definition: NvInferRuntime.h:2462

nvinfer1::IRefitter::unsetNamedWeights
bool unsetNamedWeights(char const *weightsName) noexcept
Unset weights associated with the given name.
Definition: NvInferRuntime.h:2494

nvinfer1::IRefitter::getWeightsPrototype
Weights getWeightsPrototype(char const *weightsName) const noexcept
Get the Weights prototype associated with the given name.
Definition: NvInferRuntime.h:2558

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:2405

nvinfer1::IRefitter::getDynamicRangeMin
TRT_DEPRECATED float getDynamicRangeMin(char const *tensorName) const noexcept
Get minimum of dynamic range.
Definition: NvInferRuntime.h:2250

nvinfer1::IRefitter::getTensorsWithDynamicRange
TRT_DEPRECATED int32_t getTensorsWithDynamicRange(int32_t size, char const **tensorNames) const noexcept
Get names of all tensors that have refittable dynamic ranges.
Definition: NvInferRuntime.h:2284

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights, TensorLocation location) noexcept
Specify new weights on a specified device of given name.
Definition: NvInferRuntime.h:2446

nvinfer1::IRefitter::setWeightsValidation
void setWeightsValidation(bool weightsValidation) noexcept
Set whether to validate weights during refitting.
Definition: NvInferRuntime.h:2510

nvinfer1::IRefitter::setDynamicRange
TRT_DEPRECATED bool setDynamicRange(char const *tensorName, float min, float max) noexcept
Definition: NvInferRuntime.h:2234

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:2564

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:2212

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::getWeightsValidation
bool getWeightsValidation() const noexcept
Get whether to validate weights values during refitting.
Definition: NvInferRuntime.h:2518

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2303

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2318

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:1819

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:1983

nvinfer1::IRuntime::loadRuntime
IRuntime * loadRuntime(char const *path) noexcept
Load IRuntime from the file.
Definition: NvInferRuntime.h:2099

nvinfer1::IRuntime::getEngineHostCodeAllowed
bool getEngineHostCodeAllowed() const noexcept
Get whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2121

nvinfer1::IRuntime::getTempfileControlFlags
TempfileControlFlags getTempfileControlFlags() const noexcept
Get the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2071

nvinfer1::IRuntime::setEngineHostCodeAllowed
void setEngineHostCodeAllowed(bool allowed) noexcept
Set whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2111

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::setTemporaryDirectory
void setTemporaryDirectory(char const *path) noexcept
Set the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2032

nvinfer1::IRuntime::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
Get the local plugin registry that can be used by the runtime.
Definition: NvInferRuntime.h:2081

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
Definition: NvInferRuntime.h:2127

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible or 0 if DLA is unavailable.
Definition: NvInferRuntime.h:1852

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
Deserialize an engine from host memory.
Definition: NvInferRuntime.h:1917

nvinfer1::IRuntime::setTempfileControlFlags
void setTempfileControlFlags(TempfileControlFlags flags) noexcept
Set the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2059

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:1844

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:1868

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1902

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(IStreamReaderV2 &streamReader)
Deserialize an engine from a stream. IStreamReaderV2 is expected to support reading to both host and ...
Definition: NvInferRuntime.h:1958

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:1968

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:1997

nvinfer1::IRuntime::getTemporaryDirectory
char const * getTemporaryDirectory() const noexcept
Get the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2043

nvinfer1::IRuntime::deserializeCudaEngine
TRT_DEPRECATED ICudaEngine * deserializeCudaEngine(IStreamReader &streamReader)
Deserialize an engine from a stream.
Definition: NvInferRuntime.h:1938

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1887

nvinfer1::ISerializationConfig
Holds properties for configuring an engine to serialize the binary.
Definition: NvInferRuntime.h:2895

nvinfer1::ISerializationConfig::~ISerializationConfig
virtual ~ISerializationConfig() noexcept=default

nvinfer1::ISerializationConfig::clearFlag
bool clearFlag(SerializationFlag serializationFlag) noexcept
clear a serialization flag.
Definition: NvInferRuntime.h:2934

nvinfer1::ISerializationConfig::setFlag
bool setFlag(SerializationFlag serializationFlag) noexcept
Set a serialization flag.
Definition: NvInferRuntime.h:2946

nvinfer1::ISerializationConfig::getFlags
SerializationFlags getFlags() const noexcept
Get the serialization flags for this config.
Definition: NvInferRuntime.h:2922

nvinfer1::ISerializationConfig::getFlag
bool getFlag(SerializationFlag serializationFlag) const noexcept
Returns true if the serialization flag is set.
Definition: NvInferRuntime.h:2958

nvinfer1::ISerializationConfig::mImpl
apiv::VSerializationConfig * mImpl
Definition: NvInferRuntime.h:2964

nvinfer1::IVersionedInterface
An Interface class for version control.
Definition: NvInferRuntimeBase.h:260

nvinfer1::InterfaceInfo
Version information associated with a TRT interface.
Definition: NvInferRuntimeBase.h:225

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:5118

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:5120

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:124

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:126

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:128

nvinfer1::Weights::values
void const  * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:127

nvinfer1::v_1_0::IDebugListener
Definition: NvInferRuntime.h:3972

nvinfer1::v_1_0::IDebugListener::processDebugTensor
virtual bool processDebugTensor(void const *addr, TensorLocation location, DataType type, Dims const &shape, char const *name, cudaStream_t stream)=0
Callback function that is called when a debug tensor’s value is updated and the debug state of the te...

nvinfer1::v_1_0::IDebugListener::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:3977

nvinfer1::v_1_0::IDebugListener::~IDebugListener
~IDebugListener() override=default

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:397

nvinfer1::v_1_0::IGpuAllocator
Definition: NvInferRuntime.h:1610

nvinfer1::v_1_0::IGpuAllocator::allocateAsync
virtual void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered acquisition of GPU mem...
Definition: NvInferRuntime.h:1732

nvinfer1::v_1_0::IGpuAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1773

nvinfer1::v_1_0::IGpuAllocator::deallocate
virtual TRT_DEPRECATED bool deallocate(void *const memory) noexcept=0
A thread-safe callback implemented by the application to handle release of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::~IGpuAllocator
~IGpuAllocator() override=default

nvinfer1::v_1_0::IGpuAllocator::IGpuAllocator
IGpuAllocator()=default

nvinfer1::v_1_0::IGpuAllocator::reallocate
virtual void * reallocate(void *const, uint64_t, uint64_t) noexcept
A thread-safe callback implemented by the application to resize an existing allocation.
Definition: NvInferRuntime.h:1679

nvinfer1::v_1_0::IGpuAllocator::allocate
virtual TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept=0
A thread-safe callback implemented by the application to handle acquisition of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::deallocateAsync
virtual bool deallocateAsync(void *const memory, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered release of GPU memory.
Definition: NvInferRuntime.h:1765

nvinfer1::v_1_0::IGpuAsyncAllocator
Definition: NvInferRuntime.h:5167

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocateAsync
bool deallocateAsync(void *const memory, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous release o...

nvinfer1::v_1_0::IGpuAsyncAllocator::IGpuAsyncAllocator
IGpuAsyncAllocator()=default

nvinfer1::v_1_0::IGpuAsyncAllocator::allocateAsync
void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous acquisiti...

nvinfer1::v_1_0::IGpuAsyncAllocator::allocate
TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override
A thread-safe callback implemented by the application to handle acquisition of GPU memory.
Definition: NvInferRuntime.h:5253

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocate
TRT_DEPRECATED bool deallocate(void *const memory) noexcept override
A thread-safe callback implemented by the application to handle release of GPU memory.
Definition: NvInferRuntime.h:5277

nvinfer1::v_1_0::IGpuAsyncAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5285

nvinfer1::v_1_0::IGpuAsyncAllocator::~IGpuAsyncAllocator
~IGpuAsyncAllocator() override=default

nvinfer1::v_1_0::IOutputAllocator
Definition: NvInferRuntime.h:3885

nvinfer1::v_1_0::IOutputAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:3890

nvinfer1::v_1_0::IOutputAllocator::reallocateOutputAsync
virtual void * reallocateOutputAsync(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment, cudaStream_t)
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated....
Definition: NvInferRuntime.h:3942

nvinfer1::v_1_0::IOutputAllocator::notifyShape
virtual void notifyShape(char const *tensorName, Dims const &dims) noexcept=0
Called by TensorRT when the shape of the output tensor is known.

nvinfer1::v_1_0::IOutputAllocator::reallocateOutput
virtual TRT_DEPRECATED void * reallocateOutput(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment) noexcept
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated....
Definition: NvInferRuntime.h:3914

nvinfer1::v_1_0::IPluginCapability
Definition: NvInferPluginBase.h:141

nvinfer1::v_1_0::IPluginCreatorInterface
Definition: NvInferPluginBase.h:193

nvinfer1::v_1_0::IPluginCreatorV3One
Definition: NvInferRuntime.h:5292

nvinfer1::v_1_0::IPluginCreatorV3One::getFieldNames
virtual PluginFieldCollection const * getFieldNames() noexcept=0
Return a list of fields that need to be passed to createPlugin() when creating a plugin for use in th...

nvinfer1::v_1_0::IPluginCreatorV3One::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5297

nvinfer1::v_1_0::IPluginCreatorV3One::createPlugin
virtual IPluginV3 * createPlugin(AsciiChar const *name, PluginFieldCollection const *fc, TensorRTPhase phase) noexcept=0
Return a plugin object. Return nullptr in case of error.

nvinfer1::v_1_0::IPluginV3
Definition: NvInferPluginBase.h:206

nvinfer1::v_1_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:836

nvinfer1::v_1_0::IPluginV3OneBuild::getFormatCombinationLimit
virtual int32_t getFormatCombinationLimit() noexcept
Return the maximum number of format combinations that will be timed by TensorRT during the build phas...
Definition: NvInferRuntime.h:1040

nvinfer1::v_1_0::IPluginV3OneBuild::getNbOutputs
virtual int32_t getNbOutputs() const noexcept=0
Get the number of outputs from the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::configurePlugin
virtual int32_t configurePlugin(DynamicPluginTensorDesc const *in, int32_t nbInputs, DynamicPluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Configure the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::getNbTactics
virtual int32_t getNbTactics() noexcept
Query for the number of custom tactics the plugin intends to use.
Definition: NvInferRuntime.h:1016

nvinfer1::v_1_0::IPluginV3OneBuild::getMetadataString
virtual char const * getMetadataString() noexcept
Query for a string representing the configuration of the plugin. May be called anytime after plugin c...
Definition: NvInferRuntime.h:1051

nvinfer1::v_1_0::IPluginV3OneBuild::getTimingCacheID
virtual char const * getTimingCacheID() noexcept
Called to query the suffix to use for the timing cache ID. May be called anytime after plugin creatio...
Definition: NvInferRuntime.h:1032

nvinfer1::v_1_0::IPluginV3OneBuild::supportsFormatCombination
virtual bool supportsFormatCombination(int32_t pos, DynamicPluginTensorDesc const *inOut, int32_t nbInputs, int32_t nbOutputs) noexcept=0
Return true if plugin supports the format and datatype for the input/output indexed by pos.

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputDataTypes
virtual int32_t getOutputDataTypes(DataType *outputTypes, int32_t nbOutputs, const DataType *inputTypes, int32_t nbInputs) const noexcept=0
Provide the data types of the plugin outputs if the input tensors have the data types provided.

nvinfer1::v_1_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:848

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputShapes
virtual int32_t getOutputShapes(DimsExprs const *inputs, int32_t nbInputs, DimsExprs const *shapeInputs, int32_t nbShapeInputs, DimsExprs *outputs, int32_t nbOutputs, IExprBuilder &exprBuilder) noexcept=0
Provide expressions for computing dimensions of the output tensors from dimensions of the input tenso...

nvinfer1::v_1_0::IPluginV3OneBuild::getValidTactics
virtual int32_t getValidTactics(int32_t *tactics, int32_t nbTactics) noexcept
Query for any custom tactics that the plugin intends to use.
Definition: NvInferRuntime.h:1008

nvinfer1::v_1_0::IPluginV3OneCore
Definition: NvInferRuntime.h:793

nvinfer1::v_1_0::IPluginV3OneCore::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:798

nvinfer1::v_1_0::IPluginV3OneCore::getPluginName
virtual AsciiChar const * getPluginName() const noexcept=0
Return the plugin name. Should match the plugin name returned by the corresponding plugin creator.

nvinfer1::v_1_0::IPluginV3OneRuntime
Definition: NvInferRuntime.h:1058

nvinfer1::v_1_0::IPluginV3OneRuntime::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1063

nvinfer1::v_1_0::IPluginV3OneRuntime::onShapeChange
virtual int32_t onShapeChange(PluginTensorDesc const *in, int32_t nbInputs, PluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Called when a plugin is being prepared for execution for specific dimensions. This could happen multi...

nvinfer1::v_1_0::IPluginV3OneRuntime::getFieldsToSerialize
virtual PluginFieldCollection const * getFieldsToSerialize() noexcept=0
Get the plugin fields which should be serialized.

nvinfer1::v_1_0::IPluginV3OneRuntime::setTactic
virtual int32_t setTactic(int32_t tactic) noexcept
Set the tactic to be used in the subsequent call to enqueue(). If no custom tactics were advertised,...
Definition: NvInferRuntime.h:1075

nvinfer1::v_1_0::IPluginV3OneRuntime::enqueue
virtual int32_t enqueue(PluginTensorDesc const *inputDesc, PluginTensorDesc const *outputDesc, void const *const *inputs, void *const *outputs, void *workspace, cudaStream_t stream) noexcept=0
Execute the layer.

nvinfer1::v_1_0::IPluginV3OneRuntime::attachToContext
virtual IPluginV3 * attachToContext(IPluginResourceContext *context) noexcept=0
Clone the plugin, attach the cloned plugin object to a execution context and grant the cloned plugin ...

nvinfer1::v_1_0::IProfiler
Definition: NvInferRuntime.h:1246

nvinfer1::v_1_0::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
Definition: NvInferRuntime.h:1257

nvinfer1::v_1_0::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::v_1_0::IStreamReader
Definition: NvInferRuntime.h:631

nvinfer1::v_1_0::IStreamReader::~IStreamReader
~IStreamReader() override=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader const &) &=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader &&) &=default

nvinfer1::v_1_0::IStreamReader::read
virtual int64_t read(void *destination, int64_t nbBytes)=0
Read the next number of bytes in the stream.

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader &&)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader const &)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader()=default

nvinfer1::v_1_0::IStreamReader::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:643

nvinfer1::v_1_0::IStreamReaderV2
Definition: NvInferRuntime.h:695

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 const &) &=default

nvinfer1::v_1_0::IStreamReaderV2::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:707

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 &&)=default

nvinfer1::v_1_0::IStreamReaderV2::~IStreamReaderV2
~IStreamReaderV2() override=default

nvinfer1::v_1_0::IStreamReaderV2::read
virtual int64_t read(void *destination, int64_t nbBytes, cudaStream_t stream) noexcept=0
Read the next number of bytes in the stream asynchronously.

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2()=default

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 const &)=default

nvinfer1::v_1_0::IStreamReaderV2::seek
virtual bool seek(int64_t offset, SeekPosition where) noexcept=0
Sets the position of the stream to the given offset.

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 &&) &=default

nvinfer1::v_2_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:1155

nvinfer1::v_2_0::IPluginV3OneBuild::getAliasedInput
virtual int32_t getAliasedInput(int32_t outputIndex) noexcept
Communicates to TensorRT that the output at the specified output index is aliased to the input at the...
Definition: NvInferRuntime.h:1191

nvinfer1::v_2_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1157

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRefitter
IRefitter * createInferRefitter(ICudaEngine &engine, ILogger &logger) noexcept
Create an instance of an IRefitter class.
Definition: NvInferRuntime.h:5098

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an IRuntime class.
Definition: NvInferRuntime.h:5087

nvinfer1
The TensorRT API version 1 namespace.

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:2834

nvinfer1::IOutputAllocator
v_1_0::IOutputAllocator IOutputAllocator
Definition: NvInferRuntime.h:3967

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:76

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:179

nvinfer1::DimensionOperation::kSUB
@ kSUB
Substract the second element from the first.

nvinfer1::DimensionOperation::kSUM
@ kSUM
Sum of the two operands.

nvinfer1::DimensionOperation::kPROD
@ kPROD
Product of the two operands.

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
1 if operands are equal, 0 otherwise.

nvinfer1::DimensionOperation::kMIN
@ kMIN
Minimum of the two operands.

nvinfer1::DimensionOperation::kLESS
@ kLESS
1 if first operand is less than second operand, 0 otherwise.

nvinfer1::DimensionOperation::kMAX
@ kMAX
Maximum of the two operands.

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::IPluginV3OneCore
v_1_0::IPluginV3OneCore IPluginV3OneCore
Definition: NvInferRuntime.h:1208

nvinfer1::TensorIOMode
TensorIOMode
Definition of tensor IO Mode.
Definition: NvInferRuntimeBase.h:640

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
Describes requirements of compatibility with GPU architectures other than that of the GPU on which th...
Definition: NvInfer.h:9216

nvinfer1::SerializationFlag
SerializationFlag
List of valid flags that the engine can enable when serializing the bytes.
Definition: NvInferRuntime.h:2875

nvinfer1::SerializationFlag::kEXCLUDE_WEIGHTS
@ kEXCLUDE_WEIGHTS
Exclude the weights that can be refitted.

nvinfer1::IProfiler
v_1_0::IProfiler IProfiler
Definition: NvInferRuntime.h:1272

nvinfer1::SeekPosition
SeekPosition
Controls the seek mode of IStreamReaderV2.
Definition: NvInferRuntime.h:681

nvinfer1::SeekPosition::kSET
@ kSET
From the beginning of the file.

nvinfer1::SeekPosition::kCUR
@ kCUR
From the current position of the file.

nvinfer1::SeekPosition::kEND
@ kEND
From the tail of the file.

nvinfer1::IStreamReaderV2
v_1_0::IStreamReaderV2 IStreamReaderV2
Definition: NvInferRuntime.h:751

nvinfer1::TempfileControlFlags
uint32_t TempfileControlFlags
Represents a collection of one or more TempfileControlFlag values combined using bitwise-OR operation...
Definition: NvInferRuntime.h:1350

nvinfer1::IGpuAllocator
v_1_0::IGpuAllocator IGpuAllocator
Definition: NvInferRuntime.h:1809

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:1293

nvinfer1::AsciiChar
char_t AsciiChar
Definition: NvInferRuntimeBase.h:101

nvinfer1::TensorRTPhase
TensorRTPhase
Indicates a phase of operation of TensorRT.
Definition: NvInferPluginBase.h:116

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
Definition: NvInferRuntime.h:4911

nvinfer1::DataType
DataType
The type of weights and tensors.
Definition: NvInferRuntimeBase.h:129

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:1304

nvinfer1::DeviceType::kGPU
@ kGPU
GPU Device.

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::IDebugListener
v_1_0::IDebugListener IDebugListener
Definition: NvInferRuntime.h:4008

nvinfer1::TempfileControlFlag
TempfileControlFlag
Flags used to control TensorRT's behavior when creating executable temporary files.
Definition: NvInferRuntime.h:1327

nvinfer1::TempfileControlFlag::kALLOW_TEMPORARY_FILES
@ kALLOW_TEMPORARY_FILES

nvinfer1::TempfileControlFlag::kALLOW_IN_MEMORY_FILES
@ kALLOW_IN_MEMORY_FILES
Allow creating and loading files in-memory (or unnamed files).

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:2590

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:1282

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
Maximum number of profile verbosity levels in ProfilingVerbosity enum.
Definition: NvInferRuntime.h:2854

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:2846

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:2797

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kCUDNN
@ kCUDNN

nvinfer1::TacticSource::kJIT_CONVOLUTIONS
@ kJIT_CONVOLUTIONS

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimePlugin.h:54

nvinfer1::IPluginV3OneRuntime
v_1_0::IPluginV3OneRuntime IPluginV3OneRuntime
Definition: NvInferRuntime.h:1232

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::EnumMax< TempfileControlFlag >
constexpr int32_t EnumMax< TempfileControlFlag >() noexcept
Maximum number of elements in TempfileControlFlag enum.
Definition: NvInferRuntime.h:1339

nvinfer1::SerializationFlags
uint32_t SerializationFlags
Represents one or more SerializationFlag values using binary OR operations, e.g., 1U << Serialization...
Definition: NvInferRuntime.h:2865

nvinfer1::InterpolationMode::kLINEAR
@ kLINEAR
Supports linear (1D), bilinear (2D), and trilinear (3D) interpolation.

nvinfer1::IPluginV3OneBuild
v_1_0::IPluginV3OneBuild IPluginV3OneBuild
Definition: NvInferRuntime.h:1220

nvinfer1::BuilderFlag::kEXCLUDE_LEAN_RUNTIME
@ kEXCLUDE_LEAN_RUNTIME

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntime.h:1383

nvinfer1::TensorFormat::kCHW4
@ kCHW4

nvinfer1::TensorFormat::kDHWC
@ kDHWC

nvinfer1::TensorFormat::kHWC16
@ kHWC16

nvinfer1::TensorFormat::kDHWC8
@ kDHWC8

nvinfer1::TensorFormat::kDLA_LINEAR
@ kDLA_LINEAR

nvinfer1::TensorFormat::kCDHW32
@ kCDHW32

nvinfer1::TensorFormat::kDLA_HWC4
@ kDLA_HWC4

nvinfer1::TensorFormat::kCHW16
@ kCHW16

nvinfer1::TensorFormat::kHWC
@ kHWC

nvinfer1::TensorFormat::kCHW2
@ kCHW2

nvinfer1::TensorFormat::kHWC8
@ kHWC8

nvinfer1::TensorFormat::kCHW32
@ kCHW32

nvinfer1::ExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy
Different memory allocation behaviors for IExecutionContext.
Definition: NvInferRuntime.h:2979

nvinfer1::ExecutionContextAllocationStrategy::kSTATIC
@ kSTATIC
Default static allocation with the maximum size across all profiles.

nvinfer1::ExecutionContextAllocationStrategy::kUSER_MANAGED
@ kUSER_MANAGED
The user supplies custom allocation to the execution context.

nvinfer1::ExecutionContextAllocationStrategy::kON_PROFILE_CHANGE
@ kON_PROFILE_CHANGE
Reallocate for a profile when it's selected.

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
Maximum number of tactic sources in TacticSource enum.
Definition: NvInferRuntime.h:2823

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:4903

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::IStreamReader
v_1_0::IStreamReader IStreamReader
Definition: NvInferRuntime.h:674

nvinfer1::AllocatorFlag
AllocatorFlag
Allowed type of memory allocation.
Definition: NvInferRuntime.h:1508

nvinfer1::AllocatorFlag::kRESIZABLE
@ kRESIZABLE
TensorRT may call realloc() on this allocation.

nvinfer1::PoolingType::kMAX
@ kMAX
Maximum over elements.

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:1311

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:193

nvinfer1::EnumMax< ExecutionContextAllocationStrategy >
constexpr int32_t EnumMax< ExecutionContextAllocationStrategy >() noexcept
Maximum number of memory allocation strategies in ExecutionContextAllocationStrategy enum.
Definition: NvInferRuntime.h:2991

nvinfer1::EnumMax< SerializationFlag >
constexpr int32_t EnumMax< SerializationFlag >() noexcept
Maximum number of serialization flags in SerializationFlag enum.
Definition: NvInferRuntime.h:2882

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:204

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:2578

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::AllocatorFlags
uint32_t AllocatorFlags
Definition: NvInferRuntime.h:1524

nvinfer1::DynamicPluginTensorDesc
Summarizes tensors that a plugin might see for an input or output.
Definition: NvInferRuntime.h:362

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:367

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:370

nvinfer1::DynamicPluginTensorDesc::opt
Dims opt
Optimum value of tensor’s dimensions specified for auto-tuning.
Definition: NvInferRuntime.h:373

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:364

nvinfer1::PluginFieldCollection
Plugin field collection struct.
Definition: NvInferPluginBase.h:103

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimePlugin.h:73

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:114