_static/c-api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h" // IWYU pragma: export

#define NV_INFER_INTERNAL_INCLUDE 1

#include "NvInferPluginBase.h" // IWYU pragma: export

#undef NV_INFER_INTERNAL_INCLUDE

#include "NvInferRuntimeCommon.h" // IWYU pragma: export


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(INoCopy const& other) = delete;

    INoCopy& operator=(INoCopy const& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kSAFETY = 1,


    kDLA_STANDALONE = 2,

};


template <>

struct impl::EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};


class Weights

{

public:

    DataType type;

    void const* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = 0;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }


protected:

    apiv::VHostMemory* mImpl;

};


inline IHostMemory::~IHostMemory() noexcept = default;


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

struct impl::EnumMaxImpl<DimensionOperation>

{

    static constexpr int32_t kVALUE = 9;

};


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


template <>

struct impl::EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int64_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = 0;


public:

    bool isSizeTensor() const noexcept

    {

        return mImpl->isSizeTensor();

    }

};


inline IDimensionExpr::~IDimensionExpr() noexcept = default;


class IExprBuilder : public INoCopy

{

public:

    IDimensionExpr const* constant(int64_t value) noexcept

    {

        return mImpl->constant(value);

    }


    IDimensionExpr const* operation(

        DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = 0;


public:

    IDimensionExpr const* declareSizeTensor(int32_t outputIndex, IDimensionExpr const& opt, IDimensionExpr const& upper)

    {

        return mImpl->declareSizeTensor(outputIndex, opt, upper);

    }

};


inline IExprBuilder::~IExprBuilder() noexcept = default;


class DimsExprs

{

public:

    int32_t nbDims;

    IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;


    Dims opt;

};


class TRT_DEPRECATED IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

        int32_t nbOutputs) const noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept final

    {

        return Dims{-1, {}};

    }


    size_t getWorkspaceSize(int32_t) const noexcept final

    {

        return 0;

    }


    int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept final

    {

        return 1;

    }

};


namespace v_1_0

{

class TRT_DEPRECATED IStreamReader : public IVersionedInterface

{

public:

    ~IStreamReader() override = default;

    IStreamReader() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReader", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes) = 0;


protected:

    IStreamReader(IStreamReader const&) = default;

    IStreamReader(IStreamReader&&) = default;

    IStreamReader& operator=(IStreamReader const&) & = default;

    IStreamReader& operator=(IStreamReader&&) & = default;

};


class IStreamWriter : public IVersionedInterface

{

public:

    ~IStreamWriter() override = default;

    IStreamWriter() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamWriter", 1, 0};

    }


    virtual int64_t write(void const* data, int64_t nbBytes) = 0;


protected:

    IStreamWriter(IStreamWriter const&) = default;

    IStreamWriter(IStreamWriter&&) = default;

    IStreamWriter& operator=(IStreamWriter const&) & = default;

    IStreamWriter& operator=(IStreamWriter&&) & = default;

};

} // namespace v_1_0


using IStreamReader = v_1_0::IStreamReader;


using IStreamWriter = v_1_0::IStreamWriter;


enum class SeekPosition : int32_t

{

    kSET = 0,


    kCUR = 1,


    kEND = 2,

};


namespace v_1_0

{

class IStreamReaderV2 : public IVersionedInterface

{

public:

    ~IStreamReaderV2() override = default;

    IStreamReaderV2() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReaderV2", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes, cudaStream_t stream) noexcept = 0;


    virtual bool seek(int64_t offset, SeekPosition where) noexcept = 0;


protected:

    IStreamReaderV2(IStreamReaderV2 const&) = default;

    IStreamReaderV2(IStreamReaderV2&&) = default;

    IStreamReaderV2& operator=(IStreamReaderV2 const&) & = default;

    IStreamReaderV2& operator=(IStreamReaderV2&&) & = default;

};

} // namespace v_1_0


using IStreamReaderV2 = v_1_0::IStreamReaderV2;


class IPluginResourceContext

{

public:

    virtual IGpuAllocator* getGpuAllocator() const noexcept = 0;


    virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

    virtual ~IPluginResourceContext() noexcept = 0;


protected:

    IPluginResourceContext() = default;

    IPluginResourceContext(IPluginResourceContext const&) = default;

    IPluginResourceContext(IPluginResourceContext&&) = default;

    IPluginResourceContext& operator=(IPluginResourceContext const&) & = default;

    IPluginResourceContext& operator=(IPluginResourceContext&&) & = default;

};


inline IPluginResourceContext::~IPluginResourceContext() noexcept = default;


namespace v_1_0

{

class IPluginV3OneCore : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_CORE", 1, 0};

    }


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;

};


class IPluginV3OneBuild : public IPluginCapability

{

public:

    static constexpr int32_t kDEFAULT_FORMAT_COMBINATION_LIMIT = 100;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 1, 0};

    }


    virtual int32_t configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getOutputDataTypes(

        DataType* outputTypes, int32_t nbOutputs, const DataType* inputTypes, int32_t nbInputs) const noexcept = 0;


    virtual int32_t getOutputShapes(DimsExprs const* inputs, int32_t nbInputs, DimsExprs const* shapeInputs,

        int32_t nbShapeInputs, DimsExprs* outputs, int32_t nbOutputs, IExprBuilder& exprBuilder) noexcept = 0;


    virtual bool supportsFormatCombination(

        int32_t pos, DynamicPluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getNbOutputs() const noexcept = 0;


    virtual size_t getWorkspaceSize(DynamicPluginTensorDesc const* /* inputs */, int32_t /* nbInputs */,

        DynamicPluginTensorDesc const* /* outputs */, int32_t /* nbOutputs */) const noexcept

    {

        return 0;

    }


    virtual int32_t getValidTactics(int32_t* /* tactics */, int32_t /* nbTactics */) noexcept

    {

        return 0;

    }


    virtual int32_t getNbTactics() noexcept

    {

        return 0;

    }


    virtual char const* getTimingCacheID() noexcept

    {

        return nullptr;

    }


    virtual int32_t getFormatCombinationLimit() noexcept

    {

        return kDEFAULT_FORMAT_COMBINATION_LIMIT;

    }


    virtual char const* getMetadataString() noexcept

    {

        return nullptr;

    }

};


class IPluginV3OneRuntime : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_RUNTIME", 1, 0};

    }


    virtual int32_t setTactic(int32_t /* tactic */) noexcept

    {

        return 0;

    }


    virtual int32_t onShapeChange(

        PluginTensorDesc const* in, int32_t nbInputs, PluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


    virtual IPluginV3* attachToContext(IPluginResourceContext* context) noexcept = 0;


    virtual PluginFieldCollection const* getFieldsToSerialize() noexcept = 0;

};

} // namespace v_1_0


namespace v_2_0

{


class IPluginV3OneBuild : public v_1_0::IPluginV3OneBuild

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 2, 0};

    }


    virtual int32_t getAliasedInput(int32_t /* outputIndex */) noexcept

    {

        return -1;

    }

};


} // namespace v_2_0


using IPluginV3OneCore = v_1_0::IPluginV3OneCore;


using IPluginV3OneBuild = v_1_0::IPluginV3OneBuild;


using IPluginV3OneRuntime = v_1_0::IPluginV3OneRuntime;


using IPluginV3OneBuildV2 = v_2_0::IPluginV3OneBuild;


namespace v_1_0

{

class IProfiler : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IProfiler", 1, 0};

    }


    virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


    ~IProfiler() override = default;

};

} // namespace v_1_0


using IProfiler = v_1_0::IProfiler;


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

struct impl::EnumMaxImpl<WeightsRole>

{

    static constexpr int32_t kVALUE = 6;

};


enum class DeviceType : int32_t

{

    kGPU = 0,

    kDLA = 1,

};


template <>

struct impl::EnumMaxImpl<DeviceType>

{

    static constexpr int32_t kVALUE = 2;

};


enum class TempfileControlFlag : int32_t

{

    kALLOW_IN_MEMORY_FILES = 0,


    kALLOW_TEMPORARY_FILES = 1,

};


template <>

struct impl::EnumMaxImpl<TempfileControlFlag>

{

    static constexpr int32_t kVALUE = 2;

};


using TempfileControlFlags = uint32_t;


enum class TensorFormat : int32_t

{

    kLINEAR = 0,


    kCHW2 = 1,


    kHWC8 = 2,


    kCHW4 = 3,


    kCHW16 = 4,


    kCHW32 = 5,


    kDHWC8 = 6,


    kCDHW32 = 7,


    kHWC = 8,


    kDLA_LINEAR = 9,


    kDLA_HWC4 = 10,


    kHWC16 = 11,


    kDHWC = 12

};


template <>

struct impl::EnumMaxImpl<TensorFormat>

{

    static constexpr int32_t kVALUE = 13;

};


enum class AllocatorFlag : int32_t

{

    kRESIZABLE = 0,

};


template <>

struct impl::EnumMaxImpl<AllocatorFlag>

{

    static constexpr int32_t kVALUE = 1;

};


using AllocatorFlags = uint32_t;


namespace v_1_0

{


class ILogger : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"ILogger", 1, 0};

    }


    enum class Severity : int32_t

    {

        kINTERNAL_ERROR = 0,

        kERROR = 1,

        kWARNING = 2,

        kINFO = 3,

        kVERBOSE = 4,

    };


    virtual void log(Severity severity, AsciiChar const* msg) noexcept = 0;


    ILogger() = default;

    ~ILogger() override = default;


protected:

    // @cond SuppressDoxyWarnings

    ILogger(ILogger const&) = default;

    ILogger(ILogger&&) = default;

    ILogger& operator=(ILogger const&) & = default;

    ILogger& operator=(ILogger&&) & = default;

    // @endcond

};


} // namespace v_1_0


using ILogger = v_1_0::ILogger;


template <>

struct impl::EnumMaxImpl<ILogger::Severity>

{

    static constexpr int32_t kVALUE = 5;

};


namespace v_1_0

{


class IGpuAllocator : public IVersionedInterface

{

public:

    TRT_DEPRECATED virtual void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept = 0;


    ~IGpuAllocator() override = default;

    IGpuAllocator() = default;


    virtual void* reallocate(void* const /*baseAddr*/, uint64_t /*alignment*/, uint64_t /*newSize*/) noexcept

    {

        return nullptr;

    }


    TRT_DEPRECATED virtual bool deallocate(void* const memory) noexcept = 0;


    virtual void* allocateAsync(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t /*stream*/) noexcept

    {

        return allocate(size, alignment, flags);

    }

    virtual bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept

    {

        return deallocate(memory);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }


protected:

    // @cond SuppressDoxyWarnings

    IGpuAllocator(IGpuAllocator const&) = default;

    IGpuAllocator(IGpuAllocator&&) = default;

    IGpuAllocator& operator=(IGpuAllocator const&) & = default;

    IGpuAllocator& operator=(IGpuAllocator&&) & = default;

    // @endcond

};


} // namespace v_1_0


using IGpuAllocator = v_1_0::IGpuAllocator;


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = 0;


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size);

    }


    ICudaEngine* deserializeCudaEngine(IStreamReaderV2& streamReader)

    {

        return mImpl->deserializeCudaEngineV2(streamReader);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    void setTemporaryDirectory(char const* path) noexcept

    {

        return mImpl->setTemporaryDirectory(path);

    }


    char const* getTemporaryDirectory() const noexcept

    {

        return mImpl->getTemporaryDirectory();

    }


    void setTempfileControlFlags(TempfileControlFlags flags) noexcept

    {

        return mImpl->setTempfileControlFlags(flags);

    }


    TempfileControlFlags getTempfileControlFlags() const noexcept

    {

        return mImpl->getTempfileControlFlags();

    }


    IPluginRegistry& getPluginRegistry() noexcept

    {

        return mImpl->getPluginRegistry();

    }


    IRuntime* loadRuntime(char const* path) noexcept

    {

        return mImpl->loadRuntime(path);

    }


    void setEngineHostCodeAllowed(bool allowed) noexcept

    {

        return mImpl->setEngineHostCodeAllowed(allowed);

    }


    bool getEngineHostCodeAllowed() const noexcept

    {

        return mImpl->getEngineHostCodeAllowed();

    }


protected:

    apiv::VRuntime* mImpl{};

};


inline IRuntime::~IRuntime() noexcept = default;


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = 0;


    bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(char const* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    bool setNamedWeights(char const* name, Weights weights, TensorLocation location) noexcept

    {

        return mImpl->setNamedWeightsWithLocation(name, weights, location);

    }


    Weights getNamedWeights(char const* weightsName) const noexcept

    {

        return mImpl->getNamedWeights(weightsName);

    }


    TensorLocation getWeightsLocation(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsLocation(weightsName);

    }


    bool unsetNamedWeights(char const* weightsName) noexcept

    {

        return mImpl->unsetNamedWeights(weightsName);

    }


    void setWeightsValidation(bool weightsValidation) noexcept

    {

        return mImpl->setWeightsValidation(weightsValidation);

    }


    bool getWeightsValidation() const noexcept

    {

        return mImpl->getWeightsValidation();

    }


    bool refitCudaEngineAsync(cudaStream_t stream) noexcept

    {

        return mImpl->refitCudaEngineAsync(stream);

    }


    Weights getWeightsPrototype(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsPrototype(weightsName);

    }


protected:

    apiv::VRefitter* mImpl;

};


inline IRefitter::~IRefitter() noexcept = default;


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

struct impl::EnumMaxImpl<OptProfileSelector>

{

    static constexpr int32_t kVALUE = 3;

};


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(char const* inputName, OptProfileSelector select, Dims const& dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    int32_t getNbShapeValues(char const* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


    bool setShapeValuesV2(

        char const* inputName, OptProfileSelector select, int64_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValuesV2(inputName, select, values, nbValues);

    }


    int64_t const* getShapeValuesV2(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValuesV2(inputName, select);

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = 0;

};


inline IOptimizationProfile::~IOptimizationProfile() noexcept = default;


enum class TacticSource : int32_t

{

    kEDGE_MASK_CONVOLUTIONS = 0,


    kJIT_CONVOLUTIONS = 1,

};


template <>

struct impl::EnumMaxImpl<TacticSource>

{

    static constexpr int32_t kVALUE = 2;

};


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,

};


template <>

struct impl::EnumMaxImpl<ProfilingVerbosity>

{

    static constexpr int32_t kVALUE = 3;

};


using SerializationFlags = uint32_t;


enum class SerializationFlag : int32_t

{

    kEXCLUDE_WEIGHTS = 0,

    kEXCLUDE_LEAN_RUNTIME = 1,

    kINCLUDE_REFIT = 2,

};


template <>

struct impl::EnumMaxImpl<SerializationFlag>

{

    static constexpr int32_t kVALUE = 3;

};


class ISerializationConfig : public INoCopy

{

public:

    virtual ~ISerializationConfig() noexcept = 0;


    bool setFlags(SerializationFlags serializationFlags) noexcept

    {

        return mImpl->setFlags(serializationFlags);

    }


    SerializationFlags getFlags() const noexcept

    {

        return mImpl->getFlags();

    }


    bool clearFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->clearFlag(serializationFlag);

    }


    bool setFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->setFlag(serializationFlag);

    }


    bool getFlag(SerializationFlag serializationFlag) const noexcept

    {

        return mImpl->getFlag(serializationFlag);

    }


protected:

    apiv::VSerializationConfig* mImpl;

};


inline ISerializationConfig::~ISerializationConfig() noexcept = default;


enum class ExecutionContextAllocationStrategy : int32_t

{

    kSTATIC = 0,

    kON_PROFILE_CHANGE = 1,

    kUSER_MANAGED = 2,

};


template <>

struct impl::EnumMaxImpl<ExecutionContextAllocationStrategy>

{

    static constexpr int32_t kVALUE = 3;

};


class IRuntimeConfig : public INoCopy

{

public:

    virtual ~IRuntimeConfig() noexcept = 0;


    void setExecutionContextAllocationStrategy(ExecutionContextAllocationStrategy strategy) noexcept

    {

        return mImpl->setExecutionContextAllocationStrategy(strategy);

    }


    ExecutionContextAllocationStrategy getExecutionContextAllocationStrategy() const noexcept

    {

        return mImpl->getExecutionContextAllocationStrategy();

    }


protected:

    apiv::VRuntimeConfig* mImpl;

}; // class IRuntimeConfig


inline IRuntimeConfig::~IRuntimeConfig() noexcept = default;


enum class EngineStat : int32_t

{

    kTOTAL_WEIGHTS_SIZE = 0,


    kSTRIPPED_WEIGHTS_SIZE = 1,

};


template <>

struct impl::EnumMaxImpl<EngineStat>

{

    static constexpr int32_t kVALUE = 2;

};


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = 0;


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    DataType getTensorDataType(char const* tensorName) const noexcept

    {

        return mImpl->getTensorDataType(tensorName);

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext(

        ExecutionContextAllocationStrategy strategy = ExecutionContextAllocationStrategy::kSTATIC) noexcept

    {

        return mImpl->createExecutionContext(strategy);

    }


    TensorLocation getTensorLocation(char const* tensorName) const noexcept

    {

        return mImpl->getTensorLocation(tensorName);

    }


    bool isShapeInferenceIO(char const* tensorName) const noexcept

    {

        return mImpl->isShapeInferenceIO(tensorName);

    }


    TensorIOMode getTensorIOMode(char const* tensorName) const noexcept

    {

        return mImpl->getTensorIOMode(tensorName);

    }


    TRT_NODISCARD char const* getAliasedInputTensor(char const* tensorName) const noexcept

    {

        return mImpl->getAliasedInputTensor(tensorName);

    }


    IExecutionContext* createExecutionContext(IRuntimeConfig* runtimeConfig) noexcept

    {

        return mImpl->createExecutionContextWithRuntimeConfig(runtimeConfig);

    }


    IRuntimeConfig* createRuntimeConfig() noexcept

    {

        return mImpl->createRuntimeConfig();

    }


    int64_t getDeviceMemorySizeV2() const noexcept

    {

        return mImpl->getDeviceMemorySizeV2();

    }


    int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept

    {

        return mImpl->getDeviceMemorySizeForProfileV2(profileIndex);

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    int32_t getTensorBytesPerComponent(char const* tensorName) const noexcept

    {

        return mImpl->getTensorBytesPerComponent(tensorName);

    }


    int32_t getTensorBytesPerComponent(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorBytesPerComponentV2(tensorName, profileIndex);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName) const noexcept

    {

        return mImpl->getTensorComponentsPerElement(tensorName);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorComponentsPerElementV2(tensorName, profileIndex);

    }


    TensorFormat getTensorFormat(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormat(tensorName);

    }


    TensorFormat getTensorFormat(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatV2(tensorName, profileIndex);

    }


    char const* getTensorFormatDesc(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormatDesc(tensorName);

    }


    char const* getTensorFormatDesc(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatDescV2(tensorName, profileIndex);

    }


    int32_t getTensorVectorizedDim(char const* tensorName) const noexcept

    {

        return mImpl->getTensorVectorizedDim(tensorName);

    }


    int32_t getTensorVectorizedDim(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorVectorizedDimV2(tensorName, profileIndex);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    Dims getProfileShape(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShape(tensorName, profileIndex, select);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


    int32_t getNbIOTensors() const noexcept

    {

        return mImpl->getNbIOTensors();

    }


    char const* getIOTensorName(int32_t index) const noexcept

    {

        return mImpl->getIOTensorName(index);

    }


    HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

        return mImpl->getHardwareCompatibilityLevel();

    }


    int32_t getNbAuxStreams() const noexcept

    {

        return mImpl->getNbAuxStreams();

    }


    ISerializationConfig* createSerializationConfig() noexcept

    {

        return mImpl->createSerializationConfig();

    }


    IHostMemory* serializeWithConfig(ISerializationConfig& config) const noexcept

    {

        return mImpl->serializeWithConfig(config);

    }


    int64_t getStreamableWeightsSize() const noexcept

    {

        return mImpl->getStreamableWeightsSize();

    }


    bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept

    {

        return mImpl->setWeightStreamingBudgetV2(gpuMemoryBudget);

    }


    int64_t getWeightStreamingBudgetV2() const noexcept

    {

        return mImpl->getWeightStreamingBudgetV2();

    }


    int64_t getWeightStreamingAutomaticBudget() const noexcept

    {

        return mImpl->getWeightStreamingAutomaticBudget();

    }


    int64_t getWeightStreamingScratchMemorySize() const noexcept

    {

        return mImpl->getWeightStreamingScratchMemorySize();

    }


    bool isDebugTensor(char const* name) const noexcept

    {

        return mImpl->isDebugTensor(name);

    }


    int64_t const* getProfileTensorValuesV2(

        char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileTensorValuesV2(tensorName, profileIndex, select);

    }


    int64_t getEngineStat(EngineStat stat) const noexcept

    {

        return mImpl->getEngineStat(stat);

    }


protected:

    apiv::VCudaEngine* mImpl;

};


inline ICudaEngine::~ICudaEngine() noexcept = default;


namespace v_1_0

{

class IOutputAllocator : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IOutputAllocator", 1, 0};

    }


    TRT_DEPRECATED virtual void* reallocateOutput(

        char const* /* tensorName */, void* /* currentMemory */, uint64_t /* size */, uint64_t /* alignment */) noexcept

    {

        return nullptr;

    }


    virtual void* reallocateOutputAsync(

        [[maybe_unused]] char const* tensorName, [[maybe_unused]] void* currentMemory, [[maybe_unused]] uint64_t size,

        [[maybe_unused]] uint64_t alignment, cudaStream_t /* stream */)

    {

        return reallocateOutput(tensorName, currentMemory, size, alignment);

    }


    virtual void notifyShape(char const* tensorName, Dims const& dims) noexcept = 0;

};

} // namespace v_1_0


using IOutputAllocator = v_1_0::IOutputAllocator;


namespace v_1_0

{

class IDebugListener : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IDebugListener", 1, 0};

    }


    virtual bool processDebugTensor(void const* addr, TensorLocation location, DataType type, Dims const& shape,

        char const* name, cudaStream_t stream)

        = 0;


    ~IDebugListener() override = default;

};

} // namespace v_1_0


using IDebugListener = v_1_0::IDebugListener;


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = 0;


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    ICudaEngine const& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    void setDeviceMemoryV2(void* memory, int64_t size) noexcept

    {

        return mImpl->setDeviceMemoryV2(memory, size);

    }


    Dims getTensorStrides(char const* tensorName) const noexcept

    {

        return mImpl->getTensorStrides(tensorName);

    }


public:

    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    bool setInputShape(char const* tensorName, Dims const& dims) noexcept

    {

        return mImpl->setInputShape(tensorName, dims);

    }


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


    bool setTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setTensorAddress(tensorName, data);

    }


    void const* getTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getTensorAddress(tensorName);

    }


    bool setOutputTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setOutputTensorAddress(tensorName, data);

    }


    bool setInputTensorAddress(char const* tensorName, void const* data) noexcept

    {

        return mImpl->setInputTensorAddress(tensorName, data);

    }


    void* getOutputTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getOutputTensorAddress(tensorName);

    }


    int32_t inferShapes(int32_t nbMaxNames, char const** tensorNames) noexcept

    {

        return mImpl->inferShapes(nbMaxNames, tensorNames);

    }


    size_t updateDeviceMemorySizeForShapes() noexcept

    {

        return mImpl->updateDeviceMemorySizeForShapes();

    }


    bool setInputConsumedEvent(cudaEvent_t event) noexcept

    {

        return mImpl->setInputConsumedEvent(event);

    }


    cudaEvent_t getInputConsumedEvent() const noexcept

    {

        return mImpl->getInputConsumedEvent();

    }


    bool setOutputAllocator(char const* tensorName, IOutputAllocator* outputAllocator) noexcept

    {

        return mImpl->setOutputAllocator(tensorName, outputAllocator);

    }


    IOutputAllocator* getOutputAllocator(char const* tensorName) const noexcept

    {

        return mImpl->getOutputAllocator(tensorName);

    }


    int64_t getMaxOutputSize(char const* tensorName) const noexcept

    {

        return mImpl->getMaxOutputSize(tensorName);

    }


    bool setTemporaryStorageAllocator(IGpuAllocator* allocator) noexcept

    {

        return mImpl->setTemporaryStorageAllocator(allocator);

    }


    IGpuAllocator* getTemporaryStorageAllocator() const noexcept

    {

        return mImpl->getTemporaryStorageAllocator();

    }


    bool enqueueV3(cudaStream_t stream) noexcept

    {

        return mImpl->enqueueV3(stream);

    }


    void setPersistentCacheLimit(size_t size) noexcept

    {

        mImpl->setPersistentCacheLimit(size);

    }


    size_t getPersistentCacheLimit() const noexcept

    {

        return mImpl->getPersistentCacheLimit();

    }


    bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept

    {

        return mImpl->setNvtxVerbosity(verbosity);

    }


    ProfilingVerbosity getNvtxVerbosity() const noexcept

    {

        return mImpl->getNvtxVerbosity();

    }


    void setAuxStreams(cudaStream_t* auxStreams, int32_t nbStreams) noexcept

    {

        mImpl->setAuxStreams(auxStreams, nbStreams);

    }


    bool setDebugListener(IDebugListener* listener) noexcept

    {

        return mImpl->setDebugListener(listener);

    }


    IDebugListener* getDebugListener() noexcept

    {

        return mImpl->getDebugListener();

    }


    bool setTensorDebugState(char const* name, bool flag) noexcept

    {

        return mImpl->setTensorDebugState(name, flag);

    }


    bool getDebugState(char const* name) const noexcept

    {

        return mImpl->getDebugState(name);

    }


    IRuntimeConfig* getRuntimeConfig() const noexcept

    {

        return mImpl->getRuntimeConfig();

    }


    bool setAllTensorsDebugState(bool flag) noexcept

    {

        return mImpl->setAllTensorsDebugState(flag);

    }


    bool setUnfusedTensorsDebugState(bool flag) noexcept

    {

        return mImpl->setUnfusedTensorsDebugState(flag);

    }


    bool getUnfusedTensorsDebugState() const noexcept

    {

        return mImpl->getUnfusedTensorsDebugState();

    }


    bool setCommunicator(void* communicator) noexcept

    {

        return mImpl->setCommunicator(communicator);

    }


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


inline IExecutionContext::~IExecutionContext() noexcept = default;


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

struct impl::EnumMaxImpl<LayerInformationFormat>

{

    static constexpr int32_t kVALUE = 2;

};


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = 0;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    char const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    char const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


inline IEngineInspector::~IEngineInspector() noexcept = default;


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}


namespace nvinfer1

{

namespace v_1_0

{

class ILoggerFinder : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"ILoggerFinder", 1, 0};

    }


    virtual ILogger* findLogger() = 0;


protected:

    ~ILoggerFinder() override = default;

};


} // namespace v_1_0


using ILoggerFinder = v_1_0::ILoggerFinder;


namespace v_1_0

{


class IGpuAsyncAllocator : public IGpuAllocator

{

public:

    IGpuAsyncAllocator() = default;

    ~IGpuAsyncAllocator() override = default;


    void* allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags,

        cudaStream_t /*stream*/) noexcept override = 0;


    bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept override = 0;


    TRT_DEPRECATED void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override

    {

        return allocateAsync(size, alignment, flags, nullptr);

    }


    TRT_DEPRECATED bool deallocate(void* const memory) noexcept override

    {

        return deallocateAsync(memory, nullptr);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }

};


class IPluginCreatorV3One : public IPluginCreatorInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN CREATOR_V3ONE", 1, 0};

    }


    virtual IPluginV3* createPlugin(

        AsciiChar const* name, PluginFieldCollection const* fc, TensorRTPhase phase) noexcept = 0;


    virtual PluginFieldCollection const* getFieldNames() noexcept = 0;


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


    IPluginCreatorV3One() = default;

    virtual ~IPluginCreatorV3One() = default;


protected:

    IPluginCreatorV3One(IPluginCreatorV3One const&) = default;

    IPluginCreatorV3One(IPluginCreatorV3One&&) = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One const&) & = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One&&) & = default;

};


} // namespace v_1_0


using IGpuAsyncAllocator = v_1_0::IGpuAsyncAllocator;


using IPluginCreatorV3One = v_1_0::IPluginCreatorV3One;


} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibMajorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibMinorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibPatchVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibBuildVersion() noexcept;


#endif // NV_INFER_RUNTIME_H

NvInferImpl.h

NvInferPluginBase.h

getPluginRegistry
TENSORRTAPI nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

getLogger
TENSORRTAPI nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getInferLibMinorVersion
TENSORRTAPI int32_t getInferLibMinorVersion() noexcept
Return the library minor version number.

getInferLibMajorVersion
TENSORRTAPI int32_t getInferLibMajorVersion() noexcept
Return the library major version number.

getInferLibPatchVersion
TENSORRTAPI int32_t getInferLibPatchVersion() noexcept
Return the library patch version number.

getInferLibBuildVersion
TENSORRTAPI int32_t getInferLibBuildVersion() noexcept
Return the library build version number.

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:70

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeBase.h:102

TRT_NODISCARD
#define TRT_NODISCARD
A stand-in for [[nodiscard]] and [[nodiscard(REASON)]] that works with older compilers.
Definition: NvInferRuntimeBase.h:57

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeBase.h:42

NvInferRuntimeCommon.h

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:222

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:225

nvinfer1::DimsExprs
Analog of class Dims with expressions instead of constants for the dimensions.
Definition: NvInferRuntime.h:350

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:352

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:3013

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName) const noexcept
Return the number of bytes per component of an element, or -1 if the tensor is not vectorized or prov...
Definition: NvInferRuntime.h:3242

nvinfer1::ICudaEngine::createSerializationConfig
ISerializationConfig * createSerializationConfig() noexcept
Create a serialization configuration object.
Definition: NvInferRuntime.h:3602

nvinfer1::ICudaEngine::getIOTensorName
char const * getIOTensorName(int32_t index) const noexcept
Return name of an IO tensor.
Definition: NvInferRuntime.h:3566

nvinfer1::ICudaEngine::getWeightStreamingBudgetV2
int64_t getWeightStreamingBudgetV2() const noexcept
Returns the current weight streaming device memory budget in bytes.
Definition: NvInferRuntime.h:3693

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:3469

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:3503

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName, int32_t profileIndex) const noexcept
Return the tensor format of given profile, or TensorFormat::kLINEAR if the provided name does not map...
Definition: NvInferRuntime.h:3328

nvinfer1::ICudaEngine::getProfileTensorValuesV2
int64_t const * getProfileTensorValuesV2(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values (not dimensions) for an input tensor given its name under ...
Definition: NvInferRuntime.h:3778

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:3812

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(ExecutionContextAllocationStrategy strategy=ExecutionContextAllocationStrategy::kSTATIC) noexcept
Create an execution context and specify the strategy for allocating internal activation memory.
Definition: NvInferRuntime.h:3087

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName) const noexcept
Return the human readable description of the tensor format, or empty string if the provided name does...
Definition: NvInferRuntime.h:3352

nvinfer1::ICudaEngine::getProfileShape
Dims getProfileShape(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for an input tensor given its name under an optimizati...
Definition: NvInferRuntime.h:3454

nvinfer1::ICudaEngine::setWeightStreamingBudgetV2
bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept
Limit the maximum amount of GPU memory usable for network weights in bytes.
Definition: NvInferRuntime.h:3677

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(IRuntimeConfig *runtimeConfig) noexcept
Create an execution context with TensorRT JIT runtime config.
Definition: NvInferRuntime.h:3170

nvinfer1::ICudaEngine::getNbAuxStreams
int32_t getNbAuxStreams() const noexcept
Return the number of auxiliary streams used by this engine.
Definition: NvInferRuntime.h:3592

nvinfer1::ICudaEngine::getStreamableWeightsSize
int64_t getStreamableWeightsSize() const noexcept
Get the total size in bytes of all streamable weights.
Definition: NvInferRuntime.h:3638

nvinfer1::ICudaEngine::getTensorDataType
DataType getTensorDataType(char const *tensorName) const noexcept
Determine the required data type for a buffer from its tensor name.
Definition: NvInferRuntime.h:3042

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:3488

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine.
Definition: NvInferRuntime.h:3519

nvinfer1::ICudaEngine::getAliasedInputTensor
TRT_NODISCARD char const * getAliasedInputTensor(char const *tensorName) const noexcept
Get the input tensor name that an output tensor should alias with.
Definition: NvInferRuntime.h:3158

nvinfer1::ICudaEngine::serializeWithConfig
IHostMemory * serializeWithConfig(ISerializationConfig &config) const noexcept
Serialize the network to a stream with the provided SerializationConfig.
Definition: NvInferRuntime.h:3622

nvinfer1::ICudaEngine::getWeightStreamingAutomaticBudget
int64_t getWeightStreamingAutomaticBudget() const noexcept
TensorRT automatically determines a device memory budget for the model to run. The budget is close to...
Definition: NvInferRuntime.h:3716

nvinfer1::ICudaEngine::isDebugTensor
bool isDebugTensor(char const *name) const noexcept
Check if a tensor is marked as a debug tensor.
Definition: NvInferRuntime.h:3756

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName, int32_t profileIndex) const noexcept
Return the dimension index that the buffer is vectorized of given profile, or -1 if the provided name...
Definition: NvInferRuntime.h:3408

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:3423

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:3531

nvinfer1::ICudaEngine::isShapeInferenceIO
bool isShapeInferenceIO(char const *tensorName) const noexcept
True if tensor is required as input for shape calculations or is output from shape calculations.
Definition: NvInferRuntime.h:3125

nvinfer1::ICudaEngine::getWeightStreamingScratchMemorySize
int64_t getWeightStreamingScratchMemorySize() const noexcept
Returns the size of the scratch memory required by the current weight streaming budget.
Definition: NvInferRuntime.h:3742

nvinfer1::ICudaEngine::getDeviceMemorySizeV2
int64_t getDeviceMemorySizeV2() const noexcept
Return the maximum device memory required by the context over all profiles.
Definition: NvInferRuntime.h:3197

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName) const noexcept
Return the dimension index that the buffer is vectorized, or -1 if the provided name does not map to ...
Definition: NvInferRuntime.h:3392

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of components included in one element of given profile, or -1 if tensor is not vect...
Definition: NvInferRuntime.h:3299

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfileV2
int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept
Return the maximum device memory required by the context for a profile.
Definition: NvInferRuntime.h:3211

nvinfer1::ICudaEngine::createRuntimeConfig
IRuntimeConfig * createRuntimeConfig() noexcept
Create a runtime config for TensorRT JIT. The caller is responsible for ownership of the returned IRu...
Definition: NvInferRuntime.h:3183

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName) const noexcept
Return the tensor format, or TensorFormat::kLINEAR if the provided name does not map to an input or o...
Definition: NvInferRuntime.h:3314

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:3070

nvinfer1::ICudaEngine::getEngineStat
int64_t getEngineStat(EngineStat stat) const noexcept
Get engine statistics according to the given enum value.
Definition: NvInferRuntime.h:3806

nvinfer1::ICudaEngine::getTensorLocation
TensorLocation getTensorLocation(char const *tensorName) const noexcept
Get whether an input or output tensor must be on GPU or CPU.
Definition: NvInferRuntime.h:3105

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:3541

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of bytes per component of an element given of given profile, or -1 if the tensor is...
Definition: NvInferRuntime.h:3260

nvinfer1::ICudaEngine::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
Return the hardware compatibility level of this engine.
Definition: NvInferRuntime.h:3577

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:3434

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName, int32_t profileIndex) const noexcept
Return the human readable description of the tensor format of given profile, or empty string if the p...
Definition: NvInferRuntime.h:3375

nvinfer1::ICudaEngine::getTensorIOMode
TensorIOMode getTensorIOMode(char const *tensorName) const noexcept
Determine whether a tensor is an input or output tensor.
Definition: NvInferRuntime.h:3139

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:3056

nvinfer1::ICudaEngine::getNbIOTensors
int32_t getNbIOTensors() const noexcept
Return number of IO tensors.
Definition: NvInferRuntime.h:3554

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=0

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName) const noexcept
Return the number of components included in one element, or -1 if tensor is not vectorized or if the ...
Definition: NvInferRuntime.h:3281

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:3221

nvinfer1::IDimensionExpr
An IDimensionExpr represents an integer expression constructed from constants, input dimensions,...
Definition: NvInferRuntime.h:228

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:233

nvinfer1::IDimensionExpr::isSizeTensor
bool isSizeTensor() const noexcept
Return true if this denotes the value of a size tensor.
Definition: NvInferRuntime.h:259

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=0

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:250

nvinfer1::IDimensionExpr::getConstantValue
int64_t getConstantValue() const noexcept
Get the value of the constant.
Definition: NvInferRuntime.h:244

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:4906

nvinfer1::IEngineInspector::getLayerInformation
char const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:4959

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:5016

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:5001

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=0

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:4934

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:5022

nvinfer1::IEngineInspector::getEngineInformation
char const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:4982

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:3957

nvinfer1::IExecutionContext::getOutputAllocator
IOutputAllocator * getOutputAllocator(char const *tensorName) const noexcept
Get output allocator associated with output tensor of given name, or nullptr if the provided name doe...
Definition: NvInferRuntime.h:4573

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:4221

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:4340

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:4059

nvinfer1::IExecutionContext::setTensorDebugState
bool setTensorDebugState(char const *name, bool flag) noexcept
Set debug state of tensor given the tensor name.
Definition: NvInferRuntime.h:4780

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:4033

nvinfer1::IExecutionContext::getTemporaryStorageAllocator
IGpuAllocator * getTemporaryStorageAllocator() const noexcept
Get allocator set by setTemporaryStorageAllocator.
Definition: NvInferRuntime.h:4621

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:4298

nvinfer1::IExecutionContext::setUnfusedTensorsDebugState
bool setUnfusedTensorsDebugState(bool flag) noexcept
Turn the debug state of unfused tensors on or off.
Definition: NvInferRuntime.h:4831

nvinfer1::IExecutionContext::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
Return the shape of the given input or output.
Definition: NvInferRuntime.h:4171

nvinfer1::IExecutionContext::getDebugState
bool getDebugState(char const *name) const noexcept
Get the debug state.
Definition: NvInferRuntime.h:4792

nvinfer1::IExecutionContext::setInputShape
bool setInputShape(char const *tensorName, Dims const &dims) noexcept
Set shape of given input.
Definition: NvInferRuntime.h:4134

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute a network.
Definition: NvInferRuntime.h:4238

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:4310

nvinfer1::IExecutionContext::getTensorAddress
void const * getTensorAddress(char const *tensorName) const noexcept
Get memory address bound to given input or output tensor, or nullptr if the provided name does not ma...
Definition: NvInferRuntime.h:4401

nvinfer1::IExecutionContext::setOutputAllocator
bool setOutputAllocator(char const *tensorName, IOutputAllocator *outputAllocator) noexcept
Set output allocator to use for output tensor of given name. Pass nullptr to outputAllocator to unset...
Definition: NvInferRuntime.h:4560

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:4282

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:4865

nvinfer1::IExecutionContext::setOutputTensorAddress
bool setOutputTensorAddress(char const *tensorName, void *data) noexcept
Set the memory address for a given output tensor.
Definition: NvInferRuntime.h:4424

nvinfer1::IExecutionContext::setPersistentCacheLimit
void setPersistentCacheLimit(size_t size) noexcept
Set the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:4661

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=0

nvinfer1::IExecutionContext::getPersistentCacheLimit
size_t getPersistentCacheLimit() const noexcept
Get the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:4672

nvinfer1::IExecutionContext::setAllTensorsDebugState
bool setAllTensorsDebugState(bool flag) noexcept
Turn the debug state of all debug tensors on or off.
Definition: NvInferRuntime.h:4815

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:4009

nvinfer1::IExecutionContext::getNvtxVerbosity
ProfilingVerbosity getNvtxVerbosity() const noexcept
Get the NVTX verbosity of the execution context.
Definition: NvInferRuntime.h:4708

nvinfer1::IExecutionContext::updateDeviceMemorySizeForShapes
size_t updateDeviceMemorySizeForShapes() noexcept
Recompute the internal activation buffer sizes based on the current input shapes, and return the tota...
Definition: NvInferRuntime.h:4515

nvinfer1::IExecutionContext::setAuxStreams
void setAuxStreams(cudaStream_t *auxStreams, int32_t nbStreams) noexcept
Set the auxiliary streams that TensorRT should launch kernels on in the next enqueueV3() call.
Definition: NvInferRuntime.h:4739

nvinfer1::IExecutionContext::getMaxOutputSize
int64_t getMaxOutputSize(char const *tensorName) const noexcept
Get upper bound on an output tensor's size, in bytes, based on the current optimization profile and i...
Definition: NvInferRuntime.h:4591

nvinfer1::IExecutionContext::inferShapes
int32_t inferShapes(int32_t nbMaxNames, char const **tensorNames) noexcept
Run shape calculations.
Definition: NvInferRuntime.h:4498

nvinfer1::IExecutionContext::setDebugListener
bool setDebugListener(IDebugListener *listener) noexcept
Set DebugListener for this execution context.
Definition: NvInferRuntime.h:4751

nvinfer1::IExecutionContext::setTensorAddress
bool setTensorAddress(char const *tensorName, void *data) noexcept
Set memory address for given input or output tensor.
Definition: NvInferRuntime.h:4384

nvinfer1::IExecutionContext::setTemporaryStorageAllocator
bool setTemporaryStorageAllocator(IGpuAllocator *allocator) noexcept
Specify allocator to use for internal temporary storage.
Definition: NvInferRuntime.h:4611

nvinfer1::IExecutionContext::getOutputTensorAddress
void * getOutputTensorAddress(char const *tensorName) const noexcept
Get memory address for given output.
Definition: NvInferRuntime.h:4465

nvinfer1::IExecutionContext::enqueueV3
bool enqueueV3(cudaStream_t stream) noexcept
Enqueue inference on a stream.
Definition: NvInferRuntime.h:4645

nvinfer1::IExecutionContext::getDebugListener
IDebugListener * getDebugListener() noexcept
Get the DebugListener of this execution context.
Definition: NvInferRuntime.h:4761

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:4116

nvinfer1::IExecutionContext::setInputTensorAddress
bool setInputTensorAddress(char const *tensorName, void const *data) noexcept
Set memory address for given input.
Definition: NvInferRuntime.h:4446

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:3979

nvinfer1::IExecutionContext::setInputConsumedEvent
bool setInputConsumedEvent(cudaEvent_t event) noexcept
Mark input as consumed.
Definition: NvInferRuntime.h:4531

nvinfer1::IExecutionContext::getTensorStrides
Dims getTensorStrides(char const *tensorName) const noexcept
Return the strides of the buffer for the given tensor name.
Definition: NvInferRuntime.h:4101

nvinfer1::IExecutionContext::setNvtxVerbosity
bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept
Set the verbosity of the NVTX markers in the execution context.
Definition: NvInferRuntime.h:4696

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:3999

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:4206

nvinfer1::IExecutionContext::setCommunicator
bool setCommunicator(void *communicator) noexcept
Set the NCCL communicator for the execution context.
Definition: NvInferRuntime.h:4859

nvinfer1::IExecutionContext::setDeviceMemoryV2
void setDeviceMemoryV2(void *memory, int64_t size) noexcept
Set the device memory and its corresponding size for use by this execution context.
Definition: NvInferRuntime.h:4080

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:4187

nvinfer1::IExecutionContext::getUnfusedTensorsDebugState
bool getUnfusedTensorsDebugState() const noexcept
Get the debug state of unfused tensors.
Definition: NvInferRuntime.h:4841

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:3989

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:4023

nvinfer1::IExecutionContext::getInputConsumedEvent
cudaEvent_t getInputConsumedEvent() const noexcept
The event associated with consuming the input.
Definition: NvInferRuntime.h:4541

nvinfer1::IExecutionContext::getRuntimeConfig
IRuntimeConfig * getRuntimeConfig() const noexcept
Get the runtime config object used during execution context creation.
Definition: NvInferRuntime.h:4802

nvinfer1::IExprBuilder
Object for constructing IDimensionExpr.
Definition: NvInferRuntime.h:285

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
Get the operation.
Definition: NvInferRuntime.h:301

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int64_t value) noexcept
Return pointer to IDimensionExpr for given value.
Definition: NvInferRuntime.h:290

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:308

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=0

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:139

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:144

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=0

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:156

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:150

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:162

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:51

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:2575

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:2742

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2616

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:2659

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:2647

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims const &dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2604

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=0

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:2676

nvinfer1::IOptimizationProfile::getShapeValuesV2
int64_t const * getShapeValuesV2(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2736

nvinfer1::IOptimizationProfile::setShapeValuesV2
bool setShapeValuesV2(char const *inputName, OptProfileSelector select, int64_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2723

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:2629

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:56

nvinfer1::IPluginRegistry::registerCreator
virtual bool registerCreator(IPluginCreatorInterface &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator. Returns false if a plugin creator with the same type is already registered...

nvinfer1::IPluginResourceContext
Interface for plugins to access per context resources provided by TensorRT.
Definition: NvInferRuntime.h:792

nvinfer1::IPluginResourceContext::getErrorRecorder
virtual IErrorRecorder * getErrorRecorder() const noexcept=0
Get the error recorder associated with the resource context.

nvinfer1::IPluginResourceContext::operator=
IPluginResourceContext & operator=(IPluginResourceContext const &) &=default

nvinfer1::IPluginResourceContext::getGpuAllocator
virtual IGpuAllocator * getGpuAllocator() const noexcept=0
Get the GPU allocator associated with the resource context.

nvinfer1::IPluginV2DynamicExt
Similar to IPluginV2Ext, but with support for dynamic shapes.
Definition: NvInferRuntime.h:407

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:556

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimePlugin.h:474

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:2169

nvinfer1::IRefitter::refitCudaEngineAsync
bool refitCudaEngineAsync(cudaStream_t stream) noexcept
Enqueue weights refitting of the associated engine on the given stream.
Definition: NvInferRuntime.h:2499

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:2378

nvinfer1::IRefitter::getWeightsLocation
TensorLocation getWeightsLocation(char const *weightsName) const noexcept
Get location for the weights associated with the given name.
Definition: NvInferRuntime.h:2437

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:2302

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:2338

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=0

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:2348

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Refits associated engine.
Definition: NvInferRuntime.h:2205

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:2322

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:2226

nvinfer1::IRefitter::getNamedWeights
Weights getNamedWeights(char const *weightsName) const noexcept
Get weights associated with the given name.
Definition: NvInferRuntime.h:2421

nvinfer1::IRefitter::unsetNamedWeights
bool unsetNamedWeights(char const *weightsName) noexcept
Unset weights associated with the given name.
Definition: NvInferRuntime.h:2453

nvinfer1::IRefitter::getWeightsPrototype
Weights getWeightsPrototype(char const *weightsName) const noexcept
Get the Weights prototype associated with the given name.
Definition: NvInferRuntime.h:2517

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:2364

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights, TensorLocation location) noexcept
Specify new weights on a specified device of given name.
Definition: NvInferRuntime.h:2405

nvinfer1::IRefitter::setWeightsValidation
void setWeightsValidation(bool weightsValidation) noexcept
Set whether to validate weights during refitting.
Definition: NvInferRuntime.h:2469

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:2523

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:2243

nvinfer1::IRefitter::getWeightsValidation
bool getWeightsValidation() const noexcept
Get whether to validate weights values during refitting.
Definition: NvInferRuntime.h:2477

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2262

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2277

nvinfer1::IRuntimeConfig
A class for runtime configuration. This class is used during execution context creation.
Definition: NvInferRuntime.h:2950

nvinfer1::IRuntimeConfig::mImpl
apiv::VRuntimeConfig * mImpl
Definition: NvInferRuntime.h:2976

nvinfer1::IRuntimeConfig::~IRuntimeConfig
virtual ~IRuntimeConfig() noexcept=0

nvinfer1::IRuntimeConfig::getExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy getExecutionContextAllocationStrategy() const noexcept
Get the execution context allocation strategy.
Definition: NvInferRuntime.h:2969

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:1862

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:2011

nvinfer1::IRuntime::loadRuntime
IRuntime * loadRuntime(char const *path) noexcept
Load IRuntime from the file.
Definition: NvInferRuntime.h:2127

nvinfer1::IRuntime::getEngineHostCodeAllowed
bool getEngineHostCodeAllowed() const noexcept
Get whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2149

nvinfer1::IRuntime::getTempfileControlFlags
TempfileControlFlags getTempfileControlFlags() const noexcept
Get the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2099

nvinfer1::IRuntime::setEngineHostCodeAllowed
void setEngineHostCodeAllowed(bool allowed) noexcept
Set whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2139

nvinfer1::IRuntime::setTemporaryDirectory
void setTemporaryDirectory(char const *path) noexcept
Set the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2060

nvinfer1::IRuntime::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
Get the local plugin registry that can be used by the runtime.
Definition: NvInferRuntime.h:2109

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible or 0 if DLA is unavailable.
Definition: NvInferRuntime.h:1895

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
Deserialize an engine from host memory.
Definition: NvInferRuntime.h:1963

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=0

nvinfer1::IRuntime::setTempfileControlFlags
void setTempfileControlFlags(TempfileControlFlags flags) noexcept
Set the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2087

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:1887

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:1911

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:1945

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(IStreamReaderV2 &streamReader)
Deserialize an engine from a stream. IStreamReaderV2 is expected to support reading to both host and ...
Definition: NvInferRuntime.h:1986

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:1996

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:2025

nvinfer1::IRuntime::getTemporaryDirectory
char const * getTemporaryDirectory() const noexcept
Get the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2071

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1930

nvinfer1::ISerializationConfig
Holds properties for configuring an engine to serialize the binary.
Definition: NvInferRuntime.h:2842

nvinfer1::ISerializationConfig::clearFlag
bool clearFlag(SerializationFlag serializationFlag) noexcept
clear a serialization flag.
Definition: NvInferRuntime.h:2881

nvinfer1::ISerializationConfig::~ISerializationConfig
virtual ~ISerializationConfig() noexcept=0

nvinfer1::ISerializationConfig::setFlag
bool setFlag(SerializationFlag serializationFlag) noexcept
Set a serialization flag.
Definition: NvInferRuntime.h:2893

nvinfer1::ISerializationConfig::getFlags
SerializationFlags getFlags() const noexcept
Get the serialization flags for this config.
Definition: NvInferRuntime.h:2869

nvinfer1::ISerializationConfig::getFlag
bool getFlag(SerializationFlag serializationFlag) const noexcept
Returns true if the serialization flag is set.
Definition: NvInferRuntime.h:2905

nvinfer1::ISerializationConfig::mImpl
apiv::VSerializationConfig * mImpl
Definition: NvInferRuntime.h:2911

nvinfer1::IVersionedInterface
An Interface class for version control.
Definition: NvInferRuntimeBase.h:282

nvinfer1::InterfaceInfo
Version information associated with a TRT interface.
Definition: NvInferRuntimeBase.h:247

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:5094

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:5096

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:121

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:123

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:125

nvinfer1::Weights::values
void const  * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:124

nvinfer1::v_1_0::IDebugListener
Definition: NvInferRuntime.h:3908

nvinfer1::v_1_0::IDebugListener::processDebugTensor
virtual bool processDebugTensor(void const *addr, TensorLocation location, DataType type, Dims const &shape, char const *name, cudaStream_t stream)=0
Callback function that is called when a debug tensor’s value is updated and the debug state of the te...

nvinfer1::v_1_0::IDebugListener::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:3913

nvinfer1::v_1_0::IDebugListener::~IDebugListener
~IDebugListener() override=default

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:419

nvinfer1::v_1_0::IGpuAllocator
Definition: NvInferRuntime.h:1652

nvinfer1::v_1_0::IGpuAllocator::allocateAsync
virtual void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered acquisition of GPU mem...
Definition: NvInferRuntime.h:1774

nvinfer1::v_1_0::IGpuAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1815

nvinfer1::v_1_0::IGpuAllocator::deallocate
virtual TRT_DEPRECATED bool deallocate(void *const memory) noexcept=0
A thread-safe callback implemented by the application to handle release of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::~IGpuAllocator
~IGpuAllocator() override=default

nvinfer1::v_1_0::IGpuAllocator::IGpuAllocator
IGpuAllocator()=default

nvinfer1::v_1_0::IGpuAllocator::reallocate
virtual void * reallocate(void *const, uint64_t, uint64_t) noexcept
A thread-safe callback implemented by the application to resize an existing allocation.
Definition: NvInferRuntime.h:1721

nvinfer1::v_1_0::IGpuAllocator::allocate
virtual TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept=0
A thread-safe callback implemented by the application to handle acquisition of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::deallocateAsync
virtual bool deallocateAsync(void *const memory, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered release of GPU memory.
Definition: NvInferRuntime.h:1807

nvinfer1::v_1_0::IGpuAsyncAllocator
Definition: NvInferRuntime.h:5160

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocateAsync
bool deallocateAsync(void *const memory, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous release o...

nvinfer1::v_1_0::IGpuAsyncAllocator::IGpuAsyncAllocator
IGpuAsyncAllocator()=default

nvinfer1::v_1_0::IGpuAsyncAllocator::allocateAsync
void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous acquisiti...

nvinfer1::v_1_0::IGpuAsyncAllocator::allocate
TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override
A thread-safe callback implemented by the application to handle acquisition of GPU memory.
Definition: NvInferRuntime.h:5247

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocate
TRT_DEPRECATED bool deallocate(void *const memory) noexcept override
A thread-safe callback implemented by the application to handle release of GPU memory.
Definition: NvInferRuntime.h:5271

nvinfer1::v_1_0::IGpuAsyncAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5279

nvinfer1::v_1_0::IGpuAsyncAllocator::~IGpuAsyncAllocator
~IGpuAsyncAllocator() override=default

nvinfer1::v_1_0::ILoggerFinder
A virtual base class to find a logger. Allows a plugin to find an instance of a logger if it needs to...
Definition: NvInferRuntime.h:5126

nvinfer1::v_1_0::ILoggerFinder::findLogger
virtual ILogger * findLogger()=0
Get the logger used by the engine or execution context which called the plugin method.

nvinfer1::v_1_0::ILoggerFinder::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5131

nvinfer1::v_1_0::ILoggerFinder::~ILoggerFinder
~ILoggerFinder() override=default
Protected: TRT owns ILoggerFinder instances and passes non-owning pointers to plugins.

nvinfer1::v_1_0::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntime.h:1575

nvinfer1::v_1_0::ILogger::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1580

nvinfer1::v_1_0::ILogger::~ILogger
~ILogger() override=default

nvinfer1::v_1_0::ILogger::Severity
Severity
The severity corresponding to a log message.
Definition: NvInferRuntime.h:1591

nvinfer1::v_1_0::ILogger::log
virtual void log(Severity severity, AsciiChar const *msg) noexcept=0
A callback implemented by the application to handle logging messages;.

nvinfer1::v_1_0::ILogger::ILogger
ILogger()=default

nvinfer1::v_1_0::IOutputAllocator
Definition: NvInferRuntime.h:3820

nvinfer1::v_1_0::IOutputAllocator::reallocateOutput
virtual TRT_DEPRECATED void * reallocateOutput(char const *, void *, uint64_t, uint64_t) noexcept
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated....
Definition: NvInferRuntime.h:3849

nvinfer1::v_1_0::IOutputAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:3825

nvinfer1::v_1_0::IOutputAllocator::reallocateOutputAsync
virtual void * reallocateOutputAsync(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment, cudaStream_t)
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated....
Definition: NvInferRuntime.h:3877

nvinfer1::v_1_0::IOutputAllocator::notifyShape
virtual void notifyShape(char const *tensorName, Dims const &dims) noexcept=0
Called by TensorRT when the shape of the output tensor is known.

nvinfer1::v_1_0::IPluginCapability
Definition: NvInferPluginBase.h:141

nvinfer1::v_1_0::IPluginCreatorInterface
Definition: NvInferPluginBase.h:193

nvinfer1::v_1_0::IPluginCreatorV3One
Definition: NvInferRuntime.h:5286

nvinfer1::v_1_0::IPluginCreatorV3One::getFieldNames
virtual PluginFieldCollection const * getFieldNames() noexcept=0
Return a list of fields that need to be passed to createPlugin() when creating a plugin for use in th...

nvinfer1::v_1_0::IPluginCreatorV3One::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5291

nvinfer1::v_1_0::IPluginCreatorV3One::createPlugin
virtual IPluginV3 * createPlugin(AsciiChar const *name, PluginFieldCollection const *fc, TensorRTPhase phase) noexcept=0
Return a plugin object. Return nullptr in case of error.

nvinfer1::v_1_0::IPluginV3
Definition: NvInferPluginBase.h:206

nvinfer1::v_1_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:863

nvinfer1::v_1_0::IPluginV3OneBuild::getFormatCombinationLimit
virtual int32_t getFormatCombinationLimit() noexcept
Return the maximum number of format combinations that will be timed by TensorRT during the build phas...
Definition: NvInferRuntime.h:1067

nvinfer1::v_1_0::IPluginV3OneBuild::getNbOutputs
virtual int32_t getNbOutputs() const noexcept=0
Get the number of outputs from the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::configurePlugin
virtual int32_t configurePlugin(DynamicPluginTensorDesc const *in, int32_t nbInputs, DynamicPluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Configure the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::getNbTactics
virtual int32_t getNbTactics() noexcept
Query for the number of custom tactics the plugin intends to use.
Definition: NvInferRuntime.h:1043

nvinfer1::v_1_0::IPluginV3OneBuild::getMetadataString
virtual char const * getMetadataString() noexcept
Query for a string representing the configuration of the plugin. May be called anytime after plugin c...
Definition: NvInferRuntime.h:1078

nvinfer1::v_1_0::IPluginV3OneBuild::getTimingCacheID
virtual char const * getTimingCacheID() noexcept
Called to query the suffix to use for the timing cache ID. May be called anytime after plugin creatio...
Definition: NvInferRuntime.h:1059

nvinfer1::v_1_0::IPluginV3OneBuild::supportsFormatCombination
virtual bool supportsFormatCombination(int32_t pos, DynamicPluginTensorDesc const *inOut, int32_t nbInputs, int32_t nbOutputs) noexcept=0
Return true if plugin supports the format and datatype for the input/output indexed by pos.

nvinfer1::v_1_0::IPluginV3OneBuild::getValidTactics
virtual int32_t getValidTactics(int32_t *, int32_t) noexcept
Query for any custom tactics that the plugin intends to use.
Definition: NvInferRuntime.h:1035

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputDataTypes
virtual int32_t getOutputDataTypes(DataType *outputTypes, int32_t nbOutputs, const DataType *inputTypes, int32_t nbInputs) const noexcept=0
Provide the data types of the plugin outputs if the input tensors have the data types provided.

nvinfer1::v_1_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:875

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputShapes
virtual int32_t getOutputShapes(DimsExprs const *inputs, int32_t nbInputs, DimsExprs const *shapeInputs, int32_t nbShapeInputs, DimsExprs *outputs, int32_t nbOutputs, IExprBuilder &exprBuilder) noexcept=0
Provide expressions for computing dimensions of the output tensors from dimensions of the input tenso...

nvinfer1::v_1_0::IPluginV3OneCore
Definition: NvInferRuntime.h:820

nvinfer1::v_1_0::IPluginV3OneCore::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:825

nvinfer1::v_1_0::IPluginV3OneCore::getPluginName
virtual AsciiChar const * getPluginName() const noexcept=0
Return the plugin name. Should match the plugin name returned by the corresponding plugin creator.

nvinfer1::v_1_0::IPluginV3OneRuntime
Definition: NvInferRuntime.h:1085

nvinfer1::v_1_0::IPluginV3OneRuntime::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1090

nvinfer1::v_1_0::IPluginV3OneRuntime::onShapeChange
virtual int32_t onShapeChange(PluginTensorDesc const *in, int32_t nbInputs, PluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Called when a plugin is being prepared for execution for specific dimensions. This could happen multi...

nvinfer1::v_1_0::IPluginV3OneRuntime::getFieldsToSerialize
virtual PluginFieldCollection const * getFieldsToSerialize() noexcept=0
Get the plugin fields which should be serialized.

nvinfer1::v_1_0::IPluginV3OneRuntime::setTactic
virtual int32_t setTactic(int32_t) noexcept
Set the tactic to be used in the subsequent call to enqueue(). If no custom tactics were advertised,...
Definition: NvInferRuntime.h:1102

nvinfer1::v_1_0::IPluginV3OneRuntime::enqueue
virtual int32_t enqueue(PluginTensorDesc const *inputDesc, PluginTensorDesc const *outputDesc, void const *const *inputs, void *const *outputs, void *workspace, cudaStream_t stream) noexcept=0
Execute the layer.

nvinfer1::v_1_0::IPluginV3OneRuntime::attachToContext
virtual IPluginV3 * attachToContext(IPluginResourceContext *context) noexcept=0
Clone the plugin, attach the cloned plugin object to a execution context and grant the cloned plugin ...

nvinfer1::v_1_0::IProfiler
Definition: NvInferRuntime.h:1275

nvinfer1::v_1_0::IProfiler::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1280

nvinfer1::v_1_0::IProfiler::~IProfiler
~IProfiler() override=default

nvinfer1::v_1_0::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::v_1_0::IStreamReader
Definition: NvInferRuntime.h:608

nvinfer1::v_1_0::IStreamReader::~IStreamReader
~IStreamReader() override=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader const &) &=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader &&) &=default

nvinfer1::v_1_0::IStreamReader::read
virtual int64_t read(void *destination, int64_t nbBytes)=0
Read the next number of bytes in the stream.

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader &&)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader const &)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader()=default

nvinfer1::v_1_0::IStreamReader::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:620

nvinfer1::v_1_0::IStreamReaderV2
Definition: NvInferRuntime.h:720

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 const &) &=default

nvinfer1::v_1_0::IStreamReaderV2::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:732

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 &&)=default

nvinfer1::v_1_0::IStreamReaderV2::~IStreamReaderV2
~IStreamReaderV2() override=default

nvinfer1::v_1_0::IStreamReaderV2::read
virtual int64_t read(void *destination, int64_t nbBytes, cudaStream_t stream) noexcept=0
Read the next number of bytes in the stream asynchronously.

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2()=default

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 const &)=default

nvinfer1::v_1_0::IStreamReaderV2::seek
virtual bool seek(int64_t offset, SeekPosition where) noexcept=0
Sets the position of the stream to the given offset.

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 &&) &=default

nvinfer1::v_1_0::IStreamWriter
Definition: NvInferRuntime.h:643

nvinfer1::v_1_0::IStreamWriter::operator=
IStreamWriter & operator=(IStreamWriter const &) &=default

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter(IStreamWriter &&)=default

nvinfer1::v_1_0::IStreamWriter::write
virtual int64_t write(void const *data, int64_t nbBytes)=0
write nbBytes of data into the stream.

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter(IStreamWriter const &)=default

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter()=default

nvinfer1::v_1_0::IStreamWriter::operator=
IStreamWriter & operator=(IStreamWriter &&) &=default

nvinfer1::v_1_0::IStreamWriter::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:655

nvinfer1::v_1_0::IStreamWriter::~IStreamWriter
~IStreamWriter() override=default

nvinfer1::v_2_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:1182

nvinfer1::v_2_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1184

nvinfer1::v_2_0::IPluginV3OneBuild::getAliasedInput
virtual int32_t getAliasedInput(int32_t) noexcept
Communicates to TensorRT that the output at the specified output index is aliased to the input at the...
Definition: NvInferRuntime.h:1218

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRefitter
IRefitter * createInferRefitter(ICudaEngine &engine, ILogger &logger) noexcept
Create an instance of an IRefitter class.
Definition: NvInferRuntime.h:5074

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an IRuntime class.
Definition: NvInferRuntime.h:5063

nvinfer1
The TensorRT API version 1 namespace.
Definition: NvInferSafePlugin.h:33

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:2780

nvinfer1::IOutputAllocator
v_1_0::IOutputAllocator IOutputAllocator
Definition: NvInferRuntime.h:3903

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:76

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:178

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::IPluginV3OneCore
v_1_0::IPluginV3OneCore IPluginV3OneCore
Definition: NvInferRuntime.h:1235

nvinfer1::TensorIOMode
TensorIOMode
Definition of tensor IO Mode.
Definition: NvInferRuntimeBase.h:662

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
Describes requirements of compatibility with GPU architectures other than that of the GPU on which th...
Definition: NvInfer.h:10397

nvinfer1::SerializationFlag
SerializationFlag
List of valid flags that the engine can enable when serializing the bytes.
Definition: NvInferRuntime.h:2821

nvinfer1::SerializationFlag::kEXCLUDE_WEIGHTS
@ kEXCLUDE_WEIGHTS
Exclude the weights that can be refitted.

nvinfer1::SerializationFlag::kINCLUDE_REFIT
@ kINCLUDE_REFIT
Remain refittable if originally so.

nvinfer1::IStreamWriter
v_1_0::IStreamWriter IStreamWriter
Definition: NvInferRuntime.h:699

nvinfer1::IProfiler
v_1_0::IProfiler IProfiler
Definition: NvInferRuntime.h:1309

nvinfer1::SeekPosition
SeekPosition
Controls the seek mode of IStreamReaderV2.
Definition: NvInferRuntime.h:706

nvinfer1::SeekPosition::kSET
@ kSET
From the beginning of the file.

nvinfer1::SeekPosition::kCUR
@ kCUR
From the current position of the file.

nvinfer1::SeekPosition::kEND
@ kEND
From the tail of the file.

nvinfer1::IStreamReaderV2
v_1_0::IStreamReaderV2 IStreamReaderV2
Definition: NvInferRuntime.h:776

nvinfer1::TempfileControlFlags
uint32_t TempfileControlFlags
Represents a collection of one or more TempfileControlFlag values combined using bitwise-OR operation...
Definition: NvInferRuntime.h:1387

nvinfer1::EngineStat
EngineStat
The kind of engine statistics that queried from the ICudaEngine.
Definition: NvInferRuntime.h:2990

nvinfer1::EngineStat::kTOTAL_WEIGHTS_SIZE
@ kTOTAL_WEIGHTS_SIZE
Return the total weight size in bytes.

nvinfer1::EngineStat::kSTRIPPED_WEIGHTS_SIZE
@ kSTRIPPED_WEIGHTS_SIZE
Return the stripped weight size in bytes for engines built with BuilderFlag::kSTRIP_PLAN.

nvinfer1::IGpuAllocator
v_1_0::IGpuAllocator IGpuAllocator
Definition: NvInferRuntime.h:1851

nvinfer1::ILogger
v_1_0::ILogger ILogger
Definition: NvInferRuntimeBase.h:125

nvinfer1::AsciiChar
char_t AsciiChar
Definition: NvInferRuntimeBase.h:116

nvinfer1::TensorRTPhase
TensorRTPhase
Indicates a phase of operation of TensorRT.
Definition: NvInferPluginBase.h:116

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::DataType
DataType
The type of weights and tensors. The datatypes other than kBOOL, kINT32, and kINT64 are "activation d...
Definition: NvInferRuntimeBase.h:149

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:1341

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::IDebugListener
v_1_0::IDebugListener IDebugListener
Definition: NvInferRuntime.h:3944

nvinfer1::TempfileControlFlag
TempfileControlFlag
Flags used to control TensorRT's behavior when creating executable temporary files.
Definition: NvInferRuntime.h:1364

nvinfer1::TempfileControlFlag::kALLOW_TEMPORARY_FILES
@ kALLOW_TEMPORARY_FILES

nvinfer1::TempfileControlFlag::kALLOW_IN_MEMORY_FILES
@ kALLOW_IN_MEMORY_FILES
Allow creating and loading files in-memory (or unnamed files).

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:1319

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:2792

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:2756

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kJIT_CONVOLUTIONS
@ kJIT_CONVOLUTIONS

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimePlugin.h:54

nvinfer1::IPluginV3OneRuntime
v_1_0::IPluginV3OneRuntime IPluginV3OneRuntime
Definition: NvInferRuntime.h:1259

nvinfer1::ElementWiseOperation::kSUB
@ kSUB
Subtract the second element from the first.

nvinfer1::ElementWiseOperation::kSUM
@ kSUM
Sum of the two elements.

nvinfer1::ElementWiseOperation::kPROD
@ kPROD
Product of the two elements.

nvinfer1::ElementWiseOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::ElementWiseOperation::kEQUAL
@ kEQUAL
Check if two elements are equal.

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::ElementWiseOperation::kLESS
@ kLESS
Check if element in first tensor is less than corresponding element in second tensor.

nvinfer1::SerializationFlags
uint32_t SerializationFlags
Represents one or more SerializationFlag values using binary OR operations, e.g., 1U << Serialization...
Definition: NvInferRuntime.h:2811

nvinfer1::InterpolationMode::kLINEAR
@ kLINEAR
Supports linear (1D), bilinear (2D), and trilinear (3D) interpolation.

nvinfer1::IPluginV3OneBuild
v_1_0::IPluginV3OneBuild IPluginV3OneBuild
Definition: NvInferRuntime.h:1247

nvinfer1::BuilderFlag::kEXCLUDE_LEAN_RUNTIME
@ kEXCLUDE_LEAN_RUNTIME

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntime.h:1421

nvinfer1::TensorFormat::kCHW4
@ kCHW4

nvinfer1::TensorFormat::kDHWC
@ kDHWC

nvinfer1::TensorFormat::kHWC16
@ kHWC16

nvinfer1::TensorFormat::kDHWC8
@ kDHWC8

nvinfer1::TensorFormat::kDLA_LINEAR
@ kDLA_LINEAR

nvinfer1::TensorFormat::kCDHW32
@ kCDHW32

nvinfer1::TensorFormat::kDLA_HWC4
@ kDLA_HWC4

nvinfer1::TensorFormat::kCHW16
@ kCHW16

nvinfer1::TensorFormat::kHWC
@ kHWC

nvinfer1::TensorFormat::kCHW2
@ kCHW2

nvinfer1::TensorFormat::kHWC8
@ kHWC8

nvinfer1::TensorFormat::kCHW32
@ kCHW32

nvinfer1::ExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy
Different memory allocation behaviors for IExecutionContext.
Definition: NvInferRuntime.h:2928

nvinfer1::ExecutionContextAllocationStrategy::kSTATIC
@ kSTATIC
Default static allocation with the maximum size across all profiles.

nvinfer1::ExecutionContextAllocationStrategy::kUSER_MANAGED
@ kUSER_MANAGED
The user supplies custom allocation to the execution context.

nvinfer1::ExecutionContextAllocationStrategy::kON_PROFILE_CHANGE
@ kON_PROFILE_CHANGE
Reallocate for a profile when it's selected.

nvinfer1::ILoggerFinder
v_1_0::ILoggerFinder ILoggerFinder
Definition: NvInferRuntime.h:5152

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:4878

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::IStreamReader
v_1_0::IStreamReader IStreamReader
Definition: NvInferRuntime.h:689

nvinfer1::AllocatorFlag
AllocatorFlag
Allowed type of memory allocation.
Definition: NvInferRuntime.h:1542

nvinfer1::AllocatorFlag::kRESIZABLE
@ kRESIZABLE
TensorRT may call realloc() on this allocation.

nvinfer1::PoolingType::kMAX
@ kMAX
Maximum over elements.

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:203

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:2539

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::AllocatorFlags
uint32_t AllocatorFlags
Definition: NvInferRuntime.h:1555

nvinfer2::safe::Severity
Severity
Enumerates severity levels for messages issued by the message recorder.
Definition: NvInferSafeRecorder.h:55

nvinfer1::DynamicPluginTensorDesc
Summarizes tensors that a plugin might see for an input or output.
Definition: NvInferRuntime.h:362

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:367

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:370

nvinfer1::DynamicPluginTensorDesc::opt
Dims opt
Optimum value of tensor’s dimensions specified for auto-tuning.
Definition: NvInferRuntime.h:373

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:364

nvinfer1::PluginFieldCollection
Plugin field collection struct.
Definition: NvInferPluginBase.h:103

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimePlugin.h:73

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store the exclusive upper bound of an enumeration type.
Definition: NvInferRuntimeBase.h:131