_static/cpp-api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h" // IWYU pragma: export

#define NV_INFER_INTERNAL_INCLUDE 1

#include "NvInferPluginBase.h" // IWYU pragma: export

#undef NV_INFER_INTERNAL_INCLUDE

#include "NvInferRuntimeCommon.h" // IWYU pragma: export


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected:

    INoCopy() = default;

    virtual ~INoCopy() = default;

    INoCopy(INoCopy const& other) = delete;

    INoCopy& operator=(INoCopy const& other) = delete;

    INoCopy(INoCopy&& other) = delete;

    INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

    kSTANDARD = 0,


    kSAFETY = 1,


    kDLA_STANDALONE = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public:

    DataType type;

    void const* values;

    int64_t count;

};


class IHostMemory : public INoCopy

{

public:

    virtual ~IHostMemory() noexcept = default;


    void* data() const noexcept

    {

        return mImpl->data();

    }


    std::size_t size() const noexcept

    {

        return mImpl->size();

    }


    DataType type() const noexcept

    {

        return mImpl->type();

    }


protected:

    apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kEQUAL = 5,

    kLESS = 6,

    kFLOOR_DIV = 7,

    kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

    return 9;

}


enum class TensorLocation : int32_t

{

    kDEVICE = 0,

    kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public:

    bool isConstant() const noexcept

    {

        return mImpl->isConstant();

    }


    int64_t getConstantValue() const noexcept

    {

        return mImpl->getConstantValue();

    }


protected:

    apiv::VDimensionExpr* mImpl;

    virtual ~IDimensionExpr() noexcept = default;


public:

    bool isSizeTensor() const noexcept

    {

        return mImpl->isSizeTensor();

    }

};


class IExprBuilder : public INoCopy

{

public:

    IDimensionExpr const* constant(int64_t value) noexcept

    {

        return mImpl->constant(value);

    }


    IDimensionExpr const* operation(

        DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

        return mImpl->operation(op, first, second);

    }


protected:

    apiv::VExprBuilder* mImpl;

    virtual ~IExprBuilder() noexcept = default;


public:

    IDimensionExpr const* declareSizeTensor(int32_t outputIndex, IDimensionExpr const& opt, IDimensionExpr const& upper)

    {

        return mImpl->declareSizeTensor(outputIndex, opt, upper);

    }

};


class DimsExprs

{

public:

    int32_t nbDims;

    IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

    PluginTensorDesc desc;


    Dims min;


    Dims max;


    Dims opt;

};


class TRT_DEPRECATED IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public:

    IPluginV2DynamicExt* clone() const noexcept override = 0;


    virtual DimsExprs getOutputDimensions(

        int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


    static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


    virtual bool supportsFormatCombination(

        int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

        int32_t nbOutputs) const noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected:

    int32_t getTensorRTVersion() const noexcept override

    {

        return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


    virtual ~IPluginV2DynamicExt() noexcept {}


private:

    // Following are obsolete base class methods, and must not be implemented or used.


    void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

        bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


    bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

        return false;

    }


    Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

        return Dims{-1, {}};

    }


    TRT_DEPRECATED bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

        return false;

    }


    TRT_DEPRECATED bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

        return true;

    }


    size_t getWorkspaceSize(int32_t) const noexcept override final

    {

        return 0;

    }


    int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

        return 1;

    }

};


namespace v_1_0

{

class IStreamReader : public IVersionedInterface

{

public:

    ~IStreamReader() override = default;

    IStreamReader() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReader", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes) = 0;


protected:

    IStreamReader(IStreamReader const&) = default;

    IStreamReader(IStreamReader&&) = default;

    IStreamReader& operator=(IStreamReader const&) & = default;

    IStreamReader& operator=(IStreamReader&&) & = default;

};


class IStreamWriter : public IVersionedInterface

{

public:

    ~IStreamWriter() override = default;

    IStreamWriter() = default;


    InterfaceInfo getInterfaceInfo() const noexcept final

    {

        return InterfaceInfo{"IStreamWriter", 1, 0};

    }


    virtual int64_t write(void const* data, int64_t nbBytes) = 0;


protected:

    IStreamWriter(IStreamWriter const&) = default;

    IStreamWriter(IStreamWriter&&) = default;

    IStreamWriter& operator=(IStreamWriter const&) & = default;

    IStreamWriter& operator=(IStreamWriter&&) & = default;

};

} // namespace v_1_0


using IStreamReader = v_1_0::IStreamReader;


using IStreamWriter = v_1_0::IStreamWriter;


enum class SeekPosition : int32_t

{

    kSET = 0,


    kCUR = 1,


    kEND = 2,

};


namespace v_1_0

{

class IStreamReaderV2 : public IVersionedInterface

{

public:

    ~IStreamReaderV2() override = default;

    IStreamReaderV2() = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IStreamReaderV2", 1, 0};

    }


    virtual int64_t read(void* destination, int64_t nbBytes, cudaStream_t stream) noexcept = 0;


    virtual bool seek(int64_t offset, SeekPosition where) noexcept = 0;


protected:

    IStreamReaderV2(IStreamReaderV2 const&) = default;

    IStreamReaderV2(IStreamReaderV2&&) = default;

    IStreamReaderV2& operator=(IStreamReaderV2 const&) & = default;

    IStreamReaderV2& operator=(IStreamReaderV2&&) & = default;

};

} // namespace v_1_0


using IStreamReaderV2 = v_1_0::IStreamReaderV2;


class IPluginResourceContext

{

public:

    virtual IGpuAllocator* getGpuAllocator() const noexcept = 0;


    virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

    virtual ~IPluginResourceContext() noexcept = default;


protected:

    IPluginResourceContext() = default;

    IPluginResourceContext(IPluginResourceContext const&) = default;

    IPluginResourceContext(IPluginResourceContext&&) = default;

    IPluginResourceContext& operator=(IPluginResourceContext const&) & = default;

    IPluginResourceContext& operator=(IPluginResourceContext&&) & = default;

};


namespace v_1_0

{

class IPluginV3OneCore : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_CORE", 1, 0};

    }


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;

};


class IPluginV3OneBuild : public IPluginCapability

{

public:

    static constexpr int32_t kDEFAULT_FORMAT_COMBINATION_LIMIT = 100;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 1, 0};

    }


    virtual int32_t configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

        DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getOutputDataTypes(

        DataType* outputTypes, int32_t nbOutputs, const DataType* inputTypes, int32_t nbInputs) const noexcept = 0;


    virtual int32_t getOutputShapes(DimsExprs const* inputs, int32_t nbInputs, DimsExprs const* shapeInputs,

        int32_t nbShapeInputs, DimsExprs* outputs, int32_t nbOutputs, IExprBuilder& exprBuilder) noexcept = 0;


    virtual bool supportsFormatCombination(

        int32_t pos, DynamicPluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


    virtual int32_t getNbOutputs() const noexcept = 0;


    virtual size_t getWorkspaceSize(DynamicPluginTensorDesc const* inputs, int32_t nbInputs,

        DynamicPluginTensorDesc const* outputs, int32_t nbOutputs) const noexcept

    {

        return 0;

    }


    virtual int32_t getValidTactics(int32_t* tactics, int32_t nbTactics) noexcept

    {

        return 0;

    }


    virtual int32_t getNbTactics() noexcept

    {

        return 0;

    }


    virtual char const* getTimingCacheID() noexcept

    {

        return nullptr;

    }


    virtual int32_t getFormatCombinationLimit() noexcept

    {

        return kDEFAULT_FORMAT_COMBINATION_LIMIT;

    }


    virtual char const* getMetadataString() noexcept

    {

        return nullptr;

    }

};


class IPluginV3OneRuntime : public IPluginCapability

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_RUNTIME", 1, 0};

    }


    virtual int32_t setTactic(int32_t tactic) noexcept

    {

        return 0;

    }


    virtual int32_t onShapeChange(

        PluginTensorDesc const* in, int32_t nbInputs, PluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


    virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

        void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


    virtual IPluginV3* attachToContext(IPluginResourceContext* context) noexcept = 0;


    virtual PluginFieldCollection const* getFieldsToSerialize() noexcept = 0;

};

} // namespace v_1_0


namespace v_2_0

{


class IPluginV3OneBuild : public v_1_0::IPluginV3OneBuild

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 2, 0};

    }


    virtual int32_t getAliasedInput(int32_t outputIndex) noexcept

    {

        return -1;

    }

};


} // namespace v_2_0


using IPluginV3OneCore = v_1_0::IPluginV3OneCore;


using IPluginV3OneBuild = v_1_0::IPluginV3OneBuild;


using IPluginV3OneRuntime = v_1_0::IPluginV3OneRuntime;


using IPluginV3OneBuildV2 = v_2_0::IPluginV3OneBuild;


namespace v_1_0

{

class IProfiler

{

public:

    virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


    virtual ~IProfiler() noexcept {}

};

} // namespace v_1_0


using IProfiler = v_1_0::IProfiler;


enum class WeightsRole : int32_t

{

    kKERNEL = 0,

    kBIAS = 1,

    kSHIFT = 2,

    kSCALE = 3,

    kCONSTANT = 4,

    kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

    return 6;

}


enum class DeviceType : int32_t

{

    kGPU = 0,

    kDLA = 1,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

    return 2;

}


enum class TempfileControlFlag : int32_t

{

    kALLOW_IN_MEMORY_FILES = 0,


    kALLOW_TEMPORARY_FILES = 1,

};


template <>

constexpr inline int32_t EnumMax<TempfileControlFlag>() noexcept

{

    return 2;

}


using TempfileControlFlags = uint32_t;


enum class TensorFormat : int32_t

{

    kLINEAR = 0,


    kCHW2 = 1,


    kHWC8 = 2,


    kCHW4 = 3,


    kCHW16 = 4,


    kCHW32 = 5,


    kDHWC8 = 6,


    kCDHW32 = 7,


    kHWC = 8,


    kDLA_LINEAR = 9,


    kDLA_HWC4 = 10,


    kHWC16 = 11,


    kDHWC = 12

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorFormat>

{

    static constexpr int32_t kVALUE = 13;

};

} // namespace impl


enum class AllocatorFlag : int32_t

{

    kRESIZABLE = 0,

};


namespace impl

{

template <>

struct EnumMaxImpl<AllocatorFlag>

{

    static constexpr int32_t kVALUE = 1;

};

} // namespace impl


using AllocatorFlags = uint32_t;


class ILogger

{

public:

    enum class Severity : int32_t

    {

        kINTERNAL_ERROR = 0,

        kERROR = 1,

        kWARNING = 2,

        kINFO = 3,

        kVERBOSE = 4,

    };


    virtual void log(Severity severity, AsciiChar const* msg) noexcept = 0;


    ILogger() = default;

    virtual ~ILogger() = default;


protected:

    // @cond SuppressDoxyWarnings

    ILogger(ILogger const&) = default;

    ILogger(ILogger&&) = default;

    ILogger& operator=(ILogger const&) & = default;

    ILogger& operator=(ILogger&&) & = default;

    // @endcond

};


namespace impl

{

template <>

struct EnumMaxImpl<ILogger::Severity>

{

    static constexpr int32_t kVALUE = 5;

};

} // namespace impl


namespace v_1_0

{


class IGpuAllocator : public IVersionedInterface

{

public:

    TRT_DEPRECATED virtual void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept = 0;


    ~IGpuAllocator() override = default;

    IGpuAllocator() = default;


    virtual void* reallocate(void* const /*baseAddr*/, uint64_t /*alignment*/, uint64_t /*newSize*/) noexcept

    {

        return nullptr;

    }


    TRT_DEPRECATED virtual bool deallocate(void* const memory) noexcept = 0;


    virtual void* allocateAsync(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t /*stream*/) noexcept

    {

        return allocate(size, alignment, flags);

    }

    virtual bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept

    {

        return deallocate(memory);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }


protected:

    // @cond SuppressDoxyWarnings

    IGpuAllocator(IGpuAllocator const&) = default;

    IGpuAllocator(IGpuAllocator&&) = default;

    IGpuAllocator& operator=(IGpuAllocator const&) & = default;

    IGpuAllocator& operator=(IGpuAllocator&&) & = default;

    // @endcond

};


} // namespace v_1_0


using IGpuAllocator = v_1_0::IGpuAllocator;


enum class EngineValidity : int32_t

{

    kVALID = 0,


    kSUBOPTIMAL = 1,


    kINVALID = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineValidity>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


enum class EngineInvalidityDiagnostics : uint64_t

{

    kVERSION_MISMATCH = 1ULL << 0,


    kUNSUPPORTED_CC = 1ULL << 1,


    kOLD_CUDA_DRIVER = 1ULL << 2,


    kOLD_CUDA_RUNTIME = 1ULL << 3,


    kINSUFFICIENT_GPU_MEMORY = 1ULL << 4,


    kMALFORMED_ENGINE = 1ULL << 5,


    kCUDA_ERROR = 1ULL << 6,

};


class IRuntime : public INoCopy

{

public:

    virtual ~IRuntime() noexcept = default;


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

        return mImpl->deserializeCudaEngine(blob, size);

    }


    ICudaEngine* deserializeCudaEngine(IStreamReaderV2& streamReader)

    {

        return mImpl->deserializeCudaEngineV2(streamReader);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    void setTemporaryDirectory(char const* path) noexcept

    {

        return mImpl->setTemporaryDirectory(path);

    }


    char const* getTemporaryDirectory() const noexcept

    {

        return mImpl->getTemporaryDirectory();

    }


    void setTempfileControlFlags(TempfileControlFlags flags) noexcept

    {

        return mImpl->setTempfileControlFlags(flags);

    }


    TempfileControlFlags getTempfileControlFlags() const noexcept

    {

        return mImpl->getTempfileControlFlags();

    }


    IPluginRegistry& getPluginRegistry() noexcept

    {

        return mImpl->getPluginRegistry();

    }


    IRuntime* loadRuntime(char const* path) noexcept

    {

        return mImpl->loadRuntime(path);

    }


    void setEngineHostCodeAllowed(bool allowed) noexcept

    {

        return mImpl->setEngineHostCodeAllowed(allowed);

    }


    bool getEngineHostCodeAllowed() const noexcept

    {

        return mImpl->getEngineHostCodeAllowed();

    }


  int64_t getEngineHeaderSize() const noexcept {

    return mImpl->getEngineHeaderSize();

  }


  EngineValidity getEngineValidity(void const* blob, int64_t blobSize, uint64_t* diagnostics) const noexcept {

    return mImpl->getEngineValidity(blob, blobSize, diagnostics);

  }


protected:

    apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public:

    virtual ~IRefitter() noexcept = default;


    bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

        return mImpl->setWeights(layerName, role, weights);

    }


    bool refitCudaEngine() noexcept

    {

        return mImpl->refitCudaEngine();

    }


    int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getMissing(size, layerNames, roles);

    }


    int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

        return mImpl->getAll(size, layerNames, roles);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool setNamedWeights(char const* name, Weights weights) noexcept

    {

        return mImpl->setNamedWeights(name, weights);

    }


    int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getMissingWeights(size, weightsNames);

    }


    int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

        return mImpl->getAllWeights(size, weightsNames);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    bool setNamedWeights(char const* name, Weights weights, TensorLocation location) noexcept

    {

        return mImpl->setNamedWeightsWithLocation(name, weights, location);

    }


    Weights getNamedWeights(char const* weightsName) const noexcept

    {

        return mImpl->getNamedWeights(weightsName);

    }


    TensorLocation getWeightsLocation(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsLocation(weightsName);

    }


    bool unsetNamedWeights(char const* weightsName) noexcept

    {

        return mImpl->unsetNamedWeights(weightsName);

    }


    void setWeightsValidation(bool weightsValidation) noexcept

    {

        return mImpl->setWeightsValidation(weightsValidation);

    }


    bool getWeightsValidation() const noexcept

    {

        return mImpl->getWeightsValidation();

    }


    bool refitCudaEngineAsync(cudaStream_t stream) noexcept

    {

        return mImpl->refitCudaEngineAsync(stream);

    }


    Weights getWeightsPrototype(char const* weightsName) const noexcept

    {

        return mImpl->getWeightsPrototype(weightsName);

    }


protected:

    apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

    kMIN = 0,

    kOPT = 1,

    kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

    return 3;

}


class IOptimizationProfile : public INoCopy

{

public:

    bool setDimensions(char const* inputName, OptProfileSelector select, Dims const& dims) noexcept

    {

        return mImpl->setDimensions(inputName, select, dims);

    }


    Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(inputName, select);

    }


    TRT_DEPRECATED bool setShapeValues(

        char const* inputName, OptProfileSelector select, int32_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


    int32_t getNbShapeValues(char const* inputName) const noexcept

    {

        return mImpl->getNbShapeValues(inputName);

    }


    TRT_DEPRECATED int32_t const* getShapeValues(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValues(inputName, select);

    }


    bool setExtraMemoryTarget(float target) noexcept

    {

        return mImpl->setExtraMemoryTarget(target);

    }


    float getExtraMemoryTarget() const noexcept

    {

        return mImpl->getExtraMemoryTarget();

    }


    bool isValid() const noexcept

    {

        return mImpl->isValid();

    }


    bool setShapeValuesV2(

        char const* inputName, OptProfileSelector select, int64_t const* values, int32_t nbValues) noexcept

    {

        return mImpl->setShapeValuesV2(inputName, select, values, nbValues);

    }


    int64_t const* getShapeValuesV2(char const* inputName, OptProfileSelector select) const noexcept

    {

        return mImpl->getShapeValuesV2(inputName, select);

    }


protected:

    apiv::VOptimizationProfile* mImpl;

    virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

    kCUBLAS TRT_DEPRECATED_ENUM = 0,


    kCUBLAS_LT TRT_DEPRECATED_ENUM = 1,


    kCUDNN TRT_DEPRECATED_ENUM = 2,


    kEDGE_MASK_CONVOLUTIONS = 3,


    kJIT_CONVOLUTIONS = 4,

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

    return 5;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

    kLAYER_NAMES_ONLY = 0,

    kNONE = 1,

    kDETAILED = 2,

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

    return 3;

}


using SerializationFlags = uint32_t;


enum class SerializationFlag : int32_t

{

    kEXCLUDE_WEIGHTS = 0,

    kEXCLUDE_LEAN_RUNTIME = 1,

    kINCLUDE_REFIT = 2,

};


template <>

constexpr inline int32_t EnumMax<SerializationFlag>() noexcept

{

    return 3;

}


class ISerializationConfig : public INoCopy

{

public:

    virtual ~ISerializationConfig() noexcept = default;


    bool setFlags(SerializationFlags serializationFlags) noexcept

    {

        return mImpl->setFlags(serializationFlags);

    }


    SerializationFlags getFlags() const noexcept

    {

        return mImpl->getFlags();

    }


    bool clearFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->clearFlag(serializationFlag);

    }


    bool setFlag(SerializationFlag serializationFlag) noexcept

    {

        return mImpl->setFlag(serializationFlag);

    }


    bool getFlag(SerializationFlag serializationFlag) const noexcept

    {

        return mImpl->getFlag(serializationFlag);

    }


protected:

    apiv::VSerializationConfig* mImpl;

};


enum class ExecutionContextAllocationStrategy : int32_t

{

    kSTATIC = 0,

    kON_PROFILE_CHANGE = 1,

    kUSER_MANAGED = 2,

};


template <>

constexpr inline int32_t EnumMax<ExecutionContextAllocationStrategy>() noexcept

{

    return 3;

}


class IRuntimeCache : public INoCopy

{

public:

    virtual ~IRuntimeCache() noexcept = default;


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    bool deserialize(void const* blob, size_t size) noexcept

    {

        return mImpl->deserialize(blob, size);

    }


    bool reset() noexcept

    {

        return mImpl->reset();

    }


protected:

    apiv::VRuntimeCache* mImpl;

};


enum class DynamicShapesKernelSpecializationStrategy : int32_t

{

    kLAZY = 0,


    kEAGER = 1,


    kNONE = 2,

};


template <>

constexpr inline int32_t EnumMax<DynamicShapesKernelSpecializationStrategy>() noexcept

{

    return 3;

}


enum class CudaGraphStrategy : int32_t

{

    kDISABLED = 0,


    kWHOLE_GRAPH_CAPTURE = 1,

};


template <>

constexpr inline int32_t EnumMax<CudaGraphStrategy>() noexcept

{

    return 2;

}


class IRuntimeConfig : public INoCopy

{

public:

    virtual ~IRuntimeConfig() noexcept = default;


    void setExecutionContextAllocationStrategy(ExecutionContextAllocationStrategy strategy) noexcept

    {

        return mImpl->setExecutionContextAllocationStrategy(strategy);

    }


    ExecutionContextAllocationStrategy getExecutionContextAllocationStrategy() const noexcept

    {

        return mImpl->getExecutionContextAllocationStrategy();

    }


    IRuntimeCache* createRuntimeCache() const noexcept

    {

        return mImpl->createRuntimeCache();

    }


    bool setRuntimeCache(IRuntimeCache const& cache) noexcept

    {

        return mImpl->setRuntimeCache(cache);

    }


    IRuntimeCache* getRuntimeCache() const noexcept

    {

        return mImpl->getRuntimeCache();

    }


    void setDynamicShapesKernelSpecializationStrategy(

        DynamicShapesKernelSpecializationStrategy dynamicShapesKernelSpecializationStrategy) noexcept

    {

        return mImpl->setDynamicShapesKernelSpecializationStrategy(dynamicShapesKernelSpecializationStrategy);

    }


    DynamicShapesKernelSpecializationStrategy getDynamicShapesKernelSpecializationStrategy() const noexcept

    {

        return mImpl->getDynamicShapesKernelSpecializationStrategy();

    }


    bool setCudaGraphStrategy(CudaGraphStrategy strategy) noexcept

    {

        return mImpl->setCudaGraphStrategy(strategy);

    }


    CudaGraphStrategy getCudaGraphStrategy() const noexcept

    {

        return mImpl->getCudaGraphStrategy();

    }


protected:

    apiv::VRuntimeConfig* mImpl;

}; // class IRuntimeConfig


enum class EngineStat : int32_t

{

    kTOTAL_WEIGHTS_SIZE = 0,


    kSTRIPPED_WEIGHTS_SIZE = 1,

};


template <>

constexpr inline int32_t EnumMax<EngineStat>() noexcept

{

    return 2;

}


class ICudaEngine : public INoCopy

{

public:

    virtual ~ICudaEngine() noexcept = default;


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    DataType getTensorDataType(char const* tensorName) const noexcept

    {

        return mImpl->getTensorDataType(tensorName);

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    IExecutionContext* createExecutionContext(

        ExecutionContextAllocationStrategy strategy = ExecutionContextAllocationStrategy::kSTATIC) noexcept

    {

        return mImpl->createExecutionContext(strategy);

    }


    TensorLocation getTensorLocation(char const* tensorName) const noexcept

    {

        return mImpl->getTensorLocation(tensorName);

    }


    bool isShapeInferenceIO(char const* tensorName) const noexcept

    {

        return mImpl->isShapeInferenceIO(tensorName);

    }


    TensorIOMode getTensorIOMode(char const* tensorName) const noexcept

    {

        return mImpl->getTensorIOMode(tensorName);

    }


    TRT_NODISCARD char const* getAliasedInputTensor(char const* tensorName) const noexcept

    {

        return mImpl->getAliasedInputTensor(tensorName);

    }


    IExecutionContext* createExecutionContext(IRuntimeConfig* runtimeConfig) noexcept

    {

        return mImpl->createExecutionContextWithRuntimeConfig(runtimeConfig);

    }


    IRuntimeConfig* createRuntimeConfig() noexcept

    {

        return mImpl->createRuntimeConfig();

    }


    int64_t getDeviceMemorySizeV2() const noexcept

    {

        return mImpl->getDeviceMemorySizeV2();

    }


    int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept

    {

        return mImpl->getDeviceMemorySizeForProfileV2(profileIndex);

    }


    bool isRefittable() const noexcept

    {

        return mImpl->isRefittable();

    }


    int32_t getTensorBytesPerComponent(char const* tensorName) const noexcept

    {

        return mImpl->getTensorBytesPerComponent(tensorName);

    }


    int32_t getTensorBytesPerComponent(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorBytesPerComponentV2(tensorName, profileIndex);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName) const noexcept

    {

        return mImpl->getTensorComponentsPerElement(tensorName);

    }


    int32_t getTensorComponentsPerElement(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorComponentsPerElementV2(tensorName, profileIndex);

    }


    TensorFormat getTensorFormat(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormat(tensorName);

    }


    TensorFormat getTensorFormat(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatV2(tensorName, profileIndex);

    }


    char const* getTensorFormatDesc(char const* tensorName) const noexcept

    {

        return mImpl->getTensorFormatDesc(tensorName);

    }


    char const* getTensorFormatDesc(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorFormatDescV2(tensorName, profileIndex);

    }


    int32_t getTensorVectorizedDim(char const* tensorName) const noexcept

    {

        return mImpl->getTensorVectorizedDim(tensorName);

    }


    int32_t getTensorVectorizedDim(char const* tensorName, int32_t profileIndex) const noexcept

    {

        return mImpl->getTensorVectorizedDimV2(tensorName, profileIndex);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    Dims getProfileShape(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileShape(tensorName, profileIndex, select);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        return mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    IEngineInspector* createEngineInspector() const noexcept

    {

        return mImpl->createEngineInspector();

    }


    int32_t getNbIOTensors() const noexcept

    {

        return mImpl->getNbIOTensors();

    }


    char const* getIOTensorName(int32_t index) const noexcept

    {

        return mImpl->getIOTensorName(index);

    }


    HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

        return mImpl->getHardwareCompatibilityLevel();

    }


    int32_t getNbAuxStreams() const noexcept

    {

        return mImpl->getNbAuxStreams();

    }


    ISerializationConfig* createSerializationConfig() noexcept

    {

        return mImpl->createSerializationConfig();

    }


    IHostMemory* serializeWithConfig(ISerializationConfig& config) const noexcept

    {

        return mImpl->serializeWithConfig(config);

    }


    int64_t getStreamableWeightsSize() const noexcept

    {

        return mImpl->getStreamableWeightsSize();

    }


    bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept

    {

        return mImpl->setWeightStreamingBudgetV2(gpuMemoryBudget);

    }


    int64_t getWeightStreamingBudgetV2() const noexcept

    {

        return mImpl->getWeightStreamingBudgetV2();

    }


    int64_t getWeightStreamingAutomaticBudget() const noexcept

    {

        return mImpl->getWeightStreamingAutomaticBudget();

    }


    int64_t getWeightStreamingScratchMemorySize() const noexcept

    {

        return mImpl->getWeightStreamingScratchMemorySize();

    }


    bool isDebugTensor(char const* name) const noexcept

    {

        return mImpl->isDebugTensor(name);

    }


    int64_t const* getProfileTensorValuesV2(

        char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

        return mImpl->getProfileTensorValuesV2(tensorName, profileIndex, select);

    }


    int64_t getEngineStat(EngineStat stat) const noexcept

    {

        return mImpl->getEngineStat(stat);

    }


protected:

    apiv::VCudaEngine* mImpl;

};


namespace v_1_0

{

class IOutputAllocator : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IOutputAllocator", 1, 0};

    }


    virtual void* reallocateOutputAsync(

        char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment, cudaStream_t /*stream*/)

    {

        return nullptr;

    }


    virtual void notifyShape(char const* tensorName, Dims const& dims) noexcept = 0;

};

} // namespace v_1_0


using IOutputAllocator = v_1_0::IOutputAllocator;


namespace v_1_0

{

class IDebugListener : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IDebugListener", 1, 0};

    }


    virtual bool processDebugTensor(void const* addr, TensorLocation location, DataType type, Dims const& shape,

        char const* name, cudaStream_t stream)

        = 0;


    ~IDebugListener() override = default;

};

} // namespace v_1_0


using IDebugListener = v_1_0::IDebugListener;


class IExecutionContext : public INoCopy

{

public:

    virtual ~IExecutionContext() noexcept = default;


    void setDebugSync(bool sync) noexcept

    {

        mImpl->setDebugSync(sync);

    }


    bool getDebugSync() const noexcept

    {

        return mImpl->getDebugSync();

    }


    void setProfiler(IProfiler* profiler) noexcept

    {

        mImpl->setProfiler(profiler);

    }


    IProfiler* getProfiler() const noexcept

    {

        return mImpl->getProfiler();

    }


    ICudaEngine const& getEngine() const noexcept

    {

        return mImpl->getEngine();

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDeviceMemory(void* memory) noexcept

    {

        mImpl->setDeviceMemory(memory);

    }


    void setDeviceMemoryV2(void* memory, int64_t size) noexcept

    {

        return mImpl->setDeviceMemoryV2(memory, size);

    }


    Dims getTensorStrides(char const* tensorName) const noexcept

    {

        return mImpl->getTensorStrides(tensorName);

    }


public:

    int32_t getOptimizationProfile() const noexcept

    {

        return mImpl->getOptimizationProfile();

    }


    bool setInputShape(char const* tensorName, Dims const& dims) noexcept

    {

        return mImpl->setInputShape(tensorName, dims);

    }


    Dims getTensorShape(char const* tensorName) const noexcept

    {

        return mImpl->getTensorShape(tensorName);

    }


    bool allInputDimensionsSpecified() const noexcept

    {

        return mImpl->allInputDimensionsSpecified();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    bool executeV2(void* const* bindings) noexcept

    {

        return mImpl->executeV2(bindings);

    }


    bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

        return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


    void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

        mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


    bool getEnqueueEmitsProfile() const noexcept

    {

        return mImpl->getEnqueueEmitsProfile();

    }


    bool reportToProfiler() const noexcept

    {

        return mImpl->reportToProfiler();

    }


    bool setTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setTensorAddress(tensorName, data);

    }


    void const* getTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getTensorAddress(tensorName);

    }


    bool setOutputTensorAddress(char const* tensorName, void* data) noexcept

    {

        return mImpl->setOutputTensorAddress(tensorName, data);

    }


    bool setInputTensorAddress(char const* tensorName, void const* data) noexcept

    {

        return mImpl->setInputTensorAddress(tensorName, data);

    }


    void* getOutputTensorAddress(char const* tensorName) const noexcept

    {

        return mImpl->getOutputTensorAddress(tensorName);

    }


    int32_t inferShapes(int32_t nbMaxNames, char const** tensorNames) noexcept

    {

        return mImpl->inferShapes(nbMaxNames, tensorNames);

    }


    size_t updateDeviceMemorySizeForShapes() noexcept

    {

        return mImpl->updateDeviceMemorySizeForShapes();

    }


    bool setInputConsumedEvent(cudaEvent_t event) noexcept

    {

        return mImpl->setInputConsumedEvent(event);

    }


    cudaEvent_t getInputConsumedEvent() const noexcept

    {

        return mImpl->getInputConsumedEvent();

    }


    bool setOutputAllocator(char const* tensorName, IOutputAllocator* outputAllocator) noexcept

    {

        return mImpl->setOutputAllocator(tensorName, outputAllocator);

    }


    IOutputAllocator* getOutputAllocator(char const* tensorName) const noexcept

    {

        return mImpl->getOutputAllocator(tensorName);

    }


    int64_t getMaxOutputSize(char const* tensorName) const noexcept

    {

        return mImpl->getMaxOutputSize(tensorName);

    }


    bool setTemporaryStorageAllocator(IGpuAllocator* allocator) noexcept

    {

        return mImpl->setTemporaryStorageAllocator(allocator);

    }


    IGpuAllocator* getTemporaryStorageAllocator() const noexcept

    {

        return mImpl->getTemporaryStorageAllocator();

    }


    bool enqueueV3(cudaStream_t stream) noexcept

    {

        return mImpl->enqueueV3(stream);

    }


    void setPersistentCacheLimit(size_t size) noexcept

    {

        mImpl->setPersistentCacheLimit(size);

    }


    size_t getPersistentCacheLimit() const noexcept

    {

        return mImpl->getPersistentCacheLimit();

    }


    bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept

    {

        return mImpl->setNvtxVerbosity(verbosity);

    }


    ProfilingVerbosity getNvtxVerbosity() const noexcept

    {

        return mImpl->getNvtxVerbosity();

    }


    void setAuxStreams(cudaStream_t* auxStreams, int32_t nbStreams) noexcept

    {

        mImpl->setAuxStreams(auxStreams, nbStreams);

    }


    bool setDebugListener(IDebugListener* listener) noexcept

    {

        return mImpl->setDebugListener(listener);

    }


    IDebugListener* getDebugListener() noexcept

    {

        return mImpl->getDebugListener();

    }


    bool setTensorDebugState(char const* name, bool flag) noexcept

    {

        return mImpl->setTensorDebugState(name, flag);

    }


    bool getDebugState(char const* name) const noexcept

    {

        return mImpl->getDebugState(name);

    }


    IRuntimeConfig* getRuntimeConfig() const noexcept

    {

        return mImpl->getRuntimeConfig();

    }


    bool setAllTensorsDebugState(bool flag) noexcept

    {

        return mImpl->setAllTensorsDebugState(flag);

    }


    bool setUnfusedTensorsDebugState(bool flag) noexcept

    {

        return mImpl->setUnfusedTensorsDebugState(flag);

    }


    bool getUnfusedTensorsDebugState() const noexcept

    {

        return mImpl->getUnfusedTensorsDebugState();

    }

#if ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION

    bool isStreamCapturable(cudaStream_t stream) const noexcept {

        return mImpl->isStreamCapturable(stream);

    }

#endif // ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION


protected:

    apiv::VExecutionContext* mImpl;

}; // class IExecutionContext


enum class LayerInformationFormat : int32_t

{

    kONELINE = 0,

    kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

    return 2;

}


class IEngineInspector : public INoCopy

{

public:

    virtual ~IEngineInspector() noexcept = default;


    bool setExecutionContext(IExecutionContext const* context) noexcept

    {

        return mImpl->setExecutionContext(context);

    }


    IExecutionContext const* getExecutionContext() const noexcept

    {

        return mImpl->getExecutionContext();

    }


    char const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

        return mImpl->getLayerInformation(layerIndex, format);

    }


    char const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

        return mImpl->getEngineInformation(format);

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


protected:

    apiv::VEngineInspector* mImpl;

}; // class IEngineInspector


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this

          // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

    return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

    return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace


template <typename T>

class PluginRegistrar

{

public:

    PluginRegistrar()

    {

        getPluginRegistry()->registerCreator(instance, "");

    }


private:

    T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name)                                                                                 \

    static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}


namespace nvinfer1

{

class ILoggerFinder

{

public:

    virtual ILogger* findLogger() = 0;


protected:

    virtual ~ILoggerFinder() = default;

};


namespace v_1_0

{


class IGpuAsyncAllocator : public IGpuAllocator

{

public:

    IGpuAsyncAllocator() = default;

    ~IGpuAsyncAllocator() override = default;


    void* allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags,

        cudaStream_t /*stream*/) noexcept override = 0;


    bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept override = 0;


    TRT_DEPRECATED void* allocate(

        uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override

    {

        return allocateAsync(size, alignment, flags, nullptr);

    }


    TRT_DEPRECATED bool deallocate(void* const memory) noexcept override

    {

        return deallocateAsync(memory, nullptr);

    }


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return {"IGpuAllocator", 1, 0};

    }

};


class IPluginCreatorV3One : public IPluginCreatorInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"PLUGIN CREATOR_V3ONE", 1, 0};

    }


    virtual IPluginV3* createPlugin(

        AsciiChar const* name, PluginFieldCollection const* fc, TensorRTPhase phase) noexcept = 0;


    virtual PluginFieldCollection const* getFieldNames() noexcept = 0;


    virtual AsciiChar const* getPluginName() const noexcept = 0;


    virtual AsciiChar const* getPluginVersion() const noexcept = 0;


    virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


    IPluginCreatorV3One() = default;

    virtual ~IPluginCreatorV3One() = default;


protected:

    IPluginCreatorV3One(IPluginCreatorV3One const&) = default;

    IPluginCreatorV3One(IPluginCreatorV3One&&) = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One const&) & = default;

    IPluginCreatorV3One& operator=(IPluginCreatorV3One&&) & = default;

};


} // namespace v_1_0


using IGpuAsyncAllocator = v_1_0::IGpuAsyncAllocator;


using IPluginCreatorV3One = v_1_0::IPluginCreatorV3One;


} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibMajorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibMinorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibPatchVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibBuildVersion() noexcept;


#endif // NV_INFER_RUNTIME_H

NvInferImpl.h

NvInferPluginBase.h

getPluginRegistry
TENSORRTAPI nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
Return the plugin registry.

getLogger
TENSORRTAPI nvinfer1::ILogger * getLogger() noexcept
Return the logger object.

getInferLibMinorVersion
TENSORRTAPI int32_t getInferLibMinorVersion() noexcept
Return the library minor version number.

getInferLibMajorVersion
TENSORRTAPI int32_t getInferLibMajorVersion() noexcept
Return the library major version number.

getInferLibPatchVersion
TENSORRTAPI int32_t getInferLibPatchVersion() noexcept
Return the library patch version number.

getInferLibBuildVersion
TENSORRTAPI int32_t getInferLibBuildVersion() noexcept
Return the library build version number.

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:69

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeBase.h:101

TRT_NODISCARD
#define TRT_NODISCARD
A stand-in for [[nodiscard]] and [[nodiscard(REASON)]] that works with older compilers.
Definition: NvInferRuntimeBase.h:57

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeBase.h:42

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeBase.h:43

NvInferRuntimeCommon.h

Dims
Structure to define the dimensions of a tensor.

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:218

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:221

nvinfer1::DimsExprs
Analog of class Dims with expressions instead of constants for the dimensions.
Definition: NvInferRuntime.h:350

nvinfer1::DimsExprs::d
IDimensionExpr const  * d[Dims::MAX_DIMS]
The extent of each dimension.
Definition: NvInferRuntime.h:353

nvinfer1::DimsExprs::nbDims
int32_t nbDims
The number of dimensions.
Definition: NvInferRuntime.h:352

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:3401

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName) const noexcept
Return the number of bytes per component of an element, or -1 if the tensor is not vectorized or prov...
Definition: NvInferRuntime.h:3634

nvinfer1::ICudaEngine::createSerializationConfig
ISerializationConfig * createSerializationConfig() noexcept
Create a serialization configuration object.
Definition: NvInferRuntime.h:4008

nvinfer1::ICudaEngine::getIOTensorName
char const * getIOTensorName(int32_t index) const noexcept
Return name of an IO tensor.
Definition: NvInferRuntime.h:3972

nvinfer1::ICudaEngine::getWeightStreamingBudgetV2
int64_t getWeightStreamingBudgetV2() const noexcept
Returns the current weight streaming device memory budget in bytes.
Definition: NvInferRuntime.h:4104

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Determine what execution capability this engine has.
Definition: NvInferRuntime.h:3861

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:3895

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName, int32_t profileIndex) const noexcept
Return the tensor format of given profile, or TensorFormat::kLINEAR if the provided name does not map...
Definition: NvInferRuntime.h:3720

nvinfer1::ICudaEngine::getProfileTensorValuesV2
int64_t const * getProfileTensorValuesV2(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values (not dimensions) for an input tensor given its name under ...
Definition: NvInferRuntime.h:4195

nvinfer1::ICudaEngine::hasImplicitBatchDimension
TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept
Query whether the engine was built with an implicit batch dimension.
Definition: NvInferRuntime.h:3909

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
Definition: NvInferRuntime.h:4230

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(ExecutionContextAllocationStrategy strategy=ExecutionContextAllocationStrategy::kSTATIC) noexcept
Create an execution context and specify the strategy for allocating internal activation memory.
Definition: NvInferRuntime.h:3475

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName) const noexcept
Return the human readable description of the tensor format, or empty string if the provided name does...
Definition: NvInferRuntime.h:3744

nvinfer1::ICudaEngine::getProfileShape
Dims getProfileShape(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for an input tensor given its name under an optimizati...
Definition: NvInferRuntime.h:3846

nvinfer1::ICudaEngine::setWeightStreamingBudgetV2
bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept
Limit the maximum amount of GPU memory usable for network weights in bytes.
Definition: NvInferRuntime.h:4086

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(IRuntimeConfig *runtimeConfig) noexcept
Create an execution context with TensorRT JIT runtime config.
Definition: NvInferRuntime.h:3558

nvinfer1::ICudaEngine::getNbAuxStreams
int32_t getNbAuxStreams() const noexcept
Return the number of auxiliary streams used by this engine.
Definition: NvInferRuntime.h:3998

nvinfer1::ICudaEngine::getStreamableWeightsSize
int64_t getStreamableWeightsSize() const noexcept
Get the total size in bytes of all streamable weights.
Definition: NvInferRuntime.h:4044

nvinfer1::ICudaEngine::getTensorDataType
DataType getTensorDataType(char const *tensorName) const noexcept
Determine the required data type for a buffer from its tensor name.
Definition: NvInferRuntime.h:3430

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:3880

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
return the tactic sources required by this engine.
Definition: NvInferRuntime.h:3925

nvinfer1::ICudaEngine::getAliasedInputTensor
TRT_NODISCARD char const * getAliasedInputTensor(char const *tensorName) const noexcept
Get the input tensor name that an output tensor should alias with.
Definition: NvInferRuntime.h:3546

nvinfer1::ICudaEngine::serializeWithConfig
IHostMemory * serializeWithConfig(ISerializationConfig &config) const noexcept
Serialize the network to a stream with the provided SerializationConfig.
Definition: NvInferRuntime.h:4028

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getWeightStreamingAutomaticBudget
int64_t getWeightStreamingAutomaticBudget() const noexcept
TensorRT automatically determines a device memory budget for the model to run. The budget is close to...
Definition: NvInferRuntime.h:4129

nvinfer1::ICudaEngine::isDebugTensor
bool isDebugTensor(char const *name) const noexcept
Check if a tensor is marked as a debug tensor.
Definition: NvInferRuntime.h:4171

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName, int32_t profileIndex) const noexcept
Return the dimension index that the buffer is vectorized of given profile, or -1 if the provided name...
Definition: NvInferRuntime.h:3800

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
Returns the name of the network associated with the engine.
Definition: NvInferRuntime.h:3815

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Return the ProfilingVerbosity the builder config was set to when the engine was built.
Definition: NvInferRuntime.h:3937

nvinfer1::ICudaEngine::isShapeInferenceIO
bool isShapeInferenceIO(char const *tensorName) const noexcept
True if tensor is required as input for shape calculations or is output from shape calculations.
Definition: NvInferRuntime.h:3513

nvinfer1::ICudaEngine::getWeightStreamingScratchMemorySize
int64_t getWeightStreamingScratchMemorySize() const noexcept
Returns the size of the scratch memory required by the current weight streaming budget.
Definition: NvInferRuntime.h:4157

nvinfer1::ICudaEngine::getDeviceMemorySizeV2
int64_t getDeviceMemorySizeV2() const noexcept
Return the maximum device memory required by the context over all profiles.
Definition: NvInferRuntime.h:3587

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName) const noexcept
Return the dimension index that the buffer is vectorized, or -1 if the provided name does not map to ...
Definition: NvInferRuntime.h:3784

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of components included in one element of given profile, or -1 if tensor is not vect...
Definition: NvInferRuntime.h:3691

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfileV2
int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept
Return the maximum device memory required by the context for a profile.
Definition: NvInferRuntime.h:3603

nvinfer1::ICudaEngine::createRuntimeConfig
IRuntimeConfig * createRuntimeConfig() noexcept
Create a runtime config for TensorRT JIT. The caller is responsible for ownership of the returned IRu...
Definition: NvInferRuntime.h:3571

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName) const noexcept
Return the tensor format, or TensorFormat::kLINEAR if the provided name does not map to an input or o...
Definition: NvInferRuntime.h:3706

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
Serialize the network to a stream.
Definition: NvInferRuntime.h:3458

nvinfer1::ICudaEngine::getEngineStat
int64_t getEngineStat(EngineStat stat) const noexcept
Get engine statistics according to the given enum value.
Definition: NvInferRuntime.h:4224

nvinfer1::ICudaEngine::getTensorLocation
TensorLocation getTensorLocation(char const *tensorName) const noexcept
Get whether an input or output tensor must be on GPU or CPU.
Definition: NvInferRuntime.h:3493

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
Create a new engine inspector which prints the layer information in an engine or an execution context...
Definition: NvInferRuntime.h:3947

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName, int32_t profileIndex) const noexcept
Return the number of bytes per component of an element given of given profile, or -1 if the tensor is...
Definition: NvInferRuntime.h:3652

nvinfer1::ICudaEngine::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
Return the hardware compatibility level of this engine.
Definition: NvInferRuntime.h:3983

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get the number of optimization profiles defined for this engine.
Definition: NvInferRuntime.h:3826

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName, int32_t profileIndex) const noexcept
Return the human readable description of the tensor format of given profile, or empty string if the p...
Definition: NvInferRuntime.h:3767

nvinfer1::ICudaEngine::getTensorIOMode
TensorIOMode getTensorIOMode(char const *tensorName) const noexcept
Determine whether a tensor is an input or output tensor.
Definition: NvInferRuntime.h:3527

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInferRuntime.h:3444

nvinfer1::ICudaEngine::getNbIOTensors
int32_t getNbIOTensors() const noexcept
Return number of IO tensors.
Definition: NvInferRuntime.h:3960

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName) const noexcept
Return the number of components included in one element, or -1 if tensor is not vectorized or if the ...
Definition: NvInferRuntime.h:3673

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
Return true if an engine can be refit.
Definition: NvInferRuntime.h:3613

nvinfer1::IDimensionExpr
An IDimensionExpr represents an integer expression constructed from constants, input dimensions,...
Definition: NvInferRuntime.h:232

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
Return true if expression is a build-time constant.
Definition: NvInferRuntime.h:237

nvinfer1::IDimensionExpr::isSizeTensor
bool isSizeTensor() const noexcept
Return true if this denotes the value of a size tensor.
Definition: NvInferRuntime.h:263

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
Definition: NvInferRuntime.h:254

nvinfer1::IDimensionExpr::getConstantValue
int64_t getConstantValue() const noexcept
Get the value of the constant.
Definition: NvInferRuntime.h:248

nvinfer1::IEngineInspector
An engine inspector which prints out the layer information of an engine or an execution context.
Definition: NvInferRuntime.h:5302

nvinfer1::IEngineInspector::getLayerInformation
char const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
Get a string describing the information about a specific layer in the current engine or the execution...
Definition: NvInferRuntime.h:5355

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:5412

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:5397

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
Get the context currently being inspected.
Definition: NvInferRuntime.h:5330

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
Definition: NvInferRuntime.h:5418

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getEngineInformation
char const * getEngineInformation(LayerInformationFormat format) const noexcept
Get a string describing the information about all the layers in the current engine or the execution c...
Definition: NvInferRuntime.h:5378

nvinfer1::IExecutionContext
Context for executing inference using an engine, with functionally unsafe features.
Definition: NvInferRuntime.h:4347

nvinfer1::IExecutionContext::getOutputAllocator
IOutputAllocator * getOutputAllocator(char const *tensorName) const noexcept
Get output allocator associated with output tensor of given name, or nullptr if the provided name doe...
Definition: NvInferRuntime.h:4965

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:4613

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
Calculate layer timing info for the current optimization profile in IExecutionContext and update the ...
Definition: NvInferRuntime.h:4732

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
Set the device memory for use by this execution context.
Definition: NvInferRuntime.h:4450

nvinfer1::IExecutionContext::setTensorDebugState
bool setTensorDebugState(char const *name, bool flag) noexcept
Set debug state of tensor given the tensor name.
Definition: NvInferRuntime.h:5172

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
Return the name of the execution context.
Definition: NvInferRuntime.h:4423

nvinfer1::IExecutionContext::getTemporaryStorageAllocator
IGpuAllocator * getTemporaryStorageAllocator() const noexcept
Get allocator set by setTemporaryStorageAllocator.
Definition: NvInferRuntime.h:5013

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
Set whether enqueue emits layer timing to the profiler.
Definition: NvInferRuntime.h:4690

nvinfer1::IExecutionContext::setUnfusedTensorsDebugState
bool setUnfusedTensorsDebugState(bool flag) noexcept
Turn the debug state of unfused tensors on or off.
Definition: NvInferRuntime.h:5223

nvinfer1::IExecutionContext::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
Return the shape of the given input or output.
Definition: NvInferRuntime.h:4563

nvinfer1::IExecutionContext::getDebugState
bool getDebugState(char const *name) const noexcept
Get the debug state.
Definition: NvInferRuntime.h:5184

nvinfer1::IExecutionContext::setInputShape
bool setInputShape(char const *tensorName, Dims const &dims) noexcept
Set shape of given input.
Definition: NvInferRuntime.h:4526

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
Synchronously execute a network.
Definition: NvInferRuntime.h:4630

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
Get the enqueueEmitsProfile state.
Definition: NvInferRuntime.h:4702

nvinfer1::IExecutionContext::getTensorAddress
void const * getTensorAddress(char const *tensorName) const noexcept
Get memory address bound to given input or output tensor, or nullptr if the provided name does not ma...
Definition: NvInferRuntime.h:4793

nvinfer1::IExecutionContext::setOutputAllocator
bool setOutputAllocator(char const *tensorName, IOutputAllocator *outputAllocator) noexcept
Set output allocator to use for output tensor of given name. Pass nullptr to outputAllocator to unset...
Definition: NvInferRuntime.h:4952

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
Select an optimization profile for the current context with async semantics.
Definition: NvInferRuntime.h:4674

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
Definition: NvInferRuntime.h:5262

nvinfer1::IExecutionContext::setOutputTensorAddress
bool setOutputTensorAddress(char const *tensorName, void *data) noexcept
Set the memory address for a given output tensor.
Definition: NvInferRuntime.h:4816

nvinfer1::IExecutionContext::setPersistentCacheLimit
void setPersistentCacheLimit(size_t size) noexcept
Set the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:5053

nvinfer1::IExecutionContext::getPersistentCacheLimit
size_t getPersistentCacheLimit() const noexcept
Get the maximum size for persistent cache usage.
Definition: NvInferRuntime.h:5064

nvinfer1::IExecutionContext::setAllTensorsDebugState
bool setAllTensorsDebugState(bool flag) noexcept
Turn the debug state of all debug tensors on or off.
Definition: NvInferRuntime.h:5207

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
Get the associated engine.
Definition: NvInferRuntime.h:4399

nvinfer1::IExecutionContext::getNvtxVerbosity
ProfilingVerbosity getNvtxVerbosity() const noexcept
Get the NVTX verbosity of the execution context.
Definition: NvInferRuntime.h:5100

nvinfer1::IExecutionContext::updateDeviceMemorySizeForShapes
size_t updateDeviceMemorySizeForShapes() noexcept
Recompute the internal activation buffer sizes based on the current input shapes, and return the tota...
Definition: NvInferRuntime.h:4907

nvinfer1::IExecutionContext::setAuxStreams
void setAuxStreams(cudaStream_t *auxStreams, int32_t nbStreams) noexcept
Set the auxiliary streams that TensorRT should launch kernels on in the next enqueueV3() call.
Definition: NvInferRuntime.h:5131

nvinfer1::IExecutionContext::getMaxOutputSize
int64_t getMaxOutputSize(char const *tensorName) const noexcept
Get upper bound on an output tensor's size, in bytes, based on the current optimization profile and i...
Definition: NvInferRuntime.h:4983

nvinfer1::IExecutionContext::inferShapes
int32_t inferShapes(int32_t nbMaxNames, char const **tensorNames) noexcept
Run shape calculations.
Definition: NvInferRuntime.h:4890

nvinfer1::IExecutionContext::setDebugListener
bool setDebugListener(IDebugListener *listener) noexcept
Set DebugListener for this execution context.
Definition: NvInferRuntime.h:5143

nvinfer1::IExecutionContext::setTensorAddress
bool setTensorAddress(char const *tensorName, void *data) noexcept
Set memory address for given input or output tensor.
Definition: NvInferRuntime.h:4776

nvinfer1::IExecutionContext::setTemporaryStorageAllocator
bool setTemporaryStorageAllocator(IGpuAllocator *allocator) noexcept
Specify allocator to use for internal temporary storage.
Definition: NvInferRuntime.h:5003

nvinfer1::IExecutionContext::getOutputTensorAddress
void * getOutputTensorAddress(char const *tensorName) const noexcept
Get memory address for given output.
Definition: NvInferRuntime.h:4857

nvinfer1::IExecutionContext::enqueueV3
bool enqueueV3(cudaStream_t stream) noexcept
Enqueue inference on a stream.
Definition: NvInferRuntime.h:5037

nvinfer1::IExecutionContext::getDebugListener
IDebugListener * getDebugListener() noexcept
Get the DebugListener of this execution context.
Definition: NvInferRuntime.h:5153

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
Get the index of the currently selected optimization profile.
Definition: NvInferRuntime.h:4508

nvinfer1::IExecutionContext::setInputTensorAddress
bool setInputTensorAddress(char const *tensorName, void const *data) noexcept
Set memory address for given input.
Definition: NvInferRuntime.h:4838

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
Get the debug sync flag.
Definition: NvInferRuntime.h:4369

nvinfer1::IExecutionContext::setInputConsumedEvent
bool setInputConsumedEvent(cudaEvent_t event) noexcept
Mark input as consumed.
Definition: NvInferRuntime.h:4923

nvinfer1::IExecutionContext::getTensorStrides
Dims getTensorStrides(char const *tensorName) const noexcept
Return the strides of the buffer for the given tensor name.
Definition: NvInferRuntime.h:4493

nvinfer1::IExecutionContext::setNvtxVerbosity
bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept
Set the verbosity of the NVTX markers in the execution context.
Definition: NvInferRuntime.h:5088

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
Get the profiler.
Definition: NvInferRuntime.h:4389

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:4598

nvinfer1::IExecutionContext::setDeviceMemoryV2
void setDeviceMemoryV2(void *memory, int64_t size) noexcept
Set the device memory and its corresponding size for use by this execution context.
Definition: NvInferRuntime.h:4472

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
Whether all dynamic dimensions of input tensors have been specified.
Definition: NvInferRuntime.h:4579

nvinfer1::IExecutionContext::getUnfusedTensorsDebugState
bool getUnfusedTensorsDebugState() const noexcept
Get the debug state of unfused tensors.
Definition: NvInferRuntime.h:5233

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
Set the profiler.
Definition: NvInferRuntime.h:4379

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
Set the name of the execution context.
Definition: NvInferRuntime.h:4413

nvinfer1::IExecutionContext::getInputConsumedEvent
cudaEvent_t getInputConsumedEvent() const noexcept
The event associated with consuming the input.
Definition: NvInferRuntime.h:4933

nvinfer1::IExecutionContext::getRuntimeConfig
IRuntimeConfig * getRuntimeConfig() const noexcept
Get the runtime config object used during execution context creation.
Definition: NvInferRuntime.h:5194

nvinfer1::IExprBuilder
Object for constructing IDimensionExpr.
Definition: NvInferRuntime.h:287

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
Get the operation.
Definition: NvInferRuntime.h:303

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int64_t value) noexcept
Return pointer to IDimensionExpr for given value.
Definition: NvInferRuntime.h:292

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
Definition: NvInferRuntime.h:310

nvinfer1::IExprBuilder::declareSizeTensor
IDimensionExpr const * declareSizeTensor(int32_t outputIndex, IDimensionExpr const &opt, IDimensionExpr const &upper)
Declare a size tensor at the given output index, with the specified auto-tuning formula and upper bou...
Definition: NvInferRuntime.h:338

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:142

nvinfer1::IHostMemory::data
void * data() const noexcept
A pointer to the raw data that is owned by the library.
Definition: NvInferRuntime.h:147

nvinfer1::IHostMemory::type
DataType type() const noexcept
The type of the memory that was allocated.
Definition: NvInferRuntime.h:159

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
The size in bytes of the data that was allocated.
Definition: NvInferRuntime.h:153

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
Definition: NvInferRuntime.h:165

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILoggerFinder
A virtual base class to find a logger. Allows a plugin to find an instance of a logger if it needs to...
Definition: NvInferRuntime.h:5516

nvinfer1::ILoggerFinder::findLogger
virtual ILogger * findLogger()=0
Get the logger used by the engine or execution context which called the plugin method.

nvinfer1::ILoggerFinder::~ILoggerFinder
virtual ~ILoggerFinder()=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntime.h:1588

nvinfer1::ILogger::ILogger
ILogger()=default

nvinfer1::ILogger::~ILogger
virtual ~ILogger()=default

nvinfer1::ILogger::Severity
Severity
The severity corresponding to a log message.
Definition: NvInferRuntime.h:1596

nvinfer1::ILogger::log
virtual void log(Severity severity, AsciiChar const *msg) noexcept=0
A callback implemented by the application to handle logging messages;.

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:51

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:2672

nvinfer1::IOptimizationProfile::getShapeValues
TRT_DEPRECATED int32_t const * getShapeValues(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2793

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
Definition: NvInferRuntime.h:2909

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2713

nvinfer1::IOptimizationProfile::setShapeValues
TRT_DEPRECATED bool setShapeValues(char const *inputName, OptProfileSelector select, int32_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2765

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
Get the extra memory target that has been defined for this profile.
Definition: NvInferRuntime.h:2823

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
Set a target for extra GPU memory that may be used by this profile.
Definition: NvInferRuntime.h:2811

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims const &dims) noexcept
Set the minimum / optimum / maximum dimensions for a dynamic input tensor.
Definition: NvInferRuntime.h:2701

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
Check whether the optimization profile can be passed to an IBuilderConfig object.
Definition: NvInferRuntime.h:2840

nvinfer1::IOptimizationProfile::getShapeValuesV2
int64_t const * getShapeValuesV2(char const *inputName, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2903

nvinfer1::IOptimizationProfile::setShapeValuesV2
bool setShapeValuesV2(char const *inputName, OptProfileSelector select, int64_t const *values, int32_t nbValues) noexcept
Set the minimum / optimum / maximum values for an input shape tensor.
Definition: NvInferRuntime.h:2890

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
Get the number of values for an input shape tensor.
Definition: NvInferRuntime.h:2779

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:56

nvinfer1::IPluginRegistry::registerCreator
virtual TRT_DEPRECATED bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
Register a plugin creator implementing IPluginCreator. Returns false if any plugin creator with the s...

nvinfer1::IPluginResourceContext
Interface for plugins to access per context resources provided by TensorRT.
Definition: NvInferRuntime.h:813

nvinfer1::IPluginResourceContext::getErrorRecorder
virtual IErrorRecorder * getErrorRecorder() const noexcept=0
Get the error recorder associated with the resource context.

nvinfer1::IPluginResourceContext::operator=
IPluginResourceContext & operator=(IPluginResourceContext const &) &=default

nvinfer1::IPluginResourceContext::getGpuAllocator
virtual IGpuAllocator * getGpuAllocator() const noexcept=0
Get the GPU allocator associated with the resource context.

nvinfer1::IPluginV2DynamicExt
Similar to IPluginV2Ext, but with support for dynamic shapes.
Definition: NvInferRuntime.h:407

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
Clone the plugin object. This copies over internal plugin parameters as well and returns a new plugin...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
Definition: NvInferRuntime.h:558

nvinfer1::IPluginV2Ext
Plugin class for user-implemented layers.
Definition: NvInferRuntimePlugin.h:474

nvinfer1::IRefitter
Updates weights in an engine.
Definition: NvInferRuntime.h:2264

nvinfer1::IRefitter::refitCudaEngineAsync
bool refitCudaEngineAsync(cudaStream_t stream) noexcept
Enqueue weights refitting of the associated engine on the given stream.
Definition: NvInferRuntime.h:2594

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the refitter.
Definition: NvInferRuntime.h:2473

nvinfer1::IRefitter::getWeightsLocation
TensorLocation getWeightsLocation(char const *weightsName) const noexcept
Get location for the weights associated with the given name.
Definition: NvInferRuntime.h:2532

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
Specify new weights of given name.
Definition: NvInferRuntime.h:2397

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
Get names of all weights that could be refit.
Definition: NvInferRuntime.h:2433

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
get the logger with which the refitter was created
Definition: NvInferRuntime.h:2443

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
Refits associated engine.
Definition: NvInferRuntime.h:2300

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
Get names of missing weights.
Definition: NvInferRuntime.h:2417

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of missing weights.
Definition: NvInferRuntime.h:2321

nvinfer1::IRefitter::getNamedWeights
Weights getNamedWeights(char const *weightsName) const noexcept
Get weights associated with the given name.
Definition: NvInferRuntime.h:2516

nvinfer1::IRefitter::unsetNamedWeights
bool unsetNamedWeights(char const *weightsName) noexcept
Unset weights associated with the given name.
Definition: NvInferRuntime.h:2548

nvinfer1::IRefitter::getWeightsPrototype
Weights getWeightsPrototype(char const *weightsName) const noexcept
Get the Weights prototype associated with the given name.
Definition: NvInferRuntime.h:2612

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:2459

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights, TensorLocation location) noexcept
Specify new weights on a specified device of given name.
Definition: NvInferRuntime.h:2500

nvinfer1::IRefitter::setWeightsValidation
void setWeightsValidation(bool weightsValidation) noexcept
Set whether to validate weights during refitting.
Definition: NvInferRuntime.h:2564

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
Definition: NvInferRuntime.h:2618

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
Get description of all weights that could be refit.
Definition: NvInferRuntime.h:2338

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::getWeightsValidation
bool getWeightsValidation() const noexcept
Get whether to validate weights values during refitting.
Definition: NvInferRuntime.h:2572

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:2357

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
Get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2372

nvinfer1::IRuntimeCache
A class for Runtime cache currently used for TensorRT JIT compilation. This cache can be serialized a...
Definition: NvInferRuntime.h:3129

nvinfer1::IRuntimeCache::~IRuntimeCache
virtual ~IRuntimeCache() noexcept=default

nvinfer1::IRuntimeCache::deserialize
bool deserialize(void const *blob, size_t size) noexcept
Deserialize the Runtime cache from a stream that contains serialized Runtime cache.
Definition: NvInferRuntime.h:3149

nvinfer1::IRuntimeCache::reset
bool reset() noexcept
Reset the Runtime cache. Clears all content within the cache.
Definition: NvInferRuntime.h:3157

nvinfer1::IRuntimeCache::mImpl
apiv::VRuntimeCache * mImpl
Definition: NvInferRuntime.h:3163

nvinfer1::IRuntimeConfig
A class for runtime configuration. This class is used during execution context creation.
Definition: NvInferRuntime.h:3252

nvinfer1::IRuntimeConfig::setCudaGraphStrategy
bool setCudaGraphStrategy(CudaGraphStrategy strategy) noexcept
Set the strategy used for CUDA graphs for JIT (Just-In-Time) inference. Default is kDISABLED.
Definition: NvInferRuntime.h:3346

nvinfer1::IRuntimeConfig::getDynamicShapesKernelSpecializationStrategy
DynamicShapesKernelSpecializationStrategy getDynamicShapesKernelSpecializationStrategy() const noexcept
Return the dynamic shape specialization strategy of this config.
Definition: NvInferRuntime.h:3322

nvinfer1::IRuntimeConfig::~IRuntimeConfig
virtual ~IRuntimeConfig() noexcept=default

nvinfer1::IRuntimeConfig::mImpl
apiv::VRuntimeConfig * mImpl
Definition: NvInferRuntime.h:3362

nvinfer1::IRuntimeConfig::createRuntimeCache
IRuntimeCache * createRuntimeCache() const noexcept
Create an empty Runtime cache.
Definition: NvInferRuntime.h:3281

nvinfer1::IRuntimeConfig::getExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy getExecutionContextAllocationStrategy() const noexcept
Get the execution context allocation strategy.
Definition: NvInferRuntime.h:3271

nvinfer1::IRuntimeConfig::setRuntimeCache
bool setRuntimeCache(IRuntimeCache const &cache) noexcept
Set Runtime cache to the runtime config. Enables Runtime caching.
Definition: NvInferRuntime.h:3291

nvinfer1::IRuntimeConfig::setDynamicShapesKernelSpecializationStrategy
void setDynamicShapesKernelSpecializationStrategy(DynamicShapesKernelSpecializationStrategy dynamicShapesKernelSpecializationStrategy) noexcept
Set the dynamic shape kernel specialization strategy for this config.
Definition: NvInferRuntime.h:3311

nvinfer1::IRuntimeConfig::getRuntimeCache
IRuntimeCache * getRuntimeCache() const noexcept
Get the Runtime cache from the runtime config.
Definition: NvInferRuntime.h:3301

nvinfer1::IRuntimeConfig::getCudaGraphStrategy
CudaGraphStrategy getCudaGraphStrategy() const noexcept
Return the strategy used for CUDA graphs for JIT (Just-In-Time) inference.
Definition: NvInferRuntime.h:3356

nvinfer1::IRuntime
Allows a serialized functionally unsafe engine to be deserialized.
Definition: NvInferRuntime.h:1921

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInferRuntime.h:2070

nvinfer1::IRuntime::loadRuntime
IRuntime * loadRuntime(char const *path) noexcept
Load IRuntime from the file.
Definition: NvInferRuntime.h:2186

nvinfer1::IRuntime::getEngineHostCodeAllowed
bool getEngineHostCodeAllowed() const noexcept
Get whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2208

nvinfer1::IRuntime::getEngineHeaderSize
int64_t getEngineHeaderSize() const noexcept
Get size of engine header in bytes.
Definition: NvInferRuntime.h:2220

nvinfer1::IRuntime::getTempfileControlFlags
TempfileControlFlags getTempfileControlFlags() const noexcept
Get the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2158

nvinfer1::IRuntime::setEngineHostCodeAllowed
void setEngineHostCodeAllowed(bool allowed) noexcept
Set whether the runtime is allowed to deserialize engines with host executable code.
Definition: NvInferRuntime.h:2198

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::setTemporaryDirectory
void setTemporaryDirectory(char const *path) noexcept
Set the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2119

nvinfer1::IRuntime::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
Get the local plugin registry that can be used by the runtime.
Definition: NvInferRuntime.h:2168

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
Definition: NvInferRuntime.h:2253

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
Returns number of DLA hardware cores accessible or 0 if DLA is unavailable.
Definition: NvInferRuntime.h:1954

nvinfer1::IRuntime::getEngineValidity
EngineValidity getEngineValidity(void const *blob, int64_t blobSize, uint64_t *diagnostics) const noexcept
Check for engine validity by inspecting the serialized engine header.
Definition: NvInferRuntime.h:2247

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
Deserialize an engine from host memory.
Definition: NvInferRuntime.h:2022

nvinfer1::IRuntime::setTempfileControlFlags
void setTempfileControlFlags(TempfileControlFlags flags) noexcept
Set the tempfile control flags for this runtime.
Definition: NvInferRuntime.h:2146

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInferRuntime.h:1946

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInferRuntime.h:1970

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInferRuntime.h:2004

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(IStreamReaderV2 &streamReader)
Deserialize an engine from a stream. IStreamReaderV2 is expected to support reading to both host and ...
Definition: NvInferRuntime.h:2045

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
get the logger with which the runtime was created
Definition: NvInferRuntime.h:2055

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
Get the maximum number of threads that can be used by the runtime.
Definition: NvInferRuntime.h:2084

nvinfer1::IRuntime::getTemporaryDirectory
char const * getTemporaryDirectory() const noexcept
Get the directory that will be used by this runtime for temporary files.
Definition: NvInferRuntime.h:2130

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInferRuntime.h:1989

nvinfer1::ISerializationConfig
Holds properties for configuring an engine to serialize the binary.
Definition: NvInferRuntime.h:3020

nvinfer1::ISerializationConfig::~ISerializationConfig
virtual ~ISerializationConfig() noexcept=default

nvinfer1::ISerializationConfig::clearFlag
bool clearFlag(SerializationFlag serializationFlag) noexcept
clear a serialization flag.
Definition: NvInferRuntime.h:3059

nvinfer1::ISerializationConfig::setFlag
bool setFlag(SerializationFlag serializationFlag) noexcept
Set a serialization flag.
Definition: NvInferRuntime.h:3071

nvinfer1::ISerializationConfig::getFlags
SerializationFlags getFlags() const noexcept
Get the serialization flags for this config.
Definition: NvInferRuntime.h:3047

nvinfer1::ISerializationConfig::getFlag
bool getFlag(SerializationFlag serializationFlag) const noexcept
Returns true if the serialization flag is set.
Definition: NvInferRuntime.h:3083

nvinfer1::ISerializationConfig::mImpl
apiv::VSerializationConfig * mImpl
Definition: NvInferRuntime.h:3089

nvinfer1::IVersionedInterface
An Interface class for version control.
Definition: NvInferRuntimeBase.h:278

nvinfer1::InterfaceInfo
Version information associated with a TRT interface.
Definition: NvInferRuntimeBase.h:243

nvinfer1::PluginRegistrar
Register the plugin creator to the registry The static registry object will be instantiated when the ...
Definition: NvInferRuntime.h:5488

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
Definition: NvInferRuntime.h:5490

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:124

nvinfer1::Weights::type
DataType type
The type of the weights.
Definition: NvInferRuntime.h:126

nvinfer1::Weights::count
int64_t count
The number of weights in the array.
Definition: NvInferRuntime.h:128

nvinfer1::Weights::values
void const  * values
The weight values, in a contiguous array.
Definition: NvInferRuntime.h:127

nvinfer1::v_1_0::IDebugListener
Definition: NvInferRuntime.h:4298

nvinfer1::v_1_0::IDebugListener::processDebugTensor
virtual bool processDebugTensor(void const *addr, TensorLocation location, DataType type, Dims const &shape, char const *name, cudaStream_t stream)=0
Callback function that is called when a debug tensor’s value is updated and the debug state of the te...

nvinfer1::v_1_0::IDebugListener::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:4303

nvinfer1::v_1_0::IDebugListener::~IDebugListener
~IDebugListener() override=default

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:415

nvinfer1::v_1_0::IGpuAllocator
Definition: NvInferRuntime.h:1656

nvinfer1::v_1_0::IGpuAllocator::allocateAsync
virtual void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered acquisition of GPU mem...
Definition: NvInferRuntime.h:1778

nvinfer1::v_1_0::IGpuAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1819

nvinfer1::v_1_0::IGpuAllocator::deallocate
virtual TRT_DEPRECATED bool deallocate(void *const memory) noexcept=0
A thread-safe callback implemented by the application to handle release of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::~IGpuAllocator
~IGpuAllocator() override=default

nvinfer1::v_1_0::IGpuAllocator::IGpuAllocator
IGpuAllocator()=default

nvinfer1::v_1_0::IGpuAllocator::reallocate
virtual void * reallocate(void *const, uint64_t, uint64_t) noexcept
A thread-safe callback implemented by the application to resize an existing allocation.
Definition: NvInferRuntime.h:1725

nvinfer1::v_1_0::IGpuAllocator::allocate
virtual TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept=0
A thread-safe callback implemented by the application to handle acquisition of GPU memory.

nvinfer1::v_1_0::IGpuAllocator::deallocateAsync
virtual bool deallocateAsync(void *const memory, cudaStream_t) noexcept
A thread-safe callback implemented by the application to handle stream-ordered release of GPU memory.
Definition: NvInferRuntime.h:1811

nvinfer1::v_1_0::IGpuAsyncAllocator
Definition: NvInferRuntime.h:5537

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocateAsync
bool deallocateAsync(void *const memory, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous release o...

nvinfer1::v_1_0::IGpuAsyncAllocator::IGpuAsyncAllocator
IGpuAsyncAllocator()=default

nvinfer1::v_1_0::IGpuAsyncAllocator::allocateAsync
void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept override=0
A thread-safe callback implemented by the application to handle stream-ordered asynchronous acquisiti...

nvinfer1::v_1_0::IGpuAsyncAllocator::allocate
TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override
A thread-safe callback implemented by the application to handle acquisition of GPU memory.
Definition: NvInferRuntime.h:5624

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocate
TRT_DEPRECATED bool deallocate(void *const memory) noexcept override
A thread-safe callback implemented by the application to handle release of GPU memory.
Definition: NvInferRuntime.h:5648

nvinfer1::v_1_0::IGpuAsyncAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5656

nvinfer1::v_1_0::IGpuAsyncAllocator::~IGpuAsyncAllocator
~IGpuAsyncAllocator() override=default

nvinfer1::v_1_0::IOutputAllocator
Definition: NvInferRuntime.h:4236

nvinfer1::v_1_0::IOutputAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:4241

nvinfer1::v_1_0::IOutputAllocator::reallocateOutputAsync
virtual void * reallocateOutputAsync(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment, cudaStream_t)
Return a pointer to memory for an output tensor, or nullptr if memory cannot be allocated....
Definition: NvInferRuntime.h:4268

nvinfer1::v_1_0::IOutputAllocator::notifyShape
virtual void notifyShape(char const *tensorName, Dims const &dims) noexcept=0
Called by TensorRT when the shape of the output tensor is known.

nvinfer1::v_1_0::IPluginCapability
Definition: NvInferPluginBase.h:141

nvinfer1::v_1_0::IPluginCreatorInterface
Definition: NvInferPluginBase.h:193

nvinfer1::v_1_0::IPluginCreatorV3One
Definition: NvInferRuntime.h:5663

nvinfer1::v_1_0::IPluginCreatorV3One::getFieldNames
virtual PluginFieldCollection const * getFieldNames() noexcept=0
Return a list of fields that need to be passed to createPlugin() when creating a plugin for use in th...

nvinfer1::v_1_0::IPluginCreatorV3One::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:5668

nvinfer1::v_1_0::IPluginCreatorV3One::createPlugin
virtual IPluginV3 * createPlugin(AsciiChar const *name, PluginFieldCollection const *fc, TensorRTPhase phase) noexcept=0
Return a plugin object. Return nullptr in case of error.

nvinfer1::v_1_0::IPluginV3
Definition: NvInferPluginBase.h:206

nvinfer1::v_1_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:882

nvinfer1::v_1_0::IPluginV3OneBuild::getFormatCombinationLimit
virtual int32_t getFormatCombinationLimit() noexcept
Return the maximum number of format combinations that will be timed by TensorRT during the build phas...
Definition: NvInferRuntime.h:1086

nvinfer1::v_1_0::IPluginV3OneBuild::getNbOutputs
virtual int32_t getNbOutputs() const noexcept=0
Get the number of outputs from the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::configurePlugin
virtual int32_t configurePlugin(DynamicPluginTensorDesc const *in, int32_t nbInputs, DynamicPluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Configure the plugin.

nvinfer1::v_1_0::IPluginV3OneBuild::getNbTactics
virtual int32_t getNbTactics() noexcept
Query for the number of custom tactics the plugin intends to use.
Definition: NvInferRuntime.h:1062

nvinfer1::v_1_0::IPluginV3OneBuild::getMetadataString
virtual char const * getMetadataString() noexcept
Query for a string representing the configuration of the plugin. May be called anytime after plugin c...
Definition: NvInferRuntime.h:1097

nvinfer1::v_1_0::IPluginV3OneBuild::getTimingCacheID
virtual char const * getTimingCacheID() noexcept
Called to query the suffix to use for the timing cache ID. May be called anytime after plugin creatio...
Definition: NvInferRuntime.h:1078

nvinfer1::v_1_0::IPluginV3OneBuild::supportsFormatCombination
virtual bool supportsFormatCombination(int32_t pos, DynamicPluginTensorDesc const *inOut, int32_t nbInputs, int32_t nbOutputs) noexcept=0
Return true if plugin supports the format and datatype for the input/output indexed by pos.

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputDataTypes
virtual int32_t getOutputDataTypes(DataType *outputTypes, int32_t nbOutputs, const DataType *inputTypes, int32_t nbInputs) const noexcept=0
Provide the data types of the plugin outputs if the input tensors have the data types provided.

nvinfer1::v_1_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:894

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputShapes
virtual int32_t getOutputShapes(DimsExprs const *inputs, int32_t nbInputs, DimsExprs const *shapeInputs, int32_t nbShapeInputs, DimsExprs *outputs, int32_t nbOutputs, IExprBuilder &exprBuilder) noexcept=0
Provide expressions for computing dimensions of the output tensors from dimensions of the input tenso...

nvinfer1::v_1_0::IPluginV3OneBuild::getValidTactics
virtual int32_t getValidTactics(int32_t *tactics, int32_t nbTactics) noexcept
Query for any custom tactics that the plugin intends to use.
Definition: NvInferRuntime.h:1054

nvinfer1::v_1_0::IPluginV3OneCore
Definition: NvInferRuntime.h:839

nvinfer1::v_1_0::IPluginV3OneCore::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:844

nvinfer1::v_1_0::IPluginV3OneCore::getPluginName
virtual AsciiChar const * getPluginName() const noexcept=0
Return the plugin name. Should match the plugin name returned by the corresponding plugin creator.

nvinfer1::v_1_0::IPluginV3OneRuntime
Definition: NvInferRuntime.h:1104

nvinfer1::v_1_0::IPluginV3OneRuntime::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1109

nvinfer1::v_1_0::IPluginV3OneRuntime::onShapeChange
virtual int32_t onShapeChange(PluginTensorDesc const *in, int32_t nbInputs, PluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
Called when a plugin is being prepared for execution for specific dimensions. This could happen multi...

nvinfer1::v_1_0::IPluginV3OneRuntime::getFieldsToSerialize
virtual PluginFieldCollection const * getFieldsToSerialize() noexcept=0
Get the plugin fields which should be serialized.

nvinfer1::v_1_0::IPluginV3OneRuntime::setTactic
virtual int32_t setTactic(int32_t tactic) noexcept
Set the tactic to be used in the subsequent call to enqueue(). If no custom tactics were advertised,...
Definition: NvInferRuntime.h:1121

nvinfer1::v_1_0::IPluginV3OneRuntime::enqueue
virtual int32_t enqueue(PluginTensorDesc const *inputDesc, PluginTensorDesc const *outputDesc, void const *const *inputs, void *const *outputs, void *workspace, cudaStream_t stream) noexcept=0
Execute the layer.

nvinfer1::v_1_0::IPluginV3OneRuntime::attachToContext
virtual IPluginV3 * attachToContext(IPluginResourceContext *context) noexcept=0
Clone the plugin, attach the cloned plugin object to a execution context and grant the cloned plugin ...

nvinfer1::v_1_0::IProfiler
Definition: NvInferRuntime.h:1292

nvinfer1::v_1_0::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
Definition: NvInferRuntime.h:1303

nvinfer1::v_1_0::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
Layer time reporting callback.

nvinfer1::v_1_0::IStreamReader
Definition: NvInferRuntime.h:631

nvinfer1::v_1_0::IStreamReader::~IStreamReader
~IStreamReader() override=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader const &) &=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader &&) &=default

nvinfer1::v_1_0::IStreamReader::read
virtual int64_t read(void *destination, int64_t nbBytes)=0
Read the next number of bytes in the stream.

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader &&)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader const &)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader()=default

nvinfer1::v_1_0::IStreamReader::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:643

nvinfer1::v_1_0::IStreamReaderV2
Definition: NvInferRuntime.h:741

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 const &) &=default

nvinfer1::v_1_0::IStreamReaderV2::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:753

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 &&)=default

nvinfer1::v_1_0::IStreamReaderV2::~IStreamReaderV2
~IStreamReaderV2() override=default

nvinfer1::v_1_0::IStreamReaderV2::read
virtual int64_t read(void *destination, int64_t nbBytes, cudaStream_t stream) noexcept=0
Read the next number of bytes in the stream asynchronously.

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2()=default

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 const &)=default

nvinfer1::v_1_0::IStreamReaderV2::seek
virtual bool seek(int64_t offset, SeekPosition where) noexcept=0
Sets the position of the stream to the given offset.

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 &&) &=default

nvinfer1::v_1_0::IStreamWriter
Definition: NvInferRuntime.h:666

nvinfer1::v_1_0::IStreamWriter::operator=
IStreamWriter & operator=(IStreamWriter const &) &=default

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter(IStreamWriter &&)=default

nvinfer1::v_1_0::IStreamWriter::write
virtual int64_t write(void const *data, int64_t nbBytes)=0
write nbBytes of data into the stream.

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter(IStreamWriter const &)=default

nvinfer1::v_1_0::IStreamWriter::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept final
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:678

nvinfer1::v_1_0::IStreamWriter::IStreamWriter
IStreamWriter()=default

nvinfer1::v_1_0::IStreamWriter::operator=
IStreamWriter & operator=(IStreamWriter &&) &=default

nvinfer1::v_1_0::IStreamWriter::~IStreamWriter
~IStreamWriter() override=default

nvinfer1::v_2_0::IPluginV3OneBuild
Definition: NvInferRuntime.h:1201

nvinfer1::v_2_0::IPluginV3OneBuild::getAliasedInput
virtual int32_t getAliasedInput(int32_t outputIndex) noexcept
Communicates to TensorRT that the output at the specified output index is aliased to the input at the...
Definition: NvInferRuntime.h:1237

nvinfer1::v_2_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInferRuntime.h:1203

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRefitter
IRefitter * createInferRefitter(ICudaEngine &engine, ILogger &logger) noexcept
Create an instance of an IRefitter class.
Definition: NvInferRuntime.h:5468

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
Create an instance of an IRuntime class.
Definition: NvInferRuntime.h:5457

nvinfer1
The TensorRT API version 1 namespace.
Definition: NvInferPluginBase.h:29

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:2958

nvinfer1::IOutputAllocator
v_1_0::IOutputAllocator IOutputAllocator
Definition: NvInferRuntime.h:4293

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:76

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::DimensionOperation
DimensionOperation
An operation on two IDimensionExpr, which represent integer expressions used in dimension computation...
Definition: NvInferRuntime.h:179

nvinfer1::DimensionOperation::kSUB
@ kSUB
Substract the second element from the first.

nvinfer1::DimensionOperation::kSUM
@ kSUM
Sum of the two operands.

nvinfer1::DimensionOperation::kPROD
@ kPROD
Product of the two operands.

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
1 if operands are equal, 0 otherwise.

nvinfer1::DimensionOperation::kMIN
@ kMIN
Minimum of the two operands.

nvinfer1::DimensionOperation::kLESS
@ kLESS
1 if first operand is less than second operand, 0 otherwise.

nvinfer1::DimensionOperation::kMAX
@ kMAX
Maximum of the two operands.

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
Division rounding up.

nvinfer1::IPluginV3OneCore
v_1_0::IPluginV3OneCore IPluginV3OneCore
Definition: NvInferRuntime.h:1254

nvinfer1::EngineInvalidityDiagnostics
EngineInvalidityDiagnostics
Bitmask indicating the reason(s) why an engine is invalid.
Definition: NvInferRuntime.h:1889

nvinfer1::EngineInvalidityDiagnostics::kUNSUPPORTED_CC
@ kUNSUPPORTED_CC
Unsupported compute capability on current system.

nvinfer1::EngineInvalidityDiagnostics::kMALFORMED_ENGINE
@ kMALFORMED_ENGINE
Serialized engine does not conform to the expected format.

nvinfer1::EngineInvalidityDiagnostics::kINSUFFICIENT_GPU_MEMORY
@ kINSUFFICIENT_GPU_MEMORY
Insufficient GPU memory to hold all engine weights.

nvinfer1::EngineInvalidityDiagnostics::kCUDA_ERROR
@ kCUDA_ERROR
Incorrect installation of the CUDA driver or runtime.

nvinfer1::EngineInvalidityDiagnostics::kOLD_CUDA_DRIVER
@ kOLD_CUDA_DRIVER
CUDA driver too old (driver downgrade compared to when engine was built).

nvinfer1::EngineInvalidityDiagnostics::kOLD_CUDA_RUNTIME
@ kOLD_CUDA_RUNTIME
CUDA runtime too old (runtime downgrade compared to when engine was built).

nvinfer1::EngineInvalidityDiagnostics::kVERSION_MISMATCH
@ kVERSION_MISMATCH
TensorRT-RTX version mismatch to when engine was built.

nvinfer1::TensorIOMode
TensorIOMode
Definition of tensor IO Mode.
Definition: NvInferRuntimeBase.h:658

nvinfer1::TensorIOMode::kNONE
@ kNONE
Tensor is not an input or output.

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
Describes requirements of compatibility with GPU architectures other than that of the GPU on which th...
Definition: NvInfer.h:9499

nvinfer1::SerializationFlag
SerializationFlag
List of valid flags that the engine can enable when serializing the bytes.
Definition: NvInferRuntime.h:2999

nvinfer1::SerializationFlag::kEXCLUDE_WEIGHTS
@ kEXCLUDE_WEIGHTS
Exclude the weights that can be refitted.

nvinfer1::SerializationFlag::kINCLUDE_REFIT
@ kINCLUDE_REFIT
Remain refittable if originally so.

nvinfer1::EnumMax< DynamicShapesKernelSpecializationStrategy >
constexpr int32_t EnumMax< DynamicShapesKernelSpecializationStrategy >() noexcept
Maximum number of dynamic shape specialization strategies in DynamicShapesKernelSpecializationStrateg...
Definition: NvInferRuntime.h:3204

nvinfer1::IStreamWriter
v_1_0::IStreamWriter IStreamWriter
Definition: NvInferRuntime.h:720

nvinfer1::IProfiler
v_1_0::IProfiler IProfiler
Definition: NvInferRuntime.h:1318

nvinfer1::DynamicShapesKernelSpecializationStrategy
DynamicShapesKernelSpecializationStrategy
Different kernel specialization strategies for dynamic shapes.
Definition: NvInferRuntime.h:3178

nvinfer1::DynamicShapesKernelSpecializationStrategy::kEAGER
@ kEAGER

nvinfer1::DynamicShapesKernelSpecializationStrategy::kLAZY
@ kLAZY

nvinfer1::SeekPosition
SeekPosition
Controls the seek mode of IStreamReaderV2.
Definition: NvInferRuntime.h:727

nvinfer1::SeekPosition::kSET
@ kSET
From the beginning of the file.

nvinfer1::SeekPosition::kCUR
@ kCUR
From the current position of the file.

nvinfer1::SeekPosition::kEND
@ kEND
From the tail of the file.

nvinfer1::IStreamReaderV2
v_1_0::IStreamReaderV2 IStreamReaderV2
Definition: NvInferRuntime.h:797

nvinfer1::TempfileControlFlags
uint32_t TempfileControlFlags
Represents a collection of one or more TempfileControlFlag values combined using bitwise-OR operation...
Definition: NvInferRuntime.h:1396

nvinfer1::EngineStat
EngineStat
The kind of engine statistics that queried from the ICudaEngine.
Definition: NvInferRuntime.h:3374

nvinfer1::EngineStat::kTOTAL_WEIGHTS_SIZE
@ kTOTAL_WEIGHTS_SIZE
Return the total weight size in bytes.

nvinfer1::EngineStat::kSTRIPPED_WEIGHTS_SIZE
@ kSTRIPPED_WEIGHTS_SIZE
Return the stripped weight size in bytes for engines built with BuilderFlag::kSTRIP_PLAN.

nvinfer1::CudaGraphStrategy
CudaGraphStrategy
Strategies available for CUDA graphs optimizations for JIT (Just-In-Time) inference.
Definition: NvInferRuntime.h:3217

nvinfer1::CudaGraphStrategy::kDISABLED
@ kDISABLED

nvinfer1::CudaGraphStrategy::kWHOLE_GRAPH_CAPTURE
@ kWHOLE_GRAPH_CAPTURE

nvinfer1::IGpuAllocator
v_1_0::IGpuAllocator IGpuAllocator
Definition: NvInferRuntime.h:1855

nvinfer1::EngineValidity
EngineValidity
Whether a TensorRT-RTX engine is likely to be valid on the current system.
Definition: NvInferRuntime.h:1863

nvinfer1::EngineValidity::kINVALID
@ kINVALID
Engine is invalid on the current system.

nvinfer1::EngineValidity::kSUBOPTIMAL
@ kSUBOPTIMAL
Engine is likely to be valid on the current system, but may show reduced performance.

nvinfer1::EngineValidity::kVALID
@ kVALID
Engine is likely to be valid on the current system, based on the information in the header.

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
Maximum number of elements in WeightsRole enum.
Definition: NvInferRuntime.h:1339

nvinfer1::AsciiChar
char_t AsciiChar
Definition: NvInferRuntimeBase.h:115

nvinfer1::TensorRTPhase
TensorRTPhase
Indicates a phase of operation of TensorRT.
Definition: NvInferPluginBase.h:116

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt.

nvinfer1::EnumMax< EngineStat >
constexpr int32_t EnumMax< EngineStat >() noexcept
Maximum number of engine statistic kinds in EngineStat enum.
Definition: NvInferRuntime.h:3388

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
Definition: NvInferRuntime.h:5281

nvinfer1::DataType
DataType
The type of weights and tensors. The datatypes other than kBOOL, kINT32, and kINT64 are "activation d...
Definition: NvInferRuntimeBase.h:145

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:1350

nvinfer1::DeviceType::kGPU
@ kGPU
GPU Device.

nvinfer1::DeviceType::kDLA
@ kDLA
DLA Core.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::IDebugListener
v_1_0::IDebugListener IDebugListener
Definition: NvInferRuntime.h:4334

nvinfer1::TempfileControlFlag
TempfileControlFlag
Flags used to control TensorRT's behavior when creating executable temporary files.
Definition: NvInferRuntime.h:1373

nvinfer1::TempfileControlFlag::kALLOW_TEMPORARY_FILES
@ kALLOW_TEMPORARY_FILES

nvinfer1::TempfileControlFlag::kALLOW_IN_MEMORY_FILES
@ kALLOW_IN_MEMORY_FILES
Allow creating and loading files in-memory (or unnamed files).

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
Number of different values of OptProfileSelector enum.
Definition: NvInferRuntime.h:2644

nvinfer1::WeightsRole
WeightsRole
How a layer uses particular Weights.
Definition: NvInferRuntime.h:1328

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
shift part of IScaleLayer

nvinfer1::WeightsRole::kANY
@ kANY
Any other weights role.

nvinfer1::WeightsRole::kBIAS
@ kBIAS
bias for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
kernel for IConvolutionLayer or IDeconvolutionLayer

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
Maximum number of profile verbosity levels in ProfilingVerbosity enum.
Definition: NvInferRuntime.h:2978

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:2970

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
Print only the layer names. This is the default setting.

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
Print detailed layer information including layer names and layer parameters.

nvinfer1::TacticSource
TacticSource
List of tactic sources for TensorRT.
Definition: NvInferRuntime.h:2921

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kCUDNN
@ kCUDNN

nvinfer1::TacticSource::kJIT_CONVOLUTIONS
@ kJIT_CONVOLUTIONS

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat is reserved for backward compatibility.
Definition: NvInferRuntimePlugin.h:54

nvinfer1::IPluginV3OneRuntime
v_1_0::IPluginV3OneRuntime IPluginV3OneRuntime
Definition: NvInferRuntime.h:1278

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::EnumMax< TempfileControlFlag >
constexpr int32_t EnumMax< TempfileControlFlag >() noexcept
Maximum number of elements in TempfileControlFlag enum.
Definition: NvInferRuntime.h:1385

nvinfer1::SerializationFlags
uint32_t SerializationFlags
Represents one or more SerializationFlag values using binary OR operations, e.g., 1U << Serialization...
Definition: NvInferRuntime.h:2989

nvinfer1::InterpolationMode::kLINEAR
@ kLINEAR
Supports linear (1D), bilinear (2D), and trilinear (3D) interpolation.

nvinfer1::IPluginV3OneBuild
v_1_0::IPluginV3OneBuild IPluginV3OneBuild
Definition: NvInferRuntime.h:1266

nvinfer1::BuilderFlag::kEXCLUDE_LEAN_RUNTIME
@ kEXCLUDE_LEAN_RUNTIME

nvinfer1::TensorFormat
TensorFormat
Format of the input/output tensors.
Definition: NvInferRuntime.h:1430

nvinfer1::TensorFormat::kCHW4
@ kCHW4

nvinfer1::TensorFormat::kDHWC
@ kDHWC

nvinfer1::TensorFormat::kHWC16
@ kHWC16

nvinfer1::TensorFormat::kDHWC8
@ kDHWC8

nvinfer1::TensorFormat::kDLA_LINEAR
@ kDLA_LINEAR

nvinfer1::TensorFormat::kCDHW32
@ kCDHW32

nvinfer1::TensorFormat::kDLA_HWC4
@ kDLA_HWC4

nvinfer1::TensorFormat::kCHW16
@ kCHW16

nvinfer1::TensorFormat::kHWC
@ kHWC

nvinfer1::TensorFormat::kCHW2
@ kCHW2

nvinfer1::TensorFormat::kHWC8
@ kHWC8

nvinfer1::TensorFormat::kCHW32
@ kCHW32

nvinfer1::ExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy
Different memory allocation behaviors for IExecutionContext.
Definition: NvInferRuntime.h:3104

nvinfer1::ExecutionContextAllocationStrategy::kSTATIC
@ kSTATIC
Default static allocation with the maximum size across all profiles.

nvinfer1::ExecutionContextAllocationStrategy::kUSER_MANAGED
@ kUSER_MANAGED
The user supplies custom allocation to the execution context.

nvinfer1::ExecutionContextAllocationStrategy::kON_PROFILE_CHANGE
@ kON_PROFILE_CHANGE
Reallocate for a profile when it's selected.

nvinfer1::EnumMax< CudaGraphStrategy >
constexpr int32_t EnumMax< CudaGraphStrategy >() noexcept
Maximum number of CUDA graph strategies in CudaGraphStrategy enum.
Definition: NvInferRuntime.h:3239

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
Maximum number of tactic sources in TacticSource enum.
Definition: NvInferRuntime.h:2947

nvinfer1::LayerInformationFormat
LayerInformationFormat
The format in which the IEngineInspector prints the layer information.
Definition: NvInferRuntime.h:5273

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
Print layer information in JSON format.

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
Print layer information in one line per layer.

nvinfer1::IStreamReader
v_1_0::IStreamReader IStreamReader
Definition: NvInferRuntime.h:710

nvinfer1::AllocatorFlag
AllocatorFlag
Allowed type of memory allocation.
Definition: NvInferRuntime.h:1554

nvinfer1::AllocatorFlag::kRESIZABLE
@ kRESIZABLE
TensorRT may call realloc() on this allocation.

nvinfer1::PoolingType::kMAX
@ kMAX
Maximum over elements.

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
Maximum number of elements in DeviceType enum.
Definition: NvInferRuntime.h:1357

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
Maximum number of elements in DimensionOperation enum.
Definition: NvInferRuntime.h:193

nvinfer1::EnumMax< ExecutionContextAllocationStrategy >
constexpr int32_t EnumMax< ExecutionContextAllocationStrategy >() noexcept
Maximum number of memory allocation strategies in ExecutionContextAllocationStrategy enum.
Definition: NvInferRuntime.h:3116

nvinfer1::EnumMax< SerializationFlag >
constexpr int32_t EnumMax< SerializationFlag >() noexcept
Maximum number of serialization flags in SerializationFlag enum.
Definition: NvInferRuntime.h:3007

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:204

nvinfer1::TensorLocation::kHOST
@ kHOST
Data stored on host.

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
Data stored on device.

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:2632

nvinfer1::OptProfileSelector::kOPT
@ kOPT
This is used to set or get the value that is used in the optimization (kernel selection).

nvinfer1::AllocatorFlags
uint32_t AllocatorFlags
Definition: NvInferRuntime.h:1570

nvinfer1::DynamicPluginTensorDesc
Summarizes tensors that a plugin might see for an input or output.
Definition: NvInferRuntime.h:362

nvinfer1::DynamicPluginTensorDesc::min
Dims min
Lower bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:367

nvinfer1::DynamicPluginTensorDesc::max
Dims max
Upper bounds on tensor’s dimensions.
Definition: NvInferRuntime.h:370

nvinfer1::DynamicPluginTensorDesc::opt
Dims opt
Optimum value of tensor’s dimensions specified for auto-tuning.
Definition: NvInferRuntime.h:373

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
Information required to interpret a pointer to tensor data, except that desc.dims has -1 in place of ...
Definition: NvInferRuntime.h:364

nvinfer1::PluginFieldCollection
Plugin field collection struct.
Definition: NvInferPluginBase.h:103

nvinfer1::PluginTensorDesc
Fields that a plugin might see for an input or output.
Definition: NvInferRuntimePlugin.h:73

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:128