_static/c-api/_nv_infer_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef NV_INFER_H

#define NV_INFER_H


#include "NvInferLegacyDims.h"

#include "NvInferRuntime.h" // IWYU pragma: export


namespace nvinfer1

{


enum class LayerType : int32_t

{

    kCONVOLUTION = 0,

    kCAST = 1,

    kACTIVATION = 2,

    kPOOLING = 3,

    kLRN = 4,

    kSCALE = 5,

    kSOFTMAX = 6,

    kDECONVOLUTION = 7,

    kCONCATENATION = 8,

    kELEMENTWISE = 9,

    kPLUGIN = 10,

    kUNARY = 11,

    kPADDING = 12,

    kSHUFFLE = 13,

    kREDUCE = 14,

    kTOPK = 15,

    kGATHER = 16,

    kMATRIX_MULTIPLY = 17,

    kRAGGED_SOFTMAX = 18,

    kCONSTANT = 19,

    kIDENTITY = 20,

    kPLUGIN_V2 = 21,

    kSLICE = 22,

    kSHAPE = 23,

    kPARAMETRIC_RELU = 24,

    kRESIZE = 25,

    kTRIP_LIMIT = 26,

    kRECURRENCE = 27,

    kITERATOR = 28,

    kLOOP_OUTPUT = 29,

    kSELECT = 30,

    kFILL = 31,

    kQUANTIZE = 32,

    kDEQUANTIZE = 33,

    kCONDITION = 34,

    kCONDITIONAL_INPUT = 35,

    kCONDITIONAL_OUTPUT = 36,

    kSCATTER = 37,

    kEINSUM = 38,

    kASSERTION = 39,

    kONE_HOT = 40,

    kNON_ZERO = 41,

    kGRID_SAMPLE = 42,

    kNMS = 43,

    kREVERSE_SEQUENCE = 44,

    kNORMALIZATION = 45,

    kPLUGIN_V3 = 46,

    kSQUEEZE = 47,

    kUNSQUEEZE = 48,

    kCUMULATIVE = 49,

    kDYNAMIC_QUANTIZE = 50,

    kATTENTION_INPUT = 51,

    kATTENTION_OUTPUT = 52,

    kROTARY_EMBEDDING = 53,

    kKVCACHE_UPDATE = 54,

};


template <>

constexpr inline int32_t EnumMax<LayerType>() noexcept

{

    return 55;

}


using TensorFormats = uint32_t;


enum class ActivationType : int32_t

{

    kRELU = 0,

    kSIGMOID = 1,

    kTANH = 2,

    kLEAKY_RELU = 3,

    kELU = 4,

    kSELU = 5,

    kSOFTSIGN = 6,

    kSOFTPLUS = 7,

    kCLIP = 8,

    kHARD_SIGMOID = 9,

    kSCALED_TANH = 10,

    kTHRESHOLDED_RELU = 11,

    kGELU_ERF = 12,

    kGELU_TANH = 13

};


namespace impl

{

template <>

struct EnumMaxImpl<ActivationType>

{

    static constexpr int32_t kVALUE = 14;

};

} // namespace impl


class ITensor : public INoCopy

{

public:

    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    void setDimensions(Dims const& dimensions) noexcept

    {

        mImpl->setDimensions(dimensions);

    }


    Dims getDimensions() const noexcept

    {

        return mImpl->getDimensions();

    }


    TRT_DEPRECATED void setType(DataType type) noexcept

    {

        mImpl->setType(type);

    }


    DataType getType() const noexcept

    {

        return mImpl->getType();

    }


    TRT_DEPRECATED bool setDynamicRange(float min, float max) noexcept

    {

        return mImpl->setDynamicRange(min, max);

    }


    bool isNetworkInput() const noexcept

    {

        return mImpl->isNetworkInput();

    }


    bool isNetworkOutput() const noexcept

    {

        return mImpl->isNetworkOutput();

    }


    TRT_DEPRECATED void setBroadcastAcrossBatch(bool broadcastAcrossBatch) noexcept

    {

        mImpl->setBroadcastAcrossBatch(broadcastAcrossBatch);

    }


    TRT_DEPRECATED bool getBroadcastAcrossBatch() const noexcept

    {

        return mImpl->getBroadcastAcrossBatch();

    }


    TensorLocation getLocation() const noexcept

    {

        return mImpl->getLocation();

    }


    TRT_DEPRECATED void setLocation(TensorLocation location) noexcept

    {

        mImpl->setLocation(location);

    }


    TRT_DEPRECATED bool dynamicRangeIsSet() const noexcept

    {

        return mImpl->dynamicRangeIsSet();

    }


    void resetDynamicRange() noexcept

    {

        mImpl->resetDynamicRange();

    }


    float getDynamicRangeMin() const noexcept

    {

        return mImpl->getDynamicRangeMin();

    }


    float getDynamicRangeMax() const noexcept

    {

        return mImpl->getDynamicRangeMax();

    }


    void setAllowedFormats(TensorFormats formats) noexcept

    {

        mImpl->setAllowedFormats(formats);

    }


    TensorFormats getAllowedFormats() const noexcept

    {

        return mImpl->getAllowedFormats();

    }


    bool isShapeTensor() const noexcept

    {

        return mImpl->isShapeTensor();

    }


    bool isExecutionTensor() const noexcept

    {

        return mImpl->isExecutionTensor();

    }


    void setDimensionName(int32_t index, char const* name) noexcept

    {

        mImpl->setDimensionName(index, name);

    }


    char const* getDimensionName(int32_t index) const noexcept

    {

        return mImpl->getDimensionName(index);

    }


protected:

    apiv::VTensor* mImpl;

    virtual ~ITensor() noexcept = default;

};


class ILayer : public INoCopy

{

public:

    LayerType getType() const noexcept

    {

        return mLayer->getType();

    }


    void setName(char const* name) noexcept

    {

        mLayer->setName(name);

    }


    char const* getName() const noexcept

    {

        return mLayer->getName();

    }


    int32_t getNbInputs() const noexcept

    {

        return mLayer->getNbInputs();

    }


    ITensor* getInput(int32_t index) const noexcept

    {

        return mLayer->getInput(index);

    }


    int32_t getNbOutputs() const noexcept

    {

        return mLayer->getNbOutputs();

    }


    ITensor* getOutput(int32_t index) const noexcept

    {

        return mLayer->getOutput(index);

    }


    void setInput(int32_t index, ITensor& tensor) noexcept

    {

        return mLayer->setInput(index, tensor);

    }


    TRT_DEPRECATED void setPrecision(DataType dataType) noexcept

    {

        mLayer->setPrecision(dataType);

    }


    DataType getPrecision() const noexcept

    {

        return mLayer->getPrecision();

    }


    TRT_DEPRECATED bool precisionIsSet() const noexcept

    {

        return mLayer->precisionIsSet();

    }


    TRT_DEPRECATED void resetPrecision() noexcept

    {

        mLayer->resetPrecision();

    }


    TRT_DEPRECATED void setOutputType(int32_t index, DataType dataType) noexcept

    {

        mLayer->setOutputType(index, dataType);

    }


    DataType getOutputType(int32_t index) const noexcept

    {

        return mLayer->getOutputType(index);

    }


    TRT_DEPRECATED bool outputTypeIsSet(int32_t index) const noexcept

    {

        return mLayer->outputTypeIsSet(index);

    }


    TRT_DEPRECATED void resetOutputType(int32_t index) noexcept

    {

        return mLayer->resetOutputType(index);

    }


    void setMetadata(char const* metadata) noexcept

    {

        mLayer->setMetadata(metadata);

    }


    char const* getMetadata() const noexcept

    {

        return mLayer->getMetadata();

    }


protected:

    virtual ~ILayer() noexcept = default;

    apiv::VLayer* mLayer;

};


enum class PaddingMode : int32_t

{

    kEXPLICIT_ROUND_DOWN = 0,

    kEXPLICIT_ROUND_UP = 1,

    kSAME_UPPER = 2,

    kSAME_LOWER = 3,

};


namespace impl

{

template <>

struct EnumMaxImpl<PaddingMode>

{

    static constexpr int32_t kVALUE = 4;

};

} // namespace impl


class IConvolutionLayer : public ILayer

{

public:

    void setNbOutputMaps(int64_t nbOutputMaps) noexcept

    {

        mImpl->setNbOutputMaps(nbOutputMaps);

    }


    int64_t getNbOutputMaps() const noexcept

    {

        return mImpl->getNbOutputMaps();

    }


    void setNbGroups(int64_t nbGroups) noexcept

    {

        mImpl->setNbGroups(nbGroups);

    }


    int64_t getNbGroups() const noexcept

    {

        return mImpl->getNbGroups();

    }


    void setKernelWeights(Weights weights) noexcept

    {

        mImpl->setKernelWeights(weights);

    }


    Weights getKernelWeights() const noexcept

    {

        return mImpl->getKernelWeights();

    }


    void setBiasWeights(Weights weights) noexcept

    {

        mImpl->setBiasWeights(weights);

    }


    Weights getBiasWeights() const noexcept

    {

        return mImpl->getBiasWeights();

    }


    void setPrePadding(Dims const& padding) noexcept

    {

        mImpl->setPrePadding(padding);

    }


    Dims getPrePadding() const noexcept

    {

        return mImpl->getPrePadding();

    }


    void setPostPadding(Dims const& padding) noexcept

    {

        mImpl->setPostPadding(padding);

    }


    Dims getPostPadding() const noexcept

    {

        return mImpl->getPostPadding();

    }


    void setPaddingMode(PaddingMode paddingMode) noexcept

    {

        mImpl->setPaddingMode(paddingMode);

    }


    PaddingMode getPaddingMode() const noexcept

    {

        return mImpl->getPaddingMode();

    }


    void setKernelSizeNd(Dims const& kernelSize) noexcept

    {

        mImpl->setKernelSizeNd(kernelSize);

    }


    Dims getKernelSizeNd() const noexcept

    {

        return mImpl->getKernelSizeNd();

    }


    void setStrideNd(Dims const& stride) noexcept

    {

        mImpl->setStrideNd(stride);

    }


    Dims getStrideNd() const noexcept

    {

        return mImpl->getStrideNd();

    }


    void setPaddingNd(Dims const& padding) noexcept

    {

        mImpl->setPaddingNd(padding);

    }


    Dims getPaddingNd() const noexcept

    {

        return mImpl->getPaddingNd();

    }


    void setDilationNd(Dims const& dilation) noexcept

    {

        mImpl->setDilationNd(dilation);

    }


    Dims getDilationNd() const noexcept

    {

        return mImpl->getDilationNd();

    }


    using ILayer::setInput;


protected:

    virtual ~IConvolutionLayer() noexcept = default;

    apiv::VConvolutionLayer* mImpl;

};


class IActivationLayer : public ILayer

{

public:

    void setActivationType(ActivationType type) noexcept

    {

        mImpl->setActivationType(type);

    }


    ActivationType getActivationType() const noexcept

    {

        return mImpl->getActivationType();

    }


    void setAlpha(float alpha) noexcept

    {

        mImpl->setAlpha(alpha);

    }


    void setBeta(float beta) noexcept

    {

        mImpl->setBeta(beta);

    }


    float getAlpha() const noexcept

    {

        return mImpl->getAlpha();

    }


    float getBeta() const noexcept

    {

        return mImpl->getBeta();

    }


protected:

    virtual ~IActivationLayer() noexcept = default;

    apiv::VActivationLayer* mImpl;

};


enum class PoolingType : int32_t

{

    kMAX = 0,

    kAVERAGE = 1,

    kMAX_AVERAGE_BLEND = 2

};


namespace impl

{

template <>

struct EnumMaxImpl<PoolingType>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class IPoolingLayer : public ILayer

{

public:

    void setPoolingType(PoolingType type) noexcept

    {

        mImpl->setPoolingType(type);

    }


    PoolingType getPoolingType() const noexcept

    {

        return mImpl->getPoolingType();

    }


    void setBlendFactor(float blendFactor) noexcept

    {

        mImpl->setBlendFactor(blendFactor);

    }


    float getBlendFactor() const noexcept

    {

        return mImpl->getBlendFactor();

    }


    void setAverageCountExcludesPadding(bool exclusive) noexcept

    {

        mImpl->setAverageCountExcludesPadding(exclusive);

    }


    bool getAverageCountExcludesPadding() const noexcept

    {

        return mImpl->getAverageCountExcludesPadding();

    }


    void setPrePadding(Dims const& padding) noexcept

    {

        mImpl->setPrePadding(padding);

    }


    Dims getPrePadding() const noexcept

    {

        return mImpl->getPrePadding();

    }


    void setPostPadding(Dims const& padding) noexcept

    {

        mImpl->setPostPadding(padding);

    }


    Dims getPostPadding() const noexcept

    {

        return mImpl->getPostPadding();

    }


    void setPaddingMode(PaddingMode paddingMode) noexcept

    {

        mImpl->setPaddingMode(paddingMode);

    }


    PaddingMode getPaddingMode() const noexcept

    {

        return mImpl->getPaddingMode();

    }


    void setWindowSizeNd(Dims const& windowSize) noexcept

    {

        mImpl->setWindowSizeNd(windowSize);

    }


    Dims getWindowSizeNd() const noexcept

    {

        return mImpl->getWindowSizeNd();

    }


    void setStrideNd(Dims const& stride) noexcept

    {

        mImpl->setStrideNd(stride);

    }


    Dims getStrideNd() const noexcept

    {

        return mImpl->getStrideNd();

    }


    void setPaddingNd(Dims const& padding) noexcept

    {

        mImpl->setPaddingNd(padding);

    }


    Dims getPaddingNd() const noexcept

    {

        return mImpl->getPaddingNd();

    }


protected:

    virtual ~IPoolingLayer() noexcept = default;

    apiv::VPoolingLayer* mImpl;

};


class ILRNLayer : public ILayer

{

public:

    void setWindowSize(int64_t windowSize) noexcept

    {

        mImpl->setWindowSize(windowSize);

    }


    int64_t getWindowSize() const noexcept

    {

        return mImpl->getWindowSize();

    }


    void setAlpha(float alpha) noexcept

    {

        mImpl->setAlpha(alpha);

    }


    float getAlpha() const noexcept

    {

        return mImpl->getAlpha();

    }


    void setBeta(float beta) noexcept

    {

        mImpl->setBeta(beta);

    }


    float getBeta() const noexcept

    {

        return mImpl->getBeta();

    }


    void setK(float k) noexcept

    {

        mImpl->setK(k);

    }


    float getK() const noexcept

    {

        return mImpl->getK();

    }


protected:

    virtual ~ILRNLayer() noexcept = default;

    apiv::VLRNLayer* mImpl;

};


enum class ScaleMode : int32_t

{

    kUNIFORM = 0,

    kCHANNEL = 1,

    kELEMENTWISE = 2

};


template <>

constexpr inline int32_t EnumMax<ScaleMode>() noexcept

{

    return 3;

}


class IScaleLayer : public ILayer

{

public:

    void setMode(ScaleMode mode) noexcept

    {

        mImpl->setMode(mode);

    }


    ScaleMode getMode() const noexcept

    {

        return mImpl->getMode();

    }


    void setShift(Weights shift) noexcept

    {

        mImpl->setShift(shift);

    }


    Weights getShift() const noexcept

    {

        return mImpl->getShift();

    }


    void setScale(Weights scale) noexcept

    {

        mImpl->setScale(scale);

    }


    Weights getScale() const noexcept

    {

        return mImpl->getScale();

    }


    void setPower(Weights power) noexcept

    {

        mImpl->setPower(power);

    }


    Weights getPower() const noexcept

    {

        return mImpl->getPower();

    }


    int32_t getChannelAxis() const noexcept

    {

        return mImpl->getChannelAxis();

    }


    void setChannelAxis(int32_t channelAxis) noexcept

    {

        mImpl->setChannelAxis(channelAxis);

    }


protected:

    virtual ~IScaleLayer() noexcept = default;

    apiv::VScaleLayer* mImpl;

};


class ISoftMaxLayer : public ILayer

{

public:

    void setAxes(uint32_t axes) noexcept

    {

        mImpl->setAxes(axes);

    }


    uint32_t getAxes() const noexcept

    {

        return mImpl->getAxes();

    }


protected:

    virtual ~ISoftMaxLayer() noexcept = default;

    apiv::VSoftMaxLayer* mImpl;

};


class IConcatenationLayer : public ILayer

{

public:

    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


protected:

    virtual ~IConcatenationLayer() noexcept = default;

    apiv::VConcatenationLayer* mImpl;

};


class IDeconvolutionLayer : public ILayer

{

public:

    void setNbOutputMaps(int64_t nbOutputMaps) noexcept

    {

        mImpl->setNbOutputMaps(nbOutputMaps);

    }


    int64_t getNbOutputMaps() const noexcept

    {

        return mImpl->getNbOutputMaps();

    }


    void setNbGroups(int64_t nbGroups) noexcept

    {

        mImpl->setNbGroups(nbGroups);

    }


    int64_t getNbGroups() const noexcept

    {

        return mImpl->getNbGroups();

    }


    void setKernelWeights(Weights weights) noexcept

    {

        mImpl->setKernelWeights(weights);

    }


    Weights getKernelWeights() const noexcept

    {

        return mImpl->getKernelWeights();

    }


    void setBiasWeights(Weights weights) noexcept

    {

        mImpl->setBiasWeights(weights);

    }


    Weights getBiasWeights() const noexcept

    {

        return mImpl->getBiasWeights();

    }


    void setPrePadding(Dims const& padding) noexcept

    {

        mImpl->setPrePadding(padding);

    }


    Dims getPrePadding() const noexcept

    {

        return mImpl->getPrePadding();

    }


    void setPostPadding(Dims const& padding) noexcept

    {

        mImpl->setPostPadding(padding);

    }


    Dims getPostPadding() const noexcept

    {

        return mImpl->getPostPadding();

    }


    void setPaddingMode(PaddingMode paddingMode) noexcept

    {

        mImpl->setPaddingMode(paddingMode);

    }


    PaddingMode getPaddingMode() const noexcept

    {

        return mImpl->getPaddingMode();

    }


    void setKernelSizeNd(Dims const& kernelSize) noexcept

    {

        mImpl->setKernelSizeNd(kernelSize);

    }


    Dims getKernelSizeNd() const noexcept

    {

        return mImpl->getKernelSizeNd();

    }


    void setStrideNd(Dims const& stride) noexcept

    {

        mImpl->setStrideNd(stride);

    }


    Dims getStrideNd() const noexcept

    {

        return mImpl->getStrideNd();

    }


    void setPaddingNd(Dims const& padding) noexcept

    {

        mImpl->setPaddingNd(padding);

    }


    Dims getPaddingNd() const noexcept

    {

        return mImpl->getPaddingNd();

    }


    using ILayer::setInput;


    void setDilationNd(Dims const& dilation) noexcept

    {

        mImpl->setDilationNd(dilation);

    }


    Dims getDilationNd() const noexcept

    {

        return mImpl->getDilationNd();

    }


protected:

    virtual ~IDeconvolutionLayer() noexcept = default;

    apiv::VDeconvolutionLayer* mImpl;

};


enum class ElementWiseOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kSUB = 4,

    kDIV = 5,

    kPOW = 6,

    kFLOOR_DIV = 7,

    kAND = 8,

    kOR = 9,

    kXOR = 10,

    kEQUAL = 11,

    kGREATER = 12,

    kLESS = 13

};


namespace impl

{

template <>

struct EnumMaxImpl<ElementWiseOperation>

{

    static constexpr int32_t kVALUE = 14;

};

} // namespace impl


class IElementWiseLayer : public ILayer

{

public:

    void setOperation(ElementWiseOperation op) noexcept

    {

        return mImpl->setOperation(op);

    }


    ElementWiseOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


protected:

    apiv::VElementWiseLayer* mImpl;

    virtual ~IElementWiseLayer() noexcept = default;

};


enum class GatherMode : int32_t

{

    kDEFAULT = 0,

    kELEMENT = 1,

    kND = 2

};


template <>

constexpr inline int32_t EnumMax<GatherMode>() noexcept

{

    return 3;

}


class IGatherLayer : public ILayer

{

public:

    void setGatherAxis(int32_t axis) noexcept

    {

        mImpl->setGatherAxis(axis);

    }


    int32_t getGatherAxis() const noexcept

    {

        return mImpl->getGatherAxis();

    }


    void setNbElementWiseDims(int32_t elementWiseDims) noexcept

    {

        mImpl->setNbElementWiseDims(elementWiseDims);

    }


    int32_t getNbElementWiseDims() const noexcept

    {

        return mImpl->getNbElementWiseDims();

    }


    void setMode(GatherMode mode) noexcept

    {

        mImpl->setMode(mode);

    }


    GatherMode getMode() const noexcept

    {

        return mImpl->getMode();

    }


protected:

    apiv::VGatherLayer* mImpl;

    virtual ~IGatherLayer() noexcept = default;

};


class TRT_DEPRECATED IPluginV2Layer : public ILayer

{

public:

    IPluginV2& getPlugin() noexcept

    {

        return mImpl->getPlugin();

    }


protected:

    apiv::VPluginV2Layer* mImpl;

    virtual ~IPluginV2Layer() noexcept = default;

};


class IPluginV3Layer : public ILayer

{

public:

    IPluginV3& getPlugin() noexcept

    {

        return mImpl->getPlugin();

    }


protected:

    apiv::VPluginV3Layer* mImpl;

    virtual ~IPluginV3Layer() noexcept = default;

};


enum class UnaryOperation : int32_t

{

    kEXP = 0,

    kLOG = 1,

    kSQRT = 2,

    kRECIP = 3,

    kABS = 4,

    kNEG = 5,

    kSIN = 6,

    kCOS = 7,

    kTAN = 8,

    kSINH = 9,

    kCOSH = 10,

    kASIN = 11,

    kACOS = 12,

    kATAN = 13,

    kASINH = 14,

    kACOSH = 15,

    kATANH = 16,

    kCEIL = 17,

    kFLOOR = 18,

    kERF = 19,

    kNOT = 20,

    kSIGN = 21,

    kROUND = 22,

    kISINF = 23,

    kISNAN = 24,

};


template <>

constexpr inline int32_t EnumMax<UnaryOperation>() noexcept

{

    return 25;

}


class IUnaryLayer : public ILayer

{

public:

    void setOperation(UnaryOperation op) noexcept

    {

        mImpl->setOperation(op);

    }


    UnaryOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


protected:

    apiv::VUnaryLayer* mImpl;

    virtual ~IUnaryLayer() noexcept = default;

};


enum class ReduceOperation : int32_t

{

    kSUM = 0,

    kPROD = 1,

    kMAX = 2,

    kMIN = 3,

    kAVG = 4

};


template <>

constexpr inline int32_t EnumMax<ReduceOperation>() noexcept

{

    return 5;

}


class IReduceLayer : public ILayer

{

public:

    void setOperation(ReduceOperation op) noexcept

    {

        mImpl->setOperation(op);

    }


    ReduceOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


    void setReduceAxes(uint32_t reduceAxes) noexcept

    {

        mImpl->setReduceAxes(reduceAxes);

    }


    uint32_t getReduceAxes() const noexcept

    {

        return mImpl->getReduceAxes();

    }


    void setKeepDimensions(bool keepDimensions) noexcept

    {

        mImpl->setKeepDimensions(keepDimensions);

    }


    bool getKeepDimensions() const noexcept

    {

        return mImpl->getKeepDimensions();

    }


protected:

    apiv::VReduceLayer* mImpl;

    virtual ~IReduceLayer() noexcept = default;

};


class IPaddingLayer : public ILayer

{

public:

    void setPrePaddingNd(Dims const& padding) noexcept

    {

        mImpl->setPrePaddingNd(padding);

    }


    Dims getPrePaddingNd() const noexcept

    {

        return mImpl->getPrePaddingNd();

    }


    void setPostPaddingNd(Dims const& padding) noexcept

    {

        mImpl->setPostPaddingNd(padding);

    }


    Dims getPostPaddingNd() const noexcept

    {

        return mImpl->getPostPaddingNd();

    }


protected:

    apiv::VPaddingLayer* mImpl;

    virtual ~IPaddingLayer() noexcept = default;

};


struct Permutation

{

    int32_t order[Dims::MAX_DIMS];

};


class IShuffleLayer : public ILayer

{

public:

    void setFirstTranspose(Permutation permutation) noexcept

    {

        mImpl->setFirstTranspose(permutation);

    }


    Permutation getFirstTranspose() const noexcept

    {

        return mImpl->getFirstTranspose();

    }


    void setReshapeDimensions(Dims const& dimensions) noexcept

    {

        mImpl->setReshapeDimensions(dimensions);

    }


    Dims getReshapeDimensions() const noexcept

    {

        return mImpl->getReshapeDimensions();

    }


    //

    using ILayer::setInput;


    void setSecondTranspose(Permutation permutation) noexcept

    {

        mImpl->setSecondTranspose(permutation);

    }


    Permutation getSecondTranspose() const noexcept

    {

        return mImpl->getSecondTranspose();

    }


    void setZeroIsPlaceholder(bool zeroIsPlaceholder) noexcept

    {

        return mImpl->setZeroIsPlaceholder(zeroIsPlaceholder);

    }


    bool getZeroIsPlaceholder() const noexcept

    {

        return mImpl->getZeroIsPlaceholder();

    }


protected:

    apiv::VShuffleLayer* mImpl;

    virtual ~IShuffleLayer() noexcept = default;

};


enum class SampleMode : int32_t

{

    kSTRICT_BOUNDS = 0,

    kWRAP = 1,

    kCLAMP = 2,

    kFILL = 3,

    kREFLECT = 4,

};


template <>

constexpr inline int32_t EnumMax<SampleMode>() noexcept

{

    return 5;

}


class ISliceLayer : public ILayer

{

public:

    void setStart(Dims const& start) noexcept

    {

        mImpl->setStart(start);

    }


    Dims getStart() const noexcept

    {

        return mImpl->getStart();

    }


    void setSize(Dims const& size) noexcept

    {

        return mImpl->setSize(size);

    }


    Dims getSize() const noexcept

    {

        return mImpl->getSize();

    }


    void setStride(Dims const& stride) noexcept

    {

        mImpl->setStride(stride);

    }


    Dims getStride() const noexcept

    {

        return mImpl->getStride();

    }


    void setMode(SampleMode mode) noexcept

    {

        mImpl->setMode(mode);

    }


    SampleMode getMode() const noexcept

    {

        return mImpl->getMode();

    }


    using ILayer::setInput;


    void setAxes(Dims const& axes) noexcept

    {

        mImpl->setAxes(axes);

    }


    Dims getAxes() const noexcept

    {

        return mImpl->getAxes();

    }


protected:

    apiv::VSliceLayer* mImpl;

    virtual ~ISliceLayer() noexcept = default;

};


class IShapeLayer : public ILayer

{

protected:

    apiv::VShapeLayer* mImpl;

    virtual ~IShapeLayer() noexcept = default;

};


enum class TopKOperation : int32_t

{

    kMAX = 0,

    kMIN = 1,

};


template <>

constexpr inline int32_t EnumMax<TopKOperation>() noexcept

{

    return 2;

}


class ITopKLayer : public ILayer

{

public:

    void setOperation(TopKOperation op) noexcept

    {

        mImpl->setOperation(op);

    }


    TopKOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


    void setK(int32_t k) noexcept

    {

        mImpl->setK(k);

    }


    int32_t getK() const noexcept

    {

        return mImpl->getK();

    }


    void setReduceAxes(uint32_t reduceAxes) noexcept

    {

        mImpl->setReduceAxes(reduceAxes);

    }


    uint32_t getReduceAxes() const noexcept

    {

        return mImpl->getReduceAxes();

    }


    using ILayer::setInput;


    bool setIndicesType(DataType type) noexcept

    {

        return mImpl->setIndicesType(type);

    }


    DataType getIndicesType() const noexcept

    {

        return mImpl->getIndicesType();

    }


protected:

    apiv::VTopKLayer* mImpl;

    virtual ~ITopKLayer() noexcept = default;

};


enum class MatrixOperation : int32_t

{

    kNONE = 0,


    kTRANSPOSE = 1,


    kVECTOR = 2,

};


template <>

constexpr inline int32_t EnumMax<MatrixOperation>() noexcept

{

    return 3;

}


class IMatrixMultiplyLayer : public ILayer

{

public:

    void setOperation(int32_t index, MatrixOperation op) noexcept

    {

        mImpl->setOperation(index, op);

    }


    MatrixOperation getOperation(int32_t index) const noexcept

    {

        return mImpl->getOperation(index);

    }


protected:

    apiv::VMatrixMultiplyLayer* mImpl;

    virtual ~IMatrixMultiplyLayer() noexcept = default;

};


class INonZeroLayer : public ILayer

{

public:

    bool setIndicesType(DataType type) noexcept

    {

        return mImpl->setIndicesType(type);

    }


    DataType getIndicesType() const noexcept

    {

        return mImpl->getIndicesType();

    }


protected:

    virtual ~INonZeroLayer() noexcept = default;

    apiv::VNonZeroLayer* mImpl;

};


class IRaggedSoftMaxLayer : public ILayer

{

protected:

    apiv::VRaggedSoftMaxLayer* mImpl;

    virtual ~IRaggedSoftMaxLayer() noexcept = default;

};


class IIdentityLayer : public ILayer

{

protected:

    apiv::VIdentityLayer* mImpl;

    virtual ~IIdentityLayer() noexcept = default;

};


class ICastLayer : public ILayer

{

public:

    void setToType(DataType toType) noexcept

    {

        mImpl->setToType(toType);

    }


    DataType getToType() const noexcept

    {

        return mImpl->getToType();

    }


protected:

    apiv::VCastLayer* mImpl;

    virtual ~ICastLayer() noexcept = default;

};


class IConstantLayer : public ILayer

{

public:

    void setWeights(Weights weights) noexcept

    {

        mImpl->setWeights(weights);

    }


    Weights getWeights() const noexcept

    {

        return mImpl->getWeights();

    }


    void setDimensions(Dims const& dimensions) noexcept

    {

        mImpl->setDimensions(dimensions);

    }


    Dims getDimensions() const noexcept

    {

        return mImpl->getDimensions();

    }


protected:

    apiv::VConstantLayer* mImpl;

    virtual ~IConstantLayer() noexcept = default;

};


class IParametricReLULayer : public ILayer

{

protected:

    apiv::VParametricReLULayer* mImpl;

    virtual ~IParametricReLULayer() noexcept = default;

};


enum class InterpolationMode : int32_t

{

    kNEAREST = 0,

    kLINEAR = 1,

    kCUBIC = 2

};


namespace impl

{

template <>

struct EnumMaxImpl<InterpolationMode>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


enum class ResizeCoordinateTransformation : int32_t

{

    kALIGN_CORNERS = 0,


    kASYMMETRIC = 1,


    kHALF_PIXEL = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<ResizeCoordinateTransformation>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


enum class ResizeSelector : int32_t

{

    kFORMULA = 0,


    kUPPER = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<ResizeSelector>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


enum class ResizeRoundMode : int32_t

{

    kHALF_UP = 0,


    kHALF_DOWN = 1,


    kFLOOR = 2,


    kCEIL = 3,

};


namespace impl

{

template <>

struct EnumMaxImpl<ResizeRoundMode>

{

    static constexpr int32_t kVALUE = 4;

};

} // namespace impl


class IResizeLayer : public ILayer

{

public:

    void setOutputDimensions(Dims const& dimensions) noexcept

    {

        return mImpl->setOutputDimensions(dimensions);

    }


    Dims getOutputDimensions() const noexcept

    {

        return mImpl->getOutputDimensions();

    }


    void setScales(float const* scales, int32_t nbScales) noexcept

    {

        mImpl->setScales(scales, nbScales);

    }


    int32_t getScales(int32_t size, float* scales) const noexcept

    {

        return mImpl->getScales(size, scales);

    }


    void setResizeMode(InterpolationMode interpolationMode) noexcept

    {

        mImpl->setResizeMode(interpolationMode);

    }


    InterpolationMode getResizeMode() const noexcept

    {

        return mImpl->getResizeMode();

    }


    using ILayer::setInput;


    void setCoordinateTransformation(ResizeCoordinateTransformation coordTransform) noexcept

    {

        mImpl->setCoordinateTransformation(coordTransform);

    }


    ResizeCoordinateTransformation getCoordinateTransformation() const noexcept

    {

        return mImpl->getCoordinateTransformation();

    }


    void setSelectorForSinglePixel(ResizeSelector selector) noexcept

    {

        mImpl->setSelectorForSinglePixel(selector);

    }


    ResizeSelector getSelectorForSinglePixel() const noexcept

    {

        return mImpl->getSelectorForSinglePixel();

    }


    void setNearestRounding(ResizeRoundMode value) noexcept

    {

        mImpl->setNearestRounding(value);

    }


    ResizeRoundMode getNearestRounding() const noexcept

    {

        return mImpl->getNearestRounding();

    }


    void setCubicCoeff(float A) noexcept

    {

        mImpl->setCubicCoeff(A);

    }


    float getCubicCoeff() const noexcept

    {

        return mImpl->getCubicCoeff();

    }


    void setExcludeOutside(bool excludeFlag) noexcept

    {

        mImpl->setExcludeOutside(excludeFlag);

    }


    bool getExcludeOutside() const noexcept

    {

        return mImpl->getExcludeOutside();

    }


protected:

    virtual ~IResizeLayer() noexcept = default;

    apiv::VResizeLayer* mImpl;

};


enum class LoopOutput : int32_t

{

    kLAST_VALUE = 0,


    kCONCATENATE = 1,


    kREVERSE = 2

};


template <>

constexpr inline int32_t EnumMax<LoopOutput>() noexcept

{

    return 3;

}


enum class TripLimit : int32_t

{


    kCOUNT = 0,

    kWHILE = 1

};


template <>

constexpr inline int32_t EnumMax<TripLimit>() noexcept

{

    return 2;

}


class ILoop;


class ILoopBoundaryLayer : public ILayer

{

public:

    ILoop* getLoop() const noexcept

    {

        return mBoundary->getLoop();

    }


protected:

    virtual ~ILoopBoundaryLayer() noexcept = default;

    apiv::VLoopBoundaryLayer* mBoundary;

};


class IIfConditionalBoundaryLayer : public ILayer

{

public:

    IIfConditional* getConditional() const noexcept

    {

        return mBoundary->getConditional();

    }


protected:

    virtual ~IIfConditionalBoundaryLayer() noexcept = default;

    apiv::VConditionalBoundaryLayer* mBoundary;

};


class IConditionLayer : public IIfConditionalBoundaryLayer

{

public:

protected:

    virtual ~IConditionLayer() noexcept = default;

    apiv::VConditionLayer* mImpl;

};


class IIfConditionalOutputLayer : public IIfConditionalBoundaryLayer

{

public:

protected:

    virtual ~IIfConditionalOutputLayer() noexcept = default;

    apiv::VConditionalOutputLayer* mImpl;

};


class IIfConditionalInputLayer : public IIfConditionalBoundaryLayer

{

public:

protected:

    virtual ~IIfConditionalInputLayer() noexcept = default;

    apiv::VConditionalInputLayer* mImpl;

};


class IIfConditional : public INoCopy

{

public:

    IConditionLayer* setCondition(ITensor& condition) noexcept

    {

        return mImpl->setCondition(condition);

    }


    IIfConditionalOutputLayer* addOutput(ITensor& trueSubgraphOutput, ITensor& falseSubgraphOutput) noexcept

    {

        return mImpl->addOutput(trueSubgraphOutput, falseSubgraphOutput);

    }


    IIfConditionalInputLayer* addInput(ITensor& input) noexcept

    {

        return mImpl->addInput(input);

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


protected:

    virtual ~IIfConditional() noexcept = default;

    apiv::VIfConditional* mImpl;

};


class IRecurrenceLayer : public ILoopBoundaryLayer

{

public:

    //

    using ILayer::setInput;


protected:

    virtual ~IRecurrenceLayer() noexcept = default;

    apiv::VRecurrenceLayer* mImpl;

};


class ILoopOutputLayer : public ILoopBoundaryLayer

{

public:

    LoopOutput getLoopOutput() const noexcept

    {

        return mImpl->getLoopOutput();

    }


    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


    //

    using ILayer::setInput;


protected:

    virtual ~ILoopOutputLayer() noexcept = default;

    apiv::VLoopOutputLayer* mImpl;

};


class ITripLimitLayer : public ILoopBoundaryLayer

{

public:

    TripLimit getTripLimit() const noexcept

    {

        return mImpl->getTripLimit();

    }


protected:

    virtual ~ITripLimitLayer() noexcept = default;

    apiv::VTripLimitLayer* mImpl;

};


class IIteratorLayer : public ILoopBoundaryLayer

{

public:

    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


    void setReverse(bool reverse) noexcept

    {

        mImpl->setReverse(reverse);

    }


    bool getReverse() const noexcept

    {

        return mImpl->getReverse();

    }


protected:

    virtual ~IIteratorLayer() noexcept = default;

    apiv::VIteratorLayer* mImpl;

};


class ILoop : public INoCopy

{

public:

    IRecurrenceLayer* addRecurrence(ITensor& initialValue) noexcept

    {

        return mImpl->addRecurrence(initialValue);

    }


    ITripLimitLayer* addTripLimit(ITensor& tensor, TripLimit limit) noexcept

    {

        return mImpl->addTripLimit(tensor, limit);

    }


    IIteratorLayer* addIterator(ITensor& tensor, int32_t axis = 0, bool reverse = false) noexcept

    {

        return mImpl->addIterator(tensor, axis, reverse);

    }


    ILoopOutputLayer* addLoopOutput(ITensor& tensor, LoopOutput outputKind, int32_t axis = 0) noexcept

    {

        return mImpl->addLoopOutput(tensor, outputKind, axis);

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


protected:

    virtual ~ILoop() noexcept = default;

    apiv::VLoop* mImpl;

};


class ISelectLayer : public ILayer

{

protected:

    virtual ~ISelectLayer() noexcept = default;

    apiv::VSelectLayer* mImpl;

};


class IAssertionLayer : public ILayer

{

public:

    void setMessage(char const* message) noexcept

    {

        mImpl->setMessage(message);

    }


    char const* getMessage() const noexcept

    {

        return mImpl->getMessage();

    }


protected:

    virtual ~IAssertionLayer() noexcept = default;


    apiv::VAssertionLayer* mImpl;

};


enum class FillOperation : int32_t

{

    kLINSPACE = 0,


    kRANDOM_UNIFORM = 1,


    kRANDOM_NORMAL = 2

};


template <>

constexpr inline int32_t EnumMax<FillOperation>() noexcept

{

    return 3;

}


class IFillLayer : public ILayer

{

public:

    //

    void setDimensions(Dims const& dimensions) noexcept

    {

        mImpl->setDimensions(dimensions);

    }


    Dims getDimensions() const noexcept

    {

        return mImpl->getDimensions();

    }


    void setOperation(FillOperation op) noexcept

    {

        mImpl->setOperation(op);

    }


    FillOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


    //

    void setAlpha(double alpha) noexcept

    {

        mImpl->setAlpha(alpha);

    }


    double getAlpha() const noexcept

    {

        return mImpl->getAlpha();

    }


    void setBeta(double beta) noexcept

    {

        mImpl->setBeta(beta);

    }


    double getBeta() const noexcept

    {

        return mImpl->getBeta();

    }


    using ILayer::setInput;


    //

    void setAlphaInt64(int64_t alpha) noexcept

    {

        mImpl->setAlphaInt64(alpha);

    }


    int64_t getAlphaInt64() const noexcept

    {

        return mImpl->getAlphaInt64();

    }


    void setBetaInt64(int64_t beta) noexcept

    {

        mImpl->setBetaInt64(beta);

    }


    int64_t getBetaInt64() const noexcept

    {

        return mImpl->getBetaInt64();

    }


    bool isAlphaBetaInt64() const noexcept

    {

        return mImpl->isAlphaBetaInt64();

    }


    void setToType(DataType toType) noexcept

    {

        mImpl->setToType(toType);

    }


    DataType getToType() const noexcept

    {

        return mImpl->getToType();

    }


protected:

    virtual ~IFillLayer() noexcept = default;

    apiv::VFillLayer* mImpl;

};


class IQuantizeLayer : public ILayer

{

public:

    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }

    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    bool setBlockShape(Dims const& blockShape) noexcept

    {

        return mImpl->setBlockShape(blockShape);

    }


    TRT_NODISCARD Dims getBlockShape() const noexcept

    {

        return mImpl->getBlockShape();

    }


    void setToType(DataType toType) noexcept

    {

        mImpl->setToType(toType);

    }


    DataType getToType() const noexcept

    {

        return mImpl->getToType();

    }


protected:

    virtual ~IQuantizeLayer() noexcept = default;

    apiv::VQuantizeLayer* mImpl;

};


class IDequantizeLayer : public ILayer

{

public:

    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }

    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    bool setBlockShape(Dims const& blockShape) noexcept

    {

        return mImpl->setBlockShape(blockShape);

    }


    TRT_NODISCARD Dims getBlockShape() const noexcept

    {

        return mImpl->getBlockShape();

    }


    void setToType(DataType toType) noexcept

    {

        mImpl->setToType(toType);

    }


    DataType getToType() const noexcept

    {

        return mImpl->getToType();

    }


protected:

    virtual ~IDequantizeLayer() noexcept = default;

    apiv::VDequantizeLayer* mImpl;

};


class IDynamicQuantizeLayer : public ILayer

{

public:

    using ILayer::setInput;


    void setToType(DataType toType) noexcept

    {

        mImpl->setToType(toType);

    }


    DataType getToType() const noexcept

    {

        return mImpl->getToType();

    }


    void setScaleType(DataType scaleType) noexcept

    {

        mImpl->setScaleType(scaleType);

    }


    DataType getScaleType() const noexcept

    {

        return mImpl->getScaleType();

    }


    TRT_DEPRECATED void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    TRT_DEPRECATED int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


    TRT_DEPRECATED void setBlockSize(int32_t size) noexcept

    {

        mImpl->setBlockSize(size);

    }


    TRT_DEPRECATED int32_t getBlockSize() const noexcept

    {

        return mImpl->getBlockSize();

    }


    void setBlockShape(Dims const& blockShape) noexcept

    {

        mImpl->setBlockShape(blockShape);

    }


    Dims getBlockShape() const noexcept

    {

        return mImpl->getBlockShape();

    }


protected:

    virtual ~IDynamicQuantizeLayer() noexcept = default;

    apiv::VDynamicQuantizeLayer* mImpl;

};


class IEinsumLayer : public ILayer

{

public:

    bool setEquation(char const* equation) noexcept

    {

        return mImpl->setEquation(equation);

    }


    char const* getEquation() const noexcept

    {

        return mImpl->getEquation();

    }


protected:

    virtual ~IEinsumLayer() noexcept = default;

    apiv::VEinsumLayer* mImpl;

};


enum class ScatterMode : int32_t

{

    kELEMENT = 0,

    kND = 1,

};


template <>

constexpr inline int32_t EnumMax<ScatterMode>() noexcept

{

    return 2;

}


class IScatterLayer : public ILayer

{

public:

    void setMode(ScatterMode mode) noexcept

    {

        mImpl->setMode(mode);

    }


    ScatterMode getMode() const noexcept

    {

        return mImpl->getMode();

    }


    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


protected:

    apiv::VScatterLayer* mImpl;

    virtual ~IScatterLayer() noexcept = default;

}; // class IScatterLayer


class IOneHotLayer : public ILayer

{

public:

    void setAxis(int32_t axis) noexcept

    {

        mImpl->setAxis(axis);

    }


    int32_t getAxis() const noexcept

    {

        return mImpl->getAxis();

    }


protected:

    apiv::VOneHotLayer* mImpl;

    virtual ~IOneHotLayer() noexcept = default;

};


class IGridSampleLayer : public ILayer

{

public:

    void setInterpolationMode(InterpolationMode mode) noexcept

    {

        mImpl->setInterpolationMode(mode);

    }


    InterpolationMode getInterpolationMode() const noexcept

    {

        return mImpl->getInterpolationMode();

    }


    void setAlignCorners(bool alignCorners) noexcept

    {

        mImpl->setAlignCorners(alignCorners);

    }


    bool getAlignCorners() const noexcept

    {

        return mImpl->getAlignCorners();

    }


    bool setSampleMode(SampleMode mode) noexcept

    {

        return mImpl->setSampleMode(mode);

    }


    SampleMode getSampleMode() const noexcept

    {

        return mImpl->getSampleMode();

    }


protected:

    apiv::VGridSampleLayer* mImpl;

    virtual ~IGridSampleLayer() noexcept = default;

}; // class IGridSampleLayer


enum class BoundingBoxFormat : int32_t

{

    kCORNER_PAIRS = 0,

    kCENTER_SIZES = 1

};


template <>

constexpr inline int32_t EnumMax<BoundingBoxFormat>() noexcept

{

    return 2;

}


class INMSLayer : public ILayer

{

public:

    void setBoundingBoxFormat(BoundingBoxFormat fmt) noexcept

    {

        mImpl->setBoundingBoxFormat(fmt);

    }


    BoundingBoxFormat getBoundingBoxFormat() const noexcept

    {

        return mImpl->getBoundingBoxFormat();

    }


    void setTopKBoxLimit(int32_t limit) noexcept

    {

        mImpl->setTopKBoxLimit(limit);

    }


    int32_t getTopKBoxLimit() const noexcept

    {

        return mImpl->getTopKBoxLimit();

    }


    using ILayer::setInput;


    bool setIndicesType(DataType type) noexcept

    {

        return mImpl->setIndicesType(type);

    }


    DataType getIndicesType() const noexcept

    {

        return mImpl->getIndicesType();

    }


protected:

    apiv::VNMSLayer* mImpl;

    virtual ~INMSLayer() noexcept = default;

}; // class INMSLayer


class IReverseSequenceLayer : public ILayer

{

public:

    void setBatchAxis(int32_t batchAxis) noexcept

    {

        mImpl->setBatchAxis(batchAxis);

    }


    int32_t getBatchAxis() const noexcept

    {

        return mImpl->getBatchAxis();

    }


    void setSequenceAxis(int32_t sequenceAxis) noexcept

    {

        mImpl->setSequenceAxis(sequenceAxis);

    }


    int32_t getSequenceAxis() const noexcept

    {

        return mImpl->getSequenceAxis();

    }


protected:

    apiv::VReverseSequenceLayer* mImpl;

    virtual ~IReverseSequenceLayer() noexcept = default;

}; // class IReverseSequenceLayer


class INormalizationLayer : public ILayer

{

public:

    void setEpsilon(float eps) noexcept

    {

        return mImpl->setEpsilon(eps);

    }


    float getEpsilon() const noexcept

    {

        return mImpl->getEpsilon();

    }


    void setAxes(uint32_t axesMask) noexcept

    {

        return mImpl->setAxes(axesMask);

    }


    uint32_t getAxes() const noexcept

    {

        return mImpl->getAxes();

    }


    void setNbGroups(int64_t nbGroups) noexcept

    {

        return mImpl->setNbGroups(nbGroups);

    }


    int64_t getNbGroups() const noexcept

    {

        return mImpl->getNbGroups();

    }


    void setComputePrecision(DataType type) noexcept

    {

        return mImpl->setComputePrecision(type);

    }


    DataType getComputePrecision() const noexcept

    {

        return mImpl->getComputePrecision();

    }


    TRT_NODISCARD bool isV2() const noexcept

    {

        return mImpl->isV2();

    }


protected:

    apiv::VNormalizationLayer* mImpl;

    virtual ~INormalizationLayer() noexcept = default;

};


class ISqueezeLayer : public ILayer

{

public:

    using ILayer::setInput;


protected:

    apiv::VSqueezeLayer* mImpl;

    virtual ~ISqueezeLayer() noexcept = default;

};


class IUnsqueezeLayer : public ILayer

{

public:

    using ILayer::setInput;


protected:

    apiv::VUnsqueezeLayer* mImpl;

    virtual ~IUnsqueezeLayer() noexcept = default;

};


enum class CumulativeOperation : int32_t

{

    kSUM = 0,

};


namespace impl

{


template <>

struct EnumMaxImpl<CumulativeOperation>

{

    static constexpr int32_t kVALUE = 1;

};


} // namespace impl


class ICumulativeLayer : public ILayer

{

public:

    bool setOperation(CumulativeOperation op) noexcept

    {

        return mImpl->setOperation(op);

    }


    CumulativeOperation getOperation() const noexcept

    {

        return mImpl->getOperation();

    }


    void setExclusive(bool exclusive) noexcept

    {

        mImpl->setExclusive(exclusive);

    }


    bool getExclusive() const noexcept

    {

        return mImpl->getExclusive();

    }


    void setReverse(bool reverse) noexcept

    {

        mImpl->setReverse(reverse);

    }


    bool getReverse() const noexcept

    {

        return mImpl->getReverse();

    }


protected:

    apiv::VCumulativeLayer* mImpl;

    virtual ~ICumulativeLayer() noexcept = default;

};


enum class AttentionNormalizationOp : int32_t

{

    kNONE

    = 0,

    kSOFTMAX = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<AttentionNormalizationOp>

{

    static constexpr int32_t kVALUE = 2;

};


} // namespace impl


class IAttentionBoundaryLayer : public ILayer

{

public:

    IAttention* getAttention() const noexcept

    {

        return mBoundary->getAttention();

    }


protected:

    virtual ~IAttentionBoundaryLayer() noexcept = default;

    apiv::VAttentionBoundaryLayer* mBoundary;

};


class IAttentionInputLayer : public IAttentionBoundaryLayer

{

public:

    using ILayer::setInput;


protected:

    virtual ~IAttentionInputLayer() noexcept = default;

    apiv::VAttentionInputLayer* mImpl;

};


class IAttentionOutputLayer : public IAttentionBoundaryLayer

{

public:

protected:

    virtual ~IAttentionOutputLayer() noexcept = default;

    apiv::VAttentionOutputLayer* mImpl;

};


class IAttention : public INoCopy

{

public:

    bool setNormalizationOperation(AttentionNormalizationOp op) noexcept

    {

        return mImpl->setNormalizationOperation(op);

    }


    AttentionNormalizationOp getNormalizationOperation() const noexcept

    {

        return mImpl->getNormalizationOperation();

    }


    bool setMask(ITensor& mask) noexcept

    {

        return mImpl->setMask(mask);

    }


    ITensor* getMask() noexcept

    {

        return mImpl->getMask();

    }


    bool setCausal(bool isCausal) noexcept

    {

        return mImpl->setCausal(isCausal);

    }


    bool getCausal() const noexcept

    {

        return mImpl->getCausal();

    }


    bool setDecomposable(bool decomposable) noexcept

    {

        return mImpl->setDecomposable(decomposable);

    }


    bool getDecomposable() const noexcept

    {

        return mImpl->getDecomposable();

    }


    bool setInput(int32_t index, ITensor& input) noexcept

    {

        return mImpl->setInput(index, input);

    }


    int32_t getNbInputs() const noexcept

    {

        return mImpl->getNbInputs();

    }


    ITensor* getInput(int32_t index) const noexcept

    {

        return mImpl->getInput(index);

    }


    int32_t getNbOutputs() const noexcept

    {

        return mImpl->getNbOutputs();

    }


    ITensor* getOutput(int32_t index) const noexcept

    {

        return mImpl->getOutput(index);

    }


    bool setName(char const* name) noexcept

    {

        return mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    bool setNormalizationQuantizeScale(ITensor& tensor) noexcept

    {

        return mImpl->setNormalizationQuantizeScale(tensor);

    }


    ITensor* getNormalizationQuantizeScale() const noexcept

    {

        return mImpl->getNormalizationQuantizeScale();

    }


    bool setNormalizationQuantizeToType(DataType type) noexcept

    {

        return mImpl->setNormalizationQuantizeToType(type);

    }


    DataType getNormalizationQuantizeToType() const noexcept

    {

        return mImpl->getNormalizationQuantizeToType();

    }


    bool setMetadata(char const* metadata) noexcept

    {

        return mImpl->setMetadata(metadata);

    }


    char const* getMetadata() const noexcept

    {

        return mImpl->getMetadata();

    }


protected:

    apiv::VAttention* mImpl;

    virtual ~IAttention() noexcept = default;

};


class IRotaryEmbeddingLayer : public ILayer

{

public:

    void setInterleaved(bool interleaved) noexcept

    {

        mImpl->setInterleaved(interleaved);

    }


    TRT_NODISCARD bool getInterleaved() const noexcept

    {

        return mImpl->getInterleaved();

    }


    TRT_NODISCARD bool setRotaryEmbeddingDim(int32_t rotaryEmbeddingDim) noexcept

    {

        return mImpl->setRotaryEmbeddingDim(rotaryEmbeddingDim);

    }


    TRT_NODISCARD int32_t getRotaryEmbeddingDim() const noexcept

    {

        return mImpl->getRotaryEmbeddingDim();

    }


    using ILayer::setInput;


protected:

    apiv::VRotaryEmbeddingLayer* mImpl;

    virtual ~IRotaryEmbeddingLayer() noexcept = default;

};


enum class KVCacheMode : int32_t

{

    kLINEAR = 0,

};


namespace impl

{

template <>

struct EnumMaxImpl<KVCacheMode>

{

    static constexpr int32_t kVALUE = 1;

};


} // namespace impl


class IKVCacheUpdateLayer : public ILayer

{

public:

    using ILayer::setInput;


    bool setCacheMode(KVCacheMode cacheMode) noexcept

    {

        return mImpl->setCacheMode(cacheMode);

    }


    KVCacheMode getCacheMode() const noexcept

    {

        return mImpl->getCacheMode();

    }


protected:

    apiv::VKVCacheUpdateLayer* mImpl;

    virtual ~IKVCacheUpdateLayer() noexcept = default;

};


class INetworkDefinition : public INoCopy

{

public:

    virtual ~INetworkDefinition() noexcept = default;


    ITensor* addInput(char const* name, DataType type, Dims const& dimensions) noexcept

    {

        return mImpl->addInput(name, type, dimensions);

    }


    void markOutput(ITensor& tensor) noexcept

    {

        mImpl->markOutput(tensor);

    }


    bool markDebug(ITensor& tensor) noexcept

    {

        return mImpl->markDebug(tensor);

    }


    bool unmarkDebug(ITensor& tensor) noexcept

    {

        return mImpl->unmarkDebug(tensor);

    }


    bool isDebugTensor(ITensor const& tensor) const noexcept

    {

        return mImpl->isDebugTensor(tensor);

    }


    bool markUnfusedTensorsAsDebugTensors() noexcept

    {

        return mImpl->markUnfusedTensorsAsDebugTensors();

    }


    bool unmarkUnfusedTensorsAsDebugTensors() noexcept

    {

        return mImpl->unmarkUnfusedTensorsAsDebugTensors();

    }


    IActivationLayer* addActivation(ITensor& input, ActivationType type) noexcept

    {

        return mImpl->addActivation(input, type);

    }


    ILRNLayer* addLRN(ITensor& input, int64_t window, float alpha, float beta, float k) noexcept

    {

        return mImpl->addLRN(input, window, alpha, beta, k);

    }


    IScaleLayer* addScale(ITensor& input, ScaleMode mode, Weights shift, Weights scale, Weights power) noexcept

    {

        return mImpl->addScale(input, mode, shift, scale, power);

    }


    ISoftMaxLayer* addSoftMax(ITensor& input) noexcept

    {

        return mImpl->addSoftMax(input);

    }


    IConcatenationLayer* addConcatenation(ITensor* const* inputs, int32_t nbInputs) noexcept

    {

        return mImpl->addConcatenation(inputs, nbInputs);

    }


    IElementWiseLayer* addElementWise(ITensor& input1, ITensor& input2, ElementWiseOperation op) noexcept

    {

        return mImpl->addElementWise(input1, input2, op);

    }


    IUnaryLayer* addUnary(ITensor& input, UnaryOperation operation) noexcept

    {

        return mImpl->addUnary(input, operation);

    }


    IShuffleLayer* addShuffle(ITensor& input) noexcept

    {

        return mImpl->addShuffle(input);

    }


    IOneHotLayer* addOneHot(ITensor& indices, ITensor& values, ITensor& depth, int32_t axis) noexcept

    {

        return mImpl->addOneHot(indices, values, depth, axis);

    }


    int32_t getNbLayers() const noexcept

    {

        return mImpl->getNbLayers();

    }


    ILayer* getLayer(int32_t index) const noexcept

    {

        return mImpl->getLayer(index);

    }


    int32_t getNbInputs() const noexcept

    {

        return mImpl->getNbInputs();

    }


    ITensor* getInput(int32_t index) const noexcept

    {

        return mImpl->getInput(index);

    }


    int32_t getNbOutputs() const noexcept

    {

        return mImpl->getNbOutputs();

    }


    ITensor* getOutput(int32_t index) const noexcept

    {

        return mImpl->getOutput(index);

    }


    IReduceLayer* addReduce(

        ITensor& input, ReduceOperation operation, uint32_t reduceAxes, bool keepDimensions) noexcept

    {

        return mImpl->addReduce(input, operation, reduceAxes, keepDimensions);

    }


    TRT_DEPRECATED ITopKLayer* addTopK(ITensor& input, TopKOperation op, int32_t k, uint32_t reduceAxes) noexcept

    {

        return mImpl->addTopK(input, op, k, reduceAxes);

    }


    ITopKLayer* addTopK(ITensor& input, TopKOperation op, int32_t k, uint32_t reduceAxes, DataType indicesType) noexcept

    {

        return mImpl->addTopKV2(input, op, k, reduceAxes, indicesType);

    }


    IGatherLayer* addGather(ITensor& data, ITensor& indices, int32_t axis) noexcept

    {

        return mImpl->addGather(data, indices, axis);

    }


    IGatherLayer* addGatherV2(ITensor& data, ITensor& indices, GatherMode mode) noexcept

    {

        return mImpl->addGatherV2(data, indices, mode);

    }


    IRaggedSoftMaxLayer* addRaggedSoftMax(ITensor& input, ITensor& bounds) noexcept

    {

        return mImpl->addRaggedSoftMax(input, bounds);

    }


    IMatrixMultiplyLayer* addMatrixMultiply(

        ITensor& input0, MatrixOperation op0, ITensor& input1, MatrixOperation op1) noexcept

    {

        return mImpl->addMatrixMultiply(input0, op0, input1, op1);

    }


    TRT_DEPRECATED INonZeroLayer* addNonZero(ITensor& input) noexcept

    {

        return mImpl->addNonZero(input);

    }


    INonZeroLayer* addNonZero(ITensor& input, DataType indicesType) noexcept

    {

        return mImpl->addNonZeroV2(input, indicesType);

    }


    IConstantLayer* addConstant(Dims const& dimensions, Weights weights) noexcept

    {

        return mImpl->addConstant(dimensions, weights);

    }


    IIdentityLayer* addIdentity(ITensor& input) noexcept

    {

        return mImpl->addIdentity(input);

    }


    ICastLayer* addCast(ITensor& input, DataType toType) noexcept

    {

        return mImpl->addCast(input, toType);

    }


    void removeTensor(ITensor& tensor) noexcept

    {

        mImpl->removeTensor(tensor);

    }


    void unmarkOutput(ITensor& tensor) noexcept

    {

        mImpl->unmarkOutput(tensor);

    }


    TRT_DEPRECATED IPluginV2Layer* addPluginV2(ITensor* const* inputs, int32_t nbInputs, IPluginV2& plugin) noexcept

    {

        return mImpl->addPluginV2(inputs, nbInputs, plugin);

    }


    IPluginV3Layer* addPluginV3(ITensor* const* inputs, int32_t nbInputs, ITensor* const* shapeInputs,

        int32_t nbShapeInputs, IPluginV3& plugin) noexcept

    {

        return mImpl->addPluginV3(inputs, nbInputs, shapeInputs, nbShapeInputs, plugin);

    }


    ISliceLayer* addSlice(ITensor& input, Dims const& start, Dims const& size, Dims const& stride) noexcept

    {

        return mImpl->addSlice(input, start, size, stride);

    }


    void setName(char const* name) noexcept

    {

        mImpl->setName(name);

    }


    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    IShapeLayer* addShape(ITensor& input) noexcept

    {

        return mImpl->addShape(input);

    }


    TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept

    {

        return mImpl->hasImplicitBatchDimension();

    }


    NetworkDefinitionCreationFlags getFlags() const noexcept

    {

        return mImpl->getFlags();

    }


    bool getFlag(NetworkDefinitionCreationFlag networkDefinitionCreationFlag) const noexcept

    {

        return mImpl->getFlag(networkDefinitionCreationFlag);

    }


    bool markOutputForShapes(ITensor& tensor) noexcept

    {

        return mImpl->markOutputForShapes(tensor);

    }


    bool unmarkOutputForShapes(ITensor& tensor) noexcept

    {

        return mImpl->unmarkOutputForShapes(tensor);

    }


    IParametricReLULayer* addParametricReLU(ITensor& input, ITensor& slope) noexcept

    {

        return mImpl->addParametricReLU(input, slope);

    }


    IConvolutionLayer* addConvolutionNd(

        ITensor& input, int64_t nbOutputMaps, Dims const& kernelSize, Weights kernelWeights, Weights biasWeights) noexcept

    {

        return mImpl->addConvolutionNd(input, nbOutputMaps, kernelSize, kernelWeights, biasWeights);

    }


    IPoolingLayer* addPoolingNd(ITensor& input, PoolingType type, Dims const& windowSize) noexcept

    {

        return mImpl->addPoolingNd(input, type, windowSize);

    }


    //

    IDeconvolutionLayer* addDeconvolutionNd(

        ITensor& input, int64_t nbOutputMaps, Dims kernelSize, Weights kernelWeights, Weights biasWeights) noexcept

    {

        return mImpl->addDeconvolutionNd(input, nbOutputMaps, kernelSize, kernelWeights, biasWeights);

    }


    IScaleLayer* addScaleNd(

        ITensor& input, ScaleMode mode, Weights shift, Weights scale, Weights power, int32_t channelAxis) noexcept

    {

        return mImpl->addScaleNd(input, mode, shift, scale, power, channelAxis);

    }


    IResizeLayer* addResize(ITensor& input) noexcept

    {

        return mImpl->addResize(input);

    }


    ILoop* addLoop() noexcept

    {

        return mImpl->addLoop();

    }


    IIfConditional* addIfConditional() noexcept

    {

        return mImpl->addIfConditional();

    }


    ISelectLayer* addSelect(ITensor& condition, ITensor& thenInput, ITensor& elseInput) noexcept

    {

        return mImpl->addSelect(condition, thenInput, elseInput);

    }


    IAssertionLayer* addAssertion(ITensor& condition, char const* message) noexcept

    {

        return mImpl->addAssertion(condition, message);

    }


    TRT_DEPRECATED IFillLayer* addFill(Dims const& dimensions, FillOperation op) noexcept

    {

        return mImpl->addFill(dimensions, op);

    }


    IFillLayer* addFill(Dims const& dimensions, FillOperation op, DataType outputType) noexcept

    {

        return mImpl->addFillV2(dimensions, op, outputType);

    }


    IPaddingLayer* addPaddingNd(ITensor& input, Dims const& prePadding, Dims const& postPadding) noexcept

    {

        return mImpl->addPaddingNd(input, prePadding, postPadding);

    }


    bool setWeightsName(Weights weights, char const* name) noexcept

    {

        return mImpl->setWeightsName(weights, name);

    }


    //

    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    TRT_DEPRECATED IDequantizeLayer* addDequantize(ITensor& input, ITensor& scale) noexcept

    {

        return mImpl->addDequantize(input, scale);

    }


    IDequantizeLayer* addDequantize(ITensor& input, ITensor& scale, DataType outputType) noexcept

    {

        return mImpl->addDequantizeV2(input, scale, outputType);

    }


    IScatterLayer* addScatter(ITensor& data, ITensor& indices, ITensor& updates, ScatterMode mode) noexcept

    {

        return mImpl->addScatter(data, indices, updates, mode);

    }


    TRT_DEPRECATED IQuantizeLayer* addQuantize(ITensor& input, ITensor& scale) noexcept

    {

        return mImpl->addQuantize(input, scale);

    }


    IQuantizeLayer* addQuantize(ITensor& input, ITensor& scale, DataType outputType) noexcept

    {

        return mImpl->addQuantizeV2(input, scale, outputType);

    }


    TRT_DEPRECATED IDynamicQuantizeLayer* addDynamicQuantize(

        ITensor& input, int32_t axis, int32_t blockSize, DataType outputType, DataType scaleType) noexcept

    {

        return mImpl->addDynamicQuantize(input, axis, blockSize, outputType, scaleType);

    }


    IDynamicQuantizeLayer* addDynamicQuantizeV2(

        ITensor& input, Dims const& blockShape, DataType outputType, DataType scaleType) noexcept

    {

        return mImpl->addDynamicQuantizeV2(input, blockShape, outputType, scaleType);

    }


    IEinsumLayer* addEinsum(ITensor* const* inputs, int32_t nbInputs, char const* equation) noexcept

    {

        return mImpl->addEinsum(inputs, nbInputs, equation);

    }


    IGridSampleLayer* addGridSample(ITensor& input, ITensor& grid) noexcept

    {

        return mImpl->addGridSample(input, grid);

    }


    TRT_DEPRECATED INMSLayer* addNMS(ITensor& boxes, ITensor& scores, ITensor& maxOutputBoxesPerClass) noexcept

    {

        return mImpl->addNMS(boxes, scores, maxOutputBoxesPerClass);

    }


    INMSLayer* addNMS(ITensor& boxes, ITensor& scores, ITensor& maxOutputBoxesPerClass, DataType indicesType) noexcept

    {

        return mImpl->addNMSV2(boxes, scores, maxOutputBoxesPerClass, indicesType);

    }


    IReverseSequenceLayer* addReverseSequence(ITensor& input, ITensor& sequenceLens) noexcept

    {

        return mImpl->addReverseSequence(input, sequenceLens);

    }


    TRT_DEPRECATED INormalizationLayer* addNormalization(ITensor& input, ITensor& scale, ITensor& bias, uint32_t axesMask) noexcept

    {

        return mImpl->addNormalization(input, scale, bias, axesMask);

    }


    ICumulativeLayer* addCumulative(ITensor& input, ITensor& axis, CumulativeOperation operation, bool exclusive, bool reverse) noexcept

    {

        return mImpl->addCumulative(input, axis, operation, exclusive, reverse);

    }


    IAttention* addAttention(

        ITensor& query, ITensor& key, ITensor& value, AttentionNormalizationOp normOp, bool causal) noexcept

    {

        return mImpl->addAttention(query, key, value, normOp, causal);

    }


    IRotaryEmbeddingLayer* addRotaryEmbedding(ITensor& input, ITensor& cosCache, ITensor& sinCache, bool interleaved, int32_t rotaryEmbeddingDim) noexcept

    {

        return mImpl->addRotaryEmbedding(input, cosCache, sinCache, interleaved, rotaryEmbeddingDim);

    }


    IKVCacheUpdateLayer* addKVCacheUpdate(

        ITensor& cache, ITensor& update, ITensor& writeIndices, KVCacheMode cacheMode) noexcept

    {

        return mImpl->addKVCacheUpdate(cache, update, writeIndices, cacheMode);

    }


    virtual IBuilder& getBuilder() const noexcept

    {

        return mImpl->getBuilder();

    }


    bool markWeightsRefittable(char const* name) noexcept

    {

        return mImpl->markWeightsRefittable(name);

    }


    bool unmarkWeightsRefittable(char const* name) noexcept

    {

        return mImpl->unmarkWeightsRefittable(name);

    }


    bool areWeightsMarkedRefittable(char const* name) const noexcept

    {

        return mImpl->areWeightsMarkedRefittable(name);

    }


    ISqueezeLayer* addSqueeze(ITensor& input, ITensor& axes) noexcept

    {

        return mImpl->addSqueeze(input, axes);

    }


    IUnsqueezeLayer* addUnsqueeze(ITensor& input, ITensor& axes) noexcept

    {

        return mImpl->addUnsqueeze(input, axes);

    }


    TRT_NODISCARD INormalizationLayer* addNormalizationV2(ITensor& input, ITensor& scale, ITensor& bias, uint32_t axesMask) noexcept

    {

        return mImpl->addNormalizationV2(input, scale, bias, axesMask);

    }


protected:

    apiv::VNetworkDefinition* mImpl;

};


enum class CalibrationAlgoType : int32_t

{

    kLEGACY_CALIBRATION TRT_DEPRECATED_ENUM = 0,

    kENTROPY_CALIBRATION TRT_DEPRECATED_ENUM = 1,

    kENTROPY_CALIBRATION_2 TRT_DEPRECATED_ENUM = 2,

    kMINMAX_CALIBRATION TRT_DEPRECATED_ENUM = 3,

};


template <>

constexpr inline int32_t EnumMax<CalibrationAlgoType>() noexcept

{

    return 4;

}


class TRT_DEPRECATED IInt8Calibrator : public IVersionedInterface

{

public:

    TRT_DEPRECATED virtual int32_t getBatchSize() const noexcept = 0;


    virtual bool getBatch(void* bindings[], char const* names[], int32_t nbBindings) noexcept = 0;


    virtual void const* readCalibrationCache(std::size_t& length) noexcept = 0;


    virtual void writeCalibrationCache(void const* ptr, std::size_t length) noexcept = 0;


    virtual CalibrationAlgoType getAlgorithm() noexcept = 0;


    ~IInt8Calibrator() noexcept override = default;

};


namespace v_1_0

{

class TRT_DEPRECATED IInt8EntropyCalibrator : public IInt8Calibrator

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IInt8EntropyCalibrator", 1, 0};

    }


    CalibrationAlgoType getAlgorithm() noexcept override

    {

        return CalibrationAlgoType::kENTROPY_CALIBRATION;

    }


    ~IInt8EntropyCalibrator() noexcept override = default;

};

} // namespace v_1_0


using IInt8EntropyCalibrator = v_1_0::IInt8EntropyCalibrator;


namespace v_1_0

{

class TRT_DEPRECATED IInt8EntropyCalibrator2 : public IInt8Calibrator

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IInt8EntropyCalibrator2", 1, 0};

    }


    CalibrationAlgoType getAlgorithm() noexcept override

    {

        return CalibrationAlgoType::kENTROPY_CALIBRATION_2;

    }


    ~IInt8EntropyCalibrator2() noexcept override = default;

};

} // namespace v_1_0


using IInt8EntropyCalibrator2 = v_1_0::IInt8EntropyCalibrator2;


namespace v_1_0

{

class TRT_DEPRECATED IInt8MinMaxCalibrator : public IInt8Calibrator

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IInt8MinMaxCalibrator", 1, 0};

    }


    CalibrationAlgoType getAlgorithm() noexcept override

    {

        return CalibrationAlgoType::kMINMAX_CALIBRATION;

    }


    ~IInt8MinMaxCalibrator() noexcept override = default;

};

} // namespace v_1_0


using IInt8MinMaxCalibrator = v_1_0::IInt8MinMaxCalibrator;


namespace v_1_0

{

class TRT_DEPRECATED IInt8LegacyCalibrator : public IInt8Calibrator

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IInt8Calibrator", 1, 0};

    }


    CalibrationAlgoType getAlgorithm() noexcept override

    {

        return CalibrationAlgoType::kLEGACY_CALIBRATION;

    }


    virtual double getQuantile() const noexcept = 0;


    virtual double getRegressionCutoff() const noexcept = 0;


    virtual void const* readHistogramCache(std::size_t& length) noexcept = 0;


    virtual void writeHistogramCache(void const* ptr, std::size_t length) noexcept = 0;


    ~IInt8LegacyCalibrator() noexcept override = default;

};

} // namespace v_1_0


using IInt8LegacyCalibrator = v_1_0::IInt8LegacyCalibrator;


class TRT_DEPRECATED IAlgorithmIOInfo : public INoCopy

{

public:

    DataType getDataType() const noexcept

    {

        return mImpl->getDataType();

    }


    Dims getStrides() const noexcept

    {

        return mImpl->getStrides();

    }


    int64_t getVectorizedDim() const noexcept

    {

        return mImpl->getVectorizedDim();

    }


    int64_t getComponentsPerElement() const noexcept

    {

        return mImpl->getComponentsPerElement();

    }


protected:

    virtual ~IAlgorithmIOInfo() noexcept = default;

    apiv::VAlgorithmIOInfo* mImpl;

};


class TRT_DEPRECATED IAlgorithmVariant : public INoCopy

{

public:

    int64_t getImplementation() const noexcept

    {

        return mImpl->getImplementation();

    }


    int64_t getTactic() const noexcept

    {

        return mImpl->getTactic();

    }


protected:

    virtual ~IAlgorithmVariant() noexcept = default;

    apiv::VAlgorithmVariant* mImpl;

};


class TRT_DEPRECATED IAlgorithmContext : public INoCopy

{

public:

    char const* getName() const noexcept

    {

        return mImpl->getName();

    }


    Dims getDimensions(int32_t index, OptProfileSelector select) const noexcept

    {

        return mImpl->getDimensions(index, select);

    }


    int32_t getNbInputs() const noexcept

    {

        return mImpl->getNbInputs();

    }


    int32_t getNbOutputs() const noexcept

    {

        return mImpl->getNbOutputs();

    }


protected:

    virtual ~IAlgorithmContext() noexcept = default;

    apiv::VAlgorithmContext* mImpl;

};


class TRT_DEPRECATED IAlgorithm : public INoCopy

{

public:

    IAlgorithmVariant const& getAlgorithmVariant() const noexcept

    {

        return mImpl->getAlgorithmVariant();

    }


    float getTimingMSec() const noexcept

    {

        return mImpl->getTimingMSec();

    }


    std::size_t getWorkspaceSize() const noexcept

    {

        return mImpl->getWorkspaceSize();

    }


    IAlgorithmIOInfo const* getAlgorithmIOInfoByIndex(int32_t index) const noexcept

    {

        return mImpl->getAlgorithmIOInfoByIndex(index);

    }


protected:

    virtual ~IAlgorithm() noexcept = default;

    apiv::VAlgorithm* mImpl;

}; // IAlgorithm


namespace v_1_0

{

class TRT_DEPRECATED IAlgorithmSelector : public IVersionedInterface

{

public:

    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IAlgorithmSelector", 1, 0};

    }

    virtual int32_t selectAlgorithms(IAlgorithmContext const& context, IAlgorithm const* const* choices,

        int32_t nbChoices, int32_t* selection) noexcept = 0;


    virtual void reportAlgorithms(IAlgorithmContext const* const* algoContexts, IAlgorithm const* const* algoChoices,

        int32_t nbAlgorithms) noexcept = 0;


    virtual ~IAlgorithmSelector() noexcept = default;

};

} // namespace v_1_0


using IAlgorithmSelector = v_1_0::IAlgorithmSelector;


using QuantizationFlags = uint32_t;


enum class QuantizationFlag : int32_t

{

    kCALIBRATE_BEFORE_FUSION TRT_DEPRECATED_ENUM = 0

};


template <>

constexpr inline int32_t EnumMax<QuantizationFlag>() noexcept

{

    return 1;

}


enum class RuntimePlatform : int32_t

{

    kSAME_AS_BUILD = 0,


    kWINDOWS_AMD64 = 1,


};


namespace impl

{

template <>

struct EnumMaxImpl<RuntimePlatform>

{

    static constexpr int32_t kVALUE = 2;

};

} // namespace impl


using BuilderFlags = uint32_t;


enum class BuilderFlag : int32_t

{

    kFP16 TRT_DEPRECATED_ENUM = 0,


    kINT8 TRT_DEPRECATED_ENUM = 1,


    kDEBUG = 2,


    kGPU_FALLBACK = 3,


    kREFIT = 4,


    kDISABLE_TIMING_CACHE = 5,


    kTF32 = 6,


    kSPARSE_WEIGHTS = 7,


    kSAFETY_SCOPE = 8,


    kOBEY_PRECISION_CONSTRAINTS TRT_DEPRECATED_ENUM = 9,


    kPREFER_PRECISION_CONSTRAINTS TRT_DEPRECATED_ENUM = 10,


    kDIRECT_IO TRT_DEPRECATED_ENUM = 11,


    kREJECT_EMPTY_ALGORITHMS TRT_DEPRECATED_ENUM = 12,


    kVERSION_COMPATIBLE = 13,


    kEXCLUDE_LEAN_RUNTIME = 14,


    kFP8 TRT_DEPRECATED_ENUM = 15,


    kERROR_ON_TIMING_CACHE_MISS = 16,


    kBF16 TRT_DEPRECATED_ENUM = 17,


    kDISABLE_COMPILATION_CACHE = 18,


    kSTRIP_PLAN = 19,


    kWEIGHTLESS TRT_DEPRECATED_ENUM = kSTRIP_PLAN,


    kREFIT_IDENTICAL = 20,


    kWEIGHT_STREAMING = 21,


    kINT4 TRT_DEPRECATED_ENUM = 22,


    kREFIT_INDIVIDUAL = 23,


    kSTRICT_NANS = 24,


    kMONITOR_MEMORY = 25,


    kFP4 TRT_DEPRECATED_ENUM = 26,


    kEDITABLE_TIMING_CACHE = 27,


    kDISTRIBUTIVE_INDEPENDENCE = 28,


#if ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION

    kREQUIRE_USER_ALLOCATION = 29,

#endif // ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION


};


template <>

constexpr inline int32_t EnumMax<BuilderFlag>() noexcept

{

#if ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION

    return 30;

#else

    return 29;

#endif // ENABLE_FEATURE_DISABLE_RUNTIME_ALLOCATION

}


namespace v_1_0

{

struct TimingCacheKey

{

    uint8_t data[16];

};


struct TimingCacheValue

{

    uint64_t tacticHash;

    float timingMSec;

    static constexpr uint64_t kINVALID_TACTIC_HASH = UINT64_MAX;

};

} // namespace v_1_0


class ITimingCache : public INoCopy

{

public:

    virtual ~ITimingCache() noexcept = default;


    nvinfer1::IHostMemory* serialize() const noexcept

    {

        return mImpl->serialize();

    }


    bool combine(ITimingCache const& inputCache, bool ignoreMismatch) noexcept

    {

        return mImpl->combine(inputCache, ignoreMismatch);

    }


    bool reset() noexcept

    {

        return mImpl->reset();

    }


    int64_t queryKeys(TimingCacheKey* keyBuffer, int64_t capacity) const noexcept

    {

        return mImpl->queryKeys(keyBuffer, capacity);

    }


    TimingCacheValue query(TimingCacheKey const& key) const noexcept

    {

        return mImpl->query(key);

    }


    bool update(TimingCacheKey const& key, TimingCacheValue const& value) noexcept

    {

        return mImpl->update(key, value);

    }


protected:

    apiv::VTimingCache* mImpl;

};


enum class MemoryPoolType : int32_t

{

    kWORKSPACE = 0,


    kDLA_MANAGED_SRAM = 1,


    kDLA_LOCAL_DRAM = 2,


    kDLA_GLOBAL_DRAM = 3,


    kTACTIC_DRAM = 4,


    kTACTIC_SHARED_MEMORY = 5,

};


template <>

constexpr inline int32_t EnumMax<MemoryPoolType>() noexcept

{

    return 6;

}


enum class PreviewFeature : int32_t

{

    kPROFILE_SHARING_0806 TRT_DEPRECATED_ENUM = 0,


    kALIASED_PLUGIN_IO_10_03 = 1,


    kRUNTIME_ACTIVATION_RESIZE_10_10 = 2

};


namespace impl

{

template <>

struct EnumMaxImpl<PreviewFeature>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


enum class HardwareCompatibilityLevel : int32_t

{

    kNONE = 0,


    kAMPERE_PLUS = 1,


    kSAME_COMPUTE_CAPABILITY = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<HardwareCompatibilityLevel>

{

    static constexpr int32_t kVALUE = 3;

};

} // namespace impl


enum class TilingOptimizationLevel : int32_t

{

    kNONE = 0,


    kFAST = 1,


    kMODERATE = 2,


    kFULL = 3


};


namespace impl

{

template <>

struct EnumMaxImpl<TilingOptimizationLevel>

{

    static constexpr int32_t kVALUE = 4;

};

} // namespace impl


namespace v_1_0

{

class IProgressMonitor : public IVersionedInterface

{

public:

    IProgressMonitor() = default;

    virtual ~IProgressMonitor() noexcept = default;


    InterfaceInfo getInterfaceInfo() const noexcept override

    {

        return InterfaceInfo{"IProgressMonitor", 1, 0};

    }


    virtual void phaseStart(char const* phaseName, char const* parentPhase, int32_t nbSteps) noexcept = 0;


    virtual bool stepComplete(char const* phaseName, int32_t step) noexcept = 0;


    virtual void phaseFinish(char const* phaseName) noexcept = 0;


}; // class IProgressMonitor

} // namespace v_1_0


using IProgressMonitor = v_1_0::IProgressMonitor;


class IBuilderConfig : public INoCopy

{

public:

    virtual ~IBuilderConfig() noexcept = default;


    virtual void setAvgTimingIterations(int32_t avgTiming) noexcept

    {

        mImpl->setAvgTimingIterations(avgTiming);

    }


    int32_t getAvgTimingIterations() const noexcept

    {

        return mImpl->getAvgTimingIterations();

    }


    void setEngineCapability(EngineCapability capability) noexcept

    {

        mImpl->setEngineCapability(capability);

    }


    EngineCapability getEngineCapability() const noexcept

    {

        return mImpl->getEngineCapability();

    }


    TRT_DEPRECATED void setInt8Calibrator(IInt8Calibrator* calibrator) noexcept

    {

        mImpl->setInt8Calibrator(calibrator);

    }


    TRT_DEPRECATED IInt8Calibrator* getInt8Calibrator() const noexcept

    {

        return mImpl->getInt8Calibrator();

    }


    void setFlags(BuilderFlags builderFlags) noexcept

    {

        mImpl->setFlags(builderFlags);

    }


    BuilderFlags getFlags() const noexcept

    {

        return mImpl->getFlags();

    }


    void clearFlag(BuilderFlag builderFlag) noexcept

    {

        mImpl->clearFlag(builderFlag);

    }


    void setFlag(BuilderFlag builderFlag) noexcept

    {

        mImpl->setFlag(builderFlag);

    }


    bool getFlag(BuilderFlag builderFlag) const noexcept

    {

        return mImpl->getFlag(builderFlag);

    }


    void setDeviceType(ILayer const* layer, DeviceType deviceType) noexcept

    {

        mImpl->setDeviceType(layer, deviceType);

    }


    DeviceType getDeviceType(ILayer const* layer) const noexcept

    {

        return mImpl->getDeviceType(layer);

    }


    bool isDeviceTypeSet(ILayer const* layer) const noexcept

    {

        return mImpl->isDeviceTypeSet(layer);

    }


    void resetDeviceType(ILayer const* layer) noexcept

    {

        mImpl->resetDeviceType(layer);

    }


    bool canRunOnDLA(ILayer const* layer) const noexcept

    {

        return mImpl->canRunOnDLA(layer);

    }


    void setDLACore(int32_t dlaCore) noexcept

    {

        mImpl->setDLACore(dlaCore);

    }


    int32_t getDLACore() const noexcept

    {

        return mImpl->getDLACore();

    }


    void setDefaultDeviceType(DeviceType deviceType) noexcept

    {

        mImpl->setDefaultDeviceType(deviceType);

    }


    DeviceType getDefaultDeviceType() const noexcept

    {

        return mImpl->getDefaultDeviceType();

    }


    void reset() noexcept

    {

        mImpl->reset();

    }


    void setProfileStream(const cudaStream_t stream) noexcept

    {

        return mImpl->setProfileStream(stream);

    }


    cudaStream_t getProfileStream() const noexcept

    {

        return mImpl->getProfileStream();

    }


    int32_t addOptimizationProfile(IOptimizationProfile const* profile) noexcept

    {

        return mImpl->addOptimizationProfile(profile);

    }


    int32_t getNbOptimizationProfiles() const noexcept

    {

        return mImpl->getNbOptimizationProfiles();

    }


    void setProfilingVerbosity(ProfilingVerbosity verbosity) noexcept

    {

        mImpl->setProfilingVerbosity(verbosity);

    }


    ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

        return mImpl->getProfilingVerbosity();

    }


    TRT_DEPRECATED void setAlgorithmSelector(IAlgorithmSelector* selector) noexcept

    {

        mImpl->setAlgorithmSelector(selector);

    }


    TRT_DEPRECATED IAlgorithmSelector* getAlgorithmSelector() const noexcept

    {

        return mImpl->getAlgorithmSelector();

    }


    TRT_DEPRECATED bool setCalibrationProfile(IOptimizationProfile const* profile) noexcept

    {

        return mImpl->setCalibrationProfile(profile);

    }


    TRT_DEPRECATED IOptimizationProfile const* getCalibrationProfile() noexcept

    {

        return mImpl->getCalibrationProfile();

    }


    TRT_DEPRECATED void setQuantizationFlags(QuantizationFlags flags) noexcept

    {

        mImpl->setQuantizationFlags(flags);

    }


    TRT_DEPRECATED QuantizationFlags getQuantizationFlags() const noexcept

    {

        return mImpl->getQuantizationFlags();

    }


    TRT_DEPRECATED void clearQuantizationFlag(QuantizationFlag flag) noexcept

    {

        mImpl->clearQuantizationFlag(flag);

    }


    TRT_DEPRECATED void setQuantizationFlag(QuantizationFlag flag) noexcept

    {

        mImpl->setQuantizationFlag(flag);

    }


    TRT_DEPRECATED bool getQuantizationFlag(QuantizationFlag flag) const noexcept

    {

        return mImpl->getQuantizationFlag(flag);

    }


    bool setTacticSources(TacticSources tacticSources) noexcept

    {

        return mImpl->setTacticSources(tacticSources);

    }


    TacticSources getTacticSources() const noexcept

    {

        return mImpl->getTacticSources();

    }


    nvinfer1::ITimingCache* createTimingCache(void const* blob, std::size_t size) const noexcept

    {

        return mImpl->createTimingCache(blob, size);

    }


    bool setTimingCache(ITimingCache const& cache, bool ignoreMismatch) noexcept

    {

        return mImpl->setTimingCache(cache, ignoreMismatch);

    }


    nvinfer1::ITimingCache const* getTimingCache() const noexcept

    {

        return mImpl->getTimingCache();

    }


    void setMemoryPoolLimit(MemoryPoolType pool, std::size_t poolSize) noexcept

    {

        mImpl->setMemoryPoolLimit(pool, poolSize);

    }


    std::size_t getMemoryPoolLimit(MemoryPoolType pool) const noexcept

    {

        return mImpl->getMemoryPoolLimit(pool);

    }


    void setPreviewFeature(PreviewFeature feature, bool enable) noexcept

    {

        mImpl->setPreviewFeature(feature, enable);

    }


    bool getPreviewFeature(PreviewFeature feature) const noexcept

    {

        return mImpl->getPreviewFeature(feature);

    }


    void setBuilderOptimizationLevel(int32_t level) noexcept

    {

        mImpl->setBuilderOptimizationLevel(level);

    }


    int32_t getBuilderOptimizationLevel() noexcept

    {

        return mImpl->getBuilderOptimizationLevel();

    }


    void setHardwareCompatibilityLevel(HardwareCompatibilityLevel hardwareCompatibilityLevel) noexcept

    {

        mImpl->setHardwareCompatibilityLevel(hardwareCompatibilityLevel);

    }


    HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

        return mImpl->getHardwareCompatibilityLevel();

    }


    void setPluginsToSerialize(char const* const* paths, int32_t nbPaths) noexcept

    {

        mImpl->setPluginsToSerialize(paths, nbPaths);

    }


    char const* getPluginToSerialize(int32_t index) const noexcept

    {

        return mImpl->getPluginToSerialize(index);

    }


    int32_t getNbPluginsToSerialize() const noexcept

    {

        return mImpl->getNbPluginsToSerialize();

    }


    void setMaxAuxStreams(int32_t nbStreams) noexcept

    {

        mImpl->setMaxAuxStreams(nbStreams);

    }


    int32_t getMaxAuxStreams() const noexcept

    {

        return mImpl->getMaxAuxStreams();

    }


    void setProgressMonitor(IProgressMonitor* monitor) noexcept

    {

        return mImpl->setProgressMonitor(monitor);

    }


    IProgressMonitor* getProgressMonitor() const noexcept

    {

        return mImpl->getProgressMonitor();

    }


    void setRuntimePlatform(RuntimePlatform runtimePlatform) noexcept

    {

        mImpl->setRuntimePlatform(runtimePlatform);

    }


    RuntimePlatform getRuntimePlatform() const noexcept

    {

        return mImpl->getRuntimePlatform();

    }


    void setMaxNbTactics(int32_t maxNbTactics) noexcept

    {

        mImpl->setMaxNbTactics(maxNbTactics);

    }


    int32_t getMaxNbTactics() const noexcept

    {

        return mImpl->getMaxNbTactics();

    }


    bool setTilingOptimizationLevel(TilingOptimizationLevel level) noexcept

    {

        return mImpl->setTilingOptimizationLevel(level);

    }


    TilingOptimizationLevel getTilingOptimizationLevel() const noexcept

    {

        return mImpl->getTilingOptimizationLevel();

    }


    bool setL2LimitForTiling(int64_t size) noexcept

    {

        return mImpl->setL2LimitForTiling(size);

    }


    int64_t getL2LimitForTiling() const noexcept

    {

        return mImpl->getL2LimitForTiling();

    }


    bool setRemoteAutoTuningConfig(char const* config) noexcept

    {

        return mImpl->setRemoteAutoTuningConfig(config);

    }


    char const* getRemoteAutoTuningConfig() const noexcept

    {

        return mImpl->getRemoteAutoTuningConfig();

    }


protected:

    apiv::VBuilderConfig* mImpl;

};


using NetworkDefinitionCreationFlags = uint32_t;


enum class NetworkDefinitionCreationFlag : int32_t

{

    kEXPLICIT_BATCH TRT_DEPRECATED_ENUM = 0,


    kSTRONGLY_TYPED = 1,

    kPREFER_JIT_PYTHON_PLUGINS = 2,


    kPREFER_AOT_PYTHON_PLUGINS = 3,

};


template <>

constexpr inline int32_t EnumMax<NetworkDefinitionCreationFlag>() noexcept

{

    return 4;

}


class IBuilder : public INoCopy

{

public:

    virtual ~IBuilder() noexcept = default;


    TRT_DEPRECATED bool platformHasFastFp16() const noexcept

    {

        return mImpl->platformHasFastFp16();

    }


    TRT_DEPRECATED bool platformHasFastInt8() const noexcept

    {

        return mImpl->platformHasFastInt8();

    }


    int32_t getMaxDLABatchSize() const noexcept

    {

        return mImpl->getMaxDLABatchSize();

    }


    int32_t getNbDLACores() const noexcept

    {

        return mImpl->getNbDLACores();

    }


    void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

        mImpl->setGpuAllocator(allocator);

    }


    nvinfer1::IBuilderConfig* createBuilderConfig() noexcept

    {

        return mImpl->createBuilderConfig();

    }


    nvinfer1::INetworkDefinition* createNetworkV2(NetworkDefinitionCreationFlags flags) noexcept

    {

        return mImpl->createNetworkV2(flags);

    }


    nvinfer1::IOptimizationProfile* createOptimizationProfile() noexcept

    {

        return mImpl->createOptimizationProfile();

    }


    void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

        mImpl->setErrorRecorder(recorder);

    }


    IErrorRecorder* getErrorRecorder() const noexcept

    {

        return mImpl->getErrorRecorder();

    }


    void reset() noexcept

    {

        mImpl->reset();

    }


    TRT_DEPRECATED bool platformHasTf32() const noexcept

    {

        return mImpl->platformHasTf32();

    }


    nvinfer1::IHostMemory* buildSerializedNetwork(INetworkDefinition& network, IBuilderConfig& config) noexcept

    {

        return mImpl->buildSerializedNetwork(network, config);

    }


    bool buildSerializedNetworkToStream(

        INetworkDefinition& network, IBuilderConfig& config, IStreamWriter& writer) noexcept

    {

        return mImpl->buildSerializedNetworkToStream(network, config, writer);

    }


    nvinfer1::IHostMemory* buildSerializedNetwork(

        INetworkDefinition& network, IBuilderConfig& config, IHostMemory*& kernelText) noexcept

    {

        return mImpl->buildSerializedNetworkWithKernelText(network, config, kernelText);

    }


    nvinfer1::ICudaEngine* buildEngineWithConfig(INetworkDefinition& network, IBuilderConfig& config) noexcept

    {

        return mImpl->buildEngineWithConfig(network, config);

    }


    bool isNetworkSupported(INetworkDefinition const& network, IBuilderConfig const& config) const noexcept

    {

        return mImpl->isNetworkSupported(network, config);

    }


    ILogger* getLogger() const noexcept

    {

        return mImpl->getLogger();

    }


    bool setMaxThreads(int32_t maxThreads) noexcept

    {

        return mImpl->setMaxThreads(maxThreads);

    }


    int32_t getMaxThreads() const noexcept

    {

        return mImpl->getMaxThreads();

    }


    IPluginRegistry& getPluginRegistry() noexcept

    {

        return mImpl->getPluginRegistry();

    }


protected:

    apiv::VBuilder* mImpl;

};


} // namespace nvinfer1


extern "C" TENSORRTAPI void* createInferBuilder_INTERNAL(void* logger, int32_t version) noexcept;


namespace nvinfer1

{

namespace

{


inline IBuilder* createInferBuilder(ILogger& logger) noexcept

{

    return static_cast<IBuilder*>(createInferBuilder_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


} // namespace


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getBuilderPluginRegistry(

    nvinfer1::EngineCapability capability) noexcept;


namespace safe

{

class IPluginRegistry;

} // namespace safe


extern "C" TRT_DEPRECATED_API nvinfer1::safe::IPluginRegistry* getBuilderSafePluginRegistry(

    nvinfer1::EngineCapability capability) noexcept;


} // namespace nvinfer1


#endif // NV_INFER_H

NvInferLegacyDims.h

NvInferRuntime.h

TRT_DEPRECATED_API
#define TRT_DEPRECATED_API
Definition: NvInferRuntimeBase.h:44

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:69

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
Definition: NvInferRuntimeBase.h:101

TRT_NODISCARD
#define TRT_NODISCARD
A stand-in for [[nodiscard]] and [[nodiscard(REASON)]] that works with older compilers.
Definition: NvInferRuntimeBase.h:57

TRT_DEPRECATED
#define TRT_DEPRECATED
Definition: NvInferRuntimeBase.h:42

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
Definition: NvInferRuntimeBase.h:43

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:218

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
The maximum rank (number of dimensions) supported for a tensor.
Definition: NvInferRuntimeBase.h:221

nvinfer1::IActivationLayer
An Activation layer in a network definition.
Definition: NvInfer.h:1387

nvinfer1::IActivationLayer::setBeta
void setBeta(float beta) noexcept
Set the beta parameter (must be finite).
Definition: NvInfer.h:1435

nvinfer1::IActivationLayer::setActivationType
void setActivationType(ActivationType type) noexcept
Set the type of activation to be performed.
Definition: NvInfer.h:1396

nvinfer1::IActivationLayer::getActivationType
ActivationType getActivationType() const noexcept
Get the type of activation to be performed.
Definition: NvInfer.h:1406

nvinfer1::IActivationLayer::getAlpha
float getAlpha() const noexcept
Get the alpha parameter.
Definition: NvInfer.h:1444

nvinfer1::IActivationLayer::~IActivationLayer
virtual ~IActivationLayer() noexcept=default

nvinfer1::IActivationLayer::getBeta
float getBeta() const noexcept
Get the beta parameter.
Definition: NvInfer.h:1453

nvinfer1::IActivationLayer::setAlpha
void setAlpha(float alpha) noexcept
Set the alpha parameter (must be finite).
Definition: NvInfer.h:1421

nvinfer1::IAlgorithmContext
Describes the context and requirements, that could be fulfilled by one or more instances of IAlgorith...
Definition: NvInfer.h:9592

nvinfer1::IAlgorithmContext::getNbOutputs
int32_t getNbOutputs() const noexcept
Return number of outputs of the algorithm.
Definition: NvInfer.h:9627

nvinfer1::IAlgorithmContext::getNbInputs
int32_t getNbInputs() const noexcept
Return number of inputs of the algorithm.
Definition: NvInfer.h:9619

nvinfer1::IAlgorithmContext::getName
char const * getName() const noexcept
Return name of the algorithm node.
Definition: NvInfer.h:9599

nvinfer1::IAlgorithmContext::~IAlgorithmContext
virtual ~IAlgorithmContext() noexcept=default

nvinfer1::IAlgorithmContext::getDimensions
Dims getDimensions(int32_t index, OptProfileSelector select) const noexcept
Get the minimum / optimum / maximum dimensions for input or output tensor.
Definition: NvInfer.h:9611

nvinfer1::IAlgorithm
Describes a variation of execution of a layer. An algorithm is represented by IAlgorithmVariant and t...
Definition: NvInfer.h:9651

nvinfer1::IAlgorithm::getWorkspaceSize
std::size_t getWorkspaceSize() const noexcept
The size of the GPU temporary memory in bytes which the algorithm uses at execution time.
Definition: NvInfer.h:9672

nvinfer1::IAlgorithm::getTimingMSec
float getTimingMSec() const noexcept
The time in milliseconds to execute the algorithm.
Definition: NvInfer.h:9664

nvinfer1::IAlgorithm::getAlgorithmIOInfoByIndex
IAlgorithmIOInfo const * getAlgorithmIOInfoByIndex(int32_t index) const noexcept
Returns the format of an Algorithm input or output. Algorithm inputs are incrementally numbered first...
Definition: NvInfer.h:9686

nvinfer1::IAlgorithm::~IAlgorithm
virtual ~IAlgorithm() noexcept=default

nvinfer1::IAlgorithm::getAlgorithmVariant
IAlgorithmVariant const & getAlgorithmVariant() const noexcept
Returns the algorithm variant.
Definition: NvInfer.h:9656

nvinfer1::IAlgorithmIOInfo
Carries information about input or output of the algorithm. IAlgorithmIOInfo for all the input and ou...
Definition: NvInfer.h:9495

nvinfer1::IAlgorithmIOInfo::~IAlgorithmIOInfo
virtual ~IAlgorithmIOInfo() noexcept=default

nvinfer1::IAlgorithmIOInfo::getVectorizedDim
int64_t getVectorizedDim() const noexcept
Return the index of the vectorized dimension or -1 for non-vectorized formats.
Definition: NvInfer.h:9523

nvinfer1::IAlgorithmIOInfo::getStrides
Dims getStrides() const noexcept
Return strides of the input/output tensor of algorithm. For vectorized formats, strides are given in ...
Definition: NvInfer.h:9513

nvinfer1::IAlgorithmIOInfo::getDataType
DataType getDataType() const noexcept
Return DataType of the input/output of algorithm.
Definition: NvInfer.h:9502

nvinfer1::IAlgorithmIOInfo::getComponentsPerElement
int64_t getComponentsPerElement() const noexcept
Return the number of components per element. This is always 1 for non-vectorized formats.
Definition: NvInfer.h:9534

nvinfer1::IAlgorithmVariant
provides a unique 128-bit identifier, which along with the input and output information denotes the v...
Definition: NvInfer.h:9558

nvinfer1::IAlgorithmVariant::~IAlgorithmVariant
virtual ~IAlgorithmVariant() noexcept=default

nvinfer1::IAlgorithmVariant::getTactic
int64_t getTactic() const noexcept
Return tactic of the algorithm.
Definition: NvInfer.h:9571

nvinfer1::IAlgorithmVariant::getImplementation
int64_t getImplementation() const noexcept
Return implementation of the algorithm.
Definition: NvInfer.h:9563

nvinfer1::IAssertionLayer
An assertion layer in a network.
Definition: NvInfer.h:5056

nvinfer1::IAssertionLayer::setMessage
void setMessage(char const *message) noexcept
Set the message to print if the assertion fails.
Definition: NvInfer.h:5066

nvinfer1::IAssertionLayer::getMessage
char const * getMessage() const noexcept
Return the assertion message.
Definition: NvInfer.h:5076

nvinfer1::IAssertionLayer::~IAssertionLayer
virtual ~IAssertionLayer() noexcept=default

nvinfer1::IAttentionBoundaryLayer
This is a base class for Attention boundary layers.
Definition: NvInfer.h:6881

nvinfer1::IAttentionBoundaryLayer::getAttention
IAttention * getAttention() const noexcept
Get a pointer to the IAttention associated with this boundary layer.
Definition: NvInfer.h:6886

nvinfer1::IAttentionBoundaryLayer::~IAttentionBoundaryLayer
virtual ~IAttentionBoundaryLayer() noexcept=default

nvinfer1::IAttention
Helper for constructing an attention that consumes query, key and value tensors.
Definition: NvInfer.h:6999

nvinfer1::IAttention::getMask
ITensor * getMask() noexcept
Get the optional mask in attention.
Definition: NvInfer.h:7049

nvinfer1::IAttention::setMetadata
bool setMetadata(char const *metadata) noexcept
Set the metadata for IAttention.
Definition: NvInfer.h:7260

nvinfer1::IAttention::setDecomposable
bool setDecomposable(bool decomposable) noexcept
Set whether the attention can be decomposed to use multiple kernels if no fused kernel support found.
Definition: NvInfer.h:7086

nvinfer1::IAttention::setName
bool setName(char const *name) noexcept
Set the name of the attention.
Definition: NvInfer.h:7176

nvinfer1::IAttention::getDecomposable
bool getDecomposable() const noexcept
Get whether the attention can be decomposed to use multiple kernels if no fused kernel support found.
Definition: NvInfer.h:7099

nvinfer1::IAttention::getInput
ITensor * getInput(int32_t index) const noexcept
Get the IAttention input corresponding to the given index.
Definition: NvInfer.h:7139

nvinfer1::IAttention::getOutput
ITensor * getOutput(int32_t index) const noexcept
Get the IAttention output corresponding to the given index. IAttention has only one output.
Definition: NvInfer.h:7159

nvinfer1::IAttention::getNbOutputs
int32_t getNbOutputs() const noexcept
Get the number of outputs of a layer. IAttention has one output.
Definition: NvInfer.h:7147

nvinfer1::IAttention::getNbInputs
int32_t getNbInputs() const noexcept
Get the number of inputs of IAttention. IAttention has three inputs.
Definition: NvInfer.h:7127

nvinfer1::IAttention::setCausal
bool setCausal(bool isCausal) noexcept
Set whether the attention will run a causal inference. Cannot be used together with setMask().
Definition: NvInfer.h:7062

nvinfer1::IAttention::setNormalizationOperation
bool setNormalizationOperation(AttentionNormalizationOp op) noexcept
Set the normalization operation for the attention.
Definition: NvInfer.h:7008

nvinfer1::IAttention::getName
char const * getName() const noexcept
Return the name of the attention.
Definition: NvInfer.h:7188

nvinfer1::IAttention::setNormalizationQuantizeToType
bool setNormalizationQuantizeToType(DataType type) noexcept
Set the datatype the attention normalization is quantized to.
Definition: NvInfer.h:7228

nvinfer1::IAttention::getNormalizationOperation
AttentionNormalizationOp getNormalizationOperation() const noexcept
Get the normalization operation for the attention.
Definition: NvInfer.h:7020

nvinfer1::IAttention::setNormalizationQuantizeScale
bool setNormalizationQuantizeScale(ITensor &tensor) noexcept
Set the quantization scale for the attention normalization output.
Definition: NvInfer.h:7204

nvinfer1::IAttention::getMetadata
char const * getMetadata() const noexcept
Get the metadata of IAttention.
Definition: NvInfer.h:7273

nvinfer1::IAttention::getNormalizationQuantizeToType
DataType getNormalizationQuantizeToType() const noexcept
Get the datatype the attention normalization is quantized to.
Definition: NvInfer.h:7240

nvinfer1::IAttention::getNormalizationQuantizeScale
ITensor * getNormalizationQuantizeScale() const noexcept
Get the quantization scale for the attention normalization output.
Definition: NvInfer.h:7215

nvinfer1::IAttention::setInput
bool setInput(int32_t index, ITensor &input) noexcept
Append or replace an input of this layer with a specific tensor.
Definition: NvInfer.h:7118

nvinfer1::IAttention::setMask
bool setMask(ITensor &mask) noexcept
Set whether a mask will be used for the normalization operation.
Definition: NvInfer.h:7037

nvinfer1::IAttention::getCausal
bool getCausal() const noexcept
Get whether the attention will run a causal inference.
Definition: NvInfer.h:7074

nvinfer1::IAttention::mImpl
apiv::VAttention * mImpl
Definition: NvInfer.h:7280

nvinfer1::IAttention::~IAttention
virtual ~IAttention() noexcept=default

nvinfer1::IAttentionInputLayer
This layer represents an input to an attention subgraph.
Definition: NvInfer.h:6907

nvinfer1::IAttentionInputLayer::~IAttentionInputLayer
virtual ~IAttentionInputLayer() noexcept=default

nvinfer1::IAttentionOutputLayer
This layer represents an output of an IAttention.
Definition: NvInfer.h:6942

nvinfer1::IAttentionOutputLayer::~IAttentionOutputLayer
virtual ~IAttentionOutputLayer() noexcept=default

nvinfer1::IBuilderConfig
Holds properties for configuring a builder to produce an engine.
Definition: NvInfer.h:10525

nvinfer1::IBuilderConfig::setMemoryPoolLimit
void setMemoryPoolLimit(MemoryPoolType pool, std::size_t poolSize) noexcept
Set the memory size for the memory pool.
Definition: NvInfer.h:11105

nvinfer1::IBuilderConfig::setQuantizationFlags
TRT_DEPRECATED void setQuantizationFlags(QuantizationFlags flags) noexcept
Set the quantization flags.
Definition: NvInfer.h:10927

nvinfer1::IBuilderConfig::createTimingCache
nvinfer1::ITimingCache * createTimingCache(void const *blob, std::size_t size) const noexcept
Create timing cache.
Definition: NvInfer.h:11040

nvinfer1::IBuilderConfig::setPreviewFeature
void setPreviewFeature(PreviewFeature feature, bool enable) noexcept
Enable or disable a specific preview feature.
Definition: NvInfer.h:11142

nvinfer1::IBuilderConfig::setAlgorithmSelector
TRT_DEPRECATED void setAlgorithmSelector(IAlgorithmSelector *selector) noexcept
Set Algorithm Selector.
Definition: NvInfer.h:10868

nvinfer1::IBuilderConfig::setInt8Calibrator
TRT_DEPRECATED void setInt8Calibrator(IInt8Calibrator *calibrator) noexcept
Set Int8 Calibration interface.
Definition: NvInfer.h:10586

nvinfer1::IBuilderConfig::getPreviewFeature
bool getPreviewFeature(PreviewFeature feature) const noexcept
Get status of preview feature.
Definition: NvInfer.h:11156

nvinfer1::IBuilderConfig::getBuilderOptimizationLevel
int32_t getBuilderOptimizationLevel() noexcept
Get builder optimization level.
Definition: NvInfer.h:11201

nvinfer1::IBuilderConfig::setTacticSources
bool setTacticSources(TacticSources tacticSources) noexcept
Set tactic sources.
Definition: NvInfer.h:11005

nvinfer1::IBuilderConfig::setPluginsToSerialize
void setPluginsToSerialize(char const *const *paths, int32_t nbPaths) noexcept
Set the plugin libraries to be serialized with version-compatible engines.
Definition: NvInfer.h:11244

nvinfer1::IBuilderConfig::setTilingOptimizationLevel
bool setTilingOptimizationLevel(TilingOptimizationLevel level) noexcept
Set the Tiling optimization level.
Definition: NvInfer.h:11400

nvinfer1::IBuilderConfig::setL2LimitForTiling
bool setL2LimitForTiling(int64_t size) noexcept
Set the L2 cache usage limit for Tiling optimization.
Definition: NvInfer.h:11428

nvinfer1::IBuilderConfig::getInt8Calibrator
TRT_DEPRECATED IInt8Calibrator * getInt8Calibrator() const noexcept
Get Int8 Calibration interface.
Definition: NvInfer.h:10596

nvinfer1::IBuilderConfig::getMemoryPoolLimit
std::size_t getMemoryPoolLimit(MemoryPoolType pool) const noexcept
Get the memory size limit of the memory pool.
Definition: NvInfer.h:11124

nvinfer1::IBuilderConfig::getDLACore
int32_t getDLACore() const noexcept
Get the DLA core that the engine executes on.
Definition: NvInfer.h:10746

nvinfer1::IBuilderConfig::getNbPluginsToSerialize
int32_t getNbPluginsToSerialize() const noexcept
Get the number of plugin library paths to be serialized with version-compatible engines.
Definition: NvInfer.h:11267

nvinfer1::IBuilderConfig::setDeviceType
void setDeviceType(ILayer const *layer, DeviceType deviceType) noexcept
Set the device that this layer must execute on.
Definition: NvInfer.h:10678

nvinfer1::IBuilderConfig::setEngineCapability
void setEngineCapability(EngineCapability capability) noexcept
Configure the builder to target specified EngineCapability flow.
Definition: NvInfer.h:10562

nvinfer1::IBuilderConfig::getMaxAuxStreams
int32_t getMaxAuxStreams() const noexcept
Get the maximum number of auxiliary streams that TRT is allowed to use.
Definition: NvInfer.h:11306

nvinfer1::IBuilderConfig::getFlag
bool getFlag(BuilderFlag builderFlag) const noexcept
Returns true if the build mode flag is set.
Definition: NvInfer.h:10661

nvinfer1::IBuilderConfig::setMaxNbTactics
void setMaxNbTactics(int32_t maxNbTactics) noexcept
Set the maximum number of tactics to time when there is a choice of tactics.
Definition: NvInfer.h:11372

nvinfer1::IBuilderConfig::clearQuantizationFlag
TRT_DEPRECATED void clearQuantizationFlag(QuantizationFlag flag) noexcept
clear a quantization flag.
Definition: NvInfer.h:10955

nvinfer1::IBuilderConfig::getL2LimitForTiling
int64_t getL2LimitForTiling() const noexcept
Get the L2 cache usage limit for tiling optimization.
Definition: NvInfer.h:11440

nvinfer1::IBuilderConfig::setRemoteAutoTuningConfig
bool setRemoteAutoTuningConfig(char const *config) noexcept
Set a config string for remote auto tuning.
Definition: NvInfer.h:11454

nvinfer1::IBuilderConfig::setProgressMonitor
void setProgressMonitor(IProgressMonitor *monitor) noexcept
Sets the progress monitor for building a network.
Definition: NvInfer.h:11322

nvinfer1::IBuilderConfig::setProfilingVerbosity
void setProfilingVerbosity(ProfilingVerbosity verbosity) noexcept
Set verbosity level of layer information exposed in NVTX annotations and IEngineInspector.
Definition: NvInfer.h:10843

nvinfer1::IBuilderConfig::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
Get number of optimization profiles.
Definition: NvInfer.h:10831

nvinfer1::IBuilderConfig::getTimingCache
nvinfer1::ITimingCache const * getTimingCache() const noexcept
Get the pointer to the timing cache from current IBuilderConfig.
Definition: NvInfer.h:11073

nvinfer1::IBuilderConfig::reset
void reset() noexcept
Resets the builder configuration to defaults.
Definition: NvInfer.h:10777

nvinfer1::IBuilderConfig::setTimingCache
bool setTimingCache(ITimingCache const &cache, bool ignoreMismatch) noexcept
Attach a timing cache to IBuilderConfig.
Definition: NvInfer.h:11063

nvinfer1::IBuilderConfig::getPluginToSerialize
char const * getPluginToSerialize(int32_t index) const noexcept
Get the plugin library path to be serialized with version-compatible engines.
Definition: NvInfer.h:11257

nvinfer1::IBuilderConfig::getEngineCapability
EngineCapability getEngineCapability() const noexcept
Query EngineCapability flow configured for the builder.
Definition: NvInfer.h:10574

nvinfer1::IBuilderConfig::getRuntimePlatform
RuntimePlatform getRuntimePlatform() const noexcept
Get the target platform for runtime execution.
Definition: NvInfer.h:11360

nvinfer1::IBuilderConfig::getDefaultDeviceType
DeviceType getDefaultDeviceType() const noexcept
Get the default DeviceType which was set by setDefaultDeviceType.
Definition: NvInfer.h:10767

nvinfer1::IBuilderConfig::setRuntimePlatform
void setRuntimePlatform(RuntimePlatform runtimePlatform) noexcept
Set the target platform for runtime execution.
Definition: NvInfer.h:11348

nvinfer1::IBuilderConfig::getMaxNbTactics
int32_t getMaxNbTactics() const noexcept
Query the maximum number of tactics timed when there is a choice.
Definition: NvInfer.h:11384

nvinfer1::IBuilderConfig::getFlags
BuilderFlags getFlags() const noexcept
Get the build mode flags for this builder config. Defaults to 0.
Definition: NvInfer.h:10625

nvinfer1::IBuilderConfig::setFlags
void setFlags(BuilderFlags builderFlags) noexcept
Set the build mode flags to turn on builder options for this network.
Definition: NvInfer.h:10613

nvinfer1::IBuilderConfig::getTacticSources
TacticSources getTacticSources() const noexcept
Get tactic sources.
Definition: NvInfer.h:11020

nvinfer1::IBuilderConfig::resetDeviceType
void resetDeviceType(ILayer const *layer) noexcept
reset the DeviceType for this layer
Definition: NvInfer.h:10710

nvinfer1::IBuilderConfig::setDLACore
void setDLACore(int32_t dlaCore) noexcept
Sets the DLA core used by the network. Defaults to -1.
Definition: NvInfer.h:10736

nvinfer1::IBuilderConfig::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
Get the hardware compatibility level.
Definition: NvInfer.h:11231

nvinfer1::IBuilderConfig::getRemoteAutoTuningConfig
char const * getRemoteAutoTuningConfig() const noexcept
Get a config string for remote auto tuning.
Definition: NvInfer.h:11464

nvinfer1::IBuilderConfig::getQuantizationFlags
TRT_DEPRECATED QuantizationFlags getQuantizationFlags() const noexcept
Get the quantization flags.
Definition: NvInfer.h:10941

nvinfer1::IBuilderConfig::clearFlag
void clearFlag(BuilderFlag builderFlag) noexcept
clear a single build mode flag.
Definition: NvInfer.h:10637

nvinfer1::IBuilderConfig::addOptimizationProfile
int32_t addOptimizationProfile(IOptimizationProfile const *profile) noexcept
Add an optimization profile.
Definition: NvInfer.h:10818

nvinfer1::IBuilderConfig::getProgressMonitor
IProgressMonitor * getProgressMonitor() const noexcept
Definition: NvInfer.h:11332

nvinfer1::IBuilderConfig::mImpl
apiv::VBuilderConfig * mImpl
Definition: NvInfer.h:11470

nvinfer1::IBuilderConfig::getCalibrationProfile
TRT_DEPRECATED IOptimizationProfile const * getCalibrationProfile() noexcept
Get the current calibration profile.
Definition: NvInfer.h:10908

nvinfer1::IBuilderConfig::getAvgTimingIterations
int32_t getAvgTimingIterations() const noexcept
Query the number of averaging iterations.
Definition: NvInfer.h:10549

nvinfer1::IBuilderConfig::setDefaultDeviceType
void setDefaultDeviceType(DeviceType deviceType) noexcept
Sets the default DeviceType to be used by the builder. It ensures that all the layers that can run on...
Definition: NvInfer.h:10757

nvinfer1::IBuilderConfig::setFlag
void setFlag(BuilderFlag builderFlag) noexcept
Set a single build mode flag.
Definition: NvInfer.h:10649

nvinfer1::IBuilderConfig::setCalibrationProfile
TRT_DEPRECATED bool setCalibrationProfile(IOptimizationProfile const *profile) noexcept
Add a calibration profile.
Definition: NvInfer.h:10896

nvinfer1::IBuilderConfig::~IBuilderConfig
virtual ~IBuilderConfig() noexcept=default

nvinfer1::IBuilderConfig::getDeviceType
DeviceType getDeviceType(ILayer const *layer) const noexcept
Get the device that this layer executes on.
Definition: NvInfer.h:10688

nvinfer1::IBuilderConfig::canRunOnDLA
bool canRunOnDLA(ILayer const *layer) const noexcept
Checks if a layer can run on DLA.
Definition: NvInfer.h:10720

nvinfer1::IBuilderConfig::getQuantizationFlag
TRT_DEPRECATED bool getQuantizationFlag(QuantizationFlag flag) const noexcept
Returns true if the quantization flag is set.
Definition: NvInfer.h:10983

nvinfer1::IBuilderConfig::getProfileStream
cudaStream_t getProfileStream() const noexcept
Get the CUDA stream that is used to profile this network.
Definition: NvInfer.h:10801

nvinfer1::IBuilderConfig::setHardwareCompatibilityLevel
void setHardwareCompatibilityLevel(HardwareCompatibilityLevel hardwareCompatibilityLevel) noexcept
Set the hardware compatibility level.
Definition: NvInfer.h:11218

nvinfer1::IBuilderConfig::getTilingOptimizationLevel
TilingOptimizationLevel getTilingOptimizationLevel() const noexcept
Get the Tiling optimization level.
Definition: NvInfer.h:11412

nvinfer1::IBuilderConfig::setQuantizationFlag
TRT_DEPRECATED void setQuantizationFlag(QuantizationFlag flag) noexcept
Set a single quantization flag.
Definition: NvInfer.h:10969

nvinfer1::IBuilderConfig::setMaxAuxStreams
void setMaxAuxStreams(int32_t nbStreams) noexcept
Set the maximum number of auxiliary streams that TRT is allowed to use.
Definition: NvInfer.h:11296

nvinfer1::IBuilderConfig::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
Get verbosity level of layer information exposed in NVTX annotations and IEngineInspector.
Definition: NvInfer.h:10856

nvinfer1::IBuilderConfig::isDeviceTypeSet
bool isDeviceTypeSet(ILayer const *layer) const noexcept
whether the DeviceType has been explicitly set for this layer
Definition: NvInfer.h:10700

nvinfer1::IBuilderConfig::setBuilderOptimizationLevel
void setBuilderOptimizationLevel(int32_t level) noexcept
Set builder optimization level.
Definition: NvInfer.h:11189

nvinfer1::IBuilderConfig::setProfileStream
void setProfileStream(const cudaStream_t stream) noexcept
Set the CUDA stream that is used to profile this network.
Definition: NvInfer.h:10789

nvinfer1::IBuilderConfig::getAlgorithmSelector
TRT_DEPRECATED IAlgorithmSelector * getAlgorithmSelector() const noexcept
Get Algorithm Selector.
Definition: NvInfer.h:10878

nvinfer1::IBuilder
Builds an engine from a network definition.
Definition: NvInfer.h:11532

nvinfer1::IBuilder::getMaxDLABatchSize
int32_t getMaxDLABatchSize() const noexcept
Get the maximum batch size DLA can support. For any tensor the total volume of index dimensions combi...
Definition: NvInfer.h:11563

nvinfer1::IBuilder::getNbDLACores
int32_t getNbDLACores() const noexcept
Return the number of DLA engines available to this builder.
Definition: NvInfer.h:11571

nvinfer1::IBuilder::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInfer.h:11678

nvinfer1::IBuilder::mImpl
apiv::VBuilder * mImpl
Definition: NvInfer.h:11859

nvinfer1::IBuilder::getLogger
ILogger * getLogger() const noexcept
get the logger with which the builder was created
Definition: NvInfer.h:11813

nvinfer1::IBuilder::isNetworkSupported
bool isNetworkSupported(INetworkDefinition const &network, IBuilderConfig const &config) const noexcept
Checks that a network is within the scope of the IBuilderConfig settings.
Definition: NvInfer.h:11803

nvinfer1::IBuilder::getMaxThreads
int32_t getMaxThreads() const noexcept
get the maximum number of threads that can be used by the builder.
Definition: NvInfer.h:11843

nvinfer1::IBuilder::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
get the local plugin registry that can be used by the builder.
Definition: NvInfer.h:11853

nvinfer1::IBuilder::platformHasFastInt8
TRT_DEPRECATED bool platformHasFastInt8() const noexcept
Determine whether the platform has fast native int8.
Definition: NvInfer.h:11551

nvinfer1::IBuilder::createOptimizationProfile
nvinfer1::IOptimizationProfile * createOptimizationProfile() noexcept
Create a new optimization profile.
Definition: NvInfer.h:11644

nvinfer1::IBuilder::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
Set the GPU allocator.
Definition: NvInfer.h:11589

nvinfer1::IBuilder::createNetworkV2
nvinfer1::INetworkDefinition * createNetworkV2(NetworkDefinitionCreationFlags flags) noexcept
Create a network definition object.
Definition: NvInfer.h:11629

nvinfer1::IBuilder::createBuilderConfig
nvinfer1::IBuilderConfig * createBuilderConfig() noexcept
Create a builder configuration object.
Definition: NvInfer.h:11603

nvinfer1::IBuilder::reset
void reset() noexcept
Resets the builder state to default values.
Definition: NvInfer.h:11686

nvinfer1::IBuilder::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
Set the maximum number of threads.
Definition: NvInfer.h:11829

nvinfer1::IBuilder::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInfer.h:11663

nvinfer1::IBuilder::buildSerializedNetwork
nvinfer1::IHostMemory * buildSerializedNetwork(INetworkDefinition &network, IBuilderConfig &config) noexcept
Builds and serializes a network for the given INetworkDefinition and IBuilderConfig.
Definition: NvInfer.h:11715

nvinfer1::IBuilder::~IBuilder
virtual ~IBuilder() noexcept=default

nvinfer1::IBuilder::platformHasTf32
TRT_DEPRECATED bool platformHasTf32() const noexcept
Determine whether the platform has TF32 support.
Definition: NvInfer.h:11696

nvinfer1::IBuilder::buildSerializedNetworkToStream
bool buildSerializedNetworkToStream(INetworkDefinition &network, IBuilderConfig &config, IStreamWriter &writer) noexcept
Builds and serializes a network into stream for the given INetworkDefinition and IBuilderConfig.
Definition: NvInfer.h:11736

nvinfer1::IBuilder::buildEngineWithConfig
nvinfer1::ICudaEngine * buildEngineWithConfig(INetworkDefinition &network, IBuilderConfig &config) noexcept
Builds a network for the given INetworkDefinition and IBuilderConfig.
Definition: NvInfer.h:11781

nvinfer1::IBuilder::buildSerializedNetwork
nvinfer1::IHostMemory * buildSerializedNetwork(INetworkDefinition &network, IBuilderConfig &config, IHostMemory *&kernelText) noexcept
Extended form of buildSerializedNetwork that optionally permits getting the kernelText.
Definition: NvInfer.h:11760

nvinfer1::ICastLayer
A cast layer in a network.
Definition: NvInfer.h:3917

nvinfer1::ICastLayer::~ICastLayer
virtual ~ICastLayer() noexcept=default

nvinfer1::ICastLayer::mImpl
apiv::VCastLayer * mImpl
Definition: NvInfer.h:3943

nvinfer1::ICastLayer::getToType
DataType getToType() const noexcept
Return cast layer output type.
Definition: NvInfer.h:3937

nvinfer1::ICastLayer::setToType
void setToType(DataType toType) noexcept
Set cast layer output type.
Definition: NvInfer.h:3926

nvinfer1::IConcatenationLayer
A concatenation layer in a network definition.
Definition: NvInfer.h:2097

nvinfer1::IConcatenationLayer::setAxis
void setAxis(int32_t axis) noexcept
Set the axis along which concatenation occurs.
Definition: NvInfer.h:2110

nvinfer1::IConcatenationLayer::getAxis
int32_t getAxis() const noexcept
Get the axis along which concatenation occurs.
Definition: NvInfer.h:2120

nvinfer1::IConcatenationLayer::~IConcatenationLayer
virtual ~IConcatenationLayer() noexcept=default

nvinfer1::IConditionLayer
This layer represents a condition input to an IIfConditional.
Definition: NvInfer.h:4580

nvinfer1::IConditionLayer::~IConditionLayer
virtual ~IConditionLayer() noexcept=default

nvinfer1::IConstantLayer
Layer that represents a constant value.
Definition: NvInfer.h:3956

nvinfer1::IConstantLayer::setWeights
void setWeights(Weights weights) noexcept
Set the weights for the layer.
Definition: NvInfer.h:3966

nvinfer1::IConstantLayer::getWeights
Weights getWeights() const noexcept
Get the weights for the layer.
Definition: NvInfer.h:3976

nvinfer1::IConstantLayer::setDimensions
void setDimensions(Dims const &dimensions) noexcept
Set the dimensions for the layer.
Definition: NvInfer.h:3988

nvinfer1::IConstantLayer::mImpl
apiv::VConstantLayer * mImpl
Definition: NvInfer.h:4006

nvinfer1::IConstantLayer::~IConstantLayer
virtual ~IConstantLayer() noexcept=default

nvinfer1::IConstantLayer::getDimensions
Dims getDimensions() const noexcept
Get the dimensions for the layer.
Definition: NvInfer.h:4000

nvinfer1::IConvolutionLayer
A convolution layer in a network definition.
Definition: NvInfer.h:1067

nvinfer1::IConvolutionLayer::getPrePadding
Dims getPrePadding() const noexcept
Get the pre-padding.
Definition: NvInfer.h:1192

nvinfer1::IConvolutionLayer::getBiasWeights
Weights getBiasWeights() const noexcept
Get the bias weights for the convolution.
Definition: NvInfer.h:1165

nvinfer1::IConvolutionLayer::setPaddingMode
void setPaddingMode(PaddingMode paddingMode) noexcept
Set the padding mode.
Definition: NvInfer.h:1233

nvinfer1::IConvolutionLayer::setDilationNd
void setDilationNd(Dims const &dilation) noexcept
Set the multi-dimension dilation of the convolution.
Definition: NvInfer.h:1337

nvinfer1::IConvolutionLayer::getPaddingNd
Dims getPaddingNd() const noexcept
Get the multi-dimension padding of the convolution.
Definition: NvInfer.h:1323

nvinfer1::IConvolutionLayer::getStrideNd
Dims getStrideNd() const noexcept
Get the multi-dimension stride of the convolution.
Definition: NvInfer.h:1293

nvinfer1::IConvolutionLayer::getKernelWeights
Weights getKernelWeights() const noexcept
Get the kernel weights of the convolution.
Definition: NvInfer.h:1140

nvinfer1::IConvolutionLayer::setStrideNd
void setStrideNd(Dims const &stride) noexcept
Set the multi-dimension stride of the convolution.
Definition: NvInfer.h:1283

nvinfer1::IConvolutionLayer::getDilationNd
Dims getDilationNd() const noexcept
Get the multi-dimension dilation of the convolution.
Definition: NvInfer.h:1347

nvinfer1::IConvolutionLayer::getNbOutputMaps
int64_t getNbOutputMaps() const noexcept
Get the number of output maps for the convolution.
Definition: NvInfer.h:1086

nvinfer1::IConvolutionLayer::setKernelWeights
void setKernelWeights(Weights weights) noexcept
Set the kernel weights for the convolution.
Definition: NvInfer.h:1130

nvinfer1::IConvolutionLayer::getPostPadding
Dims getPostPadding() const noexcept
Get the post-padding.
Definition: NvInfer.h:1219

nvinfer1::IConvolutionLayer::getNbGroups
int64_t getNbGroups() const noexcept
Get the number of groups of the convolution.
Definition: NvInfer.h:1116

nvinfer1::IConvolutionLayer::getPaddingMode
PaddingMode getPaddingMode() const noexcept
Get the padding mode.
Definition: NvInfer.h:1245

nvinfer1::IConvolutionLayer::~IConvolutionLayer
virtual ~IConvolutionLayer() noexcept=default

nvinfer1::IConvolutionLayer::setNbGroups
void setNbGroups(int64_t nbGroups) noexcept
Set the number of groups for a convolution.
Definition: NvInfer.h:1106

nvinfer1::IConvolutionLayer::setNbOutputMaps
void setNbOutputMaps(int64_t nbOutputMaps) noexcept
Set the number of output maps for the convolution.
Definition: NvInfer.h:1076

nvinfer1::IConvolutionLayer::setBiasWeights
void setBiasWeights(Weights weights) noexcept
Set the bias weights for the convolution.
Definition: NvInfer.h:1155

nvinfer1::IConvolutionLayer::getKernelSizeNd
Dims getKernelSizeNd() const noexcept
Get the multi-dimension kernel size of the convolution.
Definition: NvInfer.h:1268

nvinfer1::IConvolutionLayer::setPaddingNd
void setPaddingNd(Dims const &padding) noexcept
Set the multi-dimension padding of the convolution.
Definition: NvInfer.h:1311

nvinfer1::IConvolutionLayer::setPrePadding
void setPrePadding(Dims const &padding) noexcept
Set the multi-dimension pre-padding of the convolution.
Definition: NvInfer.h:1182

nvinfer1::IConvolutionLayer::setPostPadding
void setPostPadding(Dims const &padding) noexcept
Set the multi-dimension post-padding of the convolution.
Definition: NvInfer.h:1209

nvinfer1::IConvolutionLayer::setKernelSizeNd
void setKernelSizeNd(Dims const &kernelSize) noexcept
Set the multi-dimension kernel size of the convolution.
Definition: NvInfer.h:1258

nvinfer1::ICudaEngine
An engine for executing inference on a built network, with functionally unsafe features.
Definition: NvInferRuntime.h:3197

nvinfer1::ICumulativeLayer
Layer that represents a cumulative operation across a tensor.
Definition: NvInfer.h:6763

nvinfer1::ICumulativeLayer::setOperation
bool setOperation(CumulativeOperation op) noexcept
Set the cumulative operation for the layer.
Definition: NvInfer.h:6774

nvinfer1::ICumulativeLayer::setReverse
void setReverse(bool reverse) noexcept
Specify whether the cumulative operation should be applied backward.
Definition: NvInfer.h:6822

nvinfer1::ICumulativeLayer::mImpl
apiv::VCumulativeLayer * mImpl
Definition: NvInfer.h:6840

nvinfer1::ICumulativeLayer::getExclusive
bool getExclusive() const noexcept
Get whether it is exclusive accumulation or inclusive accumulation.
Definition: NvInfer.h:6810

nvinfer1::ICumulativeLayer::~ICumulativeLayer
virtual ~ICumulativeLayer() noexcept=default

nvinfer1::ICumulativeLayer::getReverse
bool getReverse() const noexcept
Get the boolean that specifies whether the cumulative operation should be applied backward.
Definition: NvInfer.h:6834

nvinfer1::ICumulativeLayer::setExclusive
void setExclusive(bool exclusive) noexcept
Set whether it is an exclusive accumulation or inclusive accumulation.
Definition: NvInfer.h:6798

nvinfer1::ICumulativeLayer::getOperation
CumulativeOperation getOperation() const noexcept
Get the cumulative operation for the layer.
Definition: NvInfer.h:6786

nvinfer1::IDeconvolutionLayer
A deconvolution layer in a network definition.
Definition: NvInfer.h:2138

nvinfer1::IDeconvolutionLayer::setBiasWeights
void setBiasWeights(Weights weights) noexcept
Set the bias weights for the deconvolution.
Definition: NvInfer.h:2226

nvinfer1::IDeconvolutionLayer::getNbGroups
int64_t getNbGroups() const noexcept
Get the number of groups for a deconvolution.
Definition: NvInfer.h:2187

nvinfer1::IDeconvolutionLayer::getKernelWeights
Weights getKernelWeights() const noexcept
Get the kernel weights for the deconvolution.
Definition: NvInfer.h:2211

nvinfer1::IDeconvolutionLayer::setPrePadding
void setPrePadding(Dims const &padding) noexcept
Set the multi-dimension pre-padding of the deconvolution.
Definition: NvInfer.h:2253

nvinfer1::IDeconvolutionLayer::getStrideNd
Dims getStrideNd() const noexcept
Get the multi-dimension stride of the deconvolution.
Definition: NvInfer.h:2368

nvinfer1::IDeconvolutionLayer::getDilationNd
Dims getDilationNd() const noexcept
Get the multi-dimension dilation of the deconvolution.
Definition: NvInfer.h:2434

nvinfer1::IDeconvolutionLayer::getBiasWeights
Weights getBiasWeights() const noexcept
Get the bias weights for the deconvolution.
Definition: NvInfer.h:2236

nvinfer1::IDeconvolutionLayer::setKernelWeights
void setKernelWeights(Weights weights) noexcept
Set the kernel weights for the deconvolution.
Definition: NvInfer.h:2201

nvinfer1::IDeconvolutionLayer::getNbOutputMaps
int64_t getNbOutputMaps() const noexcept
Get the number of output feature maps for the deconvolution.
Definition: NvInfer.h:2157

nvinfer1::IDeconvolutionLayer::setStrideNd
void setStrideNd(Dims const &stride) noexcept
Set the multi-dimension stride of the deconvolution.
Definition: NvInfer.h:2358

nvinfer1::IDeconvolutionLayer::getPostPadding
Dims getPostPadding() const noexcept
Get the padding.
Definition: NvInfer.h:2290

nvinfer1::IDeconvolutionLayer::getKernelSizeNd
Dims getKernelSizeNd() const noexcept
Get the multi-dimension kernel size of the deconvolution.
Definition: NvInfer.h:2341

nvinfer1::IDeconvolutionLayer::setPostPadding
void setPostPadding(Dims const &padding) noexcept
Set the multi-dimension post-padding of the deconvolution.
Definition: NvInfer.h:2280

nvinfer1::IDeconvolutionLayer::setKernelSizeNd
void setKernelSizeNd(Dims const &kernelSize) noexcept
Set the multi-dimension kernel size of the deconvolution.
Definition: NvInfer.h:2331

nvinfer1::IDeconvolutionLayer::~IDeconvolutionLayer
virtual ~IDeconvolutionLayer() noexcept=default

nvinfer1::IDeconvolutionLayer::setPaddingNd
void setPaddingNd(Dims const &padding) noexcept
Set the multi-dimension padding of the deconvolution.
Definition: NvInfer.h:2386

nvinfer1::IDeconvolutionLayer::setNbOutputMaps
void setNbOutputMaps(int64_t nbOutputMaps) noexcept
Set the number of output feature maps for the deconvolution.
Definition: NvInfer.h:2147

nvinfer1::IDeconvolutionLayer::getPaddingNd
Dims getPaddingNd() const noexcept
Get the multi-dimension padding of the deconvolution.
Definition: NvInfer.h:2398

nvinfer1::IDeconvolutionLayer::setDilationNd
void setDilationNd(Dims const &dilation) noexcept
Set the multi-dimension dilation of the deconvolution.
Definition: NvInfer.h:2424

nvinfer1::IDeconvolutionLayer::setPaddingMode
void setPaddingMode(PaddingMode paddingMode) noexcept
Set the padding mode.
Definition: NvInfer.h:2304

nvinfer1::IDeconvolutionLayer::setNbGroups
void setNbGroups(int64_t nbGroups) noexcept
Set the number of groups for a deconvolution.
Definition: NvInfer.h:2177

nvinfer1::IDeconvolutionLayer::getPrePadding
Dims getPrePadding() const noexcept
Get the pre-padding.
Definition: NvInfer.h:2263

nvinfer1::IDeconvolutionLayer::getPaddingMode
PaddingMode getPaddingMode() const noexcept
Get the padding mode.
Definition: NvInfer.h:2316

nvinfer1::IDequantizeLayer
A Dequantize layer in a network definition.
Definition: NvInfer.h:5665

nvinfer1::IDequantizeLayer::getBlockShape
TRT_NODISCARD Dims getBlockShape() const noexcept
Get the shape of the quantization block.
Definition: NvInfer.h:5714

nvinfer1::IDequantizeLayer::setToType
void setToType(DataType toType) noexcept
Set the Dequantize layer output type.
Definition: NvInfer.h:5730

nvinfer1::IDequantizeLayer::~IDequantizeLayer
virtual ~IDequantizeLayer() noexcept=default

nvinfer1::IDequantizeLayer::getAxis
int32_t getAxis() const noexcept
Get the quantization axis.
Definition: NvInfer.h:5675

nvinfer1::IDequantizeLayer::setBlockShape
bool setBlockShape(Dims const &blockShape) noexcept
Set the shape of the quantization block.
Definition: NvInfer.h:5703

nvinfer1::IDequantizeLayer::getToType
DataType getToType() const noexcept
Return the Dequantize layer output type.
Definition: NvInfer.h:5742

nvinfer1::IDequantizeLayer::setAxis
void setAxis(int32_t axis) noexcept
Set the quantization axis.
Definition: NvInfer.h:5686

nvinfer1::IDynamicQuantizeLayer
A network layer to perform dynamic quantization.
Definition: NvInfer.h:5770

nvinfer1::IDynamicQuantizeLayer::getScaleType
DataType getScaleType() const noexcept
Return the scale factors data type.
Definition: NvInfer.h:5836

nvinfer1::IDynamicQuantizeLayer::setAxis
TRT_DEPRECATED void setAxis(int32_t axis) noexcept
Set the axis along which block quantization occurs.
Definition: NvInfer.h:5849

nvinfer1::IDynamicQuantizeLayer::setBlockSize
TRT_DEPRECATED void setBlockSize(int32_t size) noexcept
Set the size of the quantization block.
Definition: NvInfer.h:5872

nvinfer1::IDynamicQuantizeLayer::getBlockShape
Dims getBlockShape() const noexcept
Get the shape of the quantization block.
Definition: NvInfer.h:5907

nvinfer1::IDynamicQuantizeLayer::setScaleType
void setScaleType(DataType scaleType) noexcept
Set the data type of the scale factors used to quantize the data.
Definition: NvInfer.h:5823

nvinfer1::IDynamicQuantizeLayer::getToType
DataType getToType() const noexcept
Return DynamicQuantizeLayer's quantized output type.
Definition: NvInfer.h:5810

nvinfer1::IDynamicQuantizeLayer::getAxis
TRT_DEPRECATED int32_t getAxis() const noexcept
Get the axis along which blocking occurs.
Definition: NvInfer.h:5859

nvinfer1::IDynamicQuantizeLayer::~IDynamicQuantizeLayer
virtual ~IDynamicQuantizeLayer() noexcept=default

nvinfer1::IDynamicQuantizeLayer::setToType
void setToType(DataType toType) noexcept
Set DynamicQuantizeLayer's quantized output type.
Definition: NvInfer.h:5797

nvinfer1::IDynamicQuantizeLayer::setBlockShape
void setBlockShape(Dims const &blockShape) noexcept
Set the shape of the quantization block.
Definition: NvInfer.h:5895

nvinfer1::IDynamicQuantizeLayer::getBlockSize
TRT_DEPRECATED int32_t getBlockSize() const noexcept
Get the size of the quantization block.
Definition: NvInfer.h:5882

nvinfer1::IEinsumLayer
An Einsum layer in a network.
Definition: NvInfer.h:5952

nvinfer1::IEinsumLayer::setEquation
bool setEquation(char const *equation) noexcept
Set the equation. The equation is a comma-separated list of subscript labels, where each label refers...
Definition: NvInfer.h:5963

nvinfer1::IEinsumLayer::~IEinsumLayer
virtual ~IEinsumLayer() noexcept=default

nvinfer1::IEinsumLayer::getEquation
char const * getEquation() const noexcept
Return the equation.
Definition: NvInfer.h:5973

nvinfer1::IElementWiseLayer
A elementwise layer in a network definition.
Definition: NvInfer.h:2508

nvinfer1::IElementWiseLayer::~IElementWiseLayer
virtual ~IElementWiseLayer() noexcept=default

nvinfer1::IElementWiseLayer::mImpl
apiv::VElementWiseLayer * mImpl
Definition: NvInfer.h:2537

nvinfer1::IElementWiseLayer::getOperation
ElementWiseOperation getOperation() const noexcept
Get the binary operation for the layer.
Definition: NvInfer.h:2531

nvinfer1::IElementWiseLayer::setOperation
void setOperation(ElementWiseOperation op) noexcept
Set the binary operation for the layer.
Definition: NvInfer.h:2519

nvinfer1::IFillLayer
Generate a tensor according to a specified mode.
Definition: NvInfer.h:5167

nvinfer1::IFillLayer::isAlphaBetaInt64
bool isAlphaBetaInt64() const noexcept
Return true if alpha/beta have type int64, false if they have type double.
Definition: NvInfer.h:5399

nvinfer1::IFillLayer::getOperation
FillOperation getOperation() const noexcept
Get the fill operation for the layer.
Definition: NvInfer.h:5213

nvinfer1::IFillLayer::setOperation
void setOperation(FillOperation op) noexcept
Set the fill operation for the layer.
Definition: NvInfer.h:5203

nvinfer1::IFillLayer::getToType
DataType getToType() const noexcept
Get the fill layer output type.
Definition: NvInfer.h:5428

nvinfer1::IFillLayer::setAlphaInt64
void setAlphaInt64(int64_t alpha) noexcept
Set the alpha parameter with int64 datatype.
Definition: NvInfer.h:5342

nvinfer1::IFillLayer::setBetaInt64
void setBetaInt64(int64_t beta) noexcept
Set the beta parameter with int64 datatype.
Definition: NvInfer.h:5376

nvinfer1::IFillLayer::setBeta
void setBeta(double beta) noexcept
Set the beta parameter.
Definition: NvInfer.h:5266

nvinfer1::IFillLayer::getAlphaInt64
int64_t getAlphaInt64() const noexcept
Get the value of alpha parameter with int64 datatype.
Definition: NvInfer.h:5357

nvinfer1::IFillLayer::getBetaInt64
int64_t getBetaInt64() const noexcept
Get the value of beta parameter with int64 datatype.
Definition: NvInfer.h:5391

nvinfer1::IFillLayer::getAlpha
double getAlpha() const noexcept
Get the value of alpha parameter.
Definition: NvInfer.h:5247

nvinfer1::IFillLayer::setDimensions
void setDimensions(Dims const &dimensions) noexcept
Set the output tensor's dimensions.
Definition: NvInfer.h:5178

nvinfer1::IFillLayer::setAlpha
void setAlpha(double alpha) noexcept
Set the alpha parameter.
Definition: NvInfer.h:5232

nvinfer1::IFillLayer::setToType
void setToType(DataType toType) noexcept
Set the fill layer output type.
Definition: NvInfer.h:5416

nvinfer1::IFillLayer::getDimensions
Dims getDimensions() const noexcept
Get the output tensor's dimensions.
Definition: NvInfer.h:5193

nvinfer1::IFillLayer::getBeta
double getBeta() const noexcept
Get the value of beta parameter.
Definition: NvInfer.h:5281

nvinfer1::IFillLayer::~IFillLayer
virtual ~IFillLayer() noexcept=default

nvinfer1::IGatherLayer
A Gather layer in a network definition. Supports several kinds of gathering.
Definition: NvInfer.h:2641

nvinfer1::IGatherLayer::setGatherAxis
void setGatherAxis(int32_t axis) noexcept
Set the axis used by GatherMode::kELEMENTS and GatherMode::kDEFAULT The axis must be less than the nu...
Definition: NvInfer.h:2652

nvinfer1::IGatherLayer::setNbElementWiseDims
void setNbElementWiseDims(int32_t elementWiseDims) noexcept
Set the number of leading dimensions of indices tensor to be handled elementwise.
Definition: NvInfer.h:2687

nvinfer1::IGatherLayer::mImpl
apiv::VGatherLayer * mImpl
Definition: NvInfer.h:2723

nvinfer1::IGatherLayer::getNbElementWiseDims
int32_t getNbElementWiseDims() const noexcept
Get the number of leading dimensions of indices tensor to be handled elementwise.
Definition: NvInfer.h:2697

nvinfer1::IGatherLayer::setMode
void setMode(GatherMode mode) noexcept
Set the gather mode.
Definition: NvInfer.h:2707

nvinfer1::IGatherLayer::getGatherAxis
int32_t getGatherAxis() const noexcept
Get the axis to gather on.
Definition: NvInfer.h:2664

nvinfer1::IGatherLayer::getMode
GatherMode getMode() const noexcept
Get the gather mode.
Definition: NvInfer.h:2717

nvinfer1::IGatherLayer::~IGatherLayer
virtual ~IGatherLayer() noexcept=default

nvinfer1::IGridSampleLayer
A GridSample layer in a network definition.
Definition: NvInfer.h:6174

nvinfer1::IGridSampleLayer::setInterpolationMode
void setInterpolationMode(InterpolationMode mode) noexcept
Set the grid sample interpolation mode.
Definition: NvInfer.h:6181

nvinfer1::IGridSampleLayer::setSampleMode
bool setSampleMode(SampleMode mode) noexcept
Set the sample mode.
Definition: NvInfer.h:6227

nvinfer1::IGridSampleLayer::setAlignCorners
void setAlignCorners(bool alignCorners) noexcept
Set the align corners mode.
Definition: NvInfer.h:6203

nvinfer1::IGridSampleLayer::mImpl
apiv::VGridSampleLayer * mImpl
Definition: NvInfer.h:6245

nvinfer1::IGridSampleLayer::getSampleMode
SampleMode getSampleMode() const noexcept
Get the sample mode.
Definition: NvInfer.h:6239

nvinfer1::IGridSampleLayer::getInterpolationMode
InterpolationMode getInterpolationMode() const noexcept
Get the grid sample interpolation mode.
Definition: NvInfer.h:6193

nvinfer1::IGridSampleLayer::getAlignCorners
bool getAlignCorners() const noexcept
Get the align corners mode.
Definition: NvInfer.h:6215

nvinfer1::IGridSampleLayer::~IGridSampleLayer
virtual ~IGridSampleLayer() noexcept=default

nvinfer1::IHostMemory
Class to handle library allocated memory that is accessible to the user.
Definition: NvInferRuntime.h:142

nvinfer1::IIdentityLayer
A layer that represents the identity function.
Definition: NvInfer.h:3904

nvinfer1::IIdentityLayer::mImpl
apiv::VIdentityLayer * mImpl
Definition: NvInfer.h:3906

nvinfer1::IIdentityLayer::~IIdentityLayer
virtual ~IIdentityLayer() noexcept=default

nvinfer1::IIfConditionalBoundaryLayer
This is a base class for Conditional boundary layers.
Definition: NvInfer.h:4559

nvinfer1::IIfConditionalBoundaryLayer::getConditional
IIfConditional * getConditional() const noexcept
Get a pointer to the IIfConditional associated with this boundary layer.
Definition: NvInfer.h:4564

nvinfer1::IIfConditionalBoundaryLayer::~IIfConditionalBoundaryLayer
virtual ~IIfConditionalBoundaryLayer() noexcept=default

nvinfer1::IIfConditional
Helper for constructing conditionally-executed subgraphs.
Definition: NvInfer.h:4642

nvinfer1::IIfConditional::addInput
IIfConditionalInputLayer * addInput(ITensor &input) noexcept
Add an If-conditional input.
Definition: NvInfer.h:4683

nvinfer1::IIfConditional::getName
char const * getName() const noexcept
Return the name of the conditional.
Definition: NvInfer.h:4708

nvinfer1::IIfConditional::~IIfConditional
virtual ~IIfConditional() noexcept=default

nvinfer1::IIfConditional::setCondition
IConditionLayer * setCondition(ITensor &condition) noexcept
Set the condition tensor for this If-Conditional construct.
Definition: NvInfer.h:4653

nvinfer1::IIfConditional::addOutput
IIfConditionalOutputLayer * addOutput(ITensor &trueSubgraphOutput, ITensor &falseSubgraphOutput) noexcept
Add an If-conditional output.
Definition: NvInfer.h:4671

nvinfer1::IIfConditional::setName
void setName(char const *name) noexcept
Set the name of the conditional.
Definition: NvInfer.h:4698

nvinfer1::IIfConditionalInputLayer
This layer represents an input to an IIfConditional.
Definition: NvInfer.h:4610

nvinfer1::IIfConditionalInputLayer::~IIfConditionalInputLayer
virtual ~IIfConditionalInputLayer() noexcept=default

nvinfer1::IIfConditionalOutputLayer
This layer represents an output of an IIfConditional.
Definition: NvInfer.h:4597

nvinfer1::IIfConditionalOutputLayer::~IIfConditionalOutputLayer
virtual ~IIfConditionalOutputLayer() noexcept=default

nvinfer1::IInt8Calibrator
Application-implemented interface for calibration.
Definition: NvInfer.h:9220

nvinfer1::IInt8Calibrator::getBatchSize
virtual TRT_DEPRECATED int32_t getBatchSize() const noexcept=0
Get the batch size used for calibration batches.

nvinfer1::IIteratorLayer
A layer to do iterations.
Definition: NvInfer.h:4873

nvinfer1::IIteratorLayer::~IIteratorLayer
virtual ~IIteratorLayer() noexcept=default

nvinfer1::IIteratorLayer::setReverse
void setReverse(bool reverse) noexcept
Set iteration order to be reverse.
Definition: NvInfer.h:4900

nvinfer1::IIteratorLayer::getReverse
bool getReverse() const noexcept
Check if the iteration order is reverse.
Definition: NvInfer.h:4910

nvinfer1::IIteratorLayer::getAxis
int32_t getAxis() const noexcept
Get axis being iterated over.
Definition: NvInfer.h:4886

nvinfer1::IIteratorLayer::setAxis
void setAxis(int32_t axis) noexcept
Set axis to iterate over.
Definition: NvInfer.h:4878

nvinfer1::IKVCacheUpdateLayer
Layer that represents a KVCacheUpdate operation.
Definition: NvInfer.h:7403

nvinfer1::IKVCacheUpdateLayer::setCacheMode
bool setCacheMode(KVCacheMode cacheMode) noexcept
Set the mode of the KVCacheUpdate layer.
Definition: NvInfer.h:7426

nvinfer1::IKVCacheUpdateLayer::~IKVCacheUpdateLayer
virtual ~IKVCacheUpdateLayer() noexcept=default

nvinfer1::IKVCacheUpdateLayer::getCacheMode
KVCacheMode getCacheMode() const noexcept
Get the mode of the KVCacheUpdate layer.
Definition: NvInfer.h:7436

nvinfer1::IKVCacheUpdateLayer::mImpl
apiv::VKVCacheUpdateLayer * mImpl
Definition: NvInfer.h:7442

nvinfer1::ILRNLayer
A LRN layer in a network definition.
Definition: NvInfer.h:1752

nvinfer1::ILRNLayer::getWindowSize
int64_t getWindowSize() const noexcept
Get the LRN window size.
Definition: NvInfer.h:1773

nvinfer1::ILRNLayer::getAlpha
float getAlpha() const noexcept
Get the LRN alpha value.
Definition: NvInfer.h:1795

nvinfer1::ILRNLayer::setWindowSize
void setWindowSize(int64_t windowSize) noexcept
Set the LRN window size.
Definition: NvInfer.h:1763

nvinfer1::ILRNLayer::setK
void setK(float k) noexcept
Set the LRN K value.
Definition: NvInfer.h:1829

nvinfer1::ILRNLayer::setAlpha
void setAlpha(float alpha) noexcept
Set the LRN alpha value.
Definition: NvInfer.h:1785

nvinfer1::ILRNLayer::setBeta
void setBeta(float beta) noexcept
Set the LRN beta value.
Definition: NvInfer.h:1807

nvinfer1::ILRNLayer::~ILRNLayer
virtual ~ILRNLayer() noexcept=default

nvinfer1::ILRNLayer::getBeta
float getBeta() const noexcept
Get the LRN beta value.
Definition: NvInfer.h:1817

nvinfer1::ILRNLayer::getK
float getK() const noexcept
Get the LRN K value.
Definition: NvInfer.h:1839

nvinfer1::ILayer
Base class for all layer classes in a network definition.
Definition: NvInfer.h:582

nvinfer1::ILayer::setPrecision
TRT_DEPRECATED void setPrecision(DataType dataType) noexcept
Set the preferred or required computational precision of this layer in a weakly-typed network.
Definition: NvInfer.h:702

nvinfer1::ILayer::setOutputType
TRT_DEPRECATED void setOutputType(int32_t index, DataType dataType) noexcept
Set the output type of this layer in a weakly-typed network.
Definition: NvInfer.h:790

nvinfer1::ILayer::precisionIsSet
TRT_DEPRECATED bool precisionIsSet() const noexcept
whether the computational precision has been set for this layer
Definition: NvInfer.h:728

nvinfer1::ILayer::setMetadata
void setMetadata(char const *metadata) noexcept
Set the metadata for this layer.
Definition: NvInfer.h:853

nvinfer1::ILayer::resetOutputType
TRT_DEPRECATED void resetOutputType(int32_t index) noexcept
reset the output type for this layer
Definition: NvInfer.h:835

nvinfer1::ILayer::setName
void setName(char const *name) noexcept
Set the name of a layer.
Definition: NvInfer.h:603

nvinfer1::ILayer::getNbInputs
int32_t getNbInputs() const noexcept
Get the number of inputs of a layer.
Definition: NvInfer.h:621

nvinfer1::ILayer::getMetadata
char const * getMetadata() const noexcept
Get the metadata of the layer.
Definition: NvInfer.h:866

nvinfer1::ILayer::getOutputType
DataType getOutputType(int32_t index) const noexcept
get the output type of this layer
Definition: NvInfer.h:805

nvinfer1::ILayer::getPrecision
DataType getPrecision() const noexcept
get the computational precision of this layer
Definition: NvInfer.h:714

nvinfer1::ILayer::outputTypeIsSet
TRT_DEPRECATED bool outputTypeIsSet(int32_t index) const noexcept
whether the output type has been set for this layer
Definition: NvInfer.h:821

nvinfer1::ILayer::getName
char const * getName() const noexcept
Return the name of a layer.
Definition: NvInfer.h:613

nvinfer1::ILayer::getNbOutputs
int32_t getNbOutputs() const noexcept
Get the number of outputs of a layer.
Definition: NvInfer.h:642

nvinfer1::ILayer::getOutput
ITensor * getOutput(int32_t index) const noexcept
Get the layer output corresponding to the given index.
Definition: NvInfer.h:652

nvinfer1::ILayer::setInput
void setInput(int32_t index, ITensor &tensor) noexcept
Replace an input of this layer with a specific tensor.
Definition: NvInfer.h:669

nvinfer1::ILayer::getInput
ITensor * getInput(int32_t index) const noexcept
Get the layer input corresponding to the given index.
Definition: NvInfer.h:634

nvinfer1::ILayer::getType
LayerType getType() const noexcept
Return the type of a layer.
Definition: NvInfer.h:589

nvinfer1::ILayer::resetPrecision
TRT_DEPRECATED void resetPrecision() noexcept
reset the computational precision for this layer
Definition: NvInfer.h:740

nvinfer1::ILayer::~ILayer
virtual ~ILayer() noexcept=default

nvinfer1::ILogger
Application-implemented logging interface for the builder, refitter and runtime.
Definition: NvInferRuntime.h:1588

nvinfer1::ILoopBoundaryLayer
This is a base class for Loop boundary layers.
Definition: NvInfer.h:4536

nvinfer1::ILoopBoundaryLayer::~ILoopBoundaryLayer
virtual ~ILoopBoundaryLayer() noexcept=default

nvinfer1::ILoopBoundaryLayer::getLoop
ILoop * getLoop() const noexcept
Get a pointer to ILoop associated with this boundary layer.
Definition: NvInfer.h:4541

nvinfer1::ILoop
Helper for creating a recurrent subgraph.
Definition: NvInfer.h:4931

nvinfer1::ILoop::setName
void setName(char const *name) noexcept
Set the name of the loop.
Definition: NvInfer.h:5001

nvinfer1::ILoop::addTripLimit
ITripLimitLayer * addTripLimit(ITensor &tensor, TripLimit limit) noexcept
Add a trip-count limiter, based on the given tensor.
Definition: NvInfer.h:4960

nvinfer1::ILoop::addIterator
IIteratorLayer * addIterator(ITensor &tensor, int32_t axis=0, bool reverse=false) noexcept
Return layer that subscripts tensor by loop iteration.
Definition: NvInfer.h:4973

nvinfer1::ILoop::addLoopOutput
ILoopOutputLayer * addLoopOutput(ITensor &tensor, LoopOutput outputKind, int32_t axis=0) noexcept
Make an output for this loop, based on the given tensor.
Definition: NvInfer.h:4986

nvinfer1::ILoop::~ILoop
virtual ~ILoop() noexcept=default

nvinfer1::ILoop::getName
char const * getName() const noexcept
Return the name of the loop.
Definition: NvInfer.h:5011

nvinfer1::ILoop::addRecurrence
IRecurrenceLayer * addRecurrence(ITensor &initialValue) noexcept
Create a recurrence layer for this loop with initialValue as its first input.
Definition: NvInfer.h:4939

nvinfer1::ILoopOutputLayer
An ILoopOutputLayer is the sole way to get output from a loop.
Definition: NvInfer.h:4773

nvinfer1::ILoopOutputLayer::~ILoopOutputLayer
virtual ~ILoopOutputLayer() noexcept=default

nvinfer1::ILoopOutputLayer::getAxis
int32_t getAxis() const noexcept
Get axis being concatenated over.
Definition: NvInfer.h:4803

nvinfer1::ILoopOutputLayer::getLoopOutput
LoopOutput getLoopOutput() const noexcept
Get which kind a loop output has.
Definition: NvInfer.h:4778

nvinfer1::ILoopOutputLayer::setAxis
void setAxis(int32_t axis) noexcept
Set where to insert the contenation axis. Ignored if getLoopOutput() is kLAST_VALUE.
Definition: NvInfer.h:4795

nvinfer1::IMatrixMultiplyLayer
Layer that represents a Matrix Multiplication.
Definition: NvInfer.h:3751

nvinfer1::IMatrixMultiplyLayer::mImpl
apiv::VMatrixMultiplyLayer * mImpl
Definition: NvInfer.h:3779

nvinfer1::IMatrixMultiplyLayer::~IMatrixMultiplyLayer
virtual ~IMatrixMultiplyLayer() noexcept=default

nvinfer1::IMatrixMultiplyLayer::getOperation
MatrixOperation getOperation(int32_t index) const noexcept
Get the operation for an input tensor.
Definition: NvInfer.h:3773

nvinfer1::IMatrixMultiplyLayer::setOperation
void setOperation(int32_t index, MatrixOperation op) noexcept
Set the operation for an input tensor.
Definition: NvInfer.h:3761

nvinfer1::INMSLayer
A non-maximum suppression layer in a network definition.
Definition: NvInfer.h:6326

nvinfer1::INMSLayer::~INMSLayer
virtual ~INMSLayer() noexcept=default

nvinfer1::INMSLayer::setTopKBoxLimit
void setTopKBoxLimit(int32_t limit) noexcept
Set the TopK box limit parameter for the layer.
Definition: NvInfer.h:6363

nvinfer1::INMSLayer::setBoundingBoxFormat
void setBoundingBoxFormat(BoundingBoxFormat fmt) noexcept
Set the bounding box format parameter for the layer.
Definition: NvInfer.h:6337

nvinfer1::INMSLayer::getBoundingBoxFormat
BoundingBoxFormat getBoundingBoxFormat() const noexcept
Get the bounding box format parameter for the layer.
Definition: NvInfer.h:6349

nvinfer1::INMSLayer::setIndicesType
bool setIndicesType(DataType type) noexcept
Set the indices type for the layer.
Definition: NvInfer.h:6408

nvinfer1::INMSLayer::mImpl
apiv::VNMSLayer * mImpl
Definition: NvInfer.h:6426

nvinfer1::INMSLayer::getTopKBoxLimit
int32_t getTopKBoxLimit() const noexcept
Get the TopK box limit parameter for the layer.
Definition: NvInfer.h:6373

nvinfer1::INMSLayer::getIndicesType
DataType getIndicesType() const noexcept
Return the NMS layer indices type.
Definition: NvInfer.h:6420

nvinfer1::INetworkDefinition
A network definition for input to the builder.
Definition: NvInfer.h:7464

nvinfer1::INetworkDefinition::addConcatenation
IConcatenationLayer * addConcatenation(ITensor *const *inputs, int32_t nbInputs) noexcept
Add a concatenation layer to the network.
Definition: NvInfer.h:7692

nvinfer1::INetworkDefinition::addShuffle
IShuffleLayer * addShuffle(ITensor &input) noexcept
Add a shuffle layer to the network.
Definition: NvInfer.h:7755

nvinfer1::INetworkDefinition::setName
void setName(char const *name) noexcept
Sets the name of the network.
Definition: NvInfer.h:8221

nvinfer1::INetworkDefinition::addTopK
ITopKLayer * addTopK(ITensor &input, TopKOperation op, int32_t k, uint32_t reduceAxes, DataType indicesType) noexcept
Add a TopK layer to the network.
Definition: NvInfer.h:7951

nvinfer1::INetworkDefinition::markDebug
bool markDebug(ITensor &tensor) noexcept
Mark a tensor as a debug tensor.
Definition: NvInfer.h:7535

nvinfer1::INetworkDefinition::addLRN
ILRNLayer * addLRN(ITensor &input, int64_t window, float alpha, float beta, float k) noexcept
Add a LRN layer to the network.
Definition: NvInfer.h:7636

nvinfer1::INetworkDefinition::addCumulative
ICumulativeLayer * addCumulative(ITensor &input, ITensor &axis, CumulativeOperation operation, bool exclusive, bool reverse) noexcept
Add a cumulative layer to the network.
Definition: NvInfer.h:8969

nvinfer1::INetworkDefinition::addAssertion
IAssertionLayer * addAssertion(ITensor &condition, char const *message) noexcept
Add an assertion layer to the network.
Definition: NvInfer.h:8537

nvinfer1::INetworkDefinition::addNonZero
TRT_DEPRECATED INonZeroLayer * addNonZero(ITensor &input) noexcept
Add a nonzero layer to the network.
Definition: NvInfer.h:8042

nvinfer1::INetworkDefinition::addConvolutionNd
IConvolutionLayer * addConvolutionNd(ITensor &input, int64_t nbOutputMaps, Dims const &kernelSize, Weights kernelWeights, Weights biasWeights) noexcept
Add a multi-dimension convolution layer to the network.
Definition: NvInfer.h:8356

nvinfer1::INetworkDefinition::addCast
ICastLayer * addCast(ITensor &input, DataType toType) noexcept
Add a cast layer.
Definition: NvInfer.h:8111

nvinfer1::INetworkDefinition::addScaleNd
IScaleLayer * addScaleNd(ITensor &input, ScaleMode mode, Weights shift, Weights scale, Weights power, int32_t channelAxis) noexcept
Add a multi-dimension scale layer to the network.
Definition: NvInfer.h:8435

nvinfer1::INetworkDefinition::getName
char const * getName() const noexcept
Returns the name associated with the network.
Definition: NvInfer.h:8235

nvinfer1::INetworkDefinition::addParametricReLU
IParametricReLULayer * addParametricReLU(ITensor &input, ITensor &slope) noexcept
Add a parametric ReLU layer to the network.
Definition: NvInfer.h:8334

nvinfer1::INetworkDefinition::getOutput
ITensor * getOutput(int32_t index) const noexcept
Get the output tensor specified by the given index.
Definition: NvInfer.h:7856

nvinfer1::INetworkDefinition::getInput
ITensor * getInput(int32_t index) const noexcept
Get the input tensor specified by the given index.
Definition: NvInfer.h:7826

nvinfer1::INetworkDefinition::addTopK
TRT_DEPRECATED ITopKLayer * addTopK(ITensor &input, TopKOperation op, int32_t k, uint32_t reduceAxes) noexcept
Add a TopK layer to the network.
Definition: NvInfer.h:7918

nvinfer1::INetworkDefinition::addDequantize
IDequantizeLayer * addDequantize(ITensor &input, ITensor &scale, DataType outputType) noexcept
Add a dequantization layer to the network.
Definition: NvInfer.h:8706

nvinfer1::INetworkDefinition::unmarkOutputForShapes
bool unmarkOutputForShapes(ITensor &tensor) noexcept
Undo markOutputForShapes.
Definition: NvInfer.h:8316

nvinfer1::INetworkDefinition::addFill
IFillLayer * addFill(Dims const &dimensions, FillOperation op, DataType outputType) noexcept
Add a fill layer to the network.
Definition: NvInfer.h:8588

nvinfer1::INetworkDefinition::addLoop
ILoop * addLoop() noexcept
Add a loop to the network.
Definition: NvInfer.h:8466

nvinfer1::INetworkDefinition::markUnfusedTensorsAsDebugTensors
bool markUnfusedTensorsAsDebugTensors() noexcept
Mark unfused tensors as debug tensors.
Definition: NvInfer.h:7583

nvinfer1::INetworkDefinition::addNormalizationV2
TRT_NODISCARD INormalizationLayer * addNormalizationV2(ITensor &input, ITensor &scale, ITensor &bias, uint32_t axesMask) noexcept
Add a normalization layer to the network.
Definition: NvInfer.h:9171

nvinfer1::INetworkDefinition::addActivation
IActivationLayer * addActivation(ITensor &input, ActivationType type) noexcept
Add an activation layer to the network.
Definition: NvInfer.h:7617

nvinfer1::INetworkDefinition::addFill
TRT_DEPRECATED IFillLayer * addFill(Dims const &dimensions, FillOperation op) noexcept
Add a fill layer to the network.
Definition: NvInfer.h:8562

nvinfer1::INetworkDefinition::addSlice
ISliceLayer * addSlice(ITensor &input, Dims const &start, Dims const &size, Dims const &stride) noexcept
Add a slice layer to the network.
Definition: NvInfer.h:8197

nvinfer1::INetworkDefinition::~INetworkDefinition
virtual ~INetworkDefinition() noexcept=default

nvinfer1::INetworkDefinition::addQuantize
TRT_DEPRECATED IQuantizeLayer * addQuantize(ITensor &input, ITensor &scale) noexcept
Add a quantization layer to the network.
Definition: NvInfer.h:8747

nvinfer1::INetworkDefinition::getBuilder
virtual IBuilder & getBuilder() const noexcept
Return the builder from which this INetworkDefinition was created.
Definition: NvInfer.h:9067

nvinfer1::INetworkDefinition::getLayer
ILayer * getLayer(int32_t index) const noexcept
Get the layer specified by the given index.
Definition: NvInfer.h:7798

nvinfer1::INetworkDefinition::isDebugTensor
bool isDebugTensor(ITensor const &tensor) const noexcept
Check if a tensor is marked as debug tensor.
Definition: NvInfer.h:7561

nvinfer1::INetworkDefinition::getFlag
bool getFlag(NetworkDefinitionCreationFlag networkDefinitionCreationFlag) const noexcept
Returns true if the network definition creation flag is set.
Definition: NvInfer.h:8287

nvinfer1::INetworkDefinition::addIfConditional
IIfConditional * addIfConditional() noexcept
Add an if-then-else to the network.
Definition: NvInfer.h:8481

nvinfer1::INetworkDefinition::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
get the ErrorRecorder assigned to this interface.
Definition: NvInfer.h:8662

nvinfer1::INetworkDefinition::addSqueeze
ISqueezeLayer * addSqueeze(ITensor &input, ITensor &axes) noexcept
Add a squeeze layer to the network.
Definition: NvInfer.h:9124

nvinfer1::INetworkDefinition::addNMS
TRT_DEPRECATED INMSLayer * addNMS(ITensor &boxes, ITensor &scores, ITensor &maxOutputBoxesPerClass) noexcept
Add a non-maximum suppression layer to the network.
Definition: NvInfer.h:8878

nvinfer1::INetworkDefinition::addReverseSequence
IReverseSequenceLayer * addReverseSequence(ITensor &input, ITensor &sequenceLens) noexcept
Add a ReverseSequence layer to the network.
Definition: NvInfer.h:8915

nvinfer1::INetworkDefinition::addDynamicQuantize
TRT_DEPRECATED IDynamicQuantizeLayer * addDynamicQuantize(ITensor &input, int32_t axis, int32_t blockSize, DataType outputType, DataType scaleType) noexcept
Add a dynamic quantization layer to the network.
Definition: NvInfer.h:8798

nvinfer1::INetworkDefinition::getNbInputs
int32_t getNbInputs() const noexcept
Get the number of inputs in the network.
Definition: NvInfer.h:7810

nvinfer1::INetworkDefinition::getFlags
NetworkDefinitionCreationFlags getFlags() const noexcept
Get the network definition creation flags for this network definition object. Defaults to 0.
Definition: NvInfer.h:8275

nvinfer1::INetworkDefinition::addQuantize
IQuantizeLayer * addQuantize(ITensor &input, ITensor &scale, DataType outputType) noexcept
Add a quantization layer to the network.
Definition: NvInfer.h:8771

nvinfer1::INetworkDefinition::addDynamicQuantizeV2
IDynamicQuantizeLayer * addDynamicQuantizeV2(ITensor &input, Dims const &blockShape, DataType outputType, DataType scaleType) noexcept
Add a dynamic quantization layer to the network.
Definition: NvInfer.h:8822

nvinfer1::INetworkDefinition::addReduce
IReduceLayer * addReduce(ITensor &input, ReduceOperation operation, uint32_t reduceAxes, bool keepDimensions) noexcept
Add a reduce layer to the network.
Definition: NvInfer.h:7882

nvinfer1::INetworkDefinition::addUnary
IUnaryLayer * addUnary(ITensor &input, UnaryOperation operation) noexcept
Add a unary layer to the network.
Definition: NvInfer.h:7741

nvinfer1::INetworkDefinition::addGridSample
IGridSampleLayer * addGridSample(ITensor &input, ITensor &grid) noexcept
Add a GridSample layer to the network.
Definition: NvInfer.h:8856

nvinfer1::INetworkDefinition::removeTensor
void removeTensor(ITensor &tensor) noexcept
remove a tensor from the network definition.
Definition: NvInfer.h:8126

nvinfer1::INetworkDefinition::areWeightsMarkedRefittable
bool areWeightsMarkedRefittable(char const *name) const noexcept
Whether the weight has been marked as refittable.
Definition: NvInfer.h:9105

nvinfer1::INetworkDefinition::addSelect
ISelectLayer * addSelect(ITensor &condition, ITensor &thenInput, ITensor &elseInput) noexcept
Add a select layer to the network.
Definition: NvInfer.h:8520

nvinfer1::INetworkDefinition::addScatter
IScatterLayer * addScatter(ITensor &data, ITensor &indices, ITensor &updates, ScatterMode mode) noexcept
Add a Scatter layer to the network with specified mode and axis=0.
Definition: NvInfer.h:8726

nvinfer1::INetworkDefinition::addNormalization
TRT_DEPRECATED INormalizationLayer * addNormalization(ITensor &input, ITensor &scale, ITensor &bias, uint32_t axesMask) noexcept
Add a normalization layer to the network.
Definition: NvInfer.h:8947

nvinfer1::INetworkDefinition::getNbLayers
int32_t getNbLayers() const noexcept
Get the number of layers in the network.
Definition: NvInfer.h:7784

nvinfer1::INetworkDefinition::hasImplicitBatchDimension
TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept
Query whether the network was created with an implicit batch dimension.
Definition: NvInfer.h:8265

nvinfer1::INetworkDefinition::mImpl
apiv::VNetworkDefinition * mImpl
Definition: NvInfer.h:9177

nvinfer1::INetworkDefinition::addKVCacheUpdate
IKVCacheUpdateLayer * addKVCacheUpdate(ITensor &cache, ITensor &update, ITensor &writeIndices, KVCacheMode cacheMode) noexcept
Add a KVCacheUpdate layer to the network.
Definition: NvInfer.h:9055

nvinfer1::INetworkDefinition::markOutputForShapes
bool markOutputForShapes(ITensor &tensor) noexcept
Enable tensor's value to be computed by IExecutionContext::getShapeBinding.
Definition: NvInfer.h:8304

nvinfer1::INetworkDefinition::addOneHot
IOneHotLayer * addOneHot(ITensor &indices, ITensor &values, ITensor &depth, int32_t axis) noexcept
Add a OneHot layer to the network.
Definition: NvInfer.h:7772

nvinfer1::INetworkDefinition::addScale
IScaleLayer * addScale(ITensor &input, ScaleMode mode, Weights shift, Weights scale, Weights power) noexcept
Add a Scale layer to the network.
Definition: NvInfer.h:7662

nvinfer1::INetworkDefinition::addPluginV3
IPluginV3Layer * addPluginV3(ITensor *const *inputs, int32_t nbInputs, ITensor *const *shapeInputs, int32_t nbShapeInputs, IPluginV3 &plugin) noexcept
Add a plugin layer implementing the IPluginV3 interface to the network.
Definition: NvInfer.h:8177

nvinfer1::INetworkDefinition::unmarkOutput
void unmarkOutput(ITensor &tensor) noexcept
unmark a tensor as a network output.
Definition: NvInfer.h:8138

nvinfer1::INetworkDefinition::addIdentity
IIdentityLayer * addIdentity(ITensor &input) noexcept
Add an identity layer.
Definition: NvInfer.h:8096

nvinfer1::INetworkDefinition::addGatherV2
IGatherLayer * addGatherV2(ITensor &data, ITensor &indices, GatherMode mode) noexcept
Add gather with specified mode, axis=0 and nbElementWiseDims=0.
Definition: NvInfer.h:7983

nvinfer1::INetworkDefinition::addNonZero
INonZeroLayer * addNonZero(ITensor &input, DataType indicesType) noexcept
Add a nonzero layer to the network.
Definition: NvInfer.h:8058

nvinfer1::INetworkDefinition::addElementWise
IElementWiseLayer * addElementWise(ITensor &input1, ITensor &input2, ElementWiseOperation op) noexcept
Add an elementwise layer to the network.
Definition: NvInfer.h:7719

nvinfer1::INetworkDefinition::addConstant
IConstantLayer * addConstant(Dims const &dimensions, Weights weights) noexcept
Add a constant layer to the network.
Definition: NvInfer.h:8082

nvinfer1::INetworkDefinition::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
Set the ErrorRecorder for this interface.
Definition: NvInfer.h:8647

nvinfer1::INetworkDefinition::addPoolingNd
IPoolingLayer * addPoolingNd(ITensor &input, PoolingType type, Dims const &windowSize) noexcept
Add a multi-dimension pooling layer to the network.
Definition: NvInfer.h:8376

nvinfer1::INetworkDefinition::addNMS
INMSLayer * addNMS(ITensor &boxes, ITensor &scores, ITensor &maxOutputBoxesPerClass, DataType indicesType) noexcept
Add a non-maximum suppression layer to the network.
Definition: NvInfer.h:8898

nvinfer1::INetworkDefinition::addRaggedSoftMax
IRaggedSoftMaxLayer * addRaggedSoftMax(ITensor &input, ITensor &bounds) noexcept
Add a RaggedSoftMax layer to the network.
Definition: NvInfer.h:8002

nvinfer1::INetworkDefinition::addShape
IShapeLayer * addShape(ITensor &input) noexcept
Add a shape layer to the network.
Definition: NvInfer.h:8251

nvinfer1::INetworkDefinition::addGather
IGatherLayer * addGather(ITensor &data, ITensor &indices, int32_t axis) noexcept
Add gather with mode GatherMode::kDEFAULT and specified axis and nbElementWiseDims=0.
Definition: NvInfer.h:7967

nvinfer1::INetworkDefinition::addAttention
IAttention * addAttention(ITensor &query, ITensor &key, ITensor &value, AttentionNormalizationOp normOp, bool causal) noexcept
Add an attention to the network.
Definition: NvInfer.h:8996

nvinfer1::INetworkDefinition::unmarkWeightsRefittable
bool unmarkWeightsRefittable(char const *name) noexcept
Unmark weights as refittable when the builder flag kREFIT_INDIVIDUAL is set.
Definition: NvInfer.h:9092

nvinfer1::INetworkDefinition::markWeightsRefittable
bool markWeightsRefittable(char const *name) noexcept
Mark weights as refittable when the builder flag kREFIT_INDIVIDUAL is set.
Definition: NvInfer.h:9080

nvinfer1::INetworkDefinition::addRotaryEmbedding
IRotaryEmbeddingLayer * addRotaryEmbedding(ITensor &input, ITensor &cosCache, ITensor &sinCache, bool interleaved, int32_t rotaryEmbeddingDim) noexcept
Add a Rotary Position Embedding (RoPE) layer to the network.
Definition: NvInfer.h:9021

nvinfer1::INetworkDefinition::addDeconvolutionNd
IDeconvolutionLayer * addDeconvolutionNd(ITensor &input, int64_t nbOutputMaps, Dims kernelSize, Weights kernelWeights, Weights biasWeights) noexcept
Add a multi-dimension deconvolution layer to the network.
Definition: NvInfer.h:8398

nvinfer1::INetworkDefinition::addResize
IResizeLayer * addResize(ITensor &input) noexcept
Add a resize layer to the network.
Definition: NvInfer.h:8452

nvinfer1::INetworkDefinition::addUnsqueeze
IUnsqueezeLayer * addUnsqueeze(ITensor &input, ITensor &axes) noexcept
Add an unsqueeze layer to the network.
Definition: NvInfer.h:9145

nvinfer1::INetworkDefinition::addMatrixMultiply
IMatrixMultiplyLayer * addMatrixMultiply(ITensor &input0, MatrixOperation op0, ITensor &input1, MatrixOperation op1) noexcept
Add a MatrixMultiply layer to the network.
Definition: NvInfer.h:8023

nvinfer1::INetworkDefinition::addSoftMax
ISoftMaxLayer * addSoftMax(ITensor &input) noexcept
Add a SoftMax layer to the network.
Definition: NvInfer.h:7675

nvinfer1::INetworkDefinition::unmarkDebug
bool unmarkDebug(ITensor &tensor) noexcept
Unmark a tensor as a debug tensor.
Definition: NvInfer.h:7551

nvinfer1::INetworkDefinition::addEinsum
IEinsumLayer * addEinsum(ITensor *const *inputs, int32_t nbInputs, char const *equation) noexcept
Add an Einsum layer to the network.
Definition: NvInfer.h:8838

nvinfer1::INetworkDefinition::markOutput
void markOutput(ITensor &tensor) noexcept
Mark a tensor as a network output.
Definition: NvInfer.h:7517

nvinfer1::INetworkDefinition::addPluginV2
TRT_DEPRECATED IPluginV2Layer * addPluginV2(ITensor *const *inputs, int32_t nbInputs, IPluginV2 &plugin) noexcept
Add a plugin layer to the network using the IPluginV2 interface.
Definition: NvInfer.h:8159

nvinfer1::INetworkDefinition::addPaddingNd
IPaddingLayer * addPaddingNd(ITensor &input, Dims const &prePadding, Dims const &postPadding) noexcept
Add a padding layer to the network. Only 2D padding is currently supported.
Definition: NvInfer.h:8604

nvinfer1::INetworkDefinition::addDequantize
TRT_DEPRECATED IDequantizeLayer * addDequantize(ITensor &input, ITensor &scale) noexcept
Add a dequantization layer to the network.
Definition: NvInfer.h:8683

nvinfer1::INetworkDefinition::getNbOutputs
int32_t getNbOutputs() const noexcept
Get the number of outputs in the network.
Definition: NvInfer.h:7840

nvinfer1::INetworkDefinition::setWeightsName
bool setWeightsName(Weights weights, char const *name) noexcept
Associate a name with all current uses of the given weights.
Definition: NvInfer.h:8628

nvinfer1::INetworkDefinition::unmarkUnfusedTensorsAsDebugTensors
bool unmarkUnfusedTensorsAsDebugTensors() noexcept
Undo the marking of unfused tensors as debug tensors.
Definition: NvInfer.h:7597

nvinfer1::INoCopy
Forward declaration of IEngineInspector for use by other interfaces.
Definition: NvInferRuntime.h:51

nvinfer1::INonZeroLayer
Definition: NvInfer.h:3805

nvinfer1::INonZeroLayer::getIndicesType
DataType getIndicesType() const noexcept
Return the NonZero layer indices type.
Definition: NvInfer.h:3829

nvinfer1::INonZeroLayer::setIndicesType
bool setIndicesType(DataType type) noexcept
Set the indices type for the layer.
Definition: NvInfer.h:3817

nvinfer1::INonZeroLayer::~INonZeroLayer
virtual ~INonZeroLayer() noexcept=default

nvinfer1::INormalizationLayer
A normalization layer in a network definition.
Definition: NvInfer.h:6515

nvinfer1::INormalizationLayer::getEpsilon
float getEpsilon() const noexcept
Get the epsilon value used for the normalization calculation.
Definition: NvInfer.h:6534

nvinfer1::INormalizationLayer::getAxes
uint32_t getAxes() const noexcept
Get the axes value used for the normalization calculation.
Definition: NvInfer.h:6554

nvinfer1::INormalizationLayer::~INormalizationLayer
virtual ~INormalizationLayer() noexcept=default

nvinfer1::INormalizationLayer::setEpsilon
void setEpsilon(float eps) noexcept
Set the epsilon value used for the normalization calculation.
Definition: NvInfer.h:6524

nvinfer1::INormalizationLayer::isV2
TRT_NODISCARD bool isV2() const noexcept
Returns true if this layer was created through addNormalizationV2().
Definition: NvInfer.h:6631

nvinfer1::INormalizationLayer::getComputePrecision
DataType getComputePrecision() const noexcept
Get the compute precision of this layer.
Definition: NvInfer.h:6621

nvinfer1::INormalizationLayer::mImpl
apiv::VNormalizationLayer * mImpl
Definition: NvInfer.h:6637

nvinfer1::INormalizationLayer::getNbGroups
int64_t getNbGroups() const noexcept
Get the number of groups used to split the channels for the normalization calculation.
Definition: NvInfer.h:6585

nvinfer1::INormalizationLayer::setAxes
void setAxes(uint32_t axesMask) noexcept
Set the reduction axes for the normalization calculation.
Definition: NvInfer.h:6544

nvinfer1::INormalizationLayer::setComputePrecision
void setComputePrecision(DataType type) noexcept
Set the compute precision of this layer.
Definition: NvInfer.h:6611

nvinfer1::INormalizationLayer::setNbGroups
void setNbGroups(int64_t nbGroups) noexcept
Set the number of groups used to split the channels in the normalization calculation.
Definition: NvInfer.h:6575

nvinfer1::IOneHotLayer
A OneHot layer in a network definition.
Definition: NvInfer.h:6137

nvinfer1::IOneHotLayer::~IOneHotLayer
virtual ~IOneHotLayer() noexcept=default

nvinfer1::IOneHotLayer::mImpl
apiv::VOneHotLayer * mImpl
Definition: NvInfer.h:6158

nvinfer1::IOneHotLayer::setAxis
void setAxis(int32_t axis) noexcept
Set the axis parameter.
Definition: NvInfer.h:6144

nvinfer1::IOneHotLayer::getAxis
int32_t getAxis() const noexcept
Get the value of the axis parameter.
Definition: NvInfer.h:6152

nvinfer1::IOptimizationProfile
Optimization profile for dynamic input dimensions and shape tensors.
Definition: NvInferRuntime.h:2675

nvinfer1::IPaddingLayer
Layer that represents a padding operation.
Definition: NvInfer.h:3002

nvinfer1::IPaddingLayer::getPostPaddingNd
Dims getPostPaddingNd() const noexcept
Get the padding that is applied at the end of the tensor.
Definition: NvInfer.h:3051

nvinfer1::IPaddingLayer::setPrePaddingNd
void setPrePaddingNd(Dims const &padding) noexcept
Set the padding that is applied at the start of the tensor.
Definition: NvInfer.h:3013

nvinfer1::IPaddingLayer::~IPaddingLayer
virtual ~IPaddingLayer() noexcept=default

nvinfer1::IPaddingLayer::setPostPaddingNd
void setPostPaddingNd(Dims const &padding) noexcept
Set the padding that is applied at the end of the tensor.
Definition: NvInfer.h:3039

nvinfer1::IPaddingLayer::getPrePaddingNd
Dims getPrePaddingNd() const noexcept
Get the padding that is applied at the start of the tensor.
Definition: NvInfer.h:3025

nvinfer1::IPaddingLayer::mImpl
apiv::VPaddingLayer * mImpl
Definition: NvInfer.h:3057

nvinfer1::IParametricReLULayer
Layer that represents a parametric ReLU operation.
Definition: NvInfer.h:4020

nvinfer1::IParametricReLULayer::mImpl
apiv::VParametricReLULayer * mImpl
Definition: NvInfer.h:4022

nvinfer1::IParametricReLULayer::~IParametricReLULayer
virtual ~IParametricReLULayer() noexcept=default

nvinfer1::IPluginRegistry
Single registration point for all plugins in an application. It is used to find plugin implementation...
Definition: NvInferRuntimeCommon.h:56

nvinfer1::IPluginV2
Plugin class for user-implemented layers.
Definition: NvInferRuntimePlugin.h:139

nvinfer1::IPluginV2Layer
Layer type for pluginV2.
Definition: NvInfer.h:2739

nvinfer1::IPluginV2Layer::~IPluginV2Layer
virtual ~IPluginV2Layer() noexcept=default

nvinfer1::IPluginV2Layer::mImpl
apiv::VPluginV2Layer * mImpl
Definition: NvInfer.h:2752

nvinfer1::IPluginV2Layer::getPlugin
IPluginV2 & getPlugin() noexcept
Get the plugin for the layer.
Definition: NvInfer.h:2746

nvinfer1::IPluginV3Layer
Layer type for V3 plugins.
Definition: NvInfer.h:2766

nvinfer1::IPluginV3Layer::~IPluginV3Layer
virtual ~IPluginV3Layer() noexcept=default

nvinfer1::IPluginV3Layer::getPlugin
IPluginV3 & getPlugin() noexcept
Get the plugin for the layer.
Definition: NvInfer.h:2773

nvinfer1::IPluginV3Layer::mImpl
apiv::VPluginV3Layer * mImpl
Definition: NvInfer.h:2779

nvinfer1::IPoolingLayer
A Pooling layer in a network definition.
Definition: NvInfer.h:1501

nvinfer1::IPoolingLayer::getPoolingType
PoolingType getPoolingType() const noexcept
Get the type of activation to be performed.
Definition: NvInfer.h:1520

nvinfer1::IPoolingLayer::getPaddingMode
PaddingMode getPaddingMode() const noexcept
Get the padding mode.
Definition: NvInfer.h:1653

nvinfer1::IPoolingLayer::getPostPadding
Dims getPostPadding() const noexcept
Get the padding.
Definition: NvInfer.h:1629

nvinfer1::IPoolingLayer::getAverageCountExcludesPadding
bool getAverageCountExcludesPadding() const noexcept
Get whether average pooling uses as a denominator the overlap area between the window and the unpadde...
Definition: NvInfer.h:1573

nvinfer1::IPoolingLayer::getPrePadding
Dims getPrePadding() const noexcept
Get the pre-padding.
Definition: NvInfer.h:1601

nvinfer1::IPoolingLayer::setPoolingType
void setPoolingType(PoolingType type) noexcept
Set the type of activation to be performed.
Definition: NvInfer.h:1510

nvinfer1::IPoolingLayer::setWindowSizeNd
void setWindowSizeNd(Dims const &windowSize) noexcept
Set the multi-dimension window size for pooling.
Definition: NvInfer.h:1666

nvinfer1::IPoolingLayer::setPaddingMode
void setPaddingMode(PaddingMode paddingMode) noexcept
Set the padding mode.
Definition: NvInfer.h:1642

nvinfer1::IPoolingLayer::getWindowSizeNd
Dims getWindowSizeNd() const noexcept
Get the multi-dimension window size for pooling.
Definition: NvInfer.h:1676

nvinfer1::IPoolingLayer::setAverageCountExcludesPadding
void setAverageCountExcludesPadding(bool exclusive) noexcept
Set whether average pooling uses as a denominator the overlap area between the window and the unpadde...
Definition: NvInfer.h:1562

nvinfer1::IPoolingLayer::setPaddingNd
void setPaddingNd(Dims const &padding) noexcept
Set the multi-dimension padding for pooling.
Definition: NvInfer.h:1720

nvinfer1::IPoolingLayer::getBlendFactor
float getBlendFactor() const noexcept
Get the blending factor for the max_average_blend mode: max_average_blendPool = (1-blendFactor)*maxPo...
Definition: NvInfer.h:1548

nvinfer1::IPoolingLayer::setStrideNd
void setStrideNd(Dims const &stride) noexcept
Set the multi-dimension stride for pooling.
Definition: NvInfer.h:1691

nvinfer1::IPoolingLayer::getStrideNd
Dims getStrideNd() const noexcept
Get the multi-dimension stride for pooling.
Definition: NvInfer.h:1701

nvinfer1::IPoolingLayer::~IPoolingLayer
virtual ~IPoolingLayer() noexcept=default

nvinfer1::IPoolingLayer::getPaddingNd
Dims getPaddingNd() const noexcept
Get the multi-dimension padding for pooling.
Definition: NvInfer.h:1732

nvinfer1::IPoolingLayer::setPostPadding
void setPostPadding(Dims const &padding) noexcept
Set the multi-dimension post-padding for pooling.
Definition: NvInfer.h:1619

nvinfer1::IPoolingLayer::setPrePadding
void setPrePadding(Dims const &padding) noexcept
Set the multi-dimension pre-padding for pooling.
Definition: NvInfer.h:1591

nvinfer1::IPoolingLayer::setBlendFactor
void setBlendFactor(float blendFactor) noexcept
Set the blending factor for the max_average_blend mode: max_average_blendPool = (1-blendFactor)*maxPo...
Definition: NvInfer.h:1535

nvinfer1::IQuantizeLayer
A Quantize layer in a network definition.
Definition: NvInfer.h:5513

nvinfer1::IQuantizeLayer::setToType
void setToType(DataType toType) noexcept
Set the Quantize layer output type.
Definition: NvInfer.h:5574

nvinfer1::IQuantizeLayer::setBlockShape
bool setBlockShape(Dims const &blockShape) noexcept
Set the shape of the quantization block.
Definition: NvInfer.h:5547

nvinfer1::IQuantizeLayer::setAxis
void setAxis(int32_t axis) noexcept
Set the quantization axis.
Definition: NvInfer.h:5534

nvinfer1::IQuantizeLayer::getBlockShape
TRT_NODISCARD Dims getBlockShape() const noexcept
Get the shape of the quantization block.
Definition: NvInfer.h:5558

nvinfer1::IQuantizeLayer::getAxis
int32_t getAxis() const noexcept
Get the quantization axis.
Definition: NvInfer.h:5523

nvinfer1::IQuantizeLayer::~IQuantizeLayer
virtual ~IQuantizeLayer() noexcept=default

nvinfer1::IQuantizeLayer::getToType
DataType getToType() const noexcept
Return the Quantize layer output type.
Definition: NvInfer.h:5586

nvinfer1::IRaggedSoftMaxLayer
A RaggedSoftmax layer in a network definition.
Definition: NvInfer.h:3854

nvinfer1::IRaggedSoftMaxLayer::mImpl
apiv::VRaggedSoftMaxLayer * mImpl
Definition: NvInfer.h:3856

nvinfer1::IRaggedSoftMaxLayer::~IRaggedSoftMaxLayer
virtual ~IRaggedSoftMaxLayer() noexcept=default

nvinfer1::IRecurrenceLayer
A recurrence layer in a network definition.
Definition: NvInfer.h:4726

nvinfer1::IRecurrenceLayer::~IRecurrenceLayer
virtual ~IRecurrenceLayer() noexcept=default

nvinfer1::IReduceLayer
Layer that represents a reduction across a non-bool tensor.
Definition: NvInfer.h:2922

nvinfer1::IReduceLayer::setKeepDimensions
void setKeepDimensions(bool keepDimensions) noexcept
Set the boolean that specifies whether or not to keep the reduced dimensions for the layer.
Definition: NvInfer.h:2969

nvinfer1::IReduceLayer::setOperation
void setOperation(ReduceOperation op) noexcept
Set the reduce operation for the layer.
Definition: NvInfer.h:2929

nvinfer1::IReduceLayer::getOperation
ReduceOperation getOperation() const noexcept
Get the reduce operation for the layer.
Definition: NvInfer.h:2939

nvinfer1::IReduceLayer::~IReduceLayer
virtual ~IReduceLayer() noexcept=default

nvinfer1::IReduceLayer::getReduceAxes
uint32_t getReduceAxes() const noexcept
Get the axes over which to reduce for the layer.
Definition: NvInfer.h:2959

nvinfer1::IReduceLayer::setReduceAxes
void setReduceAxes(uint32_t reduceAxes) noexcept
Set the axes over which to reduce.
Definition: NvInfer.h:2949

nvinfer1::IReduceLayer::mImpl
apiv::VReduceLayer * mImpl
Definition: NvInfer.h:2985

nvinfer1::IReduceLayer::getKeepDimensions
bool getKeepDimensions() const noexcept
Get the boolean that specifies whether or not to keep the reduced dimensions for the layer.
Definition: NvInfer.h:2979

nvinfer1::IResizeLayer
A resize layer in a network definition.
Definition: NvInfer.h:4209

nvinfer1::IResizeLayer::setSelectorForSinglePixel
void setSelectorForSinglePixel(ResizeSelector selector) noexcept
Set coordinate selector function when resized to single pixel.
Definition: NvInfer.h:4370

nvinfer1::IResizeLayer::setNearestRounding
void setNearestRounding(ResizeRoundMode value) noexcept
Set rounding mode for nearest neighbor resize.
Definition: NvInfer.h:4394

nvinfer1::IResizeLayer::~IResizeLayer
virtual ~IResizeLayer() noexcept=default

nvinfer1::IResizeLayer::getScales
int32_t getScales(int32_t size, float *scales) const noexcept
Copies resize scales to scales[0, ..., nbScales-1], where nbScales is the number of scales that were ...
Definition: NvInfer.h:4288

nvinfer1::IResizeLayer::setOutputDimensions
void setOutputDimensions(Dims const &dimensions) noexcept
Set the output dimensions.
Definition: NvInfer.h:4229

nvinfer1::IResizeLayer::setCubicCoeff
void setCubicCoeff(float A) noexcept
Set the coefficient 'A' used in cubic interpolation.
Definition: NvInfer.h:4426

nvinfer1::IResizeLayer::setScales
void setScales(float const *scales, int32_t nbScales) noexcept
Set the resize scales.
Definition: NvInfer.h:4269

nvinfer1::IResizeLayer::getCubicCoeff
float getCubicCoeff() const noexcept
Get the coefficient 'A' used in cubic interpolation.
Definition: NvInfer.h:4436

nvinfer1::IResizeLayer::getSelectorForSinglePixel
ResizeSelector getSelectorForSinglePixel() const noexcept
Get the coordinate selector function when resized to single pixel.
Definition: NvInfer.h:4380

nvinfer1::IResizeLayer::getResizeMode
InterpolationMode getResizeMode() const noexcept
Get resize mode for an input tensor.
Definition: NvInfer.h:4310

nvinfer1::IResizeLayer::setCoordinateTransformation
void setCoordinateTransformation(ResizeCoordinateTransformation coordTransform) noexcept
Set coordinate transformation function.
Definition: NvInfer.h:4345

nvinfer1::IResizeLayer::setExcludeOutside
void setExcludeOutside(bool excludeFlag) noexcept
Set the state for excluding outside pixels.
Definition: NvInfer.h:4449

nvinfer1::IResizeLayer::setResizeMode
void setResizeMode(InterpolationMode interpolationMode) noexcept
Set resize mode for an input tensor.
Definition: NvInfer.h:4300

nvinfer1::IResizeLayer::getOutputDimensions
Dims getOutputDimensions() const noexcept
Get the output dimensions.
Definition: NvInfer.h:4239

nvinfer1::IResizeLayer::getNearestRounding
ResizeRoundMode getNearestRounding() const noexcept
Get rounding mode for nearest neighbor resize.
Definition: NvInfer.h:4404

nvinfer1::IResizeLayer::getExcludeOutside
bool getExcludeOutside() const noexcept
Get the state for excluding outside pixels.
Definition: NvInfer.h:4459

nvinfer1::IResizeLayer::getCoordinateTransformation
ResizeCoordinateTransformation getCoordinateTransformation() const noexcept
Get coordinate transformation function.
Definition: NvInfer.h:4355

nvinfer1::IReverseSequenceLayer
A ReverseSequence layer in a network definition.
Definition: NvInfer.h:6443

nvinfer1::IReverseSequenceLayer::setSequenceAxis
void setSequenceAxis(int32_t sequenceAxis) noexcept
Set the sequence axis. Default is 0.
Definition: NvInfer.h:6476

nvinfer1::IReverseSequenceLayer::getBatchAxis
int32_t getBatchAxis() const noexcept
Return the batch axis. Return 1 if no batch axis was set.
Definition: NvInfer.h:6463

nvinfer1::IReverseSequenceLayer::mImpl
apiv::VReverseSequenceLayer * mImpl
Definition: NvInfer.h:6492

nvinfer1::IReverseSequenceLayer::getSequenceAxis
int32_t getSequenceAxis() const noexcept
Return the sequence axis. Return 0 if no sequence axis was set.
Definition: NvInfer.h:6486

nvinfer1::IReverseSequenceLayer::setBatchAxis
void setBatchAxis(int32_t batchAxis) noexcept
Set the batch axis. Default is 1.
Definition: NvInfer.h:6453

nvinfer1::IReverseSequenceLayer::~IReverseSequenceLayer
virtual ~IReverseSequenceLayer() noexcept=default

nvinfer1::IRotaryEmbeddingLayer
Layer that implements Rotary Position Embedding (RoPE) (https://arxiv.org/abs/2104....
Definition: NvInfer.h:7291

nvinfer1::IRotaryEmbeddingLayer::getRotaryEmbeddingDim
TRT_NODISCARD int32_t getRotaryEmbeddingDim() const noexcept
Get the number of hidden dimensions participating in RoPE. The default value is 0,...
Definition: NvInfer.h:7331

nvinfer1::IRotaryEmbeddingLayer::~IRotaryEmbeddingLayer
virtual ~IRotaryEmbeddingLayer() noexcept=default

nvinfer1::IRotaryEmbeddingLayer::setInterleaved
void setInterleaved(bool interleaved) noexcept
Set whether the input is in interleaved format, i.e., whether the 2-d vectors rotated are taken from ...
Definition: NvInfer.h:7298

nvinfer1::IRotaryEmbeddingLayer::setRotaryEmbeddingDim
TRT_NODISCARD bool setRotaryEmbeddingDim(int32_t rotaryEmbeddingDim) noexcept
Set the number of hidden dimensions participating in RoPE. The default value is 0,...
Definition: NvInfer.h:7320

nvinfer1::IRotaryEmbeddingLayer::mImpl
apiv::VRotaryEmbeddingLayer * mImpl
Definition: NvInfer.h:7354

nvinfer1::IRotaryEmbeddingLayer::getInterleaved
TRT_NODISCARD bool getInterleaved() const noexcept
Get whether the input is in interleaved format. The default value is false.
Definition: NvInfer.h:7309

nvinfer1::IScaleLayer
A Scale layer in a network definition.
Definition: NvInfer.h:1898

nvinfer1::IScaleLayer::getScale
Weights getScale() const noexcept
Get the scale value.
Definition: NvInfer.h:1955

nvinfer1::IScaleLayer::getPower
Weights getPower() const noexcept
Get the power value.
Definition: NvInfer.h:1975

nvinfer1::IScaleLayer::setScale
void setScale(Weights scale) noexcept
Set the scale value.
Definition: NvInfer.h:1945

nvinfer1::IScaleLayer::setPower
void setPower(Weights power) noexcept
Set the power value.
Definition: NvInfer.h:1965

nvinfer1::IScaleLayer::getMode
ScaleMode getMode() const noexcept
Get the scale mode.
Definition: NvInfer.h:1915

nvinfer1::IScaleLayer::setShift
void setShift(Weights shift) noexcept
Set the shift value.
Definition: NvInfer.h:1925

nvinfer1::IScaleLayer::setChannelAxis
void setChannelAxis(int32_t channelAxis) noexcept
Set the channel axis.
Definition: NvInfer.h:2011

nvinfer1::IScaleLayer::getShift
Weights getShift() const noexcept
Get the shift value.
Definition: NvInfer.h:1935

nvinfer1::IScaleLayer::~IScaleLayer
virtual ~IScaleLayer() noexcept=default

nvinfer1::IScaleLayer::setMode
void setMode(ScaleMode mode) noexcept
Set the scale mode.
Definition: NvInfer.h:1905

nvinfer1::IScaleLayer::getChannelAxis
int32_t getChannelAxis() const noexcept
Get the channel axis.
Definition: NvInfer.h:1990

nvinfer1::IScatterLayer
A scatter layer in a network definition. Supports several kinds of scattering.
Definition: NvInfer.h:6065

nvinfer1::IScatterLayer::setMode
void setMode(ScatterMode mode) noexcept
Set the scatter mode.
Definition: NvInfer.h:6072

nvinfer1::IScatterLayer::mImpl
apiv::VScatterLayer * mImpl
Definition: NvInfer.h:6106

nvinfer1::IScatterLayer::setAxis
void setAxis(int32_t axis) noexcept
Set the axis used by ScatterMode::kELEMENTS.
Definition: NvInfer.h:6092

nvinfer1::IScatterLayer::getAxis
int32_t getAxis() const noexcept
Get the axis.
Definition: NvInfer.h:6100

nvinfer1::IScatterLayer::getMode
ScatterMode getMode() const noexcept
Get the scatter mode.
Definition: NvInfer.h:6082

nvinfer1::IScatterLayer::~IScatterLayer
virtual ~IScatterLayer() noexcept=default

nvinfer1::ISelectLayer
Select elements from two data tensors based on a condition tensor.
Definition: NvInfer.h:5034

nvinfer1::ISelectLayer::~ISelectLayer
virtual ~ISelectLayer() noexcept=default

nvinfer1::IShapeLayer
Layer type for getting shape of a tensor.
Definition: NvInfer.h:3527

nvinfer1::IShapeLayer::~IShapeLayer
virtual ~IShapeLayer() noexcept=default

nvinfer1::IShapeLayer::mImpl
apiv::VShapeLayer * mImpl
Definition: NvInfer.h:3529

nvinfer1::IShuffleLayer
Layer type for shuffling data.
Definition: NvInfer.h:3090

nvinfer1::IShuffleLayer::mImpl
apiv::VShuffleLayer * mImpl
Definition: NvInfer.h:3248

nvinfer1::IShuffleLayer::setFirstTranspose
void setFirstTranspose(Permutation permutation) noexcept
Set the permutation applied by the first transpose operation.
Definition: NvInfer.h:3101

nvinfer1::IShuffleLayer::setSecondTranspose
void setSecondTranspose(Permutation permutation) noexcept
Set the permutation applied by the second transpose operation.
Definition: NvInfer.h:3201

nvinfer1::IShuffleLayer::getReshapeDimensions
Dims getReshapeDimensions() const noexcept
Get the reshaped dimensions.
Definition: NvInfer.h:3154

nvinfer1::IShuffleLayer::setReshapeDimensions
void setReshapeDimensions(Dims const &dimensions) noexcept
Set the reshaped dimensions.
Definition: NvInfer.h:3141

nvinfer1::IShuffleLayer::getFirstTranspose
Permutation getFirstTranspose() const noexcept
Get the permutation applied by the first transpose operation.
Definition: NvInfer.h:3113

nvinfer1::IShuffleLayer::~IShuffleLayer
virtual ~IShuffleLayer() noexcept=default

nvinfer1::IShuffleLayer::getSecondTranspose
Permutation getSecondTranspose() const noexcept
Get the permutation applied by the second transpose operation.
Definition: NvInfer.h:3213

nvinfer1::IShuffleLayer::getZeroIsPlaceholder
bool getZeroIsPlaceholder() const noexcept
Get meaning of 0 in reshape dimensions.
Definition: NvInfer.h:3242

nvinfer1::IShuffleLayer::setZeroIsPlaceholder
void setZeroIsPlaceholder(bool zeroIsPlaceholder) noexcept
Set meaning of 0 in reshape dimensions.
Definition: NvInfer.h:3229

nvinfer1::ISliceLayer
Slices an input tensor into an output tensor based on the offset and strides.
Definition: NvInfer.h:3342

nvinfer1::ISliceLayer::setStride
void setStride(Dims const &stride) noexcept
Set the stride for computing the output slice data.
Definition: NvInfer.h:3411

nvinfer1::ISliceLayer::mImpl
apiv::VSliceLayer * mImpl
Definition: NvInfer.h:3510

nvinfer1::ISliceLayer::~ISliceLayer
virtual ~ISliceLayer() noexcept=default

nvinfer1::ISliceLayer::setSize
void setSize(Dims const &size) noexcept
Set the dimensions of the output slice.
Definition: NvInfer.h:3382

nvinfer1::ISliceLayer::setAxes
void setAxes(Dims const &axes) noexcept
Set the axes for this ISliceLayer.
Definition: NvInfer.h:3489

nvinfer1::ISliceLayer::setStart
void setStart(Dims const &start) noexcept
Set the start offset that the slice layer uses to create the output slice.
Definition: NvInfer.h:3353

nvinfer1::ISliceLayer::getStart
Dims getStart() const noexcept
Get the start offset for the slice layer.
Definition: NvInfer.h:3368

nvinfer1::ISliceLayer::setMode
void setMode(SampleMode mode) noexcept
Set the slice mode.
Definition: NvInfer.h:3436

nvinfer1::ISliceLayer::getSize
Dims getSize() const noexcept
Get dimensions of the output slice.
Definition: NvInfer.h:3397

nvinfer1::ISliceLayer::getMode
SampleMode getMode() const noexcept
Get the slice mode.
Definition: NvInfer.h:3446

nvinfer1::ISliceLayer::getStride
Dims getStride() const noexcept
Get the stride for the output slice.
Definition: NvInfer.h:3426

nvinfer1::ISliceLayer::getAxes
Dims getAxes() const noexcept
Get the axes for this ISliceLayer.
Definition: NvInfer.h:3504

nvinfer1::ISoftMaxLayer
A Softmax layer in a network definition.
Definition: NvInfer.h:2042

nvinfer1::ISoftMaxLayer::setAxes
void setAxes(uint32_t axes) noexcept
Set the axis along which softmax is computed. Currently, only one axis can be set.
Definition: NvInfer.h:2064

nvinfer1::ISoftMaxLayer::getAxes
uint32_t getAxes() const noexcept
Get the axis along which softmax occurs.
Definition: NvInfer.h:2074

nvinfer1::ISoftMaxLayer::~ISoftMaxLayer
virtual ~ISoftMaxLayer() noexcept=default

nvinfer1::ISqueezeLayer
Layer that represents a squeeze operation, removing unit dimensions of the first input tensor on a se...
Definition: NvInfer.h:6651

nvinfer1::ISqueezeLayer::~ISqueezeLayer
virtual ~ISqueezeLayer() noexcept=default

nvinfer1::ISqueezeLayer::mImpl
apiv::VSqueezeLayer * mImpl
Definition: NvInfer.h:6668

nvinfer1::ITensor
A tensor in a network definition.
Definition: NvInfer.h:188

nvinfer1::ITensor::setAllowedFormats
void setAllowedFormats(TensorFormats formats) noexcept
Set allowed formats for an input or output tensor. By default all formats are allowed....
Definition: NvInfer.h:458

nvinfer1::ITensor::getLocation
TensorLocation getLocation() const noexcept
Get the storage location of a tensor.
Definition: NvInfer.h:377

nvinfer1::ITensor::setDimensions
void setDimensions(Dims const &dimensions) noexcept
Set the dimensions of a tensor.
Definition: NvInfer.h:236

nvinfer1::ITensor::resetDynamicRange
void resetDynamicRange() noexcept
Undo effect of setDynamicRange.
Definition: NvInfer.h:416

nvinfer1::ITensor::setName
void setName(char const *name) noexcept
Set the tensor name.
Definition: NvInfer.h:205

nvinfer1::ITensor::isExecutionTensor
bool isExecutionTensor() const noexcept
Whether the tensor is an execution tensor.
Definition: NvInfer.h:523

nvinfer1::ITensor::dynamicRangeIsSet
TRT_DEPRECATED bool dynamicRangeIsSet() const noexcept
Query whether dynamic range is set.
Definition: NvInfer.h:408

nvinfer1::ITensor::getName
char const * getName() const noexcept
Get the tensor name.
Definition: NvInfer.h:217

nvinfer1::ITensor::isShapeTensor
bool isShapeTensor() const noexcept
Whether the tensor is a shape tensor.
Definition: NvInfer.h:502

nvinfer1::ITensor::getDynamicRangeMax
float getDynamicRangeMax() const noexcept
Get maximum of dynamic range.
Definition: NvInfer.h:436

nvinfer1::ITensor::isNetworkInput
bool isNetworkInput() const noexcept
Whether the tensor is a network input.
Definition: NvInfer.h:326

nvinfer1::ITensor::setBroadcastAcrossBatch
TRT_DEPRECATED void setBroadcastAcrossBatch(bool broadcastAcrossBatch) noexcept
Set whether to enable broadcast of tensor across the implicit batch dimension.
Definition: NvInfer.h:351

nvinfer1::ITensor::setDynamicRange
TRT_DEPRECATED bool setDynamicRange(float min, float max) noexcept
Set dynamic range for the tensor.
Definition: NvInfer.h:318

nvinfer1::ITensor::setType
TRT_DEPRECATED void setType(DataType type) noexcept
Set the data type of a tensor.
Definition: NvInfer.h:286

nvinfer1::ITensor::getBroadcastAcrossBatch
TRT_DEPRECATED bool getBroadcastAcrossBatch() const noexcept
Check if tensor is broadcast across the implicit batch dimension.
Definition: NvInfer.h:365

nvinfer1::ITensor::isNetworkOutput
bool isNetworkOutput() const noexcept
Whether the tensor is a network output.
Definition: NvInfer.h:334

nvinfer1::ITensor::getType
DataType getType() const noexcept
Get the data type of a tensor.
Definition: NvInfer.h:301

nvinfer1::ITensor::mImpl
apiv::VTensor * mImpl
Definition: NvInfer.h:570

nvinfer1::ITensor::getDynamicRangeMin
float getDynamicRangeMin() const noexcept
Get minimum of dynamic range.
Definition: NvInfer.h:426

nvinfer1::ITensor::~ITensor
virtual ~ITensor() noexcept=default

nvinfer1::ITensor::setDimensionName
void setDimensionName(int32_t index, char const *name) noexcept
Name a dimension of an input tensor.
Definition: NvInfer.h:549

nvinfer1::ITensor::getDimensionName
char const * getDimensionName(int32_t index) const noexcept
Get the name of an input dimension.
Definition: NvInfer.h:564

nvinfer1::ITensor::setLocation
TRT_DEPRECATED void setLocation(TensorLocation location) noexcept
Set the storage location of a tensor.
Definition: NvInfer.h:396

nvinfer1::ITensor::getDimensions
Dims getDimensions() const noexcept
Get the dimensions of a tensor.
Definition: NvInfer.h:250

nvinfer1::ITensor::getAllowedFormats
TensorFormats getAllowedFormats() const noexcept
Get a bitmask of TensorFormat values that the tensor supports. For a shape tensor,...
Definition: NvInfer.h:471

nvinfer1::ITimingCache
Class to handle tactic timing info collected from builder.
Definition: NvInfer.h:10105

nvinfer1::ITimingCache::queryKeys
int64_t queryKeys(TimingCacheKey *keyBuffer, int64_t capacity) const noexcept
Query cache keys from Timing Cache.
Definition: NvInfer.h:10171

nvinfer1::ITimingCache::combine
bool combine(ITimingCache const &inputCache, bool ignoreMismatch) noexcept
Combine input timing cache into local instance.
Definition: NvInfer.h:10142

nvinfer1::ITimingCache::query
TimingCacheValue query(TimingCacheKey const &key) const noexcept
Query value in a cache entry.
Definition: NvInfer.h:10188

nvinfer1::ITimingCache::~ITimingCache
virtual ~ITimingCache() noexcept=default

nvinfer1::ITimingCache::update
bool update(TimingCacheKey const &key, TimingCacheValue const &value) noexcept
Update values in a cache entry.
Definition: NvInfer.h:10210

nvinfer1::ITimingCache::mImpl
apiv::VTimingCache * mImpl
Definition: NvInfer.h:10216

nvinfer1::ITimingCache::reset
bool reset() noexcept
Empty the timing cache.
Definition: NvInfer.h:10152

nvinfer1::ITopKLayer
Layer that represents a TopK reduction.
Definition: NvInfer.h:3567

nvinfer1::ITopKLayer::setK
void setK(int32_t k) noexcept
Set the static k value for the layer.
Definition: NvInfer.h:3598

nvinfer1::ITopKLayer::setReduceAxes
void setReduceAxes(uint32_t reduceAxes) noexcept
Set which axes to reduce for the layer.
Definition: NvInfer.h:3622

nvinfer1::ITopKLayer::getOperation
TopKOperation getOperation() const noexcept
Get the operation for the layer.
Definition: NvInfer.h:3584

nvinfer1::ITopKLayer::mImpl
apiv::VTopKLayer * mImpl
Definition: NvInfer.h:3681

nvinfer1::ITopKLayer::setOperation
void setOperation(TopKOperation op) noexcept
Set the operation for the layer.
Definition: NvInfer.h:3574

nvinfer1::ITopKLayer::setIndicesType
bool setIndicesType(DataType type) noexcept
Set the indices type for the layer.
Definition: NvInfer.h:3663

nvinfer1::ITopKLayer::getK
int32_t getK() const noexcept
Get the k value for the layer.
Definition: NvInfer.h:3612

nvinfer1::ITopKLayer::getReduceAxes
uint32_t getReduceAxes() const noexcept
Get the axes to reduce for the layer.
Definition: NvInfer.h:3632

nvinfer1::ITopKLayer::~ITopKLayer
virtual ~ITopKLayer() noexcept=default

nvinfer1::ITopKLayer::getIndicesType
DataType getIndicesType() const noexcept
Return the TopK layer indices type.
Definition: NvInfer.h:3675

nvinfer1::ITripLimitLayer
A layer that represents a trip-count limiter.
Definition: NvInfer.h:4847

nvinfer1::ITripLimitLayer::getTripLimit
TripLimit getTripLimit() const noexcept
Get a trip limiter type.
Definition: NvInfer.h:4852

nvinfer1::ITripLimitLayer::~ITripLimitLayer
virtual ~ITripLimitLayer() noexcept=default

nvinfer1::IUnaryLayer
Layer that represents an unary operation.
Definition: NvInfer.h:2847

nvinfer1::IUnaryLayer::setOperation
void setOperation(UnaryOperation op) noexcept
Set the unary operation for the layer.
Definition: NvInfer.h:2856

nvinfer1::IUnaryLayer::mImpl
apiv::VUnaryLayer * mImpl
Definition: NvInfer.h:2872

nvinfer1::IUnaryLayer::getOperation
UnaryOperation getOperation() const noexcept
Get the unary operation for the layer.
Definition: NvInfer.h:2866

nvinfer1::IUnaryLayer::~IUnaryLayer
virtual ~IUnaryLayer() noexcept=default

nvinfer1::IUnsqueezeLayer
Layer that represents an unsqueeze operation, which reshapes the first input tensor by inserting unit...
Definition: NvInfer.h:6681

nvinfer1::IUnsqueezeLayer::~IUnsqueezeLayer
virtual ~IUnsqueezeLayer() noexcept=default

nvinfer1::IUnsqueezeLayer::mImpl
apiv::VUnsqueezeLayer * mImpl
Definition: NvInfer.h:6699

nvinfer1::IVersionedInterface
An Interface class for version control.
Definition: NvInferRuntimeBase.h:278

nvinfer1::InterfaceInfo
Version information associated with a TRT interface.
Definition: NvInferRuntimeBase.h:243

nvinfer1::Weights
An array of weights used as a layer parameter.
Definition: NvInferRuntime.h:124

nvinfer1::v_1_0::IAlgorithmSelector
Definition: NvInfer.h:9699

nvinfer1::v_1_0::IAlgorithmSelector::selectAlgorithms
virtual int32_t selectAlgorithms(IAlgorithmContext const &context, IAlgorithm const *const *choices, int32_t nbChoices, int32_t *selection) noexcept=0
Select Algorithms for a layer from the given list of algorithm choices.

nvinfer1::v_1_0::IAlgorithmSelector::reportAlgorithms
virtual void reportAlgorithms(IAlgorithmContext const *const *algoContexts, IAlgorithm const *const *algoChoices, int32_t nbAlgorithms) noexcept=0
Called by TensorRT to report choices it made.

nvinfer1::v_1_0::IAlgorithmSelector::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInfer.h:9704

nvinfer1::v_1_0::IAlgorithmSelector::~IAlgorithmSelector
virtual ~IAlgorithmSelector() noexcept=default

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:415

nvinfer1::v_1_0::IGpuAllocator
Definition: NvInferRuntime.h:1656

nvinfer1::v_1_0::IInt8EntropyCalibrator2
Definition: NvInfer.h:9326

nvinfer1::v_1_0::IInt8EntropyCalibrator2::~IInt8EntropyCalibrator2
~IInt8EntropyCalibrator2() noexcept override=default

nvinfer1::v_1_0::IInt8EntropyCalibrator2::getAlgorithm
CalibrationAlgoType getAlgorithm() noexcept override
Definition: NvInfer.h:9339

nvinfer1::v_1_0::IInt8EntropyCalibrator2::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInfer.h:9331

nvinfer1::v_1_0::IInt8EntropyCalibrator
Definition: NvInfer.h:9286

nvinfer1::v_1_0::IInt8EntropyCalibrator::getAlgorithm
CalibrationAlgoType getAlgorithm() noexcept override
Definition: NvInfer.h:9299

nvinfer1::v_1_0::IInt8EntropyCalibrator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInfer.h:9291

nvinfer1::v_1_0::IInt8EntropyCalibrator::~IInt8EntropyCalibrator
~IInt8EntropyCalibrator() noexcept override=default

nvinfer1::v_1_0::IInt8LegacyCalibrator
Definition: NvInfer.h:9405

nvinfer1::v_1_0::IInt8LegacyCalibrator::getAlgorithm
CalibrationAlgoType getAlgorithm() noexcept override
Definition: NvInfer.h:9418

nvinfer1::v_1_0::IInt8LegacyCalibrator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInfer.h:9410

nvinfer1::v_1_0::IInt8LegacyCalibrator::getQuantile
virtual double getQuantile() const noexcept=0
The quantile (between 0 and 1) that will be used to select the region maximum when the quantile metho...

nvinfer1::v_1_0::IInt8MinMaxCalibrator
Definition: NvInfer.h:9366

nvinfer1::v_1_0::IInt8MinMaxCalibrator::~IInt8MinMaxCalibrator
~IInt8MinMaxCalibrator() noexcept override=default

nvinfer1::v_1_0::IInt8MinMaxCalibrator::getAlgorithm
CalibrationAlgoType getAlgorithm() noexcept override
Definition: NvInfer.h:9379

nvinfer1::v_1_0::IInt8MinMaxCalibrator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
Return version information associated with this interface. Applications must not override this method...
Definition: NvInfer.h:9371

nvinfer1::v_1_0::IPluginV3
Definition: NvInferPluginBase.h:206

nvinfer1::v_1_0::IProgressMonitor
Definition: NvInfer.h:10432

nvinfer1::v_1_0::IProgressMonitor::stepComplete
virtual bool stepComplete(char const *phaseName, int32_t step) noexcept=0
Signal that a step of an optimizer phase has finished.

nvinfer1::v_1_0::IProgressMonitor::~IProgressMonitor
virtual ~IProgressMonitor() noexcept=default

nvinfer1::v_1_0::IProgressMonitor::IProgressMonitor
IProgressMonitor()=default

nvinfer1::v_1_0::IProgressMonitor::phaseFinish
virtual void phaseFinish(char const *phaseName) noexcept=0
Signal that a phase of the optimizer has finished.

nvinfer1::v_1_0::IProgressMonitor::phaseStart
virtual void phaseStart(char const *phaseName, char const *parentPhase, int32_t nbSteps) noexcept=0
Signal that a phase of the optimizer has started.

nvinfer1::v_1_0::IStreamWriter
Definition: NvInferRuntime.h:666

nvinfer1::anonymous_namespace{NvInfer.h}::createInferBuilder
IBuilder * createInferBuilder(ILogger &logger) noexcept
Create an instance of an IBuilder class.
Definition: NvInfer.h:11882

nvinfer1
The TensorRT API version 1 namespace.
Definition: NvInferPluginBase.h:29

nvinfer1::TacticSources
uint32_t TacticSources
Represents a collection of one or more TacticSource values combine using bitwise-OR operations.
Definition: NvInferRuntime.h:2961

nvinfer1::ResizeSelector
ResizeSelector
The coordinate selector when resize to single pixel output.
Definition: NvInfer.h:4114

nvinfer1::ResizeSelector::kFORMULA
@ kFORMULA
Use formula to map the original index.

nvinfer1::ResizeSelector::kUPPER
@ kUPPER
Select the upper left pixel.

nvinfer1::EngineCapability
EngineCapability
List of supported engine capability flows.
Definition: NvInferRuntime.h:76

nvinfer1::MemoryPoolType
MemoryPoolType
The type for memory pools used by TensorRT.
Definition: NvInfer.h:10227

nvinfer1::MemoryPoolType::kWORKSPACE
@ kWORKSPACE

nvinfer1::MemoryPoolType::kTACTIC_SHARED_MEMORY
@ kTACTIC_SHARED_MEMORY

nvinfer1::MemoryPoolType::kDLA_GLOBAL_DRAM
@ kDLA_GLOBAL_DRAM

nvinfer1::MemoryPoolType::kDLA_MANAGED_SRAM
@ kDLA_MANAGED_SRAM

nvinfer1::MemoryPoolType::kDLA_LOCAL_DRAM
@ kDLA_LOCAL_DRAM

nvinfer1::MemoryPoolType::kTACTIC_DRAM
@ kTACTIC_DRAM

nvinfer1::ScaleMode
ScaleMode
Controls how shift, scale and power are applied in a Scale layer.
Definition: NvInfer.h:1855

nvinfer1::ScaleMode::kUNIFORM
@ kUNIFORM
Identical coefficients across all elements of the tensor.

nvinfer1::ScaleMode::kCHANNEL
@ kCHANNEL
Per-channel coefficients.

nvinfer1::RuntimePlatform
RuntimePlatform
Describes the intended runtime platform (operating system and CPU architecture) for the execution of ...
Definition: NvInfer.h:9810

nvinfer1::RuntimePlatform::kWINDOWS_AMD64
@ kWINDOWS_AMD64

nvinfer1::RuntimePlatform::kSAME_AS_BUILD
@ kSAME_AS_BUILD

nvinfer1::QuantizationFlags
uint32_t QuantizationFlags
Represents one or more QuantizationFlag values using binary OR operations.
Definition: NvInfer.h:9762

nvinfer1::TensorIOMode::kNONE
@ kNONE
Tensor is not an input or output.

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
Describes requirements of compatibility with GPU architectures other than that of the GPU on which th...
Definition: NvInfer.h:10346

nvinfer1::HardwareCompatibilityLevel::kSAME_COMPUTE_CAPABILITY
@ kSAME_COMPUTE_CAPABILITY

nvinfer1::HardwareCompatibilityLevel::kAMPERE_PLUS
@ kAMPERE_PLUS

nvinfer1::CumulativeOperation
CumulativeOperation
Enumerates the cumulative operations that may be performed by a Cumulative layer.
Definition: NvInfer.h:6715

nvinfer1::BoundingBoxFormat
BoundingBoxFormat
Representation of bounding box data used for the Boxes input tensor in INMSLayer.
Definition: NvInfer.h:6257

nvinfer1::BoundingBoxFormat::kCENTER_SIZES
@ kCENTER_SIZES
(x_center, y_center, width, height) where (x_center, y_center) is the center point of the box

nvinfer1::BoundingBoxFormat::kCORNER_PAIRS
@ kCORNER_PAIRS
(x1, y1, x2, y2) where (x1, y1) and (x2, y2) are any pair of diagonal corners

nvinfer1::EnumMax< BuilderFlag >
constexpr int32_t EnumMax< BuilderFlag >() noexcept
Definition: NvInfer.h:10045

nvinfer1::EnumMax< LayerType >
constexpr int32_t EnumMax< LayerType >() noexcept
Definition: NvInfer.h:122

nvinfer1::PluginFieldType::kFP4
@ kFP4
FP4 field type.

nvinfer1::PluginFieldType::kINT8
@ kINT8
INT8 field type.

nvinfer1::PluginFieldType::kFP8
@ kFP8
FP8 field type.

nvinfer1::PluginFieldType::kBF16
@ kBF16
BF16 field type.

nvinfer1::PluginFieldType::kINT4
@ kINT4
INT4 field type.

nvinfer1::EnumMax< CalibrationAlgoType >
constexpr int32_t EnumMax< CalibrationAlgoType >() noexcept
Definition: NvInfer.h:9201

nvinfer1::UnaryOperation
UnaryOperation
Enumerates the unary operations that may be performed by a Unary layer.
Definition: NvInfer.h:2800

nvinfer1::UnaryOperation::kISINF
@ kISINF
Return true if input value equals +/- infinity for floating-point data type.

nvinfer1::UnaryOperation::kFLOOR
@ kFLOOR
Floor.

nvinfer1::UnaryOperation::kCOSH
@ kCOSH
Hyperbolic cosine.

nvinfer1::UnaryOperation::kACOSH
@ kACOSH
Inverse hyperbolic cosine.

nvinfer1::UnaryOperation::kTAN
@ kTAN
Tangent.

nvinfer1::UnaryOperation::kERF
@ kERF
Gauss error function.

nvinfer1::UnaryOperation::kISNAN
@ kISNAN
Return true if input value is a NaN for floating-point data type.

nvinfer1::UnaryOperation::kACOS
@ kACOS
Inverse cosine.

nvinfer1::UnaryOperation::kABS
@ kABS
Absolute value.

nvinfer1::UnaryOperation::kRECIP
@ kRECIP
Reciprocal.

nvinfer1::UnaryOperation::kCOS
@ kCOS
Cosine.

nvinfer1::UnaryOperation::kSINH
@ kSINH
Hyperbolic sine.

nvinfer1::UnaryOperation::kSQRT
@ kSQRT
Square root.

nvinfer1::UnaryOperation::kROUND
@ kROUND
Round to nearest even for floating-point data type.

nvinfer1::UnaryOperation::kATANH
@ kATANH
Inverse hyperbolic tangent.

nvinfer1::UnaryOperation::kCEIL
@ kCEIL
Ceiling.

nvinfer1::UnaryOperation::kASINH
@ kASINH
Inverse hyperbolic sine.

nvinfer1::UnaryOperation::kASIN
@ kASIN
Inverse sine.

nvinfer1::UnaryOperation::kSIGN
@ kSIGN
Sign, If input > 0, output 1; if input < 0, output -1; if input == 0, output 0.

nvinfer1::UnaryOperation::kSIN
@ kSIN
Sine.

nvinfer1::UnaryOperation::kLOG
@ kLOG
Log (base e).

nvinfer1::UnaryOperation::kNOT
@ kNOT
Logical NOT.

nvinfer1::UnaryOperation::kEXP
@ kEXP
Exponentiation.

nvinfer1::UnaryOperation::kNEG
@ kNEG
Negation.

nvinfer1::UnaryOperation::kATAN
@ kATAN
Inverse tangent.

nvinfer1::EnumMax< ReduceOperation >
constexpr int32_t EnumMax< ReduceOperation >() noexcept
Definition: NvInfer.h:2909

nvinfer1::EnumMax< TripLimit >
constexpr int32_t EnumMax< TripLimit >() noexcept
Definition: NvInfer.h:4515

nvinfer1::ActivationType
ActivationType
Enumerates the types of activation to perform in an activation layer.
Definition: NvInfer.h:141

nvinfer1::ActivationType::kSELU
@ kSELU
Selu activation: x>0 ? beta * x : beta * (alpha*exp(x) - alpha)

nvinfer1::ActivationType::kTANH
@ kTANH
TanH activation.

nvinfer1::ActivationType::kSCALED_TANH
@ kSCALED_TANH
Scaled tanh activation: alpha*tanh(beta*x)

nvinfer1::ActivationType::kRELU
@ kRELU
Rectified linear activation.

nvinfer1::ActivationType::kELU
@ kELU
Elu activation: x>=0 ? x : alpha * (exp(x) - 1).

nvinfer1::ActivationType::kLEAKY_RELU
@ kLEAKY_RELU
LeakyRelu activation: x>=0 ? x : alpha * x.

nvinfer1::ActivationType::kSOFTSIGN
@ kSOFTSIGN
Softsign activation: x / (1+|x|)

nvinfer1::ActivationType::kHARD_SIGMOID
@ kHARD_SIGMOID
Hard sigmoid activation: max(0, min(1, alpha*x+beta))

nvinfer1::ActivationType::kTHRESHOLDED_RELU
@ kTHRESHOLDED_RELU
Thresholded ReLU activation: x>alpha ? x : 0.

nvinfer1::ActivationType::kSIGMOID
@ kSIGMOID
Sigmoid activation.

nvinfer1::ActivationType::kCLIP
@ kCLIP
Clip activation: max(alpha, min(beta, x))

nvinfer1::ActivationType::kGELU_TANH
@ kGELU_TANH
GELU tanh activation: 0.5 * x * (1 + tanh(sqrt(2/pi) * (0.044715F * pow(x, 3) + x)))

nvinfer1::ActivationType::kGELU_ERF
@ kGELU_ERF
GELU erf activation: 0.5 * x * (1 + erf(sqrt(0.5) * x))

nvinfer1::ActivationType::kSOFTPLUS
@ kSOFTPLUS
Parametric softplus activation: alpha*log(exp(beta*x)+1)

nvinfer1::FillOperation
FillOperation
Enumerates the tensor fill operations that may performed by a fill layer.
Definition: NvInfer.h:5095

nvinfer1::FillOperation::kLINSPACE
@ kLINSPACE

nvinfer1::FillOperation::kRANDOM_UNIFORM
@ kRANDOM_UNIFORM
Randomly draw values from a uniform distribution.

nvinfer1::FillOperation::kRANDOM_NORMAL
@ kRANDOM_NORMAL
Randomly draw values from a normal distribution.

nvinfer1::ResizeRoundMode
ResizeRoundMode
The rounding mode for nearest neighbor resize.
Definition: NvInfer.h:4144

nvinfer1::ResizeRoundMode::kHALF_UP
@ kHALF_UP
Round half up.

nvinfer1::ResizeRoundMode::kHALF_DOWN
@ kHALF_DOWN
Round half down.

nvinfer1::PaddingMode
PaddingMode
Enumerates the modes of padding to perform in convolution, deconvolution and pooling layer,...
Definition: NvInfer.h:1033

nvinfer1::PaddingMode::kSAME_LOWER
@ kSAME_LOWER
Use SAME padding, with prePadding >= postPadding.

nvinfer1::PaddingMode::kEXPLICIT_ROUND_DOWN
@ kEXPLICIT_ROUND_DOWN
Use explicit padding, rounding output size down.

nvinfer1::PaddingMode::kEXPLICIT_ROUND_UP
@ kEXPLICIT_ROUND_UP
Use explicit padding, rounding output size up.

nvinfer1::PaddingMode::kSAME_UPPER
@ kSAME_UPPER
Use SAME padding, with prePadding <= postPadding.

nvinfer1::TripLimit
TripLimit
Enum that describes kinds of trip limits.
Definition: NvInfer.h:4503

nvinfer1::TripLimit::kWHILE
@ kWHILE
Tensor is a scalar of type kBOOL. Loop terminates when value is false.

nvinfer1::TripLimit::kCOUNT
@ kCOUNT
Tensor is a scalar of type kINT32 or kINT64 that contains the trip count.

nvinfer1::NetworkDefinitionCreationFlags
uint32_t NetworkDefinitionCreationFlags
Represents one or more NetworkDefinitionCreationFlag flags using binary OR operations....
Definition: NvInfer.h:11480

nvinfer1::PreviewFeature
PreviewFeature
Define preview features.
Definition: NvInfer.h:10302

nvinfer1::PreviewFeature::kRUNTIME_ACTIVATION_RESIZE_10_10
@ kRUNTIME_ACTIVATION_RESIZE_10_10

nvinfer1::PreviewFeature::kALIASED_PLUGIN_IO_10_03
@ kALIASED_PLUGIN_IO_10_03

nvinfer1::PreviewFeature::kPROFILE_SHARING_0806
@ kPROFILE_SHARING_0806

nvinfer1::TilingOptimizationLevel
TilingOptimizationLevel
Define the optimization levels for Tiling.
Definition: NvInfer.h:10399

nvinfer1::TilingOptimizationLevel::kFAST
@ kFAST
Use a fast algorithm and heuristic based strategy. Slightly increases engine build time.

nvinfer1::TilingOptimizationLevel::kMODERATE
@ kMODERATE

nvinfer1::TilingOptimizationLevel::kFULL
@ kFULL
Increase search space even wider. Significantly increases engine build time.

nvinfer1::EnumMax< GatherMode >
constexpr int32_t EnumMax< GatherMode >() noexcept
Definition: NvInfer.h:2559

nvinfer1::DataType
DataType
The type of weights and tensors. The datatypes other than kBOOL, kINT32, and kINT64 are "activation d...
Definition: NvInferRuntimeBase.h:145

nvinfer1::BuilderFlags
uint32_t BuilderFlags
Represents one or more BuilderFlag values using binary OR operations, e.g., 1U << BuilderFlag::kFP16 ...
Definition: NvInfer.h:9842

nvinfer1::DeviceType
DeviceType
The device that this layer/network will execute on.
Definition: NvInferRuntime.h:1350

nvinfer1::EnumMax< ScaleMode >
constexpr int32_t EnumMax< ScaleMode >() noexcept
Definition: NvInfer.h:1867

nvinfer1::CalibrationAlgoType
CalibrationAlgoType
Version of calibration algorithm to use.
Definition: NvInfer.h:9188

nvinfer1::CalibrationAlgoType::kENTROPY_CALIBRATION_2
@ kENTROPY_CALIBRATION_2
Entropy calibration.

nvinfer1::CalibrationAlgoType::kLEGACY_CALIBRATION
@ kLEGACY_CALIBRATION
Legacy calibration.

nvinfer1::CalibrationAlgoType::kENTROPY_CALIBRATION
@ kENTROPY_CALIBRATION
Legacy entropy calibration.

nvinfer1::CalibrationAlgoType::kMINMAX_CALIBRATION
@ kMINMAX_CALIBRATION
Minmax calibration.

nvinfer1::LayerType
LayerType
The type values of layer classes.
Definition: NvInfer.h:58

nvinfer1::LayerType::kGRID_SAMPLE
@ kGRID_SAMPLE
Grid sample layer.

nvinfer1::LayerType::kRAGGED_SOFTMAX
@ kRAGGED_SOFTMAX
Ragged softmax layer.

nvinfer1::LayerType::kDECONVOLUTION
@ kDECONVOLUTION
Deconvolution layer.

nvinfer1::LayerType::kREDUCE
@ kREDUCE
Reduce layer.

nvinfer1::LayerType::kASSERTION
@ kASSERTION
Assertion layer.

nvinfer1::LayerType::kTOPK
@ kTOPK
TopK layer.

nvinfer1::LayerType::kRESIZE
@ kRESIZE
Resize Layer.

nvinfer1::LayerType::kCAST
@ kCAST
Cast layer.

nvinfer1::LayerType::kPADDING
@ kPADDING
Padding layer.

nvinfer1::LayerType::kSQUEEZE
@ kSQUEEZE
Squeeze Layer.

nvinfer1::LayerType::kATTENTION_INPUT
@ kATTENTION_INPUT
Attention Input.

nvinfer1::LayerType::kMATRIX_MULTIPLY
@ kMATRIX_MULTIPLY
Matrix multiply layer.

nvinfer1::LayerType::kCONDITION
@ kCONDITION
Condition layer.

nvinfer1::LayerType::kCUMULATIVE
@ kCUMULATIVE
Cumulative layer.

nvinfer1::LayerType::kCONDITIONAL_INPUT
@ kCONDITIONAL_INPUT
Conditional Input layer.

nvinfer1::LayerType::kIDENTITY
@ kIDENTITY
Identity layer.

nvinfer1::LayerType::kNORMALIZATION
@ kNORMALIZATION
Normalization layer.

nvinfer1::LayerType::kQUANTIZE
@ kQUANTIZE
Quantize layer.

nvinfer1::LayerType::kSCATTER
@ kSCATTER
Scatter layer.

nvinfer1::LayerType::kCONVOLUTION
@ kCONVOLUTION
Convolution layer.

nvinfer1::LayerType::kPARAMETRIC_RELU
@ kPARAMETRIC_RELU
Parametric ReLU layer.

nvinfer1::LayerType::kNMS
@ kNMS
NMS layer.

nvinfer1::LayerType::kATTENTION_OUTPUT
@ kATTENTION_OUTPUT
Attention Output.

nvinfer1::LayerType::kUNSQUEEZE
@ kUNSQUEEZE
Unsqueeze Layer.

nvinfer1::LayerType::kCONCATENATION
@ kCONCATENATION
Concatenation layer.

nvinfer1::LayerType::kONE_HOT
@ kONE_HOT
OneHot layer.

nvinfer1::LayerType::kREVERSE_SEQUENCE
@ kREVERSE_SEQUENCE
Reverse sequence layer.

nvinfer1::LayerType::kSLICE
@ kSLICE
Slice layer.

nvinfer1::LayerType::kEINSUM
@ kEINSUM
Einsum layer.

nvinfer1::LayerType::kSOFTMAX
@ kSOFTMAX
SoftMax layer.

nvinfer1::LayerType::kSHAPE
@ kSHAPE
Shape layer.

nvinfer1::LayerType::kROTARY_EMBEDDING
@ kROTARY_EMBEDDING
Rotary Embedding layer.

nvinfer1::LayerType::kRECURRENCE
@ kRECURRENCE
Loop Recurrence layer.

nvinfer1::LayerType::kDEQUANTIZE
@ kDEQUANTIZE
Dequantize layer.

nvinfer1::LayerType::kSHUFFLE
@ kSHUFFLE
Shuffle layer.

nvinfer1::LayerType::kPLUGIN_V3
@ kPLUGIN_V3
PluginV3 layer.

nvinfer1::LayerType::kLRN
@ kLRN
LRN layer.

nvinfer1::LayerType::kITERATOR
@ kITERATOR
Loop Iterator layer.

nvinfer1::LayerType::kPOOLING
@ kPOOLING
Pooling layer.

nvinfer1::LayerType::kTRIP_LIMIT
@ kTRIP_LIMIT
Loop Trip limit layer.

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale layer.

nvinfer1::LayerType::kDYNAMIC_QUANTIZE
@ kDYNAMIC_QUANTIZE
Dynamic Quantize layer.

nvinfer1::LayerType::kGATHER
@ kGATHER
Gather layer.

nvinfer1::LayerType::kUNARY
@ kUNARY
UnaryOp operation Layer.

nvinfer1::LayerType::kACTIVATION
@ kACTIVATION
Activation layer.

nvinfer1::LayerType::kELEMENTWISE
@ kELEMENTWISE
Elementwise layer.

nvinfer1::LayerType::kSELECT
@ kSELECT
Select layer.

nvinfer1::LayerType::kPLUGIN_V2
@ kPLUGIN_V2
PluginV2 layer.

nvinfer1::LayerType::kLOOP_OUTPUT
@ kLOOP_OUTPUT
Loop output layer.

nvinfer1::LayerType::kCONDITIONAL_OUTPUT
@ kCONDITIONAL_OUTPUT
Conditional Output layer.

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant layer.

nvinfer1::LayerType::kNON_ZERO
@ kNON_ZERO
NonZero layer.

nvinfer1::LayerType::kFILL
@ kFILL
Fill layer.

nvinfer1::LayerType::kKVCACHE_UPDATE
@ kKVCACHE_UPDATE
KV Cache Update layer.

nvinfer1::LayerType::kPLUGIN
@ kPLUGIN
Plugin layer.

nvinfer1::EnumMax< QuantizationFlag >
constexpr int32_t EnumMax< QuantizationFlag >() noexcept
Definition: NvInfer.h:9787

nvinfer1::SampleMode
SampleMode
Controls how ISliceLayer and IGridSample handle out-of-bounds coordinates.
Definition: NvInfer.h:3258

nvinfer1::SampleMode::kREFLECT
@ kREFLECT

nvinfer1::SampleMode::kCLAMP
@ kCLAMP
Out of bounds indices are clamped to bounds.

nvinfer1::SampleMode::kSTRICT_BOUNDS
@ kSTRICT_BOUNDS
Fail with error when the coordinates are out of bounds.

nvinfer1::SampleMode::kWRAP
@ kWRAP
Coordinates wrap around periodically.

nvinfer1::GatherMode
GatherMode
Control form of IGatherLayer.
Definition: NvInfer.h:2547

nvinfer1::GatherMode::kDEFAULT
@ kDEFAULT
Similar to ONNX Gather.

nvinfer1::GatherMode::kELEMENT
@ kELEMENT
Similar to ONNX GatherElements.

nvinfer1::GatherMode::kND
@ kND
Similar to ONNX GatherND.

nvinfer1::TensorFormats
uint32_t TensorFormats
It is capable of representing one or more TensorFormat by binary OR operations, e....
Definition: NvInfer.h:133

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
List of verbosity levels of layer information exposed in NVTX annotations and in IEngineInspector.
Definition: NvInferRuntime.h:2973

nvinfer1::NetworkDefinitionCreationFlag
NetworkDefinitionCreationFlag
List of immutable network properties expressed at network creation time. NetworkDefinitionCreationFla...
Definition: NvInfer.h:11491

nvinfer1::NetworkDefinitionCreationFlag::kSTRONGLY_TYPED
@ kSTRONGLY_TYPED

nvinfer1::NetworkDefinitionCreationFlag::kPREFER_JIT_PYTHON_PLUGINS
@ kPREFER_JIT_PYTHON_PLUGINS

nvinfer1::NetworkDefinitionCreationFlag::kPREFER_AOT_PYTHON_PLUGINS
@ kPREFER_AOT_PYTHON_PLUGINS

nvinfer1::NetworkDefinitionCreationFlag::kEXPLICIT_BATCH
@ kEXPLICIT_BATCH

nvinfer1::ElementWiseOperation
ElementWiseOperation
Enumerates the binary operations that may be performed by an ElementWise layer.
Definition: NvInfer.h:2457

nvinfer1::ElementWiseOperation::kSUB
@ kSUB
Subtract the second element from the first.

nvinfer1::ElementWiseOperation::kSUM
@ kSUM
Sum of the two elements.

nvinfer1::ElementWiseOperation::kPROD
@ kPROD
Product of the two elements.

nvinfer1::ElementWiseOperation::kFLOOR_DIV
@ kFLOOR_DIV
Floor division of the first element by the second.

nvinfer1::ElementWiseOperation::kEQUAL
@ kEQUAL
Check if two elements are equal.

nvinfer1::ElementWiseOperation::kAND
@ kAND
Logical AND of two elements.

nvinfer1::ElementWiseOperation::kOR
@ kOR
Logical OR of two elements.

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
Minimum of the two elements.

nvinfer1::ElementWiseOperation::kPOW
@ kPOW
The first element to the power of the second element.

nvinfer1::ElementWiseOperation::kLESS
@ kLESS
Check if element in first tensor is less than corresponding element in second tensor.

nvinfer1::ElementWiseOperation::kGREATER
@ kGREATER
Check if element in first tensor is greater than corresponding element in second tensor.

nvinfer1::ElementWiseOperation::kXOR
@ kXOR
Logical XOR of two elements.

nvinfer1::ElementWiseOperation::kDIV
@ kDIV
Divide the first element by the second.

nvinfer1::QuantizationFlag
QuantizationFlag
List of valid flags for quantizing the network to int8.
Definition: NvInfer.h:9774

nvinfer1::QuantizationFlag::kCALIBRATE_BEFORE_FUSION
@ kCALIBRATE_BEFORE_FUSION

nvinfer1::EnumMax< SampleMode >
constexpr int32_t EnumMax< SampleMode >() noexcept
Definition: NvInfer.h:3274

nvinfer1::InterpolationMode
InterpolationMode
Enumerates various modes of interpolation.
Definition: NvInfer.h:4032

nvinfer1::InterpolationMode::kNEAREST
@ kNEAREST
ND (0 < N <= 8) nearest neighbor resizing.

nvinfer1::InterpolationMode::kCUBIC
@ kCUBIC
Supports bicubic (2D) interpolation.

nvinfer1::InterpolationMode::kLINEAR
@ kLINEAR
Supports linear (1D), bilinear (2D), and trilinear (3D) interpolation.

nvinfer1::BuilderFlag
BuilderFlag
List of valid modes that the builder can enable when creating an engine from a network definition.
Definition: NvInfer.h:9852

nvinfer1::BuilderFlag::kWEIGHT_STREAMING
@ kWEIGHT_STREAMING
Enable weight streaming for the current engine.

nvinfer1::BuilderFlag::kEXCLUDE_LEAN_RUNTIME
@ kEXCLUDE_LEAN_RUNTIME

nvinfer1::BuilderFlag::kDEBUG
@ kDEBUG
Enable debugging of layers via synchronizing after every layer.

nvinfer1::BuilderFlag::kGPU_FALLBACK
@ kGPU_FALLBACK
Enable layers marked to execute on GPU if layer cannot execute on DLA.

nvinfer1::BuilderFlag::kSPARSE_WEIGHTS
@ kSPARSE_WEIGHTS
Allow the builder to examine weights and use optimized functions when weights have suitable sparsity.

nvinfer1::BuilderFlag::kTF32
@ kTF32

nvinfer1::BuilderFlag::kFP16
@ kFP16

nvinfer1::BuilderFlag::kVERSION_COMPATIBLE
@ kVERSION_COMPATIBLE

nvinfer1::BuilderFlag::kERROR_ON_TIMING_CACHE_MISS
@ kERROR_ON_TIMING_CACHE_MISS

nvinfer1::BuilderFlag::kEDITABLE_TIMING_CACHE
@ kEDITABLE_TIMING_CACHE
Enable editable timing cache.

nvinfer1::BuilderFlag::kSAFETY_SCOPE
@ kSAFETY_SCOPE

nvinfer1::BuilderFlag::kPREFER_PRECISION_CONSTRAINTS
@ kPREFER_PRECISION_CONSTRAINTS

nvinfer1::BuilderFlag::kDISTRIBUTIVE_INDEPENDENCE
@ kDISTRIBUTIVE_INDEPENDENCE

nvinfer1::BuilderFlag::kSTRIP_PLAN
@ kSTRIP_PLAN
Strip the refittable weights from the engine plan file.

nvinfer1::BuilderFlag::kSTRICT_NANS
@ kSTRICT_NANS

nvinfer1::BuilderFlag::kDIRECT_IO
@ kDIRECT_IO

nvinfer1::BuilderFlag::kMONITOR_MEMORY
@ kMONITOR_MEMORY
Enable memory monitor during build time.

nvinfer1::BuilderFlag::kDISABLE_TIMING_CACHE
@ kDISABLE_TIMING_CACHE
Disable reuse of timing information across identical layers.

nvinfer1::BuilderFlag::kREFIT_INDIVIDUAL
@ kREFIT_INDIVIDUAL

nvinfer1::BuilderFlag::kREFIT_IDENTICAL
@ kREFIT_IDENTICAL

nvinfer1::BuilderFlag::kDISABLE_COMPILATION_CACHE
@ kDISABLE_COMPILATION_CACHE

nvinfer1::BuilderFlag::kWEIGHTLESS
@ kWEIGHTLESS

nvinfer1::BuilderFlag::kREFIT
@ kREFIT
Enable building a refittable engine.

nvinfer1::BuilderFlag::kOBEY_PRECISION_CONSTRAINTS
@ kOBEY_PRECISION_CONSTRAINTS

nvinfer1::BuilderFlag::kREJECT_EMPTY_ALGORITHMS
@ kREJECT_EMPTY_ALGORITHMS

nvinfer1::EnumMax< TopKOperation >
constexpr int32_t EnumMax< TopKOperation >() noexcept
Definition: NvInfer.h:3550

nvinfer1::getBuilderPluginRegistry
TENSORRTAPI nvinfer1::IPluginRegistry * getBuilderPluginRegistry(nvinfer1::EngineCapability capability) noexcept
Return the plugin registry for building a Standard engine, or nullptr if no registry exists.

nvinfer1::EnumMax< MemoryPoolType >
constexpr int32_t EnumMax< MemoryPoolType >() noexcept
Definition: NvInfer.h:10288

nvinfer1::TopKOperation
TopKOperation
Enumerates the operations that may be performed by a TopK layer.
Definition: NvInfer.h:3539

nvinfer1::ReduceOperation
ReduceOperation
Enumerates the reduce operations that may be performed by a Reduce layer.
Definition: NvInfer.h:2895

nvinfer1::ReduceOperation::kAVG
@ kAVG

nvinfer1::EnumMax< LoopOutput >
constexpr int32_t EnumMax< LoopOutput >() noexcept
Definition: NvInfer.h:4492

nvinfer1::EnumMax< NetworkDefinitionCreationFlag >
constexpr int32_t EnumMax< NetworkDefinitionCreationFlag >() noexcept
Definition: NvInfer.h:11519

nvinfer1::getBuilderSafePluginRegistry
TRT_DEPRECATED_API nvinfer1::safe::IPluginRegistry * getBuilderSafePluginRegistry(nvinfer1::EngineCapability capability) noexcept
Return the plugin registry for building a Safety engine, or nullptr if no registry exists.

nvinfer1::ScatterMode
ScatterMode
Control form of IScatterLayer.
Definition: NvInfer.h:5991

nvinfer1::MatrixOperation
MatrixOperation
Enumerates the operations that may be performed on a tensor by IMatrixMultiplyLayer before multiplica...
Definition: NvInfer.h:3692

nvinfer1::MatrixOperation::kVECTOR
@ kVECTOR

nvinfer1::MatrixOperation::kTRANSPOSE
@ kTRANSPOSE
Like kNONE, but transpose the matrix dimensions.

nvinfer1::ResizeCoordinateTransformation
ResizeCoordinateTransformation
The resize coordinate transformation function.
Definition: NvInfer.h:4060

nvinfer1::ResizeCoordinateTransformation::kHALF_PIXEL
@ kHALF_PIXEL

nvinfer1::ResizeCoordinateTransformation::kALIGN_CORNERS
@ kALIGN_CORNERS

nvinfer1::ResizeCoordinateTransformation::kASYMMETRIC
@ kASYMMETRIC

nvinfer1::EnumMax< UnaryOperation >
constexpr int32_t EnumMax< UnaryOperation >() noexcept
Definition: NvInfer.h:2834

nvinfer1::LoopOutput
LoopOutput
Enum that describes kinds of loop outputs.
Definition: NvInfer.h:4475

nvinfer1::LoopOutput::kLAST_VALUE
@ kLAST_VALUE
Output value is value of tensor for last iteration.

nvinfer1::LoopOutput::kCONCATENATE
@ kCONCATENATE
Output value is concatenation of values of tensor for each iteration, in forward order.

nvinfer1::LoopOutput::kREVERSE
@ kREVERSE
Output value is concatenation of values of tensor for each iteration, in reverse order.

nvinfer1::EnumMax< BoundingBoxFormat >
constexpr int32_t EnumMax< BoundingBoxFormat >() noexcept
Definition: NvInfer.h:6270

nvinfer1::EnumMax< MatrixOperation >
constexpr int32_t EnumMax< MatrixOperation >() noexcept
Definition: NvInfer.h:3720

nvinfer1::KVCacheMode
KVCacheMode
Enumerates the KVCache modes that may be performed by a KVCacheUpdate layer.
Definition: NvInfer.h:7364

nvinfer1::PoolingType
PoolingType
The type of pooling to perform in a pooling layer.
Definition: NvInfer.h:1469

nvinfer1::PoolingType::kAVERAGE
@ kAVERAGE
Average over elements. If the tensor is padded, the count includes the padding.

nvinfer1::PoolingType::kMAX
@ kMAX
Maximum over elements.

nvinfer1::PoolingType::kMAX_AVERAGE_BLEND
@ kMAX_AVERAGE_BLEND
Blending between max and average pooling: (1-blendFactor)*maxPool + blendFactor*avgPool.

nvinfer1::IProgressMonitor
v_1_0::IProgressMonitor IProgressMonitor
Definition: NvInfer.h:10515

nvinfer1::EnumMax< FillOperation >
constexpr int32_t EnumMax< FillOperation >() noexcept
Definition: NvInfer.h:5126

nvinfer1::TensorLocation
TensorLocation
The location for tensor data storage, device or host.
Definition: NvInferRuntime.h:204

nvinfer1::OptProfileSelector
OptProfileSelector
When setting or querying optimization profile parameters (such as shape tensor inputs or dynamic dime...
Definition: NvInferRuntime.h:2635

nvinfer1::AttentionNormalizationOp
AttentionNormalizationOp
Enumerates the operations that may be performed by the normalization in the attention subgraph.
Definition: NvInfer.h:6850

nvinfer1::EnumMax< ScatterMode >
constexpr int32_t EnumMax< ScatterMode >() noexcept
Definition: NvInfer.h:6002

nvinfer1::Permutation
Represents a permutation of dimensions.
Definition: NvInfer.h:3067

nvinfer1::impl::EnumMaxImpl
Declaration of EnumMaxImpl struct to store maximum number of elements in an enumeration type.
Definition: NvInferRuntimeBase.h:128

nvinfer1::v_1_0::TimingCacheKey
The key to retrieve timing cache entries.
Definition: NvInfer.h:10069

nvinfer1::v_1_0::TimingCacheValue
Definition: NvInfer.h:10081

nvinfer1::v_1_0::TimingCacheValue::tacticHash
uint64_t tacticHash
Hash of the selected tactic.
Definition: NvInfer.h:10083

nvinfer1::v_1_0::TimingCacheValue::timingMSec
float timingMSec
Timing of this tactic in milliseconds. Negative numbers and NaN are invalid values.
Definition: NvInfer.h:10085