nsight-dl-designer/NvNeuralSDK/_base_prototype_layer_8h_source.html

 /*

 * SPDX-FileCopyrightText: Copyright (c) 2020-2021 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: MIT

 *

 * Permission is hereby granted, free of charge, to any person obtaining a

 * copy of this software and associated documentation files (the "Software"),

 * to deal in the Software without restriction, including without limitation

 * the rights to use, copy, modify, merge, publish, distribute, sublicense,

 * and/or sell copies of the Software, and to permit persons to whom the

 * Software is furnished to do so, subject to the following conditions:

 *

 * The above copyright notice and this permission notice shall be included in

 * all copies or substantial portions of the Software.

 *

 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

 * DEALINGS IN THE SOFTWARE.

 */


 #ifndef NVNEURAL_BASEPROTOTYPELAYER_H

 #define NVNEURAL_BASEPROTOTYPELAYER_H


 #include <nvneural/CodeGenTypes.h>

 #include <nvneural/CoreTypes.h>

 #include <nvneural/LayerTypes.h>

 #include <nvneural/RefObject.h>

 #include <nvneural/layers/IPrototypeLayer.h>

 #include "ScriptEngine.h"

 #include <Pugixml/pugixml.hpp>


 #include <map>

 #include <string>

 #include <vector>


 namespace nvneural {


 class BasePrototypeLayer

     : public refobj::RefObjectBase<

                   refobj::Implements<ILayer>

                 , refobj::Implements<IPrototypeLayer>

                 , refobj::Implements<ICppCodeGenerationLayer>>

            , detail::ScriptInterpretInterface<detail::AnyOperand>

 {

 public:

     virtual ~BasePrototypeLayer();


     const char* serializedType() const noexcept override;


     NeuralResult setName(const char* pName) noexcept override;

     const char* name() const noexcept override;


     NeuralResult setNetworkRuntime(INetworkRuntime* pNetworkRuntime) noexcept override;


     NetworkBackendId backendId() const noexcept override;

     TensorFormat tensorFormat() const noexcept override;

     TensorDimension stepping() const noexcept override;


     TensorDimension dimensions() const noexcept override;

     TensorDimension internalDimensions() const noexcept override;

     size_t tensorBufferSize() const noexcept override;

     size_t tensorInternalBufferSize() const noexcept override;


     NeuralResult loadFromParameters(const IParameterNode* pParameters) noexcept override;


     NeuralResult getInputLayers(ILayerList** ppInputLayers) const noexcept override;

     NeuralResult setInputLayer(size_t index, ILayer* pLayer) noexcept override;


     NeuralResult setPermanent(bool permanent) noexcept override;

     bool isPermanent() const noexcept override;


     NeuralResult setAffected(bool affected) noexcept override;

     bool isAffected() const noexcept override;


     NeuralResult setActivationFunction(ActivationFunctionId activationFunction) noexcept override;

     ActivationFunctionId activationFunction() const noexcept override;


     NeuralResult setActivationCoefficient(std::size_t coefficientIndex, float value) noexcept override;

     float activationCoefficient(std::size_t coefficientIndex) const noexcept override;


     const char* weightsName() const noexcept override;

     NeuralResult setWeightsName(const char* pWeightsName) noexcept override;


     TensorDimension weightsDimensions(const char* pWeightsName, WeightsQuery queryType) const noexcept override;


     NeuralResult reshape() noexcept override;

     NeuralResult evaluateForward() noexcept override;


     NeuralResult getData(void** ppOut, TensorFormat format, const ILayer* pRequestingLayer) noexcept override;

     NeuralResult getConstData(const void** ppOut, TensorFormat format, const ILayer* pRequestingLayer) const noexcept override;

     NeuralResult getCpuConstData(void* pOutBuffer, size_t bufferByteCount, size_t* pBytesCopied, TensorFormat format) const noexcept override;


     NeuralResult addPrototypeCode(const char* pName, const char* pCode) noexcept override final;

     NeuralResult addForwardEvalCall(const char* pName, const char* pCall) noexcept override final;

     NeuralResult addParameterKey(const char* pKey) noexcept override final;


     NeuralResult generateLayerCpp(ICppCodeGenerationLayerHost* pHost) noexcept override final;

     NeuralResult networkGenerationComplete() noexcept override final;


 protected:

     BasePrototypeLayer();


     virtual NeuralResult implementationReshape() noexcept = 0;


     virtual NeuralResult implementationForward() noexcept = 0;


     NeuralResult loadBasePrototypeInfo(NetworkBackendId      backendId,

                                        const TensorFormat&   format,

                                        CompilationLevel      compilationLevel,

                                        const std::string&    currentImpl,

                                        const IParameterNode* pParameters);


     NeuralResult setBasePrototypeInfo(std::size_t         inputsCount,

                                       const std::string&  type,

                                       NetworkBackendId    backend,

                                       const TensorFormat& format,

                                       const std::string&  dim,

                                       const std::string&  impl) noexcept;


     INetworkRuntime* m_pNetwork;

     detail::SizeValue m_block;

     detail::SizeValue m_grid;


     std::vector<detail::AnyOperand> m_ops;

     std::string m_selected_code;

     std::string m_entry;


 private:

     struct BasePrototypeLayerParameters

     {

         std::string type; // layer type for after prototyping

         NetworkBackendId backendId;

         TensorFormat tensorFormat;

         std::map<std::string, std::string> code; // tensor type as a key

         // dim example: 1,in[0].c+in[1].c,in.h,in.w;... (without index mean in[0].h == in[1].h == in[2].h ...)

         std::string dimNCHWCalculation;

         // fwd example: calling_kernel_name(in[0],in[1],out.w,out.h,in[0].c,in[1].c,out,1+5*4,act,act.alpha,@option,parameter)

         std::map<std::string, std::string> fwdEvalCall;

         std::vector<std::string> parametersKey;

         std::string currentImpl;

     };


     void setReal(detail::AnyOperand& v, const std::string& str) override;

     void setInteger(detail::AnyOperand& v, const std::string& str) override;

     void setBufferPointer(detail::AnyOperand& v, const std::string& str, int arg_index) override;

     void neg(detail::AnyOperand& v) override;

     void add(detail::AnyOperand& v, detail::AnyOperand& op) override;

     void sub(detail::AnyOperand& v, detail::AnyOperand& op) override;

     void mul(detail::AnyOperand& v, detail::AnyOperand& op) override;

     void div(detail::AnyOperand& v, detail::AnyOperand& op) override;

     void setRealOption(detail::AnyOperand& v, const std::string& str) override;

     void setIntegerOption(detail::AnyOperand& v, const std::string& str) override;

     void transform(detail::AnyOperand& v, const std::string& str) override;

     void setActType(detail::AnyOperand& v) override;

     void setActAlhpaLeft(detail::AnyOperand& v) override;

     void setActAlhpaRight(detail::AnyOperand& v) override;

     void setWeightsPointer(detail::AnyOperand& v, const std::string& str) override;

     void setInputPointer(detail::AnyOperand& v, int index) override;

     void setInputDimValue(detail::AnyOperand& v, int index, const std::string& str) override;

     void setOutputPointer(detail::AnyOperand& v, const std::string& name) override;

     void setOutputDimValue(detail::AnyOperand& v, const std::string& name, const std::string& str) override;


     void createScriptEngine();

     std::vector<detail::AnyOperand> interpretFinalize(const detail::SynParser::Node& node, bool onReshape = false);


     BasePrototypeLayerParameters m_basePrototypeParameters;

     std::string m_name;

     INetworkBackend* m_pBackend;

     TensorDimension m_dim;

     std::map<std::string, std::string> m_parameters;

     std::vector<ILayer*> m_inputLayers;

     bool m_permanent;

     bool m_affected;

     ActivationFunctionId m_activationFunction;

     std::vector<float> m_activationCoefficients;


     detail::ScriptEngine* m_pEngine = nullptr;


     std::vector<ILayer*> m_skip;


     detail::SynParser::Node m_fwdSyntree;

     size_t m_smemSize = 0;

     std::string m_type;


     TensorDimension m_steppingValue = TensorDimension(1, 1, 1, 1);

     std::size_t m_expectedInputCount = 0;


     bool m_reshapeFailed = true;

 };


 } // namespace nvneural


 #endif // !NVNEURAL_BASEPROTOTYPELAYER_H

CodeGenTypes.h
Definitions of C++ code generation interfaces exported by tools and plugins.

CoreTypes.h
Fundamental NvNeural data types are declared here.

nvneural::NetworkBackendId
NetworkBackendId
Enumeration describing common network backends.
Definition: CoreTypes.h:239

nvneural::CompilationLevel
CompilationLevel
This enum represent kernel type contained by a prototype layer.
Definition: CoreTypes.h:1688

nvneural::ActivationFunctionId
ActivationFunctionId
Enumeration describing common activation functions.
Definition: CoreTypes.h:259

nvneural::NeuralResult
NeuralResult
NeuralResult is a generic success/failure result type similar to COM HRESULT.
Definition: CoreTypes.h:275

IPrototypeLayer.h
Common interfaces for prototype layers.

LayerTypes.h
Interface types needed by layer objects.

nvneural::WeightsQuery
WeightsQuery
WeightsQuery describes the different types of queries for weights data.
Definition: LayerTypes.h:39

RefObject.h
Standard implementation for IRefObject-derived objects.

ScriptEngine.h
Internal helper classes for working with prototype layer scripts.

nvneural::BasePrototypeLayer
Base class for the CUDA prototype layers shipped with NvNeural.
Definition: BasePrototypeLayer.h:49

nvneural::BasePrototypeLayer::getInputLayers
NeuralResult getInputLayers(ILayerList **ppInputLayers) const noexcept
Retrieves the inputs for this layer.
Definition: BasePrototypeLayer.cpp:467

nvneural::BasePrototypeLayer::m_grid
detail::SizeValue m_grid
Preferred grid size in blocks.
Definition: BasePrototypeLayer.h:211

nvneural::BasePrototypeLayer::setWeightsName
NeuralResult setWeightsName(const char *pWeightsName) noexcept
Sets the name used to identify this layer's weights.
Definition: BasePrototypeLayer.cpp:576

nvneural::BasePrototypeLayer::m_pNetwork
INetworkRuntime * m_pNetwork
Pointer to owning network.
Definition: BasePrototypeLayer.h:209

nvneural::BasePrototypeLayer::activationCoefficient
float activationCoefficient(std::size_t coefficientIndex) const noexcept
Retrieves the activation coefficient for the specified index.
Definition: BasePrototypeLayer.cpp:555

nvneural::BasePrototypeLayer::setNetworkRuntime
NeuralResult setNetworkRuntime(INetworkRuntime *pNetworkRuntime) noexcept
Informs the layer it has been attached to a new network.
Definition: BasePrototypeLayer.cpp:385

nvneural::BasePrototypeLayer::setBasePrototypeInfo
NeuralResult setBasePrototypeInfo(std::size_t inputsCount, const std::string &type, NetworkBackendId backend, const TensorFormat &format, const std::string &dim, const std::string &impl) noexcept
Stores implementation-agnostic details of the prototype layer.
Definition: BasePrototypeLayer.cpp:188

nvneural::BasePrototypeLayer::setActivationFunction
NeuralResult setActivationFunction(ActivationFunctionId activationFunction) noexcept
Sets the activation function attached to the layer.
Definition: BasePrototypeLayer.cpp:525

nvneural::BasePrototypeLayer::backendId
NetworkBackendId backendId() const noexcept
Returns the backend ID associated with this layer implementation.
Definition: BasePrototypeLayer.cpp:410

nvneural::BasePrototypeLayer::addPrototypeCode
NeuralResult addPrototypeCode(const char *pName, const char *pCode) noexcept final
Adds a kernel definition for a particular tensor format and backend.
Definition: BasePrototypeLayer.cpp:207

nvneural::BasePrototypeLayer::stepping
TensorDimension stepping() const noexcept
Returns the internal storage stride consumed by this layer implementation.
Definition: BasePrototypeLayer.cpp:405

nvneural::BasePrototypeLayer::weightsName
const char * weightsName() const noexcept
Retrieves the name used to identify this layer's weights.
Definition: BasePrototypeLayer.cpp:569

nvneural::BasePrototypeLayer::getCpuConstData
NeuralResult getCpuConstData(void *pOutBuffer, size_t bufferByteCount, size_t *pBytesCopied, TensorFormat format) const noexcept
Retrieves read-only CPU-side memory for the layer's output.
Definition: BasePrototypeLayer.cpp:615

nvneural::BasePrototypeLayer::tensorBufferSize
size_t tensorBufferSize() const noexcept
Retrieve the size of the layer's output tensor buffer in bytes.
Definition: BasePrototypeLayer.cpp:432

nvneural::BasePrototypeLayer::generateLayerCpp
NeuralResult generateLayerCpp(ICppCodeGenerationLayerHost *pHost) noexcept final
Generates C++ code to configure the layer.
Definition: BasePrototypeLayer.cpp:241

nvneural::BasePrototypeLayer::loadBasePrototypeInfo
NeuralResult loadBasePrototypeInfo(NetworkBackendId backendId, const TensorFormat &format, CompilationLevel compilationLevel, const std::string &currentImpl, const IParameterNode *pParameters)
Loads prototype information from a parameter node.
Definition: BasePrototypeLayer.cpp:68

nvneural::BasePrototypeLayer::weightsDimensions
TensorDimension weightsDimensions(const char *pWeightsName, WeightsQuery queryType) const noexcept
Retrieves the tensor dimension of a layer's named weight input.
Definition: BasePrototypeLayer.cpp:583

nvneural::BasePrototypeLayer::implementationForward
virtual NeuralResult implementationForward() noexcept=0
Implementation-specific logic for ILayer::evaluateForward.

nvneural::BasePrototypeLayer::m_block
detail::SizeValue m_block
Preferred block size in threads.
Definition: BasePrototypeLayer.h:210

nvneural::BasePrototypeLayer::tensorInternalBufferSize
size_t tensorInternalBufferSize() const noexcept
Retrieves the dimensions of the layer's output tensor as allocated internally.
Definition: BasePrototypeLayer.cpp:440

nvneural::BasePrototypeLayer::setAffected
NeuralResult setAffected(bool affected) noexcept
Sets or clears the "affected" flag on a layer's output tensor.
Definition: BasePrototypeLayer.cpp:514

nvneural::BasePrototypeLayer::addForwardEvalCall
NeuralResult addForwardEvalCall(const char *pName, const char *pCall) noexcept final
Adds a call script for a particular tensor format and backend.
Definition: BasePrototypeLayer.cpp:218

nvneural::BasePrototypeLayer::setPermanent
NeuralResult setPermanent(bool permanent) noexcept
Sets or clears the "permanent" flag on a layer's output tensor.
Definition: BasePrototypeLayer.cpp:503

nvneural::BasePrototypeLayer::getData
NeuralResult getData(void **ppOut, TensorFormat format, const ILayer *pRequestingLayer) noexcept
Retrieves device-side memory for the layer's output.
Definition: BasePrototypeLayer.cpp:590

nvneural::BasePrototypeLayer::serializedType
const char * serializedType() const noexcept
Retrieves the layer type.
Definition: BasePrototypeLayer.cpp:337

nvneural::BasePrototypeLayer::setInputLayer
NeuralResult setInputLayer(size_t index, ILayer *pLayer) noexcept
Sets an input layer by index.
Definition: BasePrototypeLayer.cpp:477

nvneural::BasePrototypeLayer::tensorFormat
TensorFormat tensorFormat() const noexcept
Returns the tensor format consumed by this layer implementation.
Definition: BasePrototypeLayer.cpp:415

nvneural::BasePrototypeLayer::internalDimensions
TensorDimension internalDimensions() const noexcept
Retrieves the dimensions of the layer's output tensor as allocated internally.
Definition: BasePrototypeLayer.cpp:425

nvneural::BasePrototypeLayer::m_ops
std::vector< detail::AnyOperand > m_ops
Arguments to pass to the compiled entry point.
Definition: BasePrototypeLayer.h:213

nvneural::BasePrototypeLayer::isAffected
bool isAffected() const noexcept
Returns the current status of the "affected" flag.
Definition: BasePrototypeLayer.cpp:520

nvneural::BasePrototypeLayer::reshape
NeuralResult reshape() noexcept
Initializes (or reinitializes) the layer implementation with the current set of parameters.
Definition: BasePrototypeLayer.cpp:655

nvneural::BasePrototypeLayer::isPermanent
bool isPermanent() const noexcept
Returns the current status of the "permanent" flag.
Definition: BasePrototypeLayer.cpp:509

nvneural::BasePrototypeLayer::activationFunction
ActivationFunctionId activationFunction() const noexcept
Retrieves the activation function attached to this layer.
Definition: BasePrototypeLayer.cpp:531

nvneural::BasePrototypeLayer::loadFromParameters
NeuralResult loadFromParameters(const IParameterNode *pParameters) noexcept
Loads layer parameters from a serialized key-value representation.
Definition: BasePrototypeLayer.cpp:448

nvneural::BasePrototypeLayer::evaluateForward
NeuralResult evaluateForward() noexcept
Performs forward evaluation for this layer.
Definition: BasePrototypeLayer.cpp:758

nvneural::BasePrototypeLayer::addParameterKey
NeuralResult addParameterKey(const char *pKey) noexcept final
Adds a named parameter to the layer.
Definition: BasePrototypeLayer.cpp:229

nvneural::BasePrototypeLayer::m_selected_code
std::string m_selected_code
Source code for the currently selected implementation.
Definition: BasePrototypeLayer.h:214

nvneural::BasePrototypeLayer::setName
NeuralResult setName(const char *pName) noexcept
Sets the layer name.
Definition: BasePrototypeLayer.cpp:368

nvneural::BasePrototypeLayer::implementationReshape
virtual NeuralResult implementationReshape() noexcept=0
Implementation-specific logic for ILayer::reshape.

nvneural::BasePrototypeLayer::m_entry
std::string m_entry
Name of compiled entry point (e.g., CUDA function name)
Definition: BasePrototypeLayer.h:215

nvneural::BasePrototypeLayer::name
const char * name() const noexcept
Retrieves the layer name.
Definition: BasePrototypeLayer.cpp:380

nvneural::BasePrototypeLayer::getConstData
NeuralResult getConstData(const void **ppOut, TensorFormat format, const ILayer *pRequestingLayer) const noexcept
Retrieves read-only device-side memory for the layer's output.
Definition: BasePrototypeLayer.cpp:599

nvneural::BasePrototypeLayer::networkGenerationComplete
NeuralResult networkGenerationComplete() noexcept final
Indicates the entire network has been generated.
Definition: BasePrototypeLayer.cpp:332

nvneural::BasePrototypeLayer::dimensions
TensorDimension dimensions() const noexcept
Retrieves the dimensions of the layer's output tensor.
Definition: BasePrototypeLayer.cpp:420

nvneural::BasePrototypeLayer::setActivationCoefficient
NeuralResult setActivationCoefficient(std::size_t coefficientIndex, float value) noexcept
Sets an activation coefficient.
Definition: BasePrototypeLayer.cpp:536

nvneural::BasePrototypeLayer::BasePrototypeLayer
BasePrototypeLayer()
Creates a new BasePrototypeLayer object.
Definition: BasePrototypeLayer.cpp:53

nvneural::ICppCodeGenerationLayerHost
Tool-supplied interface for C++ code generation.
Definition: CodeGenTypes.h:130

nvneural::ILayer
ILayer is the base class for neural network layers.
Definition: LayerTypes.h:59

nvneural::ILayerList
ILayerList represents an immutable collection of ILayer pointers.
Definition: CoreTypes.h:1060

nvneural::INetworkBackend
INetworkBackend is a runtime-specific interface for CUDA, DirectX, or other system- specific operatio...
Definition: CoreTypes.h:643

nvneural::INetworkRuntime
INetworkRuntime is a subset of the basic network interface that is accessible from layer classes duri...
Definition: CoreTypes.h:1129

nvneural::IParameterNode
Represents a serialized parameter block in a model definition.
Definition: CoreTypes.h:1889

nvneural::TensorDimension
TensorDimension describes the dimensions of a four-dimensional image tensor.
Definition: CoreTypes.h:136

nvneural::TensorFormat
TensorFormat describes a specific tensor shape (element type and layout).
Definition: CoreTypes.h:88

nvneural::refobj::RefObjectBase
Parameterized base class implementing common IRefObject operations.
Definition: RefObject.h:336