2022.2/NvNeuralSDK/_base_layer_8h_source.html

 /*

 * SPDX-FileCopyrightText: Copyright (c) 2020-2021 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: MIT

 *

 * Permission is hereby granted, free of charge, to any person obtaining a

 * copy of this software and associated documentation files (the "Software"),

 * to deal in the Software without restriction, including without limitation

 * the rights to use, copy, modify, merge, publish, distribute, sublicense,

 * and/or sell copies of the Software, and to permit persons to whom the

 * Software is furnished to do so, subject to the following conditions:

 *

 * The above copyright notice and this permission notice shall be included in

 * all copies or substantial portions of the Software.

 *

 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

 * DEALINGS IN THE SOFTWARE.

 */


 #ifndef NVNEURAL_BASELAYER_H

 #define NVNEURAL_BASELAYER_H


 #include <nvneural/CoreTypes.h>

 #include <nvneural/CoreHelpers.h>

 #include <nvneural/LayerTypes.h>

 #include <string>

 #include <sstream>

 #include <vector>


 namespace nvneural {


     class BaseLayer : public ILayer

     {

     public:

         NeuralResult setName(const char* pName) noexcept override;

         const char* name() const noexcept override;


         NeuralResult setNetworkRuntime(INetworkRuntime* pNetworkRuntime) noexcept override;


         NetworkBackendId backendId() const noexcept override;

         TensorFormat tensorFormat() const noexcept override;

         TensorDimension stepping() const noexcept override;

         // Derived: TensorDimension dimensions() const noexcept override;

         TensorDimension internalDimensions() const noexcept override;

         size_t tensorBufferSize() const noexcept override;

         size_t tensorInternalBufferSize() const noexcept override;


         NeuralResult loadFromParameters(const IParameterNode* pParameters) noexcept override;


         NeuralResult setActivationFunction(ActivationFunctionId activationFunction) noexcept override;

         ActivationFunctionId activationFunction() const noexcept override;


         NeuralResult setActivationCoefficient(std::size_t coefficientIndex, float value) noexcept override;

         float activationCoefficient(std::size_t coefficientIndex) const noexcept override;


         NeuralResult setPermanent(bool permanent) noexcept override;

         bool isPermanent() const noexcept override;


         NeuralResult setAffected(bool affected) noexcept override;

         bool isAffected() const noexcept override;


         NeuralResult getInputLayers(ILayerList** ppInputLayers) const noexcept override;

         NeuralResult setInputLayer(std::size_t index, ILayer* pLayer) noexcept override;


         // Derived: NeuralResult reshape() noexcept override;

         // Derived: NeuralResult evaluateForward() noexcept override;


         const char* weightsName() const noexcept override;

         NeuralResult setWeightsName(const char* pWeightsName) noexcept override;


         TensorDimension weightsDimensions(const char* pWeightsName, WeightsQuery queryType) const noexcept override;


         NeuralResult getData(void** ppOut, TensorFormat format, const ILayer* pRequestingLayer) noexcept override;

         NeuralResult getConstData(const void** ppOut, TensorFormat format, const ILayer* pRequestingLayer) const noexcept override;

         NeuralResult getCpuConstData(void* pOutBuffer, size_t bufferByteCount, size_t* pBytesCopied, TensorFormat format) const noexcept override;


     protected:

         BaseLayer();

         INetworkRuntime* networkRuntime() const;

         RefPtr<INetworkBackend> networkBackend() const;


         NeuralResult allocateMemoryBlock(MemoryHandle* pHandle, size_t byteCount) noexcept;


         NeuralResult allocateMemoryBlock(MemoryHandle* pHandle, size_t byteCount, const char* pTrackingKey) noexcept;


         void* data(TensorFormat format);


         const ILayer* inputLayer(size_t index) const;


         ILayer* inputLayer(size_t index);


         size_t inputLayerCount() const;


         void registerImplementation(NetworkBackendId backendId, TensorDataType elementType, TensorDataLayout layout, int penalty);


         virtual void onImplementationChanged() const;


         const void* weightsData(const char* pWeightsName) const;


         TensorDimension loadedWeightsSize(const ILayer* pWeightsLayer, const char* pWeightsName) const;


         template<typename... Indices>

         bool verifyInputConnected(Indices... indices) const noexcept

         {

             const std::size_t arraySize = sizeof...(Indices);

             const std::array<size_t, arraySize> checklist = { (size_t)indices... };

             bool result = true;

             size_t checklistIndex;


             for (checklistIndex = 0; checklistIndex < arraySize; ++checklistIndex)

             {

                 if (!inputLayer(checklist[checklistIndex]))

                 {

                     result = false;

                     break;

                 }

             }


             if (!result)

             {

                 std::stringstream errorStream;

                 errorStream << name() << ": These mandatory inputs are not connected: " << checklist[checklistIndex];

                 for (checklistIndex += 1; checklistIndex < arraySize; ++checklistIndex)

                 {

                     const std::size_t inputIndex = checklist[checklistIndex];

                     if (!inputLayer(inputIndex))

                     {

                         errorStream << ", " << inputIndex;

                     }

                 }


                 DefaultLogger()->logError(0, "%s", errorStream.str().c_str());

                 return false;

             }

             else

             {

                 return true;

             }

         }


         void requestReshape() noexcept;


         enum class LoadResult : std::uint16_t

         {

             Success             = 0,

             Failure             = 1,

             NonNumericInput     = 2,

             CouldNotTranslate   = 3,

         };


         static LoadResult load2ElementParameter(const std::vector<std::string>& inArray, size_t& outElementX, size_t& outElementY, size_t inFill, bool inFillFirstElement = false)

         {

             // Sanity check the input array

             if (inArray.empty())

             {

                 return LoadResult::Failure;

             }


             // Calculate the fill which needs the first element, it is saved for later use

             LoadResult status = LoadResult::Success;

             size_t calcFill = inFill;


             size_t firstElement = inFill;

             if (isdigit(inArray[0][0]))

             {

                 try

                 {

                     firstElement = static_cast<size_t>(std::stoul(inArray[0]));

                 }

                 catch (const std::exception&)

                 {

                     status = LoadResult::CouldNotTranslate;

                 }

             }

             else

             {

                 status = LoadResult::NonNumericInput;

             }


             if (inFillFirstElement)

             {

                 if (status != LoadResult::Success)

                 {

                     return LoadResult::Failure;

                 }

                 calcFill = firstElement;

             }


             // Loaded elements go here locally, so on error, outElements is not changed.

             size_t elementsOut[2] = { calcFill, calcFill };


             // Deal with the saved first element from above

             if (status == LoadResult::Success)

             {

                 elementsOut[0] = firstElement;

             }


             // Deal with the second element

             size_t secondElement = calcFill;

             if (inArray.size() >= 2)

             {

                 if (isdigit(inArray[1].data()[0]))

                 {

                     try

                     {

                         secondElement = static_cast<size_t>(std::stoul(inArray[1]));

                     }

                     catch (const std::exception&)

                     {

                         status = LoadResult::CouldNotTranslate;

                     }

                 }

                 else

                 {

                     status = LoadResult::NonNumericInput;

                 }

             }


             elementsOut[1] = secondElement;


             // Finalize output

             outElementX = elementsOut[0];

             outElementY = elementsOut[1];


             return status;

         }


     private:

         ActivationFunctionId m_activationFunction;

         std::vector<float> m_activationCoefficients;

         std::string m_name;

         bool m_permanent;

         bool m_affected;

         std::string m_weightsName;


         INetworkRuntime* m_pNetwork;

         INetworkBackend* m_pBackend;

         std::vector<ILayer*> m_inputLayers;


         struct InternalImplementation

         {

             NetworkBackendId backendId;

             TensorFormat format;

             int penalty;

         };

         std::vector<InternalImplementation> m_implementations;

         mutable const InternalImplementation* m_pCurrentImplementation;


         void updateImplementation() const;

     };


 } // namespace nvneural


 #endif // NVNEURAL_BASELAYER_H

CoreHelpers.h
Common helper classes and template function implementations.

nvneural::DefaultLogger
ILogger * DefaultLogger()
Returns a pointer to the default logger for this module.
Definition: Logging.cpp:38

CoreTypes.h
Fundamental NvNeural data types are declared here.

nvneural::TensorDataType
TensorDataType
Enumeration describing common tensor element types.
Definition: CoreTypes.h:60

nvneural::TensorDataLayout
TensorDataLayout
Enumeration describing common tensor data layouts.
Definition: CoreTypes.h:77

nvneural::MemoryHandle
MemoryHandle__type * MemoryHandle
Opaque typedef used to represent INetworkBackend memory handles.
Definition: CoreTypes.h:626

nvneural::NetworkBackendId
NetworkBackendId
Enumeration describing common network backends.
Definition: CoreTypes.h:239

nvneural::ActivationFunctionId
ActivationFunctionId
Enumeration describing common activation functions.
Definition: CoreTypes.h:259

nvneural::NeuralResult
NeuralResult
NeuralResult is a generic success/failure result type similar to COM HRESULT.
Definition: CoreTypes.h:275

nvneural::NeuralResult::Success
@ Success
Operation succeeded. Generic result.

nvneural::NeuralResult::Failure
@ Failure
Operation failed. Generic result.

LayerTypes.h
Interface types needed by layer objects.

nvneural::WeightsQuery
WeightsQuery
WeightsQuery describes the different types of queries for weights data.
Definition: LayerTypes.h:39

nvneural::BaseLayer
BaseLayer provides common implementations for most of ILayer.
Definition: BaseLayer.h:74

nvneural::BaseLayer::data
void * data(TensorFormat format)
Returns a pointer to the output tensor memory in the provided format.
Definition: BaseLayer.cpp:310

nvneural::BaseLayer::setWeightsName
NeuralResult setWeightsName(const char *pWeightsName) noexcept
Sets the name used to identify this layer's weights.
Definition: BaseLayer.cpp:340

nvneural::BaseLayer::loadFromParameters
NeuralResult loadFromParameters(const IParameterNode *pParameters) noexcept
Loads layer parameters from a serialized key-value representation.
Definition: BaseLayer.cpp:147

nvneural::BaseLayer::weightsName
const char * weightsName() const noexcept
Retrieves the name used to identify this layer's weights.
Definition: BaseLayer.cpp:335

nvneural::BaseLayer::setActivationCoefficient
NeuralResult setActivationCoefficient(std::size_t coefficientIndex, float value) noexcept
Sets an activation coefficient.
Definition: BaseLayer.cpp:163

nvneural::BaseLayer::networkRuntime
INetworkRuntime * networkRuntime() const
Returns the INetworkRuntime object most recently set with setNetworkRuntime.
Definition: BaseLayer.cpp:88

nvneural::BaseLayer::setName
NeuralResult setName(const char *pName) noexcept
Sets the layer name.
Definition: BaseLayer.cpp:46

nvneural::BaseLayer::stepping
TensorDimension stepping() const noexcept
Returns the internal storage stride consumed by this layer implementation.
Definition: BaseLayer.cpp:119

nvneural::BaseLayer::setActivationFunction
NeuralResult setActivationFunction(ActivationFunctionId activationFunction) noexcept
Sets the activation function attached to the layer.
Definition: BaseLayer.cpp:152

nvneural::BaseLayer::internalDimensions
TensorDimension internalDimensions() const noexcept
Retrieves the dimensions of the layer's output tensor as allocated internally.
Definition: BaseLayer.cpp:124

nvneural::BaseLayer::tensorInternalBufferSize
size_t tensorInternalBufferSize() const noexcept
Retrieves the dimensions of the layer's output tensor as allocated internally.
Definition: BaseLayer.cpp:139

nvneural::BaseLayer::allocateMemoryBlock
NeuralResult allocateMemoryBlock(MemoryHandle *pHandle, size_t byteCount) noexcept
Allocates a memory block of the requested size.
Definition: BaseLayer.cpp:98

nvneural::BaseLayer::isPermanent
bool isPermanent() const noexcept
Returns the current status of the "permanent" flag.
Definition: BaseLayer.cpp:204

nvneural::BaseLayer::backendId
NetworkBackendId backendId() const noexcept
Returns the backend ID associated with this layer implementation.
Definition: BaseLayer.cpp:458

nvneural::BaseLayer::onImplementationChanged
virtual void onImplementationChanged() const
Callback for derived classes to know that the "preferred implementation" has changed.
Definition: BaseLayer.cpp:387

nvneural::BaseLayer::weightsData
const void * weightsData(const char *pWeightsName) const
Returns a pointer to device-side memory containing the indicated weights data.
Definition: BaseLayer.cpp:355

nvneural::BaseLayer::getCpuConstData
NeuralResult getCpuConstData(void *pOutBuffer, size_t bufferByteCount, size_t *pBytesCopied, TensorFormat format) const noexcept
Retrieves read-only CPU-side memory for the layer's output.
Definition: BaseLayer.cpp:270

nvneural::BaseLayer::activationFunction
ActivationFunctionId activationFunction() const noexcept
Retrieves the activation function attached to this layer.
Definition: BaseLayer.cpp:158

nvneural::BaseLayer::setNetworkRuntime
NeuralResult setNetworkRuntime(INetworkRuntime *pNetworkRuntime) noexcept
Informs the layer it has been attached to a new network.
Definition: BaseLayer.cpp:67

nvneural::BaseLayer::tensorBufferSize
size_t tensorBufferSize() const noexcept
Retrieve the size of the layer's output tensor buffer in bytes.
Definition: BaseLayer.cpp:131

nvneural::BaseLayer::name
const char * name() const noexcept
Retrieves the layer name.
Definition: BaseLayer.cpp:62

nvneural::BaseLayer::getConstData
NeuralResult getConstData(const void **ppOut, TensorFormat format, const ILayer *pRequestingLayer) const noexcept
Retrieves read-only device-side memory for the layer's output.
Definition: BaseLayer.cpp:245

nvneural::BaseLayer::load2ElementParameter
static LoadResult load2ElementParameter(const std::vector< std::string > &inArray, size_t &outElementX, size_t &outElementY, size_t inFill, bool inFillFirstElement=false)
Helper class that takes a vector of strings and loads 2 size_t elements.
Definition: BaseLayer.h:278

nvneural::BaseLayer::activationCoefficient
float activationCoefficient(std::size_t coefficientIndex) const noexcept
Retrieves the activation coefficient for the specified index.
Definition: BaseLayer.cpp:183

nvneural::BaseLayer::tensorFormat
TensorFormat tensorFormat() const noexcept
Returns the tensor format consumed by this layer implementation.
Definition: BaseLayer.cpp:471

nvneural::BaseLayer::getInputLayers
NeuralResult getInputLayers(ILayerList **ppInputLayers) const noexcept
Retrieves the inputs for this layer.
Definition: BaseLayer.cpp:220

nvneural::BaseLayer::LoadResult
LoadResult
This enum describes a result from the load2ElementParameter function.
Definition: BaseLayer.h:262

nvneural::BaseLayer::LoadResult::NonNumericInput
@ NonNumericInput
An input component contained a nondigit.

nvneural::BaseLayer::LoadResult::Success
@ Success
Parsing succeeded.

nvneural::BaseLayer::LoadResult::CouldNotTranslate
@ CouldNotTranslate
An input component could not be parsed as a number.

nvneural::BaseLayer::LoadResult::Failure
@ Failure
Parsing failed.

nvneural::BaseLayer::setAffected
NeuralResult setAffected(bool affected) noexcept
Sets or clears the "affected" flag on a layer's output tensor.
Definition: BaseLayer.cpp:209

nvneural::BaseLayer::setInputLayer
NeuralResult setInputLayer(std::size_t index, ILayer *pLayer) noexcept
Sets an input layer by index.
Definition: BaseLayer.cpp:230

nvneural::BaseLayer::inputLayer
const ILayer * inputLayer(size_t index) const
Returns the Nth input layer attached to this layer.
Definition: BaseLayer.cpp:315

nvneural::BaseLayer::verifyInputConnected
bool verifyInputConnected(Indices... indices) const noexcept
Test if inputs represented by indices are connected, and log errors if not.
Definition: BaseLayer.h:214

nvneural::BaseLayer::setPermanent
NeuralResult setPermanent(bool permanent) noexcept
Sets or clears the "permanent" flag on a layer's output tensor.
Definition: BaseLayer.cpp:198

nvneural::BaseLayer::loadedWeightsSize
TensorDimension loadedWeightsSize(const ILayer *pWeightsLayer, const char *pWeightsName) const
Returns the size of already-loaded weights data, whether using a layer or IWeightsLoader.
Definition: BaseLayer.cpp:364

nvneural::BaseLayer::inputLayerCount
size_t inputLayerCount() const
Returns the number of input layers assigned to this object.
Definition: BaseLayer.cpp:330

nvneural::BaseLayer::registerImplementation
void registerImplementation(NetworkBackendId backendId, TensorDataType elementType, TensorDataLayout layout, int penalty)
Registers an implementation for multi-format layers.
Definition: BaseLayer.cpp:380

nvneural::BaseLayer::networkBackend
RefPtr< INetworkBackend > networkBackend() const
Returns the INetworkBackend object associated with the implementation that most closely matches the c...
Definition: BaseLayer.cpp:93

nvneural::BaseLayer::requestReshape
void requestReshape() noexcept
Marks this layer as in need of reshape.
Definition: BaseLayer.cpp:484

nvneural::BaseLayer::getData
NeuralResult getData(void **ppOut, TensorFormat format, const ILayer *pRequestingLayer) noexcept
Retrieves device-side memory for the layer's output.
Definition: BaseLayer.cpp:261

nvneural::BaseLayer::weightsDimensions
TensorDimension weightsDimensions(const char *pWeightsName, WeightsQuery queryType) const noexcept
Retrieves the tensor dimension of a layer's named weight input.
Definition: BaseLayer.cpp:350

nvneural::BaseLayer::isAffected
bool isAffected() const noexcept
Returns the current status of the "affected" flag.
Definition: BaseLayer.cpp:215

nvneural::ILayer
ILayer is the base class for neural network layers.
Definition: LayerTypes.h:59

nvneural::ILayerList
ILayerList represents an immutable collection of ILayer pointers.
Definition: CoreTypes.h:1060

nvneural::ILogger::logError
virtual NeuralResult logError(VerbosityLevel verbosity, const char *format,...) noexcept=0
Logs an error message.

nvneural::INetworkBackend
INetworkBackend is a runtime-specific interface for CUDA, DirectX, or other system- specific operatio...
Definition: CoreTypes.h:643

nvneural::INetworkRuntime
INetworkRuntime is a subset of the basic network interface that is accessible from layer classes duri...
Definition: CoreTypes.h:1129

nvneural::IParameterNode
Represents a serialized parameter block in a model definition.
Definition: CoreTypes.h:1889

nvneural::RefPtr
Intrusive pointer using IRefObject's reference counting system.
Definition: RefPtr.h:46

nvneural::TensorDimension
TensorDimension describes the dimensions of a four-dimensional image tensor.
Definition: CoreTypes.h:136

nvneural::TensorFormat
TensorFormat describes a specific tensor shape (element type and layout).
Definition: CoreTypes.h:88