_static/c-api/_nv_infer_safe_mem_allocator_8h_source.html

/*

 * SPDX-FileCopyrightText: Copyright (c) 1993-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.

 * SPDX-License-Identifier: Apache-2.0

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


// Header file for the NVIDIA Safe Runtime Memory Allocator interface.

// This file provides the user-implementable interface for the Memory Allocator feature in the NVIDIA Safe Runtime API.

// It includes the necessary classes, functions, and definitions for creating and managing safe memory allocators,

// including the ISafeMemAllocator interface.

// Users should implement this interface to provide a custom memory allocator that will be used by the Safe Runtime

// to allocate memory for both CPU and GPU resources. The allocator should handle memory allocation and deallocation

// requests from the Safe Runtime, and ensure thread safety and proper memory management.

// The implemented allocator will be responsible for allocating memory for various components of the Safe Runtime,

// including tensors, plugins, and other internal data structures.


#ifndef NV_INFER_SAFE_MEM_ALLOCATOR_H

#define NV_INFER_SAFE_MEM_ALLOCATOR_H

#include "NvInferSafeRecorder.h"

#include <cstdint>


namespace nvinfer2

{

namespace safe

{

class ISafeRecorder;


constexpr uint64_t kMAXIMUM_ALLOC_SIZE{17179869184U};


enum class MemoryPlacement : uint32_t

{

    kNONE = 0x0,

    kMANAGED = 0x1,

    kGPU = 0x2,

    kCPU = 0x4,

    kCPU_PINNED = 0x80

};


enum class MemoryUsage : uint32_t

{

    kGENERIC = 0x0,

    kIMMUTABLE = 0x3,

    kSCRATCH = 0x5,

    kIOTENSOR = 0x6

};


class ISafeMemAllocator

{

public:

    virtual void* allocate(uint64_t const size, uint64_t const alignment, MemoryPlacement const flags,

        MemoryUsage const usage, ISafeRecorder& recorder) noexcept = 0;


    virtual ~ISafeMemAllocator() = default;

    ISafeMemAllocator() = default;


    virtual bool deallocate(void* const memory, MemoryPlacement const flags, ISafeRecorder& recorder) noexcept = 0;


protected:

    ISafeMemAllocator(ISafeMemAllocator const&) = default;

    ISafeMemAllocator(ISafeMemAllocator&&) = default;

    ISafeMemAllocator& operator=(ISafeMemAllocator const&) & = default;

    ISafeMemAllocator& operator=(ISafeMemAllocator&&) & = default;

};

} // namespace safe

} // namespace nvinfer2


#endif /* NV_INFER_SAFE_MEM_ALLOCATOR_H */

NvInferSafeRecorder.h

nvinfer2::safe::ISafeMemAllocator
Application-implemented class for controlling memory allocation on the GPU/CPU.
Definition: NvInferSafeMemAllocator.h:86

nvinfer2::safe::ISafeMemAllocator::ISafeMemAllocator
ISafeMemAllocator(ISafeMemAllocator const &)=default
Copy constructor (defaulted).

nvinfer2::safe::ISafeMemAllocator::deallocate
virtual bool deallocate(void *const memory, MemoryPlacement const flags, ISafeRecorder &recorder) noexcept=0
A thread-safe callback implemented by the application to handle release of GPU/CPU memory.

nvinfer2::safe::ISafeMemAllocator::operator=
ISafeMemAllocator & operator=(ISafeMemAllocator &&) &=default
Move assignment operator (defaulted).

nvinfer2::safe::ISafeMemAllocator::ISafeMemAllocator
ISafeMemAllocator(ISafeMemAllocator &&)=default
Move constructor (defaulted).

nvinfer2::safe::ISafeMemAllocator::operator=
ISafeMemAllocator & operator=(ISafeMemAllocator const &) &=default
Copy assignment operator (defaulted).

nvinfer2::safe::ISafeMemAllocator::~ISafeMemAllocator
virtual ~ISafeMemAllocator()=default
Destructor for ISafeMemAllocator.

nvinfer2::safe::ISafeMemAllocator::allocate
virtual void * allocate(uint64_t const size, uint64_t const alignment, MemoryPlacement const flags, MemoryUsage const usage, ISafeRecorder &recorder) noexcept=0
A thread-safe callback implemented by the application to handle acquisition of GPU/CPU memory.

nvinfer2::safe::ISafeMemAllocator::ISafeMemAllocator
ISafeMemAllocator()=default
Default constructor for ISafeMemAllocator.

nvinfer2::safe::ISafeRecorder
Interface for extended recorder which allows error, warn, debug, or info messages to be recorded.
Definition: NvInferSafeRecorder.h:77

nvinfer2::safe::MemoryUsage
MemoryUsage
Enum to describe the usage of memory region.
Definition: NvInferSafeMemAllocator.h:67

nvinfer2::safe::MemoryUsage::kSCRATCH
@ kSCRATCH
Scratchpad memory per context used for intermediate tensors.

nvinfer2::safe::MemoryUsage::kIMMUTABLE
@ kIMMUTABLE
Memory (network weights) that is initialized once and can be shared across different graphs.

nvinfer2::safe::MemoryUsage::kIOTENSOR
@ kIOTENSOR
Memory used for IO Tensors.

nvinfer2::safe::MemoryUsage::kGENERIC
@ kGENERIC
Uncommitted memory usage.

nvinfer2::safe::MemoryPlacement
MemoryPlacement
Enum to describe the placement of the memory region.
Definition: NvInferSafeMemAllocator.h:49

nvinfer2::safe::MemoryPlacement::kMANAGED
@ kMANAGED
CUDA managed memory (not used for safety)

nvinfer2::safe::MemoryPlacement::kCPU
@ kCPU
Regular (paged) host memory allocated via malloc, or aligned_alloc.

nvinfer2::safe::MemoryPlacement::kGPU
@ kGPU
Device memory allocated via cudaMalloc.

nvinfer2::safe::MemoryPlacement::kCPU_PINNED
@ kCPU_PINNED
Page-locked host memory allocated via cudaHostAlloc, mappable to device (for zero-copy)

nvinfer2::safe::MemoryPlacement::kNONE
@ kNONE
Invalid or unspecified placement (used for error checking)

nvinfer2::safe::kMAXIMUM_ALLOC_SIZE
constexpr uint64_t kMAXIMUM_ALLOC_SIZE
Legacy constant (16 GiB) kept for TensorRT excessiveMemoryDetection test build compatibility.
Definition: NvInferSafeMemAllocator.h:42

nvinfer2
Definition: NvInferConsistency.h:30