NVIDIA DeepStream SDK API Reference

9.0 Release
9.0/sources/gst-plugins/gst-nvdsvisionencoder-c/trt_encoder.h File Reference

Go to the source code of this file.

Functions

void * nvds_triton_client_create (const char *url, const char *model_name, int batch_size, const char *onnx_model)
 Create TensorRT encoder client. More...
 
void nvds_triton_client_destroy (void *client)
 Destroy TensorRT encoder client. More...
 
int nvds_triton_client_get_input_size (void *client, unsigned int *width, unsigned int *height)
 Get input dimensions from encoder. More...
 
int nvds_triton_client_get_embedding_dim (void *client)
 Get embedding dimension from encoder. More...
 
unsigned int nvds_triton_client_get_input_width (void *client)
 Get input width. More...
 
unsigned int nvds_triton_client_get_input_height (void *client)
 Get input height. More...
 
int nvds_triton_client_infer (void *client, float *input_data, int num_images, float *output_embeddings)
 Run inference on host input data. More...
 
int nvds_triton_client_infer_device (void *client, float *d_input_data, int num_images, float *output_embeddings)
 Run inference on device input data (GPU path) More...
 

Function Documentation

◆ nvds_triton_client_create()

void* nvds_triton_client_create ( const char *  url,
const char *  model_name,
int  batch_size,
const char *  onnx_model 
)

Create TensorRT encoder client.

Parameters
urlEngine path (if contains .plan/.engine) or Triton URL (fallback)
model_nameModel name for path construction
batch_sizeBatch size for engine building
onnx_modelPath to ONNX model for building engine if not found
Returns
Opaque handle to encoder, or NULL on failure

◆ nvds_triton_client_destroy()

void nvds_triton_client_destroy ( void *  client)

Destroy TensorRT encoder client.

Parameters
clientOpaque handle from nvds_triton_client_create

◆ nvds_triton_client_get_embedding_dim()

int nvds_triton_client_get_embedding_dim ( void *  client)

Get embedding dimension from encoder.

Parameters
clientOpaque handle
Returns
Embedding dimension, or 0 on failure

◆ nvds_triton_client_get_input_height()

unsigned int nvds_triton_client_get_input_height ( void *  client)

Get input height.

Parameters
clientOpaque handle
Returns
Input height, or 0 on failure

◆ nvds_triton_client_get_input_size()

int nvds_triton_client_get_input_size ( void *  client,
unsigned int *  width,
unsigned int *  height 
)

Get input dimensions from encoder.

Parameters
clientOpaque handle
widthOutput: input width
heightOutput: input height
Returns
0 on success, -1 on failure

◆ nvds_triton_client_get_input_width()

unsigned int nvds_triton_client_get_input_width ( void *  client)

Get input width.

Parameters
clientOpaque handle
Returns
Input width, or 0 on failure

◆ nvds_triton_client_infer()

int nvds_triton_client_infer ( void *  client,
float *  input_data,
int  num_images,
float *  output_embeddings 
)

Run inference on host input data.

Parameters
clientOpaque handle
input_dataHost pointer to input tensor [N, C, H, W]
num_imagesNumber of images in batch
output_embeddingsHost pointer for output [N, embedding_dim]
Returns
0 on success, -1 on failure

◆ nvds_triton_client_infer_device()

int nvds_triton_client_infer_device ( void *  client,
float *  d_input_data,
int  num_images,
float *  output_embeddings 
)

Run inference on device input data (GPU path)

Parameters
clientOpaque handle
d_input_dataDevice pointer to input tensor [N, C, H, W]
num_imagesNumber of images in batch
output_embeddingsHost pointer for output [N, embedding_dim]
Returns
0 on success, -1 on failure