Go to the source code of this file.
|
| void * | nvds_triton_client_create (const char *url, const char *model_name, int batch_size, const char *onnx_model) |
| | Create TensorRT encoder client. More...
|
| |
| void | nvds_triton_client_destroy (void *client) |
| | Destroy TensorRT encoder client. More...
|
| |
| int | nvds_triton_client_get_input_size (void *client, unsigned int *width, unsigned int *height) |
| | Get input dimensions from encoder. More...
|
| |
| int | nvds_triton_client_get_embedding_dim (void *client) |
| | Get embedding dimension from encoder. More...
|
| |
| unsigned int | nvds_triton_client_get_input_width (void *client) |
| | Get input width. More...
|
| |
| unsigned int | nvds_triton_client_get_input_height (void *client) |
| | Get input height. More...
|
| |
| int | nvds_triton_client_infer (void *client, float *input_data, int num_images, float *output_embeddings) |
| | Run inference on host input data. More...
|
| |
| int | nvds_triton_client_infer_device (void *client, float *d_input_data, int num_images, float *output_embeddings) |
| | Run inference on device input data (GPU path) More...
|
| |
◆ nvds_triton_client_create()
| void* nvds_triton_client_create |
( |
const char * |
url, |
|
|
const char * |
model_name, |
|
|
int |
batch_size, |
|
|
const char * |
onnx_model |
|
) |
| |
Create TensorRT encoder client.
- Parameters
-
| url | Engine path (if contains .plan/.engine) or Triton URL (fallback) |
| model_name | Model name for path construction |
| batch_size | Batch size for engine building |
| onnx_model | Path to ONNX model for building engine if not found |
- Returns
- Opaque handle to encoder, or NULL on failure
◆ nvds_triton_client_destroy()
| void nvds_triton_client_destroy |
( |
void * |
client | ) |
|
Destroy TensorRT encoder client.
- Parameters
-
| client | Opaque handle from nvds_triton_client_create |
◆ nvds_triton_client_get_embedding_dim()
| int nvds_triton_client_get_embedding_dim |
( |
void * |
client | ) |
|
Get embedding dimension from encoder.
- Parameters
-
- Returns
- Embedding dimension, or 0 on failure
◆ nvds_triton_client_get_input_height()
| unsigned int nvds_triton_client_get_input_height |
( |
void * |
client | ) |
|
Get input height.
- Parameters
-
- Returns
- Input height, or 0 on failure
◆ nvds_triton_client_get_input_size()
| int nvds_triton_client_get_input_size |
( |
void * |
client, |
|
|
unsigned int * |
width, |
|
|
unsigned int * |
height |
|
) |
| |
Get input dimensions from encoder.
- Parameters
-
| client | Opaque handle |
| width | Output: input width |
| height | Output: input height |
- Returns
- 0 on success, -1 on failure
◆ nvds_triton_client_get_input_width()
| unsigned int nvds_triton_client_get_input_width |
( |
void * |
client | ) |
|
Get input width.
- Parameters
-
- Returns
- Input width, or 0 on failure
◆ nvds_triton_client_infer()
| int nvds_triton_client_infer |
( |
void * |
client, |
|
|
float * |
input_data, |
|
|
int |
num_images, |
|
|
float * |
output_embeddings |
|
) |
| |
Run inference on host input data.
- Parameters
-
| client | Opaque handle |
| input_data | Host pointer to input tensor [N, C, H, W] |
| num_images | Number of images in batch |
| output_embeddings | Host pointer for output [N, embedding_dim] |
- Returns
- 0 on success, -1 on failure
◆ nvds_triton_client_infer_device()
| int nvds_triton_client_infer_device |
( |
void * |
client, |
|
|
float * |
d_input_data, |
|
|
int |
num_images, |
|
|
float * |
output_embeddings |
|
) |
| |
Run inference on device input data (GPU path)
- Parameters
-
| client | Opaque handle |
| d_input_data | Device pointer to input tensor [N, C, H, W] |
| num_images | Number of images in batch |
| output_embeddings | Host pointer for output [N, embedding_dim] |
- Returns
- 0 on success, -1 on failure