NVIDIA DeepStream SDK API Reference

7.0 Release
tritonserver.h
Go to the documentation of this file.
1 // Copyright 2020-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2 //
3 // Redistribution and use in source and binary forms, with or without
4 // modification, are permitted provided that the following conditions
5 // are met:
6 // * Redistributions of source code must retain the above copyright
7 // notice, this list of conditions and the following disclaimer.
8 // * Redistributions in binary form must reproduce the above copyright
9 // notice, this list of conditions and the following disclaimer in the
10 // documentation and/or other materials provided with the distribution.
11 // * Neither the name of NVIDIA CORPORATION nor the names of its
12 // contributors may be used to endorse or promote products derived
13 // from this software without specific prior written permission.
14 //
15 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
16 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
19 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
23 // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 #pragma once
27 
29 
30 #include <stdbool.h>
31 #include <stddef.h>
32 #include <stdint.h>
33 
34 #ifdef __cplusplus
35 extern "C" {
36 #endif
37 
38 #ifdef _COMPILING_TRITONSERVER
39 #if defined(_MSC_VER)
40 #define TRITONSERVER_DECLSPEC __declspec(dllexport)
41 #elif defined(__GNUC__)
42 #define TRITONSERVER_DECLSPEC __attribute__((__visibility__("default")))
43 #else
44 #define TRITONSERVER_DECLSPEC
45 #endif
46 #else
47 #if defined(_MSC_VER)
48 #define TRITONSERVER_DECLSPEC __declspec(dllimport)
49 #else
50 #define TRITONSERVER_DECLSPEC
51 #endif
52 #endif
53 
54 struct TRITONSERVER_BufferAttributes;
55 struct TRITONSERVER_Error;
56 struct TRITONSERVER_InferenceRequest;
57 struct TRITONSERVER_InferenceResponse;
58 struct TRITONSERVER_InferenceTrace;
59 struct TRITONSERVER_Message;
60 struct TRITONSERVER_Metrics;
61 struct TRITONSERVER_Parameter;
62 struct TRITONSERVER_ResponseAllocator;
63 struct TRITONSERVER_Server;
64 struct TRITONSERVER_ServerOptions;
65 struct TRITONSERVER_Metric;
66 struct TRITONSERVER_MetricFamily;
67 
93 #define TRITONSERVER_API_VERSION_MAJOR 1
94 #ifdef IS_TEGRA
95 #define TRITONSERVER_API_VERSION_MINOR 29
96 #else
97 #define TRITONSERVER_API_VERSION_MINOR 25
98 #endif
99 
111 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ApiVersion(
112  uint32_t* major, uint32_t* minor);
113 
135 
142  TRITONSERVER_DataType datatype);
143 
151 TRITONSERVER_StringToDataType(const char* dtype);
152 
159 TRITONSERVER_DECLSPEC uint32_t
161 
171 
179  TRITONSERVER_MemoryType memtype);
180 
189 #ifdef IS_TEGRA
190  TRITONSERVER_PARAMETER_DOUBLE,
191 #endif
194 
202  TRITONSERVER_ParameterType paramtype);
203 
214 TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter* TRITONSERVER_ParameterNew(
215  const char* name, const TRITONSERVER_ParameterType type, const void* value);
216 
227 TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter*
229  const char* name, const void* byte_ptr, const uint64_t size);
230 
235  struct TRITONSERVER_Parameter* parameter);
236 
247 
256 
267 
280 
286  TRITONSERVER_LogLevel level);
287 
295 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_LogMessage(
296  TRITONSERVER_LogLevel level, const char* filename, const int line,
297  const char* msg);
298 
309 
321 
329 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ErrorNew(
330  TRITONSERVER_Error_Code code, const char* msg);
331 
336  struct TRITONSERVER_Error* error);
337 
343 TRITONSERVER_ErrorCode(struct TRITONSERVER_Error* error);
344 
353  struct TRITONSERVER_Error* error);
354 
363  struct TRITONSERVER_Error* error);
364 
370 
401 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorAllocFn_t)(
402  struct TRITONSERVER_ResponseAllocator* allocator, const char* tensor_name,
403  size_t byte_size, TRITONSERVER_MemoryType memory_type,
404  int64_t memory_type_id, void* userp, void** buffer, void** buffer_userp,
405  TRITONSERVER_MemoryType* actual_memory_type,
406  int64_t* actual_memory_type_id);
407 
430 typedef struct TRITONSERVER_Error* (
432  struct TRITONSERVER_ResponseAllocator* allocator, const char* tensor_name,
433  struct TRITONSERVER_BufferAttributes* buffer_attributes, void* userp,
434  void* buffer_userp);
435 
460 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorQueryFn_t)(
461  struct TRITONSERVER_ResponseAllocator* allocator, void* userp,
462  const char* tensor_name, size_t* byte_size,
463  TRITONSERVER_MemoryType* memory_type, int64_t* memory_type_id);
464 
482 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorReleaseFn_t)(
483  struct TRITONSERVER_ResponseAllocator* allocator, void* buffer,
484  void* buffer_userp, size_t byte_size, TRITONSERVER_MemoryType memory_type,
485  int64_t memory_type_id);
486 
496 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorStartFn_t)(
497  struct TRITONSERVER_ResponseAllocator* allocator, void* userp);
498 
548 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
550  struct TRITONSERVER_ResponseAllocator** allocator,
554 
566 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
568  struct TRITONSERVER_ResponseAllocator* allocator,
570 
583 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
585  struct TRITONSERVER_ResponseAllocator* allocator,
587 
592 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
594  struct TRITONSERVER_ResponseAllocator* allocator);
595 
600 
607 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
609  struct TRITONSERVER_Message** message, const char* base, size_t byte_size);
610 
615 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MessageDelete(
616  struct TRITONSERVER_Message* message);
617 
629 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
631  struct TRITONSERVER_Message* message, const char** base, size_t* byte_size);
632 
637 
642 
647 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricsDelete(
648  struct TRITONSERVER_Metrics* metrics);
649 
670 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricsFormatted(
671  struct TRITONSERVER_Metrics* metrics, TRITONSERVER_MetricFormat format,
672  const char** base, size_t* byte_size);
673 
678 
702 
711 
725 
734 
742  struct TRITONSERVER_InferenceTrace* trace,
743  TRITONSERVER_InferenceTraceActivity activity, uint64_t timestamp_ns,
744  void* userp);
745 
753  struct TRITONSERVER_InferenceTrace* trace,
754  TRITONSERVER_InferenceTraceActivity activity, const char* name,
755  TRITONSERVER_DataType datatype, const void* base, size_t byte_size,
756  const int64_t* shape, uint64_t dim_count,
757  TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void* userp);
758 
765  struct TRITONSERVER_InferenceTrace* trace, void* userp);
766 
790 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_InferenceTraceNew(
791  struct TRITONSERVER_InferenceTrace** trace,
792  TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id,
794  TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void* trace_userp);
795 
821 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
823  struct TRITONSERVER_InferenceTrace** trace,
824  TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id,
827  TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void* trace_userp);
828 
833 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
834 TRITONSERVER_InferenceTraceDelete(struct TRITONSERVER_InferenceTrace* trace);
835 
842 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_InferenceTraceId(
843  struct TRITONSERVER_InferenceTrace* trace, uint64_t* id);
844 
852 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
854  struct TRITONSERVER_InferenceTrace* trace, uint64_t* parent_id);
855 
864 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
866  struct TRITONSERVER_InferenceTrace* trace, const char** model_name);
867 
874 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
876  struct TRITONSERVER_InferenceTrace* trace, int64_t* model_version);
877 
886 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
888  struct TRITONSERVER_InferenceTrace* trace, const char** request_id);
889 
898 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
900  struct TRITONSERVER_InferenceTrace* trace,
901  struct TRITONSERVER_InferenceTrace** child_trace);
902 
903 #ifdef IS_TEGRA
904 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
910 TRITONSERVER_InferenceTraceSetContext(
911  struct TRITONSERVER_InferenceTrace* trace, const char* trace_context);
912 
913 
919 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
920 TRITONSERVER_InferenceTraceContext(
921  struct TRITONSERVER_InferenceTrace* trace, const char** trace_context);
922 #endif
923 
932 
938 
943 #ifdef IS_TEGRA
944  ,TRITONSERVER_REQUEST_RELEASE_RESCHEDULE = 2
945 #endif
947 
953 
984  struct TRITONSERVER_InferenceRequest* request, const uint32_t flags,
985  void* userp);
986 
1005  struct TRITONSERVER_InferenceResponse* response, const uint32_t flags,
1006  void* userp);
1007 
1017 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1019  struct TRITONSERVER_InferenceRequest** inference_request,
1020  struct TRITONSERVER_Server* server, const char* model_name,
1021  const int64_t model_version);
1022 
1027 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1029  struct TRITONSERVER_InferenceRequest* inference_request);
1030 
1038 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1040  struct TRITONSERVER_InferenceRequest* inference_request, const char** id);
1041 
1047 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1049  struct TRITONSERVER_InferenceRequest* inference_request, const char* id);
1050 
1058 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1060  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t* flags);
1061 
1069 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1071  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t flags);
1072 
1084 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1086  struct TRITONSERVER_InferenceRequest* inference_request,
1087  uint64_t* correlation_id);
1088 
1100 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1102  struct TRITONSERVER_InferenceRequest* inference_request,
1103  const char** correlation_id);
1104 
1114 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1116  struct TRITONSERVER_InferenceRequest* inference_request,
1117  uint64_t correlation_id);
1118 
1128 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1130  struct TRITONSERVER_InferenceRequest* inference_request,
1131  const char* correlation_id);
1132 
1143 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1145  struct TRITONSERVER_InferenceRequest* inference_request);
1146 
1156 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1158  struct TRITONSERVER_InferenceRequest* inference_request,
1159  bool* is_cancelled);
1160 
1170 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1172  struct TRITONSERVER_InferenceRequest* inference_request,
1173  uint32_t* priority);
1174 
1182 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1184  struct TRITONSERVER_InferenceRequest* inference_request,
1185  uint64_t* priority);
1186 
1196 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1198  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t priority);
1199 
1207 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1209  struct TRITONSERVER_InferenceRequest* inference_request, uint64_t priority);
1210 
1217 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1219  struct TRITONSERVER_InferenceRequest* inference_request,
1220  uint64_t* timeout_us);
1221 
1228 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1230  struct TRITONSERVER_InferenceRequest* inference_request,
1231  uint64_t timeout_us);
1232 
1243 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1245  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1246  const TRITONSERVER_DataType datatype, const int64_t* shape,
1247  uint64_t dim_count);
1248 
1259 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1261  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1262 
1268 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1270  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1271 
1276 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1278  struct TRITONSERVER_InferenceRequest* inference_request);
1279 
1294 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1296  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1297  const void* base, size_t byte_size, TRITONSERVER_MemoryType memory_type,
1298  int64_t memory_type_id);
1299 
1319 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1321  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1322  const void* base, size_t byte_size, TRITONSERVER_MemoryType memory_type,
1323  int64_t memory_type_id, const char* host_policy_name);
1324 
1337 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1339  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1340  const void* base, struct TRITONSERVER_BufferAttributes* buffer_attributes);
1341 
1348 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1350  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1351 
1357 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1359  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1360 
1366 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1368  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1369 
1374 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1376  struct TRITONSERVER_InferenceRequest* inference_request);
1377 
1388 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1390  struct TRITONSERVER_InferenceRequest* inference_request,
1391  TRITONSERVER_InferenceRequestReleaseFn_t request_release_fn,
1392  void* request_release_userp);
1393 
1414 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1416  struct TRITONSERVER_InferenceRequest* inference_request,
1417  struct TRITONSERVER_ResponseAllocator* response_allocator,
1418  void* response_allocator_userp,
1420  void* response_userp);
1421 
1428 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1430  struct TRITONSERVER_InferenceRequest* request, const char* key,
1431  const char* value);
1432 
1439 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1441  struct TRITONSERVER_InferenceRequest* request, const char* key,
1442  const int64_t value);
1443 
1450 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1452  struct TRITONSERVER_InferenceRequest* request, const char* key,
1453  const bool value);
1454 
1455 #ifdef IS_TEGRA
1456 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1463 TRITONSERVER_InferenceRequestSetDoubleParameter(
1464  struct TRITONSERVER_InferenceRequest* request, const char* key,
1465  const double value);
1466 #endif
1467 
1474 
1479 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1481  struct TRITONSERVER_InferenceResponse* inference_response);
1482 
1491 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1493  struct TRITONSERVER_InferenceResponse* inference_response);
1494 
1505 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1507  struct TRITONSERVER_InferenceResponse* inference_response,
1508  const char** model_name, int64_t* model_version);
1509 
1519 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1521  struct TRITONSERVER_InferenceResponse* inference_response,
1522  const char** request_id);
1523 
1529 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1531  struct TRITONSERVER_InferenceResponse* inference_response, uint32_t* count);
1532 
1564 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1566  struct TRITONSERVER_InferenceResponse* inference_response,
1567  const uint32_t index, const char** name, TRITONSERVER_ParameterType* type,
1568  const void** vvalue);
1569 
1575 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1577  struct TRITONSERVER_InferenceResponse* inference_response, uint32_t* count);
1578 
1601 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1603  struct TRITONSERVER_InferenceResponse* inference_response,
1604  const uint32_t index, const char** name, TRITONSERVER_DataType* datatype,
1605  const int64_t** shape, uint64_t* dim_count, const void** base,
1606  size_t* byte_size, TRITONSERVER_MemoryType* memory_type,
1607  int64_t* memory_type_id, void** userp);
1608 
1622 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1624  struct TRITONSERVER_InferenceResponse* inference_response,
1625  const uint32_t index, const size_t class_index, const char** label);
1626 
1631 
1638 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1640  struct TRITONSERVER_BufferAttributes** buffer_attributes);
1641 
1646 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1648  struct TRITONSERVER_BufferAttributes* buffer_attributes);
1649 
1656 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1658  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1659  int64_t memory_type_id);
1660 
1666 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1668  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1669  TRITONSERVER_MemoryType memory_type);
1670 
1677 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1679  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1680  void* cuda_ipc_handle);
1681 
1687 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1689  struct TRITONSERVER_BufferAttributes* buffer_attributes, size_t byte_size);
1690 
1697 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1699  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1700  int64_t* memory_type_id);
1701 
1708 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1710  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1711  TRITONSERVER_MemoryType* memory_type);
1712 
1720 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1722  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1723  void** cuda_ipc_handle);
1724 
1731 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1733  struct TRITONSERVER_BufferAttributes* buffer_attributes, size_t* byte_size);
1734 
1735 
1740 
1747 
1753 
1760 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerOptionsNew(
1761  struct TRITONSERVER_ServerOptions** options);
1762 
1767 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1768 TRITONSERVER_ServerOptionsDelete(struct TRITONSERVER_ServerOptions* options);
1769 
1776 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1778  struct TRITONSERVER_ServerOptions* options, const char* server_id);
1779 
1789 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1791  struct TRITONSERVER_ServerOptions* options,
1792  const char* model_repository_path);
1793 
1814 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1816  struct TRITONSERVER_ServerOptions* options,
1818 
1828 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1830  struct TRITONSERVER_ServerOptions* options, const char* model_name);
1831 
1839 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1841  struct TRITONSERVER_ServerOptions* options, bool strict);
1842 
1857 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1859  struct TRITONSERVER_ServerOptions* options,
1861 
1875 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1877  struct TRITONSERVER_ServerOptions* options, const char* resource_name,
1878  const size_t resource_count, const int device);
1879 
1888 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1890  struct TRITONSERVER_ServerOptions* options, uint64_t size);
1891 
1901 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1903  struct TRITONSERVER_ServerOptions* options, int gpu_device, uint64_t size);
1904 
1905 #ifdef IS_TEGRA
1906 TRITONSERVER_DECLSPEC TRITONSERVER_Error*
1914 TRITONSERVER_ServerOptionsSetCudaVirtualAddressSize(
1915  TRITONSERVER_ServerOptions* options, int gpu_device,
1916  size_t cuda_virtual_address_size);
1917 #endif
1918 
1928 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1930  struct TRITONSERVER_ServerOptions* options, uint64_t size);
1931 
1953 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1955  struct TRITONSERVER_ServerOptions* options, const char* cache_name,
1956  const char* config_json);
1957 
1964 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1966  struct TRITONSERVER_ServerOptions* options, const char* cache_dir);
1967 
1974 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1976  struct TRITONSERVER_ServerOptions* options, double cc);
1977 
1984 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1986  struct TRITONSERVER_ServerOptions* options, bool exit);
1987 
1994 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1996  struct TRITONSERVER_ServerOptions* options, bool strict);
1997 
2004 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2006  struct TRITONSERVER_ServerOptions* options, unsigned int timeout);
2007 
2013 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2015  struct TRITONSERVER_ServerOptions* options, unsigned int thread_count);
2016 
2022 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2024  struct TRITONSERVER_ServerOptions* options, unsigned int thread_count);
2025 
2026 #ifdef IS_TEGRA
2027 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2033 TRITONSERVER_ServerOptionsSetModelLoadRetryCount(
2034  struct TRITONSERVER_ServerOptions* options, unsigned int retry_count);
2035 #endif
2036 
2043 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2045  struct TRITONSERVER_ServerOptions* options, bool enable_namespace);
2046 
2054 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2056  struct TRITONSERVER_ServerOptions* options, const char* file);
2057 
2063 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2065  struct TRITONSERVER_ServerOptions* options, bool log);
2066 
2072 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2074  struct TRITONSERVER_ServerOptions* options, bool log);
2075 
2081 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2083  struct TRITONSERVER_ServerOptions* options, bool log);
2084 
2090 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2092  struct TRITONSERVER_ServerOptions* options,
2093  const TRITONSERVER_LogFormat format);
2094 
2100 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2102  struct TRITONSERVER_ServerOptions* options, int level);
2103 
2109 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2111  struct TRITONSERVER_ServerOptions* options, bool metrics);
2112 
2120 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2122  struct TRITONSERVER_ServerOptions* options, bool gpu_metrics);
2123 
2131 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2133  struct TRITONSERVER_ServerOptions* options, bool cpu_metrics);
2134 
2142 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2144  struct TRITONSERVER_ServerOptions* options, uint64_t metrics_interval_ms);
2145 
2155 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2157  struct TRITONSERVER_ServerOptions* options, const char* backend_dir);
2158 
2167 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2169  struct TRITONSERVER_ServerOptions* options, const char* repoagent_dir);
2170 
2183 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2185  struct TRITONSERVER_ServerOptions* options,
2186  const TRITONSERVER_InstanceGroupKind kind, const int device_id,
2187  const double fraction);
2188 
2197 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2199  struct TRITONSERVER_ServerOptions* options, const char* backend_name,
2200  const char* setting, const char* value);
2201 
2209 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2211  struct TRITONSERVER_ServerOptions* options, const char* policy_name,
2212  const char* setting, const char* value);
2213 
2222 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2224  struct TRITONSERVER_ServerOptions* options, const char* name,
2225  const char* setting, const char* value);
2226 
2231 
2237 
2242 
2249 
2257 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerNew(
2258  struct TRITONSERVER_Server** server,
2259  struct TRITONSERVER_ServerOptions* options);
2260 
2266 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerDelete(
2267  struct TRITONSERVER_Server* server);
2268 
2274 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerStop(
2275  struct TRITONSERVER_Server* server);
2276 
2285 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2287  struct TRITONSERVER_Server* server, const char* repository_path,
2288  const struct TRITONSERVER_Parameter** name_mapping,
2289  const uint32_t mapping_count);
2290 
2296 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2298  struct TRITONSERVER_Server* server, const char* repository_path);
2299 
2305 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2306 TRITONSERVER_ServerPollModelRepository(struct TRITONSERVER_Server* server);
2307 
2313 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerIsLive(
2314  struct TRITONSERVER_Server* server, bool* live);
2315 
2321 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerIsReady(
2322  struct TRITONSERVER_Server* server, bool* ready);
2323 
2333 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2335  struct TRITONSERVER_Server* server, const char* model_name,
2336  const int64_t model_version, bool* ready);
2337 
2362 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2364  struct TRITONSERVER_Server* server, const char* model_name,
2365  const int64_t model_version, uint32_t* flags, void** voidp);
2366 
2384 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2386  struct TRITONSERVER_Server* server, const char* model_name,
2387  const int64_t model_version, uint32_t* txn_flags, void** voidp);
2388 
2396 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerMetadata(
2397  struct TRITONSERVER_Server* server,
2398  struct TRITONSERVER_Message** server_metadata);
2399 
2411 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2413  struct TRITONSERVER_Server* server, const char* model_name,
2414  const int64_t model_version, struct TRITONSERVER_Message** model_metadata);
2415 
2428 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2430  struct TRITONSERVER_Server* server, const char* model_name,
2431  const int64_t model_version, struct TRITONSERVER_Message** model_stats);
2432 
2447 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerModelConfig(
2448  struct TRITONSERVER_Server* server, const char* model_name,
2449  const int64_t model_version, const uint32_t config_version,
2450  struct TRITONSERVER_Message** model_config);
2451 
2467 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerModelIndex(
2468  struct TRITONSERVER_Server* server, uint32_t flags,
2469  struct TRITONSERVER_Message** model_index);
2470 
2479 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerLoadModel(
2480  struct TRITONSERVER_Server* server, const char* model_name);
2481 
2496 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2498  struct TRITONSERVER_Server* server, const char* model_name,
2499  const struct TRITONSERVER_Parameter** parameters,
2500  const uint64_t parameter_count);
2501 
2511 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerUnloadModel(
2512  struct TRITONSERVER_Server* server, const char* model_name);
2513 
2525 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2527  struct TRITONSERVER_Server* server, const char* model_name);
2528 
2536 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerMetrics(
2537  struct TRITONSERVER_Server* server, struct TRITONSERVER_Metrics** metrics);
2538 
2560 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerInferAsync(
2561  struct TRITONSERVER_Server* server,
2562  struct TRITONSERVER_InferenceRequest* inference_request,
2563  struct TRITONSERVER_InferenceTrace* trace);
2564 
2573 
2585 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricFamilyNew(
2586  struct TRITONSERVER_MetricFamily** family,
2587  const TRITONSERVER_MetricKind kind, const char* name,
2588  const char* description);
2589 
2597 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2598 TRITONSERVER_MetricFamilyDelete(struct TRITONSERVER_MetricFamily* family);
2599 
2612 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricNew(
2613  struct TRITONSERVER_Metric** metric,
2614  struct TRITONSERVER_MetricFamily* family,
2615  const struct TRITONSERVER_Parameter** labels, const uint64_t label_count);
2616 
2624 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricDelete(
2625  struct TRITONSERVER_Metric* metric);
2626 
2635 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricValue(
2636  struct TRITONSERVER_Metric* metric, double* value);
2637 
2648 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricIncrement(
2649  struct TRITONSERVER_Metric* metric, double value);
2650 
2658 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricSet(
2659  struct TRITONSERVER_Metric* metric, double value);
2660 
2666 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_GetMetricKind(
2667  struct TRITONSERVER_Metric* metric, TRITONSERVER_MetricKind* kind);
2668 
2669 #ifdef __cplusplus
2670 }
2671 #endif
TRITONSERVER_InferenceTraceReleaseFn_t
void(* TRITONSERVER_InferenceTraceReleaseFn_t)(struct TRITONSERVER_InferenceTrace *trace, void *userp)
Type for trace release callback function.
Definition: tritonserver.h:764
TRITONSERVER_InferenceRequestSetTimeoutMicroseconds
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetTimeoutMicroseconds(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t timeout_us)
Set the timeout for a request, in microseconds.
TRITONSERVER_TYPE_INT64
@ TRITONSERVER_TYPE_INT64
Definition: tritonserver.h:128
tritonserver_traceactivity_enum
tritonserver_traceactivity_enum
Trace activities.
Definition: tritonserver.h:713
TRITONSERVER_ResponseAllocatorReleaseFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorReleaseFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *buffer, void *buffer_userp, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id)
Type for function that is called when the server no longer holds any reference to a buffer allocated ...
Definition: tritonserver.h:482
TRITONSERVER_InferenceTraceLevelString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InferenceTraceLevelString(TRITONSERVER_InferenceTraceLevel level)
Get the string representation of a trace level.
TRITONSERVER_TYPE_BF16
@ TRITONSERVER_TYPE_BF16
Definition: tritonserver.h:133
TRITONSERVER_ServerOptionsSetModelLoadDeviceLimit
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelLoadDeviceLimit(struct TRITONSERVER_ServerOptions *options, const TRITONSERVER_InstanceGroupKind kind, const int device_id, const double fraction)
Specify the limit on memory usage as a fraction on the device identified by 'kind' and 'device_id'.
TRITONSERVER_InferenceTraceLevel
enum tritonserver_tracelevel_enum TRITONSERVER_InferenceTraceLevel
TRITONSERVER_InferenceTrace.
TRITONSERVER_TRACE_LEVEL_DISABLED
@ TRITONSERVER_TRACE_LEVEL_DISABLED
Tracing disabled. No trace activities are reported.
Definition: tritonserver.h:692
TRITONSERVER_logformat_enum
TRITONSERVER_logformat_enum
Format of logging.
Definition: tritonserver.h:276
TRITONSERVER_InferenceTraceSpawnChildTrace
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceSpawnChildTrace(struct TRITONSERVER_InferenceTrace *trace, struct TRITONSERVER_InferenceTrace **child_trace)
Get the child trace, spawned from the parent trace.
tritonserver_responsecompleteflag_enum
tritonserver_responsecompleteflag_enum
Inference response complete flags.
Definition: tritonserver.h:950
TRITONSERVER_ErrorMessage
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ErrorMessage(struct TRITONSERVER_Error *error)
Get the error message.
TRITONSERVER_ResponseAllocatorAllocFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorAllocFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, const char *tensor_name, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void *userp, void **buffer, void **buffer_userp, TRITONSERVER_MemoryType *actual_memory_type, int64_t *actual_memory_type_id)
TRITONSERVER_ResponseAllocator.
Definition: tritonserver.h:401
TRITONSERVER_BufferAttributesSetMemoryType
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetMemoryType(struct TRITONSERVER_BufferAttributes *buffer_attributes, TRITONSERVER_MemoryType memory_type)
Set the memory type field of the buffer attributes.
TRITONSERVER_ServerOptionsSetCpuMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCpuMetrics(struct TRITONSERVER_ServerOptions *options, bool cpu_metrics)
Enable or disable CPU metrics collection in a server options.
TRITONSERVER_MEMORY_CPU
@ TRITONSERVER_MEMORY_CPU
Definition: tritonserver.h:167
TRITONSERVER_PARAMETER_BYTES
@ TRITONSERVER_PARAMETER_BYTES
Definition: tritonserver.h:192
TRITONSERVER_LOG_ISO8601
@ TRITONSERVER_LOG_ISO8601
Definition: tritonserver.h:278
TRITONSERVER_InferenceTraceModelVersion
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceModelVersion(struct TRITONSERVER_InferenceTrace *trace, int64_t *model_version)
Get the version of the model associated with a trace.
TRITONSERVER_ApiVersion
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ApiVersion(uint32_t *major, uint32_t *minor)
Get the TRITONBACKEND API version supported by the Triton shared library.
TRITONSERVER_InferenceRequestRemoveInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Remove an input from a request.
TRITONSERVER_LOG_DEFAULT
@ TRITONSERVER_LOG_DEFAULT
Definition: tritonserver.h:277
TRITONSERVER_TYPE_UINT16
@ TRITONSERVER_TYPE_UINT16
Definition: tritonserver.h:122
TRITONSERVER_InferenceResponseParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseParameter(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const char **name, TRITONSERVER_ParameterType *type, const void **vvalue)
Get all information about a parameter.
TRITONSERVER_TYPE_INT16
@ TRITONSERVER_TYPE_INT16
Definition: tritonserver.h:126
TRITONSERVER_ResponseAllocatorStartFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorStartFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *userp)
Type for function that is called to indicate that subsequent allocation requests will refer to a new ...
Definition: tritonserver.h:496
TRITONSERVER_TRACE_QUEUE_START
@ TRITONSERVER_TRACE_QUEUE_START
Definition: tritonserver.h:715
TRITONSERVER_TYPE_UINT64
@ TRITONSERVER_TYPE_UINT64
Definition: tritonserver.h:124
TRITONSERVER_MetricNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricNew(struct TRITONSERVER_Metric **metric, struct TRITONSERVER_MetricFamily *family, const struct TRITONSERVER_Parameter **labels, const uint64_t label_count)
Create a new metric object.
TRITONSERVER_ServerOptionsSetStrictReadiness
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStrictReadiness(struct TRITONSERVER_ServerOptions *options, bool strict)
Enable or disable strict readiness handling in a server options.
TRITONSERVER_metrickind_enum
TRITONSERVER_metrickind_enum
TRITONSERVER_MetricKind.
Definition: tritonserver.h:2569
TRITONSERVER_ERROR_CANCELLED
@ TRITONSERVER_ERROR_CANCELLED
Definition: tritonserver.h:319
TRITONSERVER_ModelControlMode
enum tritonserver_modelcontrolmode_enum TRITONSERVER_ModelControlMode
TRITONSERVER_ServerOptions.
TRITONSERVER_RATE_LIMIT_OFF
@ TRITONSERVER_RATE_LIMIT_OFF
Definition: tritonserver.h:1750
TRITONSERVER_InferenceResponseId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseId(struct TRITONSERVER_InferenceResponse *inference_response, const char **request_id)
Get the ID of the request corresponding to a response.
TRITONSERVER_ERROR_NOT_FOUND
@ TRITONSERVER_ERROR_NOT_FOUND
Definition: tritonserver.h:314
TRITONSERVER_ResponseAllocatorDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorDelete(struct TRITONSERVER_ResponseAllocator *allocator)
Delete a response allocator.
TRITONSERVER_InferenceRequestCorrelationIdString
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCorrelationIdString(struct TRITONSERVER_InferenceRequest *inference_request, const char **correlation_id)
Get the correlation ID of the inference request as a string.
TRITONSERVER_ServerOptionsSetHostPolicy
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetHostPolicy(struct TRITONSERVER_ServerOptions *options, const char *policy_name, const char *setting, const char *value)
Set a host policy setting for a given policy name in a server options.
TRITONSERVER_InferenceResponseError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseError(struct TRITONSERVER_InferenceResponse *inference_response)
Return the error status of an inference response.
TRITONSERVER_InferenceRequestSetIntParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetIntParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const int64_t value)
Set an integer parameter in the request.
TRITONSERVER_ServerOptionsNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsNew(struct TRITONSERVER_ServerOptions **options)
Create a new server options object.
TRITONSERVER_MetricFamilyDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricFamilyDelete(struct TRITONSERVER_MetricFamily *family)
Delete a metric family object.
TRITONSERVER_TRACE_COMPUTE_END
@ TRITONSERVER_TRACE_COMPUTE_END
Definition: tritonserver.h:719
TRITONSERVER_MetricsDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricsDelete(struct TRITONSERVER_Metrics *metrics)
Delete a metrics object.
TRITONSERVER_LOG_VERBOSE
@ TRITONSERVER_LOG_VERBOSE
Definition: tritonserver.h:265
TRITONSERVER_InferenceTraceModelName
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceModelName(struct TRITONSERVER_InferenceTrace *trace, const char **model_name)
Get the name of the model associated with a trace.
TRITONSERVER_ServerModelIsReady
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelIsReady(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, bool *ready)
Is the model ready?
TRITONSERVER_MemoryType
enum TRITONSERVER_memorytype_enum TRITONSERVER_MemoryType
TRITONSERVER_MemoryType.
TRITONSERVER_TRACE_TENSOR_QUEUE_INPUT
@ TRITONSERVER_TRACE_TENSOR_QUEUE_INPUT
Definition: tritonserver.h:721
TRITONSERVER_DataTypeByteSize
TRITONSERVER_DECLSPEC uint32_t TRITONSERVER_DataTypeByteSize(TRITONSERVER_DataType datatype)
Get the size of a Triton datatype in bytes.
TRITONSERVER_BATCH_UNKNOWN
@ TRITONSERVER_BATCH_UNKNOWN
Definition: tritonserver.h:2234
TRITONSERVER_BufferAttributesSetMemoryTypeId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetMemoryTypeId(struct TRITONSERVER_BufferAttributes *buffer_attributes, int64_t memory_type_id)
Set the memory type id field of the buffer attributes.
TRITONSERVER_InferenceRequestTimeoutMicroseconds
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestTimeoutMicroseconds(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *timeout_us)
Get the timeout for a request, in microseconds.
TRITONSERVER_ServerOptionsSetPinnedMemoryPoolByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetPinnedMemoryPoolByteSize(struct TRITONSERVER_ServerOptions *options, uint64_t size)
Set the total pinned memory byte size that the server can allocate in a server options.
TRITONSERVER_METRIC_PROMETHEUS
@ TRITONSERVER_METRIC_PROMETHEUS
Definition: tritonserver.h:640
TRITONSERVER_REQUEST_FLAG_SEQUENCE_END
@ TRITONSERVER_REQUEST_FLAG_SEQUENCE_END
Definition: tritonserver.h:936
TRITONSERVER_ServerOptionsAddRateLimiterResource
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsAddRateLimiterResource(struct TRITONSERVER_ServerOptions *options, const char *resource_name, const size_t resource_count, const int device)
Add resource count for rate limiting.
TRITONSERVER_ServerIsLive
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerIsLive(struct TRITONSERVER_Server *server, bool *live)
Is the server live?
TRITONSERVER_MODEL_CONTROL_POLL
@ TRITONSERVER_MODEL_CONTROL_POLL
Definition: tritonserver.h:1744
TRITONSERVER_TRACE_COMPUTE_INPUT_END
@ TRITONSERVER_TRACE_COMPUTE_INPUT_END
Definition: tritonserver.h:717
TRITONSERVER_InferenceRequestRemoveRequestedOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveRequestedOutput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Remove an output request from an inference request.
TRITONSERVER_TXN_DECOUPLED
@ TRITONSERVER_TXN_DECOUPLED
Definition: tritonserver.h:2247
TRITONSERVER_ServerOptionsSetGpuMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetGpuMetrics(struct TRITONSERVER_ServerOptions *options, bool gpu_metrics)
Enable or disable GPU metrics collection in a server options.
TRITONSERVER_ERROR_UNKNOWN
@ TRITONSERVER_ERROR_UNKNOWN
Definition: tritonserver.h:312
TRITONSERVER_ErrorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ErrorNew(TRITONSERVER_Error_Code code, const char *msg)
Create a new error object.
TRITONSERVER_InferenceTraceActivityString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InferenceTraceActivityString(TRITONSERVER_InferenceTraceActivity activity)
Get the string representation of a trace activity.
TRITONSERVER_MetricKind
enum TRITONSERVER_metrickind_enum TRITONSERVER_MetricKind
TRITONSERVER_MetricKind.
TRITONSERVER_TRACE_LEVEL_TIMESTAMPS
@ TRITONSERVER_TRACE_LEVEL_TIMESTAMPS
Record timestamps for the inference request.
Definition: tritonserver.h:698
TRITONSERVER_ServerModelBatchProperties
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelBatchProperties(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, uint32_t *flags, void **voidp)
Get the batch properties of the model.
TRITONSERVER_InferenceRequestAddRawInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddRawInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Add a raw input to a request.
TRITONSERVER_InferenceResponseDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseDelete(struct TRITONSERVER_InferenceResponse *inference_response)
TRITONSERVER_InferenceResponse.
TRITONSERVER_InferenceTraceNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceNew(struct TRITONSERVER_InferenceTrace **trace, TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id, TRITONSERVER_InferenceTraceActivityFn_t activity_fn, TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void *trace_userp)
Create a new inference trace object.
TRITONSERVER_ServerModelStatistics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelStatistics(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, struct TRITONSERVER_Message **model_stats)
Get the statistics of a model as a TRITONSERVER_Message object.
TRITONSERVER_PARAMETER_INT
@ TRITONSERVER_PARAMETER_INT
Definition: tritonserver.h:187
TRITONSERVER_BufferAttributesByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesByteSize(struct TRITONSERVER_BufferAttributes *buffer_attributes, size_t *byte_size)
Get the byte size field of the buffer attributes.
TRITONSERVER_MemoryTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_MemoryTypeString(TRITONSERVER_MemoryType memtype)
Get the string representation of a memory type.
TRITONSERVER_ServerOptionsSetBackendConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBackendConfig(struct TRITONSERVER_ServerOptions *options, const char *backend_name, const char *setting, const char *value)
Set a configuration setting for a named backend in a server options.
TRITONSERVER_ERROR_ALREADY_EXISTS
@ TRITONSERVER_ERROR_ALREADY_EXISTS
Definition: tritonserver.h:318
TRITONSERVER_ResponseAllocatorBufferAttributesFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorBufferAttributesFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, const char *tensor_name, struct TRITONSERVER_BufferAttributes *buffer_attributes, void *userp, void *buffer_userp)
Type for allocation function that allocates a buffer to hold an output tensor with buffer attributes.
Definition: tritonserver.h:431
tritonserver_modelindexflag_enum
tritonserver_modelindexflag_enum
Model index flags. The enum values must be power-of-2 values.
Definition: tritonserver.h:2239
TRITONSERVER_REQUEST_FLAG_SEQUENCE_START
@ TRITONSERVER_REQUEST_FLAG_SEQUENCE_START
Definition: tritonserver.h:935
TRITONSERVER_DECLSPEC
#define TRITONSERVER_DECLSPEC
Definition: tritonserver.h:50
TRITONSERVER_InferenceRequestSetCorrelationId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetCorrelationId(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t correlation_id)
Set the correlation ID of the inference request to be an unsigned integer.
TRITONSERVER_ParameterDelete
TRITONSERVER_DECLSPEC void TRITONSERVER_ParameterDelete(struct TRITONSERVER_Parameter *parameter)
Delete an parameter object.
TRITONSERVER_TRACE_LEVEL_TENSORS
@ TRITONSERVER_TRACE_LEVEL_TENSORS
Record input and output tensor values for the inference request.
Definition: tritonserver.h:700
TRITONSERVER_RequestReleaseFlag
enum tritonserver_requestreleaseflag_enum TRITONSERVER_RequestReleaseFlag
Inference request release flags.
TRITONSERVER_METRIC_KIND_GAUGE
@ TRITONSERVER_METRIC_KIND_GAUGE
Definition: tritonserver.h:2571
TRITONSERVER_LOG_INFO
@ TRITONSERVER_LOG_INFO
Definition: tritonserver.h:262
TRITONSERVER_TYPE_INT8
@ TRITONSERVER_TYPE_INT8
Definition: tritonserver.h:125
TRITONSERVER_InferenceTraceTensorActivityFn_t
void(* TRITONSERVER_InferenceTraceTensorActivityFn_t)(struct TRITONSERVER_InferenceTrace *trace, TRITONSERVER_InferenceTraceActivity activity, const char *name, TRITONSERVER_DataType datatype, const void *base, size_t byte_size, const int64_t *shape, uint64_t dim_count, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void *userp)
Type for trace tensor activity callback function.
Definition: tritonserver.h:752
TRITONSERVER_ServerIsReady
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerIsReady(struct TRITONSERVER_Server *server, bool *ready)
Is the server ready?
TRITONSERVER_ServerOptionsSetMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetrics(struct TRITONSERVER_ServerOptions *options, bool metrics)
Enable or disable metrics collection in a server options.
TRITONSERVER_BufferAttributesSetByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetByteSize(struct TRITONSERVER_BufferAttributes *buffer_attributes, size_t byte_size)
Set the byte size field of the buffer attributes.
TRITONSERVER_ServerOptionsSetLogError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogError(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable error level logging.
TRITONSERVER_TYPE_BYTES
@ TRITONSERVER_TYPE_BYTES
Definition: tritonserver.h:132
TRITONSERVER_BufferAttributesMemoryTypeId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesMemoryTypeId(struct TRITONSERVER_BufferAttributes *buffer_attributes, int64_t *memory_type_id)
Get the memory type id field of the buffer attributes.
TRITONSERVER_ResponseAllocatorSetQueryFunction
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorSetQueryFunction(struct TRITONSERVER_ResponseAllocator *allocator, TRITONSERVER_ResponseAllocatorQueryFn_t query_fn)
Set the query function to a response allocator object.
TRITONSERVER_InferenceRequestAppendInputData
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputData(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id)
Assign a buffer of data to an input.
TRITONSERVER_ServerOptionsSetLogInfo
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogInfo(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable info level logging.
TRITONSERVER_MetricSet
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricSet(struct TRITONSERVER_Metric *metric, double value)
Set the current value of metric to value.
TRITONSERVER_ServerUnloadModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnloadModel(struct TRITONSERVER_Server *server, const char *model_name)
Unload the requested model.
TRITONSERVER_INSTANCEGROUPKIND_MODEL
@ TRITONSERVER_INSTANCEGROUPKIND_MODEL
Definition: tritonserver.h:245
TRITONSERVER_InferenceRequestDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestDelete(struct TRITONSERVER_InferenceRequest *inference_request)
Delete an inference request object.
TRITONSERVER_BufferAttributesNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesNew(struct TRITONSERVER_BufferAttributes **buffer_attributes)
TRITONSERVER_BufferAttributes.
TRITONSERVER_InferenceRequestSetPriority
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetPriority(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t priority)
Deprecated.
TRITONSERVER_MetricDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricDelete(struct TRITONSERVER_Metric *metric)
Delete a metric object.
TRITONSERVER_Error_Code
enum TRITONSERVER_errorcode_enum TRITONSERVER_Error_Code
TRITONSERVER_Error.
TRITONSERVER_StringToDataType
TRITONSERVER_DECLSPEC TRITONSERVER_DataType TRITONSERVER_StringToDataType(const char *dtype)
Get the Triton datatype corresponding to a string representation of a datatype.
TRITONSERVER_LogFormat
enum TRITONSERVER_logformat_enum TRITONSERVER_LogFormat
Format of logging.
TRITONSERVER_ErrorCodeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ErrorCodeString(struct TRITONSERVER_Error *error)
Get the string representation of an error code.
TRITONSERVER_REQUEST_RELEASE_ALL
@ TRITONSERVER_REQUEST_RELEASE_ALL
Definition: tritonserver.h:942
TRITONSERVER_ServerOptionsSetCudaMemoryPoolByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCudaMemoryPoolByteSize(struct TRITONSERVER_ServerOptions *options, int gpu_device, uint64_t size)
Set the total CUDA memory byte size that the server can allocate on given GPU device in a server opti...
TRITONSERVER_ServerOptionsSetModelControlMode
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelControlMode(struct TRITONSERVER_ServerOptions *options, TRITONSERVER_ModelControlMode mode)
Set the model control mode in a server options.
TRITONSERVER_DataTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_DataTypeString(TRITONSERVER_DataType datatype)
Get the string representation of a data type.
TRITONSERVER_METRIC_KIND_COUNTER
@ TRITONSERVER_METRIC_KIND_COUNTER
Definition: tritonserver.h:2570
TRITONSERVER_ServerOptionsDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsDelete(struct TRITONSERVER_ServerOptions *options)
Delete a server options object.
TRITONSERVER_TXN_ONE_TO_ONE
@ TRITONSERVER_TXN_ONE_TO_ONE
Definition: tritonserver.h:2246
TRITONSERVER_errorcode_enum
TRITONSERVER_errorcode_enum
TRITONSERVER_Error.
Definition: tritonserver.h:311
TRITONSERVER_RATE_LIMIT_EXEC_COUNT
@ TRITONSERVER_RATE_LIMIT_EXEC_COUNT
Definition: tritonserver.h:1751
TRITONSERVER_BufferAttributesMemoryType
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesMemoryType(struct TRITONSERVER_BufferAttributes *buffer_attributes, TRITONSERVER_MemoryType *memory_type)
Get the memory type field of the buffer attributes.
TRITONSERVER_ServerStop
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerStop(struct TRITONSERVER_Server *server)
Stop a server object.
TRITONSERVER_InferenceResponseCompleteFn_t
void(* TRITONSERVER_InferenceResponseCompleteFn_t)(struct TRITONSERVER_InferenceResponse *response, const uint32_t flags, void *userp)
Type for callback function indicating that an inference response has completed.
Definition: tritonserver.h:1004
TRITONSERVER_MetricIncrement
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricIncrement(struct TRITONSERVER_Metric *metric, double value)
Increment the current value of metric by value.
TRITONSERVER_INDEX_FLAG_READY
@ TRITONSERVER_INDEX_FLAG_READY
Definition: tritonserver.h:2240
TRITONSERVER_ModelTxnPropertyFlag
enum tritonserver_txn_property_flag_enum TRITONSERVER_ModelTxnPropertyFlag
Model transaction policy flags.
TRITONSERVER_ParameterTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ParameterTypeString(TRITONSERVER_ParameterType paramtype)
Get the string representation of a parameter type.
TRITONSERVER_InferenceRequestSetBoolParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetBoolParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const bool value)
Set a boolean parameter in the request.
TRITONSERVER_ServerOptionsSetMetricsConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetricsConfig(struct TRITONSERVER_ServerOptions *options, const char *name, const char *setting, const char *value)
Set a configuration setting for metrics in server options.
TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, struct TRITONSERVER_BufferAttributes *buffer_attributes)
Assign a buffer of data to an input.
TRITONSERVER_memorytype_enum
TRITONSERVER_memorytype_enum
TRITONSERVER_MemoryType.
Definition: tritonserver.h:166
TRITONSERVER_TYPE_FP16
@ TRITONSERVER_TYPE_FP16
Definition: tritonserver.h:129
TRITONSERVER_TRACE_REQUEST_END
@ TRITONSERVER_TRACE_REQUEST_END
Definition: tritonserver.h:720
TRITONSERVER_ServerRegisterModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerRegisterModelRepository(struct TRITONSERVER_Server *server, const char *repository_path, const struct TRITONSERVER_Parameter **name_mapping, const uint32_t mapping_count)
Register a new model repository.
TRITONSERVER_RequestFlag
enum tritonserver_requestflag_enum TRITONSERVER_RequestFlag
TRITONSERVER_InferenceRequest.
TRITONSERVER_InferenceTraceActivity
enum tritonserver_traceactivity_enum TRITONSERVER_InferenceTraceActivity
Trace activities.
TRITONSERVER_MessageSerializeToJson
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageSerializeToJson(struct TRITONSERVER_Message *message, const char **base, size_t *byte_size)
Get the base and size of the buffer containing the serialized message in JSON format.
TRITONSERVER_ServerModelMetadata
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelMetadata(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, struct TRITONSERVER_Message **model_metadata)
Get the metadata of a model as a TRITONSERVER_Message object.
TRITONSERVER_ServerOptionsSetBackendDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBackendDirectory(struct TRITONSERVER_ServerOptions *options, const char *backend_dir)
Set the directory containing backend shared libraries.
TRITONSERVER_ERROR_INTERNAL
@ TRITONSERVER_ERROR_INTERNAL
Definition: tritonserver.h:313
TRITONSERVER_MODEL_CONTROL_NONE
@ TRITONSERVER_MODEL_CONTROL_NONE
Definition: tritonserver.h:1743
TRITONSERVER_InferenceRequestCancel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCancel(struct TRITONSERVER_InferenceRequest *inference_request)
Cancel an inference request.
TRITONSERVER_MODEL_CONTROL_EXPLICIT
@ TRITONSERVER_MODEL_CONTROL_EXPLICIT
Definition: tritonserver.h:1745
TRITONSERVER_ServerOptionsSetLogWarn
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogWarn(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable warning level logging.
TRITONSERVER_ResponseAllocatorQueryFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorQueryFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *userp, const char *tensor_name, size_t *byte_size, TRITONSERVER_MemoryType *memory_type, int64_t *memory_type_id)
Type for function that is called to query the allocator's preferred memory type and memory type ID.
Definition: tritonserver.h:460
TRITONSERVER_ParameterType
enum TRITONSERVER_parametertype_enum TRITONSERVER_ParameterType
TRITONSERVER_ParameterType.
TRITONSERVER_GetMetricKind
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_GetMetricKind(struct TRITONSERVER_Metric *metric, TRITONSERVER_MetricKind *kind)
Get the TRITONSERVER_MetricKind of metric and its corresponding family.
TRITONSERVER_InferenceRequestRemoveAllInputData
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllInputData(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Clear all input data from an input, releasing ownership of the buffer(s) that were appended to the in...
tritonserver_tracelevel_enum
tritonserver_tracelevel_enum
TRITONSERVER_InferenceTrace.
Definition: tritonserver.h:690
TRITONSERVER_parametertype_enum
TRITONSERVER_parametertype_enum
TRITONSERVER_ParameterType.
Definition: tritonserver.h:185
TRITONSERVER_TYPE_INVALID
@ TRITONSERVER_TYPE_INVALID
Definition: tritonserver.h:119
TRITONSERVER_PARAMETER_STRING
@ TRITONSERVER_PARAMETER_STRING
Definition: tritonserver.h:186
TRITONSERVER_TYPE_FP64
@ TRITONSERVER_TYPE_FP64
Definition: tritonserver.h:131
TRITONSERVER_ServerMetadata
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerMetadata(struct TRITONSERVER_Server *server, struct TRITONSERVER_Message **server_metadata)
Get the metadata of the server as a TRITONSERVER_Message object.
TRITONSERVER_ServerNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerNew(struct TRITONSERVER_Server **server, struct TRITONSERVER_ServerOptions *options)
Create a new server object.
TRITONSERVER_MetricValue
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricValue(struct TRITONSERVER_Metric *metric, double *value)
Get the current value of a metric object.
TRITONSERVER_InferenceResponseModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseModel(struct TRITONSERVER_InferenceResponse *inference_response, const char **model_name, int64_t *model_version)
Get model used to produce a response.
TRITONSERVER_InferenceTraceActivityFn_t
void(* TRITONSERVER_InferenceTraceActivityFn_t)(struct TRITONSERVER_InferenceTrace *trace, TRITONSERVER_InferenceTraceActivity activity, uint64_t timestamp_ns, void *userp)
Type for trace timeline activity callback function.
Definition: tritonserver.h:741
TRITONSERVER_LogLevel
enum TRITONSERVER_loglevel_enum TRITONSERVER_LogLevel
TRITONSERVER_Logging.
tritonserver_txn_property_flag_enum
tritonserver_txn_property_flag_enum
Model transaction policy flags.
Definition: tritonserver.h:2245
TRITONSERVER_InferenceRequestSetFlags
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetFlags(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t flags)
Set the flag(s) associated with a request.
TRITONSERVER_MessageNewFromSerializedJson
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageNewFromSerializedJson(struct TRITONSERVER_Message **message, const char *base, size_t byte_size)
TRITONSERVER_Message.
TRITONSERVER_MessageDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageDelete(struct TRITONSERVER_Message *message)
Delete a message object.
TRITONSERVER_InferenceRequestSetId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetId(struct TRITONSERVER_InferenceRequest *inference_request, const char *id)
Set the ID for a request.
TRITONSERVER_DataType
enum TRITONSERVER_datatype_enum TRITONSERVER_DataType
TRITONSERVER_DataType.
TRITONSERVER_BufferAttributesDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesDelete(struct TRITONSERVER_BufferAttributes *buffer_attributes)
Delete a buffer attributes object.
TRITONSERVER_ResponseAllocatorSetBufferAttributesFunction
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorSetBufferAttributesFunction(struct TRITONSERVER_ResponseAllocator *allocator, TRITONSERVER_ResponseAllocatorBufferAttributesFn_t buffer_attributes_fn)
Set the buffer attributes function for a response allocator object.
TRITONSERVER_TRACE_COMPUTE_START
@ TRITONSERVER_TRACE_COMPUTE_START
Definition: tritonserver.h:716
tritonserver_batchflag_enum
tritonserver_batchflag_enum
TRITONSERVER_Server.
Definition: tritonserver.h:2233
TRITONSERVER_ERROR_INVALID_ARG
@ TRITONSERVER_ERROR_INVALID_ARG
Definition: tritonserver.h:315
TRITONSERVER_TYPE_BOOL
@ TRITONSERVER_TYPE_BOOL
Definition: tritonserver.h:120
TRITONSERVER_ServerPollModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerPollModelRepository(struct TRITONSERVER_Server *server)
Check the model repository for changes and update server state based on those changes.
TRITONSERVER_MEMORY_CPU_PINNED
@ TRITONSERVER_MEMORY_CPU_PINNED
Definition: tritonserver.h:168
TRITONSERVER_ResponseCompleteFlag
enum tritonserver_responsecompleteflag_enum TRITONSERVER_ResponseCompleteFlag
Inference response complete flags.
TRITONSERVER_ServerUnloadModelAndDependents
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnloadModelAndDependents(struct TRITONSERVER_Server *server, const char *model_name)
Unload the requested model, and also unload any dependent model that was loaded along with the reques...
TRITONSERVER_InferenceRequestSetStringParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetStringParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const char *value)
Set a string parameter in the request.
TRITONSERVER_TRACE_TENSOR_BACKEND_OUTPUT
@ TRITONSERVER_TRACE_TENSOR_BACKEND_OUTPUT
Definition: tritonserver.h:723
TRITONSERVER_MetricsFormatted
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricsFormatted(struct TRITONSERVER_Metrics *metrics, TRITONSERVER_MetricFormat format, const char **base, size_t *byte_size)
Get a buffer containing the metrics in the specified format.
TRITONSERVER_ErrorDelete
TRITONSERVER_DECLSPEC void TRITONSERVER_ErrorDelete(struct TRITONSERVER_Error *error)
Delete an error object.
TRITONSERVER_ServerLoadModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerLoadModel(struct TRITONSERVER_Server *server, const char *model_name)
Load the requested model or reload the model if it is already loaded.
TRITONSERVER_TYPE_UINT8
@ TRITONSERVER_TYPE_UINT8
Definition: tritonserver.h:121
TRITONSERVER_ServerOptionsSetMinSupportedComputeCapability
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMinSupportedComputeCapability(struct TRITONSERVER_ServerOptions *options, double cc)
Set the minimum support CUDA compute capability in a server options.
TRITONSERVER_ServerOptionsSetModelRepositoryPath
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelRepositoryPath(struct TRITONSERVER_ServerOptions *options, const char *model_repository_path)
Set the model repository path in a server options.
TRITONSERVER_TYPE_INT32
@ TRITONSERVER_TYPE_INT32
Definition: tritonserver.h:127
TRITONSERVER_ServerOptionsSetStrictModelConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStrictModelConfig(struct TRITONSERVER_ServerOptions *options, bool strict)
Enable or disable strict model configuration handling in a server options.
TRITONSERVER_ParameterBytesNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter * TRITONSERVER_ParameterBytesNew(const char *name, const void *byte_ptr, const uint64_t size)
Create a new parameter object with type TRITONSERVER_PARAMETER_BYTES.
eMode::strict
@ strict
TRITONSERVER_LogMessage
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_LogMessage(TRITONSERVER_LogLevel level, const char *filename, const int line, const char *msg)
Log a message at a given log level if that level is enabled.
TRITONSERVER_ServerOptionsSetExitOnError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetExitOnError(struct TRITONSERVER_ServerOptions *options, bool exit)
Enable or disable exit-on-error in a server options.
TRITONSERVER_ServerUnregisterModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnregisterModelRepository(struct TRITONSERVER_Server *server, const char *repository_path)
Unregister a model repository.
TRITONSERVER_InferenceRequestId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestId(struct TRITONSERVER_InferenceRequest *inference_request, const char **id)
Get the ID for a request.
TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, const char *host_policy_name)
Assign a buffer of data to an input for execution on all model instances with the specified host poli...
TRITONSERVER_InferenceResponseOutputClassificationLabel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutputClassificationLabel(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const size_t class_index, const char **label)
Get a classification label associated with an output for a given index.
TRITONSERVER_TRACE_LEVEL_MIN
@ TRITONSERVER_TRACE_LEVEL_MIN
Deprecated. Use TRITONSERVER_TRACE_LEVEL_TIMESTAMPS.
Definition: tritonserver.h:694
TRITONSERVER_ServerOptionsSetBufferManagerThreadCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBufferManagerThreadCount(struct TRITONSERVER_ServerOptions *options, unsigned int thread_count)
Set the number of threads used in buffer manager in a server options.
TRITONSERVER_InferenceTraceTensorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceTensorNew(struct TRITONSERVER_InferenceTrace **trace, TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id, TRITONSERVER_InferenceTraceActivityFn_t activity_fn, TRITONSERVER_InferenceTraceTensorActivityFn_t tensor_activity_fn, TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void *trace_userp)
Create a new inference trace object.
TRITONSERVER_InferenceRequestPriorityUInt64
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestPriorityUInt64(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *priority)
Get the priority for a request.
TRITONSERVER_InferenceRequestSetPriorityUInt64
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetPriorityUInt64(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t priority)
Set the priority for a request.
TRITONSERVER_ServerModelTransactionProperties
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelTransactionProperties(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, uint32_t *txn_flags, void **voidp)
Get the transaction policy of the model.
TRITONSERVER_ServerModelIndex
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelIndex(struct TRITONSERVER_Server *server, uint32_t flags, struct TRITONSERVER_Message **model_index)
Get the index of all unique models in the model repositories as a TRITONSERVER_Message object.
TRITONSERVER_ResponseAllocatorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorNew(struct TRITONSERVER_ResponseAllocator **allocator, TRITONSERVER_ResponseAllocatorAllocFn_t alloc_fn, TRITONSERVER_ResponseAllocatorReleaseFn_t release_fn, TRITONSERVER_ResponseAllocatorStartFn_t start_fn)
Create a new response allocator object.
TRITONSERVER_ERROR_UNAVAILABLE
@ TRITONSERVER_ERROR_UNAVAILABLE
Definition: tritonserver.h:316
TRITONSERVER_INSTANCEGROUPKIND_AUTO
@ TRITONSERVER_INSTANCEGROUPKIND_AUTO
Definition: tritonserver.h:242
TRITONSERVER_ServerLoadModelWithParameters
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerLoadModelWithParameters(struct TRITONSERVER_Server *server, const char *model_name, const struct TRITONSERVER_Parameter **parameters, const uint64_t parameter_count)
Load the requested model or reload the model if it is already loaded, with load parameters provided.
TRITONSERVER_InferenceResponseOutputCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutputCount(struct TRITONSERVER_InferenceResponse *inference_response, uint32_t *count)
Get the number of outputs available in the response.
TRITONSERVER_InferenceResponseOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutput(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const char **name, TRITONSERVER_DataType *datatype, const int64_t **shape, uint64_t *dim_count, const void **base, size_t *byte_size, TRITONSERVER_MemoryType *memory_type, int64_t *memory_type_id, void **userp)
Get all information about an output tensor.
TRITONSERVER_ServerInferAsync
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerInferAsync(struct TRITONSERVER_Server *server, struct TRITONSERVER_InferenceRequest *inference_request, struct TRITONSERVER_InferenceTrace *trace)
Perform inference using the meta-data and inputs supplied by the 'inference_request'.
TRITONSERVER_TYPE_FP32
@ TRITONSERVER_TYPE_FP32
Definition: tritonserver.h:130
TRITONSERVER_ServerOptionsSetCacheDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCacheDirectory(struct TRITONSERVER_ServerOptions *options, const char *cache_dir)
Set the directory containing cache shared libraries.
TRITONSERVER_instancegroupkind_enum
TRITONSERVER_instancegroupkind_enum
TRITONSERVER_InstanceGroupKind.
Definition: tritonserver.h:241
tritonserver_modelcontrolmode_enum
tritonserver_modelcontrolmode_enum
TRITONSERVER_ServerOptions.
Definition: tritonserver.h:1742
TRITONSERVER_TRACE_TENSOR_BACKEND_INPUT
@ TRITONSERVER_TRACE_TENSOR_BACKEND_INPUT
Definition: tritonserver.h:722
TRITONSERVER_ServerOptionsSetExitTimeout
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetExitTimeout(struct TRITONSERVER_ServerOptions *options, unsigned int timeout)
Set the exit timeout, in seconds, for the server in a server options.
TRITONSERVER_loglevel_enum
TRITONSERVER_loglevel_enum
TRITONSERVER_Logging.
Definition: tritonserver.h:261
TRITONSERVER_InferenceRequestSetReleaseCallback
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetReleaseCallback(struct TRITONSERVER_InferenceRequest *inference_request, TRITONSERVER_InferenceRequestReleaseFn_t request_release_fn, void *request_release_userp)
Set the release callback for an inference request.
TRITONSERVER_ERROR_UNSUPPORTED
@ TRITONSERVER_ERROR_UNSUPPORTED
Definition: tritonserver.h:317
TRITONSERVER_ServerOptionsSetResponseCacheByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetResponseCacheByteSize(struct TRITONSERVER_ServerOptions *options, uint64_t size)
Deprecated.
TRITONSERVER_InstanceGroupKindString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InstanceGroupKindString(TRITONSERVER_InstanceGroupKind kind)
Get the string representation of an instance-group kind.
TRITONSERVER_RateLimitMode
enum tritonserver_ratelimitmode_enum TRITONSERVER_RateLimitMode
Rate limit modes.
TRITONSERVER_InferenceTraceId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceId(struct TRITONSERVER_InferenceTrace *trace, uint64_t *id)
Get the id associated with a trace.
TRITONSERVER_LOG_ERROR
@ TRITONSERVER_LOG_ERROR
Definition: tritonserver.h:264
TRITONSERVER_InferenceRequestAddRequestedOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddRequestedOutput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Add an output request to an inference request.
TRITONSERVER_MetricFormat
enum tritonserver_metricformat_enum TRITONSERVER_MetricFormat
TRITONSERVER_Metrics.
TRITONSERVER_TRACE_COMPUTE_OUTPUT_START
@ TRITONSERVER_TRACE_COMPUTE_OUTPUT_START
Definition: tritonserver.h:718
TRITONSERVER_InferenceRequestIsCancelled
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestIsCancelled(struct TRITONSERVER_InferenceRequest *inference_request, bool *is_cancelled)
Query whether the request is cancelled or not.
TRITONSERVER_InferenceRequestPriority
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestPriority(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t *priority)
Deprecated.
TRITONSERVER_RESPONSE_COMPLETE_FINAL
@ TRITONSERVER_RESPONSE_COMPLETE_FINAL
Definition: tritonserver.h:951
TRITONSERVER_InferenceTraceDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceDelete(struct TRITONSERVER_InferenceTrace *trace)
Delete a trace object.
TRITONSERVER_InferenceRequestReleaseFn_t
void(* TRITONSERVER_InferenceRequestReleaseFn_t)(struct TRITONSERVER_InferenceRequest *request, const uint32_t flags, void *userp)
Type for inference request release callback function.
Definition: tritonserver.h:983
TRITONSERVER_LOG_WARN
@ TRITONSERVER_LOG_WARN
Definition: tritonserver.h:263
TRITONSERVER_datatype_enum
TRITONSERVER_datatype_enum
TRITONSERVER_DataType.
Definition: tritonserver.h:118
tritonserver_metricformat_enum
tritonserver_metricformat_enum
TRITONSERVER_Metrics.
Definition: tritonserver.h:639
TRITONSERVER_ParameterNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter * TRITONSERVER_ParameterNew(const char *name, const TRITONSERVER_ParameterType type, const void *value)
Create a new parameter object.
TRITONSERVER_INSTANCEGROUPKIND_GPU
@ TRITONSERVER_INSTANCEGROUPKIND_GPU
Definition: tritonserver.h:244
TRITONSERVER_InstanceGroupKind
enum TRITONSERVER_instancegroupkind_enum TRITONSERVER_InstanceGroupKind
TRITONSERVER_InstanceGroupKind.
TRITONSERVER_LogIsEnabled
TRITONSERVER_DECLSPEC bool TRITONSERVER_LogIsEnabled(TRITONSERVER_LogLevel level)
Is a log level enabled?
tritonserver_requestflag_enum
tritonserver_requestflag_enum
TRITONSERVER_InferenceRequest.
Definition: tritonserver.h:934
TRITONSERVER_ServerOptionsSetRateLimiterMode
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetRateLimiterMode(struct TRITONSERVER_ServerOptions *options, TRITONSERVER_RateLimitMode mode)
Set the rate limit mode in a server options.
TRITONSERVER_ServerOptionsSetRepoAgentDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetRepoAgentDirectory(struct TRITONSERVER_ServerOptions *options, const char *repoagent_dir)
Set the directory containing repository agent shared libraries.
TRITONSERVER_TYPE_UINT32
@ TRITONSERVER_TYPE_UINT32
Definition: tritonserver.h:123
TRITONSERVER_InferenceRequestFlags
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestFlags(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t *flags)
Get the flag(s) associated with a request.
TRITONSERVER_ServerModelConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelConfig(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, const uint32_t config_version, struct TRITONSERVER_Message **model_config)
Get the configuration of a model as a TRITONSERVER_Message object.
TRITONSERVER_InferenceRequestNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestNew(struct TRITONSERVER_InferenceRequest **inference_request, struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version)
Create a new inference request object.
TRITONSERVER_MetricFamilyNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricFamilyNew(struct TRITONSERVER_MetricFamily **family, const TRITONSERVER_MetricKind kind, const char *name, const char *description)
Create a new metric family object.
TRITONSERVER_ServerMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerMetrics(struct TRITONSERVER_Server *server, struct TRITONSERVER_Metrics **metrics)
Get the current metrics for the server.
TRITONSERVER_InferenceRequestAddInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const TRITONSERVER_DataType datatype, const int64_t *shape, uint64_t dim_count)
Add an input to a request.
TRITONSERVER_ServerOptionsSetServerId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetServerId(struct TRITONSERVER_ServerOptions *options, const char *server_id)
Set the textual ID for the server in a server options.
TRITONSERVER_ServerDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerDelete(struct TRITONSERVER_Server *server)
Delete a server object.
TRITONSERVER_ModelIndexFlag
enum tritonserver_modelindexflag_enum TRITONSERVER_ModelIndexFlag
Model index flags. The enum values must be power-of-2 values.
TRITONSERVER_TRACE_LEVEL_MAX
@ TRITONSERVER_TRACE_LEVEL_MAX
Deprecated. Use TRITONSERVER_TRACE_LEVEL_TIMESTAMPS.
Definition: tritonserver.h:696
TRITONSERVER_BufferAttributesSetCudaIpcHandle
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetCudaIpcHandle(struct TRITONSERVER_BufferAttributes *buffer_attributes, void *cuda_ipc_handle)
Set the CudaIpcHandle field of the buffer attributes.
TRITONSERVER_TRACE_REQUEST_START
@ TRITONSERVER_TRACE_REQUEST_START
Definition: tritonserver.h:714
TRITONSERVER_ServerOptionsSetLogFile
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogFile(struct TRITONSERVER_ServerOptions *options, const char *file)
Provide a log output file.
TRITONSERVER_ServerOptionsSetStartupModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStartupModel(struct TRITONSERVER_ServerOptions *options, const char *model_name)
Set the model to be loaded at startup in a server options.
TRITONSERVER_PARAMETER_BOOL
@ TRITONSERVER_PARAMETER_BOOL
Definition: tritonserver.h:188
TRITONSERVER_InferenceResponseParameterCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseParameterCount(struct TRITONSERVER_InferenceResponse *inference_response, uint32_t *count)
Get the number of parameters available in the response.
TRITONSERVER_ServerOptionsSetMetricsInterval
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetricsInterval(struct TRITONSERVER_ServerOptions *options, uint64_t metrics_interval_ms)
Set the interval for metrics collection in a server options.
TRITONSERVER_BufferAttributesCudaIpcHandle
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesCudaIpcHandle(struct TRITONSERVER_BufferAttributes *buffer_attributes, void **cuda_ipc_handle)
Get the CudaIpcHandle field of the buffer attributes object.
TRITONSERVER_InferenceRequestRemoveAllRequestedOutputs
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllRequestedOutputs(struct TRITONSERVER_InferenceRequest *inference_request)
Remove all output requests from an inference request.
TRITONSERVER_ModelBatchFlag
enum tritonserver_batchflag_enum TRITONSERVER_ModelBatchFlag
TRITONSERVER_Server.
TRITONSERVER_ErrorCode
TRITONSERVER_DECLSPEC TRITONSERVER_Error_Code TRITONSERVER_ErrorCode(struct TRITONSERVER_Error *error)
Get the error code.
TRITONSERVER_InferenceRequestCorrelationId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCorrelationId(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *correlation_id)
Get the correlation ID of the inference request as an unsigned integer.
TRITONSERVER_MEMORY_GPU
@ TRITONSERVER_MEMORY_GPU
Definition: tritonserver.h:169
TRITONSERVER_ServerOptionsSetLogVerbose
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogVerbose(struct TRITONSERVER_ServerOptions *options, int level)
Set verbose logging level.
tritonserver_requestreleaseflag_enum
tritonserver_requestreleaseflag_enum
Inference request release flags.
Definition: tritonserver.h:941
TRITONSERVER_InferenceTraceRequestId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceRequestId(struct TRITONSERVER_InferenceTrace *trace, const char **request_id)
Get the request id associated with a trace.
TRITONSERVER_InferenceTraceParentId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceParentId(struct TRITONSERVER_InferenceTrace *trace, uint64_t *parent_id)
Get the parent id associated with a trace.
TRITONSERVER_ServerOptionsSetCacheConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCacheConfig(struct TRITONSERVER_ServerOptions *options, const char *cache_name, const char *config_json)
Set the cache config that will be used to initialize the cache implementation for "cache_name".
TRITONSERVER_InferenceRequestSetCorrelationIdString
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetCorrelationIdString(struct TRITONSERVER_InferenceRequest *inference_request, const char *correlation_id)
Set the correlation ID of the inference request to be a string.
tritonserver_ratelimitmode_enum
tritonserver_ratelimitmode_enum
Rate limit modes.
Definition: tritonserver.h:1749
TRITONSERVER_BATCH_FIRST_DIM
@ TRITONSERVER_BATCH_FIRST_DIM
Definition: tritonserver.h:2235
TRITONSERVER_ServerOptionsSetLogFormat
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogFormat(struct TRITONSERVER_ServerOptions *options, const TRITONSERVER_LogFormat format)
Set the logging format.
TRITONSERVER_InferenceRequestSetResponseCallback
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetResponseCallback(struct TRITONSERVER_InferenceRequest *inference_request, struct TRITONSERVER_ResponseAllocator *response_allocator, void *response_allocator_userp, TRITONSERVER_InferenceResponseCompleteFn_t response_fn, void *response_userp)
Set the allocator and response callback for an inference request.
TRITONSERVER_INSTANCEGROUPKIND_CPU
@ TRITONSERVER_INSTANCEGROUPKIND_CPU
Definition: tritonserver.h:243
TRITONSERVER_ServerOptionsSetModelNamespacing
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelNamespacing(struct TRITONSERVER_ServerOptions *options, bool enable_namespace)
Enable model namespacing to allow serving models with the same name if they are in different namespac...
TRITONSERVER_InferenceRequestRemoveAllInputs
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllInputs(struct TRITONSERVER_InferenceRequest *inference_request)
Remove all inputs from a request.
TRITONSERVER_ServerOptionsSetModelLoadThreadCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelLoadThreadCount(struct TRITONSERVER_ServerOptions *options, unsigned int thread_count)
Set the number of threads to concurrently load models in a server options.