NVIDIA DeepStream SDK API Reference

7.1 Release
tritonserver.h
Go to the documentation of this file.
1 // Copyright 2020-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2 //
3 // Redistribution and use in source and binary forms, with or without
4 // modification, are permitted provided that the following conditions
5 // are met:
6 // * Redistributions of source code must retain the above copyright
7 // notice, this list of conditions and the following disclaimer.
8 // * Redistributions in binary form must reproduce the above copyright
9 // notice, this list of conditions and the following disclaimer in the
10 // documentation and/or other materials provided with the distribution.
11 // * Neither the name of NVIDIA CORPORATION nor the names of its
12 // contributors may be used to endorse or promote products derived
13 // from this software without specific prior written permission.
14 //
15 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
16 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
19 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
23 // OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 #pragma once
27 
29 
30 #include <stdbool.h>
31 #include <stddef.h>
32 #include <stdint.h>
33 
34 #ifdef __cplusplus
35 extern "C" {
36 #endif
37 
38 #ifdef _COMPILING_TRITONSERVER
39 #if defined(_MSC_VER)
40 #define TRITONSERVER_DECLSPEC __declspec(dllexport)
41 #elif defined(__GNUC__)
42 #define TRITONSERVER_DECLSPEC __attribute__((__visibility__("default")))
43 #else
44 #define TRITONSERVER_DECLSPEC
45 #endif
46 #else
47 #if defined(_MSC_VER)
48 #define TRITONSERVER_DECLSPEC __declspec(dllimport)
49 #else
50 #define TRITONSERVER_DECLSPEC
51 #endif
52 #endif
53 
54 struct TRITONSERVER_BufferAttributes;
55 struct TRITONSERVER_Error;
56 struct TRITONSERVER_InferenceRequest;
57 struct TRITONSERVER_InferenceResponse;
58 struct TRITONSERVER_InferenceTrace;
59 struct TRITONSERVER_Message;
60 struct TRITONSERVER_Metrics;
61 struct TRITONSERVER_Parameter;
62 struct TRITONSERVER_ResponseAllocator;
63 struct TRITONSERVER_Server;
64 struct TRITONSERVER_ServerOptions;
65 struct TRITONSERVER_Metric;
66 struct TRITONSERVER_MetricFamily;
67 struct TRITONSERVER_MetricArgs;
68 
94 #define TRITONSERVER_API_VERSION_MAJOR 1
95 #define TRITONSERVER_API_VERSION_MINOR 34
96 
108 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ApiVersion(
109  uint32_t* major, uint32_t* minor);
110 
132 
139  TRITONSERVER_DataType datatype);
140 
148 TRITONSERVER_StringToDataType(const char* dtype);
149 
156 TRITONSERVER_DECLSPEC uint32_t
158 
168 
176  TRITONSERVER_MemoryType memtype);
177 
189 
197  TRITONSERVER_ParameterType paramtype);
198 
209 TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter* TRITONSERVER_ParameterNew(
210  const char* name, const TRITONSERVER_ParameterType type, const void* value);
211 
222 TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter*
224  const char* name, const void* byte_ptr, const uint64_t size);
225 
230  struct TRITONSERVER_Parameter* parameter);
231 
242 
251 
262 
293 
299  TRITONSERVER_LogLevel level);
300 
308 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_LogMessage(
309  TRITONSERVER_LogLevel level, const char* filename, const int line,
310  const char* msg);
311 
322 
334 
342 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ErrorNew(
343  TRITONSERVER_Error_Code code, const char* msg);
344 
349  struct TRITONSERVER_Error* error);
350 
356 TRITONSERVER_ErrorCode(struct TRITONSERVER_Error* error);
357 
366  struct TRITONSERVER_Error* error);
367 
376  struct TRITONSERVER_Error* error);
377 
383 
414 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorAllocFn_t)(
415  struct TRITONSERVER_ResponseAllocator* allocator, const char* tensor_name,
416  size_t byte_size, TRITONSERVER_MemoryType memory_type,
417  int64_t memory_type_id, void* userp, void** buffer, void** buffer_userp,
418  TRITONSERVER_MemoryType* actual_memory_type,
419  int64_t* actual_memory_type_id);
420 
443 typedef struct TRITONSERVER_Error* (
445  struct TRITONSERVER_ResponseAllocator* allocator, const char* tensor_name,
446  struct TRITONSERVER_BufferAttributes* buffer_attributes, void* userp,
447  void* buffer_userp);
448 
473 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorQueryFn_t)(
474  struct TRITONSERVER_ResponseAllocator* allocator, void* userp,
475  const char* tensor_name, size_t* byte_size,
476  TRITONSERVER_MemoryType* memory_type, int64_t* memory_type_id);
477 
495 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorReleaseFn_t)(
496  struct TRITONSERVER_ResponseAllocator* allocator, void* buffer,
497  void* buffer_userp, size_t byte_size, TRITONSERVER_MemoryType memory_type,
498  int64_t memory_type_id);
499 
509 typedef struct TRITONSERVER_Error* (*TRITONSERVER_ResponseAllocatorStartFn_t)(
510  struct TRITONSERVER_ResponseAllocator* allocator, void* userp);
511 
561 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
563  struct TRITONSERVER_ResponseAllocator** allocator,
567 
579 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
581  struct TRITONSERVER_ResponseAllocator* allocator,
583 
596 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
598  struct TRITONSERVER_ResponseAllocator* allocator,
600 
605 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
607  struct TRITONSERVER_ResponseAllocator* allocator);
608 
613 
620 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
622  struct TRITONSERVER_Message** message, const char* base, size_t byte_size);
623 
628 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MessageDelete(
629  struct TRITONSERVER_Message* message);
630 
642 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
644  struct TRITONSERVER_Message* message, const char** base, size_t* byte_size);
645 
650 
655 
660 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricsDelete(
661  struct TRITONSERVER_Metrics* metrics);
662 
683 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricsFormatted(
684  struct TRITONSERVER_Metrics* metrics, TRITONSERVER_MetricFormat format,
685  const char** base, size_t* byte_size);
686 
691 
715 
724 
739 
748 
756  struct TRITONSERVER_InferenceTrace* trace,
757  TRITONSERVER_InferenceTraceActivity activity, uint64_t timestamp_ns,
758  void* userp);
759 
767  struct TRITONSERVER_InferenceTrace* trace,
768  TRITONSERVER_InferenceTraceActivity activity, const char* name,
769  TRITONSERVER_DataType datatype, const void* base, size_t byte_size,
770  const int64_t* shape, uint64_t dim_count,
771  TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void* userp);
772 
779  struct TRITONSERVER_InferenceTrace* trace, void* userp);
780 
804 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_InferenceTraceNew(
805  struct TRITONSERVER_InferenceTrace** trace,
806  TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id,
808  TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void* trace_userp);
809 
835 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
837  struct TRITONSERVER_InferenceTrace** trace,
838  TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id,
841  TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void* trace_userp);
842 
850 TRITONSERVER_DECLSPEC TRITONSERVER_Error*
852  TRITONSERVER_InferenceTrace* trace, uint64_t timestamp,
853  const char* activity_name);
854 
859 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
860 TRITONSERVER_InferenceTraceDelete(struct TRITONSERVER_InferenceTrace* trace);
861 
868 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_InferenceTraceId(
869  struct TRITONSERVER_InferenceTrace* trace, uint64_t* id);
870 
878 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
880  struct TRITONSERVER_InferenceTrace* trace, uint64_t* parent_id);
881 
890 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
892  struct TRITONSERVER_InferenceTrace* trace, const char** model_name);
893 
900 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
902  struct TRITONSERVER_InferenceTrace* trace, int64_t* model_version);
903 
912 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
914  struct TRITONSERVER_InferenceTrace* trace, const char** request_id);
915 
924 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
926  struct TRITONSERVER_InferenceTrace* trace,
927  struct TRITONSERVER_InferenceTrace** child_trace);
928 
934 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
936  struct TRITONSERVER_InferenceTrace* trace, const char* trace_context);
937 
943 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
945  struct TRITONSERVER_InferenceTrace* trace, const char** trace_context);
946 
955 
961 
968 
974 
1005  struct TRITONSERVER_InferenceRequest* request, const uint32_t flags,
1006  void* userp);
1007 
1026  struct TRITONSERVER_InferenceResponse* response, const uint32_t flags,
1027  void* userp);
1028 
1038 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1040  struct TRITONSERVER_InferenceRequest** inference_request,
1041  struct TRITONSERVER_Server* server, const char* model_name,
1042  const int64_t model_version);
1043 
1048 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1050  struct TRITONSERVER_InferenceRequest* inference_request);
1051 
1059 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1061  struct TRITONSERVER_InferenceRequest* inference_request, const char** id);
1062 
1068 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1070  struct TRITONSERVER_InferenceRequest* inference_request, const char* id);
1071 
1079 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1081  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t* flags);
1082 
1090 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1092  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t flags);
1093 
1105 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1107  struct TRITONSERVER_InferenceRequest* inference_request,
1108  uint64_t* correlation_id);
1109 
1121 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1123  struct TRITONSERVER_InferenceRequest* inference_request,
1124  const char** correlation_id);
1125 
1135 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1137  struct TRITONSERVER_InferenceRequest* inference_request,
1138  uint64_t correlation_id);
1139 
1149 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1151  struct TRITONSERVER_InferenceRequest* inference_request,
1152  const char* correlation_id);
1153 
1164 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1166  struct TRITONSERVER_InferenceRequest* inference_request);
1167 
1177 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1179  struct TRITONSERVER_InferenceRequest* inference_request,
1180  bool* is_cancelled);
1181 
1191 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1193  struct TRITONSERVER_InferenceRequest* inference_request,
1194  uint32_t* priority);
1195 
1203 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1205  struct TRITONSERVER_InferenceRequest* inference_request,
1206  uint64_t* priority);
1207 
1217 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1219  struct TRITONSERVER_InferenceRequest* inference_request, uint32_t priority);
1220 
1228 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1230  struct TRITONSERVER_InferenceRequest* inference_request, uint64_t priority);
1231 
1238 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1240  struct TRITONSERVER_InferenceRequest* inference_request,
1241  uint64_t* timeout_us);
1242 
1249 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1251  struct TRITONSERVER_InferenceRequest* inference_request,
1252  uint64_t timeout_us);
1253 
1264 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1266  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1267  const TRITONSERVER_DataType datatype, const int64_t* shape,
1268  uint64_t dim_count);
1269 
1280 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1282  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1283 
1289 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1291  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1292 
1297 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1299  struct TRITONSERVER_InferenceRequest* inference_request);
1300 
1315 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1317  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1318  const void* base, size_t byte_size, TRITONSERVER_MemoryType memory_type,
1319  int64_t memory_type_id);
1320 
1340 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1342  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1343  const void* base, size_t byte_size, TRITONSERVER_MemoryType memory_type,
1344  int64_t memory_type_id, const char* host_policy_name);
1345 
1358 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1360  struct TRITONSERVER_InferenceRequest* inference_request, const char* name,
1361  const void* base, struct TRITONSERVER_BufferAttributes* buffer_attributes);
1362 
1369 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1371  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1372 
1378 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1380  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1381 
1387 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1389  struct TRITONSERVER_InferenceRequest* inference_request, const char* name);
1390 
1395 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1397  struct TRITONSERVER_InferenceRequest* inference_request);
1398 
1409 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1411  struct TRITONSERVER_InferenceRequest* inference_request,
1412  TRITONSERVER_InferenceRequestReleaseFn_t request_release_fn,
1413  void* request_release_userp);
1414 
1435 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1437  struct TRITONSERVER_InferenceRequest* inference_request,
1438  struct TRITONSERVER_ResponseAllocator* response_allocator,
1439  void* response_allocator_userp,
1441  void* response_userp);
1442 
1449 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1451  struct TRITONSERVER_InferenceRequest* request, const char* key,
1452  const char* value);
1453 
1460 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1462  struct TRITONSERVER_InferenceRequest* request, const char* key,
1463  const int64_t value);
1464 
1471 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1473  struct TRITONSERVER_InferenceRequest* request, const char* key,
1474  const bool value);
1475 
1482 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1484  struct TRITONSERVER_InferenceRequest* request, const char* key,
1485  const double value);
1486 
1493 
1498 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1500  struct TRITONSERVER_InferenceResponse* inference_response);
1501 
1510 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1512  struct TRITONSERVER_InferenceResponse* inference_response);
1513 
1524 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1526  struct TRITONSERVER_InferenceResponse* inference_response,
1527  const char** model_name, int64_t* model_version);
1528 
1538 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1540  struct TRITONSERVER_InferenceResponse* inference_response,
1541  const char** request_id);
1542 
1548 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1550  struct TRITONSERVER_InferenceResponse* inference_response, uint32_t* count);
1551 
1583 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1585  struct TRITONSERVER_InferenceResponse* inference_response,
1586  const uint32_t index, const char** name, TRITONSERVER_ParameterType* type,
1587  const void** vvalue);
1588 
1594 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1596  struct TRITONSERVER_InferenceResponse* inference_response, uint32_t* count);
1597 
1620 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1622  struct TRITONSERVER_InferenceResponse* inference_response,
1623  const uint32_t index, const char** name, TRITONSERVER_DataType* datatype,
1624  const int64_t** shape, uint64_t* dim_count, const void** base,
1625  size_t* byte_size, TRITONSERVER_MemoryType* memory_type,
1626  int64_t* memory_type_id, void** userp);
1627 
1641 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1643  struct TRITONSERVER_InferenceResponse* inference_response,
1644  const uint32_t index, const size_t class_index, const char** label);
1645 
1650 
1657 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1659  struct TRITONSERVER_BufferAttributes** buffer_attributes);
1660 
1665 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1667  struct TRITONSERVER_BufferAttributes* buffer_attributes);
1668 
1675 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1677  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1678  int64_t memory_type_id);
1679 
1685 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1687  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1688  TRITONSERVER_MemoryType memory_type);
1689 
1696 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1698  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1699  void* cuda_ipc_handle);
1700 
1706 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1708  struct TRITONSERVER_BufferAttributes* buffer_attributes, size_t byte_size);
1709 
1716 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1718  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1719  int64_t* memory_type_id);
1720 
1727 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1729  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1730  TRITONSERVER_MemoryType* memory_type);
1731 
1739 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1741  struct TRITONSERVER_BufferAttributes* buffer_attributes,
1742  void** cuda_ipc_handle);
1743 
1750 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1752  struct TRITONSERVER_BufferAttributes* buffer_attributes, size_t* byte_size);
1753 
1754 
1759 
1766 
1772 
1779 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerOptionsNew(
1780  struct TRITONSERVER_ServerOptions** options);
1781 
1786 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1787 TRITONSERVER_ServerOptionsDelete(struct TRITONSERVER_ServerOptions* options);
1788 
1795 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1797  struct TRITONSERVER_ServerOptions* options, const char* server_id);
1798 
1808 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1810  struct TRITONSERVER_ServerOptions* options,
1811  const char* model_repository_path);
1812 
1833 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1835  struct TRITONSERVER_ServerOptions* options,
1837 
1847 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1849  struct TRITONSERVER_ServerOptions* options, const char* model_name);
1850 
1858 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1860  struct TRITONSERVER_ServerOptions* options, bool strict);
1861 
1868 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1870  struct TRITONSERVER_ServerOptions* options, const char* model_config_name);
1871 
1886 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1888  struct TRITONSERVER_ServerOptions* options,
1890 
1904 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1906  struct TRITONSERVER_ServerOptions* options, const char* resource_name,
1907  const size_t resource_count, const int device);
1908 
1917 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1919  struct TRITONSERVER_ServerOptions* options, uint64_t size);
1920 
1930 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1932  struct TRITONSERVER_ServerOptions* options, int gpu_device, uint64_t size);
1933 
1941 TRITONSERVER_DECLSPEC TRITONSERVER_Error*
1943  TRITONSERVER_ServerOptions* options, int gpu_device,
1944  size_t cuda_virtual_address_size);
1945 
1955 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1957  struct TRITONSERVER_ServerOptions* options, uint64_t size);
1958 
1980 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1982  struct TRITONSERVER_ServerOptions* options, const char* cache_name,
1983  const char* config_json);
1984 
1991 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
1993  struct TRITONSERVER_ServerOptions* options, const char* cache_dir);
1994 
2001 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2003  struct TRITONSERVER_ServerOptions* options, double cc);
2004 
2011 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2013  struct TRITONSERVER_ServerOptions* options, bool exit);
2014 
2021 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2023  struct TRITONSERVER_ServerOptions* options, bool strict);
2024 
2031 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2033  struct TRITONSERVER_ServerOptions* options, unsigned int timeout);
2034 
2040 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2042  struct TRITONSERVER_ServerOptions* options, unsigned int thread_count);
2043 
2049 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2051  struct TRITONSERVER_ServerOptions* options, unsigned int thread_count);
2052 
2058 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2060  struct TRITONSERVER_ServerOptions* options, unsigned int retry_count);
2061 
2068 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2070  struct TRITONSERVER_ServerOptions* options, bool enable_namespace);
2071 
2080 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2082  struct TRITONSERVER_ServerOptions* options, bool enable_peer_access);
2083 
2091 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2093  struct TRITONSERVER_ServerOptions* options, const char* file);
2094 
2100 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2102  struct TRITONSERVER_ServerOptions* options, bool log);
2103 
2109 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2111  struct TRITONSERVER_ServerOptions* options, bool log);
2112 
2118 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2120  struct TRITONSERVER_ServerOptions* options, bool log);
2121 
2127 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2129  struct TRITONSERVER_ServerOptions* options,
2130  const TRITONSERVER_LogFormat format);
2131 
2137 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2139  struct TRITONSERVER_ServerOptions* options, int level);
2140 
2146 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2148  struct TRITONSERVER_ServerOptions* options, bool metrics);
2149 
2157 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2159  struct TRITONSERVER_ServerOptions* options, bool gpu_metrics);
2160 
2168 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2170  struct TRITONSERVER_ServerOptions* options, bool cpu_metrics);
2171 
2179 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2181  struct TRITONSERVER_ServerOptions* options, uint64_t metrics_interval_ms);
2182 
2192 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2194  struct TRITONSERVER_ServerOptions* options, const char* backend_dir);
2195 
2204 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2206  struct TRITONSERVER_ServerOptions* options, const char* repoagent_dir);
2207 
2220 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2222  struct TRITONSERVER_ServerOptions* options,
2223  const TRITONSERVER_InstanceGroupKind kind, const int device_id,
2224  const double fraction);
2225 
2234 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2236  struct TRITONSERVER_ServerOptions* options, const char* backend_name,
2237  const char* setting, const char* value);
2238 
2246 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2248  struct TRITONSERVER_ServerOptions* options, const char* policy_name,
2249  const char* setting, const char* value);
2250 
2259 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2261  struct TRITONSERVER_ServerOptions* options, const char* name,
2262  const char* setting, const char* value);
2263 
2268 
2274 
2279 
2286 
2294 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerNew(
2295  struct TRITONSERVER_Server** server,
2296  struct TRITONSERVER_ServerOptions* options);
2297 
2303 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerDelete(
2304  struct TRITONSERVER_Server* server);
2305 
2311 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerStop(
2312  struct TRITONSERVER_Server* server);
2313 
2321 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2323  struct TRITONSERVER_Server* server, unsigned int timeout);
2324 
2333 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2335  struct TRITONSERVER_Server* server, const char* repository_path,
2336  const struct TRITONSERVER_Parameter** name_mapping,
2337  const uint32_t mapping_count);
2338 
2344 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2346  struct TRITONSERVER_Server* server, const char* repository_path);
2347 
2353 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2354 TRITONSERVER_ServerPollModelRepository(struct TRITONSERVER_Server* server);
2355 
2361 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerIsLive(
2362  struct TRITONSERVER_Server* server, bool* live);
2363 
2369 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerIsReady(
2370  struct TRITONSERVER_Server* server, bool* ready);
2371 
2381 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2383  struct TRITONSERVER_Server* server, const char* model_name,
2384  const int64_t model_version, bool* ready);
2385 
2410 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2412  struct TRITONSERVER_Server* server, const char* model_name,
2413  const int64_t model_version, uint32_t* flags, void** voidp);
2414 
2432 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2434  struct TRITONSERVER_Server* server, const char* model_name,
2435  const int64_t model_version, uint32_t* txn_flags, void** voidp);
2436 
2444 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerMetadata(
2445  struct TRITONSERVER_Server* server,
2446  struct TRITONSERVER_Message** server_metadata);
2447 
2459 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2461  struct TRITONSERVER_Server* server, const char* model_name,
2462  const int64_t model_version, struct TRITONSERVER_Message** model_metadata);
2463 
2476 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2478  struct TRITONSERVER_Server* server, const char* model_name,
2479  const int64_t model_version, struct TRITONSERVER_Message** model_stats);
2480 
2495 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerModelConfig(
2496  struct TRITONSERVER_Server* server, const char* model_name,
2497  const int64_t model_version, const uint32_t config_version,
2498  struct TRITONSERVER_Message** model_config);
2499 
2515 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerModelIndex(
2516  struct TRITONSERVER_Server* server, uint32_t flags,
2517  struct TRITONSERVER_Message** model_index);
2518 
2527 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerLoadModel(
2528  struct TRITONSERVER_Server* server, const char* model_name);
2529 
2544 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2546  struct TRITONSERVER_Server* server, const char* model_name,
2547  const struct TRITONSERVER_Parameter** parameters,
2548  const uint64_t parameter_count);
2549 
2559 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerUnloadModel(
2560  struct TRITONSERVER_Server* server, const char* model_name);
2561 
2573 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2575  struct TRITONSERVER_Server* server, const char* model_name);
2576 
2584 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerMetrics(
2585  struct TRITONSERVER_Server* server, struct TRITONSERVER_Metrics** metrics);
2586 
2608 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_ServerInferAsync(
2609  struct TRITONSERVER_Server* server,
2610  struct TRITONSERVER_InferenceRequest* inference_request,
2611  struct TRITONSERVER_InferenceTrace* trace);
2612 
2622 
2634 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricFamilyNew(
2635  struct TRITONSERVER_MetricFamily** family,
2636  const TRITONSERVER_MetricKind kind, const char* name,
2637  const char* description);
2638 
2646 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2647 TRITONSERVER_MetricFamilyDelete(struct TRITONSERVER_MetricFamily* family);
2648 
2654 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2656  struct TRITONSERVER_MetricFamily* family, TRITONSERVER_MetricKind* kind);
2657 
2664 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricArgsNew(
2665  struct TRITONSERVER_MetricArgs** args);
2666 
2675 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error*
2677  struct TRITONSERVER_MetricArgs* args, const double* buckets,
2678  const uint64_t buckets_count);
2679 
2684 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricArgsDelete(
2685  struct TRITONSERVER_MetricArgs* args);
2686 
2699 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricNew(
2700  struct TRITONSERVER_Metric** metric,
2701  struct TRITONSERVER_MetricFamily* family,
2702  const struct TRITONSERVER_Parameter** labels, const uint64_t label_count);
2703 
2720 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricNewWithArgs(
2721  struct TRITONSERVER_Metric** metric,
2722  struct TRITONSERVER_MetricFamily* family,
2723  const struct TRITONSERVER_Parameter** labels, const uint64_t label_count,
2724  const struct TRITONSERVER_MetricArgs* args);
2725 
2733 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricDelete(
2734  struct TRITONSERVER_Metric* metric);
2735 
2744 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricValue(
2745  struct TRITONSERVER_Metric* metric, double* value);
2746 
2757 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricIncrement(
2758  struct TRITONSERVER_Metric* metric, double value);
2759 
2767 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricSet(
2768  struct TRITONSERVER_Metric* metric, double value);
2769 
2777 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_MetricObserve(
2778  struct TRITONSERVER_Metric* metric, double value);
2779 
2785 TRITONSERVER_DECLSPEC struct TRITONSERVER_Error* TRITONSERVER_GetMetricKind(
2786  struct TRITONSERVER_Metric* metric, TRITONSERVER_MetricKind* kind);
2787 
2788 #ifdef __cplusplus
2789 }
2790 #endif
TRITONSERVER_InferenceTraceReleaseFn_t
void(* TRITONSERVER_InferenceTraceReleaseFn_t)(struct TRITONSERVER_InferenceTrace *trace, void *userp)
Type for trace release callback function.
Definition: tritonserver.h:778
TRITONSERVER_InferenceRequestSetTimeoutMicroseconds
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetTimeoutMicroseconds(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t timeout_us)
Set the timeout for a request, in microseconds.
TRITONSERVER_TYPE_INT64
@ TRITONSERVER_TYPE_INT64
Definition: tritonserver.h:125
tritonserver_traceactivity_enum
tritonserver_traceactivity_enum
Trace activities.
Definition: tritonserver.h:726
TRITONSERVER_ResponseAllocatorReleaseFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorReleaseFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *buffer, void *buffer_userp, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id)
Type for function that is called when the server no longer holds any reference to a buffer allocated ...
Definition: tritonserver.h:495
TRITONSERVER_InferenceTraceLevelString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InferenceTraceLevelString(TRITONSERVER_InferenceTraceLevel level)
Get the string representation of a trace level.
TRITONSERVER_TYPE_BF16
@ TRITONSERVER_TYPE_BF16
Definition: tritonserver.h:130
TRITONSERVER_ServerOptionsSetModelLoadDeviceLimit
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelLoadDeviceLimit(struct TRITONSERVER_ServerOptions *options, const TRITONSERVER_InstanceGroupKind kind, const int device_id, const double fraction)
Specify the limit on memory usage as a fraction on the device identified by 'kind' and 'device_id'.
TRITONSERVER_InferenceTraceLevel
enum tritonserver_tracelevel_enum TRITONSERVER_InferenceTraceLevel
TRITONSERVER_InferenceTrace.
TRITONSERVER_TRACE_LEVEL_DISABLED
@ TRITONSERVER_TRACE_LEVEL_DISABLED
Tracing disabled. No trace activities are reported.
Definition: tritonserver.h:705
TRITONSERVER_logformat_enum
TRITONSERVER_logformat_enum
Logging Formats.
Definition: tritonserver.h:289
TRITONSERVER_InferenceTraceSpawnChildTrace
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceSpawnChildTrace(struct TRITONSERVER_InferenceTrace *trace, struct TRITONSERVER_InferenceTrace **child_trace)
Get the child trace, spawned from the parent trace.
tritonserver_responsecompleteflag_enum
tritonserver_responsecompleteflag_enum
Inference response complete flags.
Definition: tritonserver.h:971
TRITONSERVER_ErrorMessage
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ErrorMessage(struct TRITONSERVER_Error *error)
Get the error message.
TRITONSERVER_ResponseAllocatorAllocFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorAllocFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, const char *tensor_name, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void *userp, void **buffer, void **buffer_userp, TRITONSERVER_MemoryType *actual_memory_type, int64_t *actual_memory_type_id)
TRITONSERVER_ResponseAllocator.
Definition: tritonserver.h:414
TRITONSERVER_BufferAttributesSetMemoryType
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetMemoryType(struct TRITONSERVER_BufferAttributes *buffer_attributes, TRITONSERVER_MemoryType memory_type)
Set the memory type field of the buffer attributes.
TRITONSERVER_ServerOptionsSetCpuMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCpuMetrics(struct TRITONSERVER_ServerOptions *options, bool cpu_metrics)
Enable or disable CPU metrics collection in a server options.
TRITONSERVER_MEMORY_CPU
@ TRITONSERVER_MEMORY_CPU
Definition: tritonserver.h:164
TRITONSERVER_PARAMETER_BYTES
@ TRITONSERVER_PARAMETER_BYTES
Definition: tritonserver.h:187
TRITONSERVER_LOG_ISO8601
@ TRITONSERVER_LOG_ISO8601
Definition: tritonserver.h:291
TRITONSERVER_InferenceTraceModelVersion
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceModelVersion(struct TRITONSERVER_InferenceTrace *trace, int64_t *model_version)
Get the version of the model associated with a trace.
TRITONSERVER_ApiVersion
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ApiVersion(uint32_t *major, uint32_t *minor)
Get the TRITONBACKEND API version supported by the Triton shared library.
TRITONSERVER_InferenceRequestRemoveInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Remove an input from a request.
TRITONSERVER_LOG_DEFAULT
@ TRITONSERVER_LOG_DEFAULT
Definition: tritonserver.h:290
TRITONSERVER_TYPE_UINT16
@ TRITONSERVER_TYPE_UINT16
Definition: tritonserver.h:119
TRITONSERVER_InferenceResponseParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseParameter(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const char **name, TRITONSERVER_ParameterType *type, const void **vvalue)
Get all information about a parameter.
TRITONSERVER_TYPE_INT16
@ TRITONSERVER_TYPE_INT16
Definition: tritonserver.h:123
TRITONSERVER_ResponseAllocatorStartFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorStartFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *userp)
Type for function that is called to indicate that subsequent allocation requests will refer to a new ...
Definition: tritonserver.h:509
TRITONSERVER_TRACE_QUEUE_START
@ TRITONSERVER_TRACE_QUEUE_START
Definition: tritonserver.h:728
TRITONSERVER_TYPE_UINT64
@ TRITONSERVER_TYPE_UINT64
Definition: tritonserver.h:121
TRITONSERVER_MetricNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricNew(struct TRITONSERVER_Metric **metric, struct TRITONSERVER_MetricFamily *family, const struct TRITONSERVER_Parameter **labels, const uint64_t label_count)
Create a new metric object.
TRITONSERVER_ServerOptionsSetStrictReadiness
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStrictReadiness(struct TRITONSERVER_ServerOptions *options, bool strict)
Enable or disable strict readiness handling in a server options.
TRITONSERVER_metrickind_enum
TRITONSERVER_metrickind_enum
TRITONSERVER_MetricKind.
Definition: tritonserver.h:2617
TRITONSERVER_InferenceTraceSetContext
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceSetContext(struct TRITONSERVER_InferenceTrace *trace, const char *trace_context)
Set TRITONSERVER_InferenceTrace context.
TRITONSERVER_ERROR_CANCELLED
@ TRITONSERVER_ERROR_CANCELLED
Definition: tritonserver.h:332
TRITONSERVER_ModelControlMode
enum tritonserver_modelcontrolmode_enum TRITONSERVER_ModelControlMode
TRITONSERVER_ServerOptions.
TRITONSERVER_RATE_LIMIT_OFF
@ TRITONSERVER_RATE_LIMIT_OFF
Definition: tritonserver.h:1769
TRITONSERVER_InferenceResponseId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseId(struct TRITONSERVER_InferenceResponse *inference_response, const char **request_id)
Get the ID of the request corresponding to a response.
TRITONSERVER_ERROR_NOT_FOUND
@ TRITONSERVER_ERROR_NOT_FOUND
Definition: tritonserver.h:327
TRITONSERVER_ResponseAllocatorDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorDelete(struct TRITONSERVER_ResponseAllocator *allocator)
Delete a response allocator.
TRITONSERVER_MetricNewWithArgs
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricNewWithArgs(struct TRITONSERVER_Metric **metric, struct TRITONSERVER_MetricFamily *family, const struct TRITONSERVER_Parameter **labels, const uint64_t label_count, const struct TRITONSERVER_MetricArgs *args)
Create a new metric object.
TRITONSERVER_InferenceRequestCorrelationIdString
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCorrelationIdString(struct TRITONSERVER_InferenceRequest *inference_request, const char **correlation_id)
Get the correlation ID of the inference request as a string.
TRITONSERVER_ServerOptionsSetHostPolicy
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetHostPolicy(struct TRITONSERVER_ServerOptions *options, const char *policy_name, const char *setting, const char *value)
Set a host policy setting for a given policy name in a server options.
TRITONSERVER_InferenceResponseError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseError(struct TRITONSERVER_InferenceResponse *inference_response)
Return the error status of an inference response.
TRITONSERVER_InferenceRequestSetIntParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetIntParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const int64_t value)
Set an integer parameter in the request.
TRITONSERVER_ServerOptionsNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsNew(struct TRITONSERVER_ServerOptions **options)
Create a new server options object.
TRITONSERVER_MetricFamilyDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricFamilyDelete(struct TRITONSERVER_MetricFamily *family)
Delete a metric family object.
TRITONSERVER_TRACE_COMPUTE_END
@ TRITONSERVER_TRACE_COMPUTE_END
Definition: tritonserver.h:732
TRITONSERVER_MetricsDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricsDelete(struct TRITONSERVER_Metrics *metrics)
Delete a metrics object.
TRITONSERVER_LOG_VERBOSE
@ TRITONSERVER_LOG_VERBOSE
Definition: tritonserver.h:260
TRITONSERVER_InferenceTraceModelName
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceModelName(struct TRITONSERVER_InferenceTrace *trace, const char **model_name)
Get the name of the model associated with a trace.
TRITONSERVER_ServerModelIsReady
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelIsReady(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, bool *ready)
Is the model ready?
TRITONSERVER_MemoryType
enum TRITONSERVER_memorytype_enum TRITONSERVER_MemoryType
TRITONSERVER_MemoryType.
TRITONSERVER_TRACE_TENSOR_QUEUE_INPUT
@ TRITONSERVER_TRACE_TENSOR_QUEUE_INPUT
Definition: tritonserver.h:734
TRITONSERVER_DataTypeByteSize
TRITONSERVER_DECLSPEC uint32_t TRITONSERVER_DataTypeByteSize(TRITONSERVER_DataType datatype)
Get the size of a Triton datatype in bytes.
TRITONSERVER_BATCH_UNKNOWN
@ TRITONSERVER_BATCH_UNKNOWN
Definition: tritonserver.h:2271
TRITONSERVER_BufferAttributesSetMemoryTypeId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetMemoryTypeId(struct TRITONSERVER_BufferAttributes *buffer_attributes, int64_t memory_type_id)
Set the memory type id field of the buffer attributes.
TRITONSERVER_PARAMETER_DOUBLE
@ TRITONSERVER_PARAMETER_DOUBLE
Definition: tritonserver.h:186
TRITONSERVER_InferenceRequestTimeoutMicroseconds
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestTimeoutMicroseconds(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *timeout_us)
Get the timeout for a request, in microseconds.
TRITONSERVER_ServerOptionsSetPinnedMemoryPoolByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetPinnedMemoryPoolByteSize(struct TRITONSERVER_ServerOptions *options, uint64_t size)
Set the total pinned memory byte size that the server can allocate in a server options.
TRITONSERVER_METRIC_PROMETHEUS
@ TRITONSERVER_METRIC_PROMETHEUS
Definition: tritonserver.h:653
TRITONSERVER_REQUEST_FLAG_SEQUENCE_END
@ TRITONSERVER_REQUEST_FLAG_SEQUENCE_END
Definition: tritonserver.h:959
TRITONSERVER_ServerOptionsAddRateLimiterResource
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsAddRateLimiterResource(struct TRITONSERVER_ServerOptions *options, const char *resource_name, const size_t resource_count, const int device)
Add resource count for rate limiting.
TRITONSERVER_InferenceTraceContext
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceContext(struct TRITONSERVER_InferenceTrace *trace, const char **trace_context)
Get TRITONSERVER_InferenceTrace context.
TRITONSERVER_ServerOptionsSetCudaVirtualAddressSize
TRITONSERVER_DECLSPEC TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCudaVirtualAddressSize(TRITONSERVER_ServerOptions *options, int gpu_device, size_t cuda_virtual_address_size)
Set the size of the virtual address space that will be used for growable memory in implicit state.
TRITONSERVER_ServerIsLive
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerIsLive(struct TRITONSERVER_Server *server, bool *live)
Is the server live?
TRITONSERVER_MODEL_CONTROL_POLL
@ TRITONSERVER_MODEL_CONTROL_POLL
Definition: tritonserver.h:1763
TRITONSERVER_TRACE_COMPUTE_INPUT_END
@ TRITONSERVER_TRACE_COMPUTE_INPUT_END
Definition: tritonserver.h:730
TRITONSERVER_InferenceRequestRemoveRequestedOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveRequestedOutput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Remove an output request from an inference request.
TRITONSERVER_TXN_DECOUPLED
@ TRITONSERVER_TXN_DECOUPLED
Definition: tritonserver.h:2284
TRITONSERVER_ServerOptionsSetGpuMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetGpuMetrics(struct TRITONSERVER_ServerOptions *options, bool gpu_metrics)
Enable or disable GPU metrics collection in a server options.
TRITONSERVER_ERROR_UNKNOWN
@ TRITONSERVER_ERROR_UNKNOWN
Definition: tritonserver.h:325
TRITONSERVER_ErrorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ErrorNew(TRITONSERVER_Error_Code code, const char *msg)
Create a new error object.
TRITONSERVER_InferenceTraceActivityString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InferenceTraceActivityString(TRITONSERVER_InferenceTraceActivity activity)
Get the string representation of a trace activity.
TRITONSERVER_MetricKind
enum TRITONSERVER_metrickind_enum TRITONSERVER_MetricKind
TRITONSERVER_MetricKind.
TRITONSERVER_TRACE_LEVEL_TIMESTAMPS
@ TRITONSERVER_TRACE_LEVEL_TIMESTAMPS
Record timestamps for the inference request.
Definition: tritonserver.h:711
TRITONSERVER_ServerModelBatchProperties
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelBatchProperties(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, uint32_t *flags, void **voidp)
Get the batch properties of the model.
TRITONSERVER_InferenceRequestAddRawInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddRawInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Add a raw input to a request.
TRITONSERVER_InferenceResponseDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseDelete(struct TRITONSERVER_InferenceResponse *inference_response)
TRITONSERVER_InferenceResponse.
TRITONSERVER_InferenceTraceNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceNew(struct TRITONSERVER_InferenceTrace **trace, TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id, TRITONSERVER_InferenceTraceActivityFn_t activity_fn, TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void *trace_userp)
Create a new inference trace object.
TRITONSERVER_ServerModelStatistics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelStatistics(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, struct TRITONSERVER_Message **model_stats)
Get the statistics of a model as a TRITONSERVER_Message object.
TRITONSERVER_PARAMETER_INT
@ TRITONSERVER_PARAMETER_INT
Definition: tritonserver.h:184
TRITONSERVER_BufferAttributesByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesByteSize(struct TRITONSERVER_BufferAttributes *buffer_attributes, size_t *byte_size)
Get the byte size field of the buffer attributes.
TRITONSERVER_MemoryTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_MemoryTypeString(TRITONSERVER_MemoryType memtype)
Get the string representation of a memory type.
TRITONSERVER_ServerOptionsSetBackendConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBackendConfig(struct TRITONSERVER_ServerOptions *options, const char *backend_name, const char *setting, const char *value)
Set a configuration setting for a named backend in a server options.
TRITONSERVER_ERROR_ALREADY_EXISTS
@ TRITONSERVER_ERROR_ALREADY_EXISTS
Definition: tritonserver.h:331
TRITONSERVER_ResponseAllocatorBufferAttributesFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorBufferAttributesFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, const char *tensor_name, struct TRITONSERVER_BufferAttributes *buffer_attributes, void *userp, void *buffer_userp)
Type for allocation function that allocates a buffer to hold an output tensor with buffer attributes.
Definition: tritonserver.h:444
tritonserver_modelindexflag_enum
tritonserver_modelindexflag_enum
Model index flags. The enum values must be power-of-2 values.
Definition: tritonserver.h:2276
TRITONSERVER_REQUEST_FLAG_SEQUENCE_START
@ TRITONSERVER_REQUEST_FLAG_SEQUENCE_START
Definition: tritonserver.h:958
TRITONSERVER_DECLSPEC
#define TRITONSERVER_DECLSPEC
Definition: tritonserver.h:50
TRITONSERVER_InferenceRequestSetCorrelationId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetCorrelationId(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t correlation_id)
Set the correlation ID of the inference request to be an unsigned integer.
TRITONSERVER_ParameterDelete
TRITONSERVER_DECLSPEC void TRITONSERVER_ParameterDelete(struct TRITONSERVER_Parameter *parameter)
Delete an parameter object.
TRITONSERVER_TRACE_LEVEL_TENSORS
@ TRITONSERVER_TRACE_LEVEL_TENSORS
Record input and output tensor values for the inference request.
Definition: tritonserver.h:713
TRITONSERVER_RequestReleaseFlag
enum tritonserver_requestreleaseflag_enum TRITONSERVER_RequestReleaseFlag
Inference request release flags.
TRITONSERVER_METRIC_KIND_GAUGE
@ TRITONSERVER_METRIC_KIND_GAUGE
Definition: tritonserver.h:2619
TRITONSERVER_LOG_INFO
@ TRITONSERVER_LOG_INFO
Definition: tritonserver.h:257
TRITONSERVER_TYPE_INT8
@ TRITONSERVER_TYPE_INT8
Definition: tritonserver.h:122
TRITONSERVER_InferenceTraceTensorActivityFn_t
void(* TRITONSERVER_InferenceTraceTensorActivityFn_t)(struct TRITONSERVER_InferenceTrace *trace, TRITONSERVER_InferenceTraceActivity activity, const char *name, TRITONSERVER_DataType datatype, const void *base, size_t byte_size, const int64_t *shape, uint64_t dim_count, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, void *userp)
Type for trace tensor activity callback function.
Definition: tritonserver.h:766
TRITONSERVER_ServerIsReady
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerIsReady(struct TRITONSERVER_Server *server, bool *ready)
Is the server ready?
TRITONSERVER_ServerOptionsSetMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetrics(struct TRITONSERVER_ServerOptions *options, bool metrics)
Enable or disable metrics collection in a server options.
TRITONSERVER_BufferAttributesSetByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetByteSize(struct TRITONSERVER_BufferAttributes *buffer_attributes, size_t byte_size)
Set the byte size field of the buffer attributes.
TRITONSERVER_ServerOptionsSetLogError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogError(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable error level logging.
TRITONSERVER_TYPE_BYTES
@ TRITONSERVER_TYPE_BYTES
Definition: tritonserver.h:129
TRITONSERVER_BufferAttributesMemoryTypeId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesMemoryTypeId(struct TRITONSERVER_BufferAttributes *buffer_attributes, int64_t *memory_type_id)
Get the memory type id field of the buffer attributes.
TRITONSERVER_ResponseAllocatorSetQueryFunction
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorSetQueryFunction(struct TRITONSERVER_ResponseAllocator *allocator, TRITONSERVER_ResponseAllocatorQueryFn_t query_fn)
Set the query function to a response allocator object.
TRITONSERVER_InferenceRequestAppendInputData
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputData(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id)
Assign a buffer of data to an input.
TRITONSERVER_ServerOptionsSetLogInfo
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogInfo(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable info level logging.
TRITONSERVER_ServerOptionsSetModelConfigName
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelConfigName(struct TRITONSERVER_ServerOptions *options, const char *model_config_name)
Set the custom model configuration name to load for all models.
TRITONSERVER_ServerOptionsSetEnablePeerAccess
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetEnablePeerAccess(struct TRITONSERVER_ServerOptions *options, bool enable_peer_access)
Enable peer access to allow GPU device to directly access the memory of another GPU device.
TRITONSERVER_MetricSet
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricSet(struct TRITONSERVER_Metric *metric, double value)
Set the current value of metric to value.
TRITONSERVER_ServerUnloadModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnloadModel(struct TRITONSERVER_Server *server, const char *model_name)
Unload the requested model.
TRITONSERVER_INSTANCEGROUPKIND_MODEL
@ TRITONSERVER_INSTANCEGROUPKIND_MODEL
Definition: tritonserver.h:240
TRITONSERVER_InferenceRequestDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestDelete(struct TRITONSERVER_InferenceRequest *inference_request)
Delete an inference request object.
TRITONSERVER_BufferAttributesNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesNew(struct TRITONSERVER_BufferAttributes **buffer_attributes)
TRITONSERVER_BufferAttributes.
TRITONSERVER_InferenceRequestSetPriority
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetPriority(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t priority)
Deprecated.
TRITONSERVER_MetricDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricDelete(struct TRITONSERVER_Metric *metric)
Delete a metric object.
TRITONSERVER_Error_Code
enum TRITONSERVER_errorcode_enum TRITONSERVER_Error_Code
TRITONSERVER_Error.
TRITONSERVER_StringToDataType
TRITONSERVER_DECLSPEC TRITONSERVER_DataType TRITONSERVER_StringToDataType(const char *dtype)
Get the Triton datatype corresponding to a string representation of a datatype.
TRITONSERVER_LogFormat
enum TRITONSERVER_logformat_enum TRITONSERVER_LogFormat
Logging Formats.
TRITONSERVER_ErrorCodeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ErrorCodeString(struct TRITONSERVER_Error *error)
Get the string representation of an error code.
TRITONSERVER_REQUEST_RELEASE_ALL
@ TRITONSERVER_REQUEST_RELEASE_ALL
Definition: tritonserver.h:965
TRITONSERVER_ServerOptionsSetCudaMemoryPoolByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCudaMemoryPoolByteSize(struct TRITONSERVER_ServerOptions *options, int gpu_device, uint64_t size)
Set the total CUDA memory byte size that the server can allocate on given GPU device in a server opti...
TRITONSERVER_ServerOptionsSetModelControlMode
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelControlMode(struct TRITONSERVER_ServerOptions *options, TRITONSERVER_ModelControlMode mode)
Set the model control mode in a server options.
TRITONSERVER_DataTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_DataTypeString(TRITONSERVER_DataType datatype)
Get the string representation of a data type.
TRITONSERVER_METRIC_KIND_COUNTER
@ TRITONSERVER_METRIC_KIND_COUNTER
Definition: tritonserver.h:2618
TRITONSERVER_ServerOptionsDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsDelete(struct TRITONSERVER_ServerOptions *options)
Delete a server options object.
TRITONSERVER_TXN_ONE_TO_ONE
@ TRITONSERVER_TXN_ONE_TO_ONE
Definition: tritonserver.h:2283
TRITONSERVER_errorcode_enum
TRITONSERVER_errorcode_enum
TRITONSERVER_Error.
Definition: tritonserver.h:324
TRITONSERVER_RATE_LIMIT_EXEC_COUNT
@ TRITONSERVER_RATE_LIMIT_EXEC_COUNT
Definition: tritonserver.h:1770
TRITONSERVER_BufferAttributesMemoryType
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesMemoryType(struct TRITONSERVER_BufferAttributes *buffer_attributes, TRITONSERVER_MemoryType *memory_type)
Get the memory type field of the buffer attributes.
TRITONSERVER_MetricObserve
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricObserve(struct TRITONSERVER_Metric *metric, double value)
Sample an observation and count it to the appropriate bucket of a metric.
TRITONSERVER_ServerStop
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerStop(struct TRITONSERVER_Server *server)
Stop a server object.
TRITONSERVER_MetricArgsNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricArgsNew(struct TRITONSERVER_MetricArgs **args)
Create a new metric args object.
TRITONSERVER_InferenceResponseCompleteFn_t
void(* TRITONSERVER_InferenceResponseCompleteFn_t)(struct TRITONSERVER_InferenceResponse *response, const uint32_t flags, void *userp)
Type for callback function indicating that an inference response has completed.
Definition: tritonserver.h:1025
TRITONSERVER_MetricIncrement
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricIncrement(struct TRITONSERVER_Metric *metric, double value)
Increment the current value of metric by value.
TRITONSERVER_INDEX_FLAG_READY
@ TRITONSERVER_INDEX_FLAG_READY
Definition: tritonserver.h:2277
TRITONSERVER_ModelTxnPropertyFlag
enum tritonserver_txn_property_flag_enum TRITONSERVER_ModelTxnPropertyFlag
Model transaction policy flags.
TRITONSERVER_ParameterTypeString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_ParameterTypeString(TRITONSERVER_ParameterType paramtype)
Get the string representation of a parameter type.
TRITONSERVER_InferenceRequestSetBoolParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetBoolParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const bool value)
Set a boolean parameter in the request.
TRITONSERVER_ServerOptionsSetMetricsConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetricsConfig(struct TRITONSERVER_ServerOptions *options, const char *name, const char *setting, const char *value)
Set a configuration setting for metrics in server options.
TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, struct TRITONSERVER_BufferAttributes *buffer_attributes)
Assign a buffer of data to an input.
TRITONSERVER_memorytype_enum
TRITONSERVER_memorytype_enum
TRITONSERVER_MemoryType.
Definition: tritonserver.h:163
TRITONSERVER_TYPE_FP16
@ TRITONSERVER_TYPE_FP16
Definition: tritonserver.h:126
TRITONSERVER_TRACE_REQUEST_END
@ TRITONSERVER_TRACE_REQUEST_END
Definition: tritonserver.h:733
TRITONSERVER_ServerRegisterModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerRegisterModelRepository(struct TRITONSERVER_Server *server, const char *repository_path, const struct TRITONSERVER_Parameter **name_mapping, const uint32_t mapping_count)
Register a new model repository.
TRITONSERVER_RequestFlag
enum tritonserver_requestflag_enum TRITONSERVER_RequestFlag
TRITONSERVER_InferenceRequest.
TRITONSERVER_InferenceTraceActivity
enum tritonserver_traceactivity_enum TRITONSERVER_InferenceTraceActivity
Trace activities.
TRITONSERVER_MessageSerializeToJson
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageSerializeToJson(struct TRITONSERVER_Message *message, const char **base, size_t *byte_size)
Get the base and size of the buffer containing the serialized message in JSON format.
TRITONSERVER_ServerModelMetadata
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelMetadata(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, struct TRITONSERVER_Message **model_metadata)
Get the metadata of a model as a TRITONSERVER_Message object.
TRITONSERVER_ServerOptionsSetBackendDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBackendDirectory(struct TRITONSERVER_ServerOptions *options, const char *backend_dir)
Set the directory containing backend shared libraries.
TRITONSERVER_ERROR_INTERNAL
@ TRITONSERVER_ERROR_INTERNAL
Definition: tritonserver.h:326
TRITONSERVER_MODEL_CONTROL_NONE
@ TRITONSERVER_MODEL_CONTROL_NONE
Definition: tritonserver.h:1762
TRITONSERVER_InferenceRequestCancel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCancel(struct TRITONSERVER_InferenceRequest *inference_request)
Cancel an inference request.
TRITONSERVER_MODEL_CONTROL_EXPLICIT
@ TRITONSERVER_MODEL_CONTROL_EXPLICIT
Definition: tritonserver.h:1764
TRITONSERVER_ServerOptionsSetLogWarn
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogWarn(struct TRITONSERVER_ServerOptions *options, bool log)
Enable or disable warning level logging.
TRITONSERVER_ResponseAllocatorQueryFn_t
struct TRITONSERVER_Error *(* TRITONSERVER_ResponseAllocatorQueryFn_t)(struct TRITONSERVER_ResponseAllocator *allocator, void *userp, const char *tensor_name, size_t *byte_size, TRITONSERVER_MemoryType *memory_type, int64_t *memory_type_id)
Type for function that is called to query the allocator's preferred memory type and memory type ID.
Definition: tritonserver.h:473
TRITONSERVER_ParameterType
enum TRITONSERVER_parametertype_enum TRITONSERVER_ParameterType
TRITONSERVER_ParameterType.
TRITONSERVER_GetMetricKind
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_GetMetricKind(struct TRITONSERVER_Metric *metric, TRITONSERVER_MetricKind *kind)
Get the TRITONSERVER_MetricKind of metric of its corresponding family.
TRITONSERVER_InferenceRequestRemoveAllInputData
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllInputData(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Clear all input data from an input, releasing ownership of the buffer(s) that were appended to the in...
tritonserver_tracelevel_enum
tritonserver_tracelevel_enum
TRITONSERVER_InferenceTrace.
Definition: tritonserver.h:703
TRITONSERVER_parametertype_enum
TRITONSERVER_parametertype_enum
TRITONSERVER_ParameterType.
Definition: tritonserver.h:182
TRITONSERVER_TYPE_INVALID
@ TRITONSERVER_TYPE_INVALID
Definition: tritonserver.h:116
TRITONSERVER_PARAMETER_STRING
@ TRITONSERVER_PARAMETER_STRING
Definition: tritonserver.h:183
TRITONSERVER_TYPE_FP64
@ TRITONSERVER_TYPE_FP64
Definition: tritonserver.h:128
TRITONSERVER_ServerMetadata
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerMetadata(struct TRITONSERVER_Server *server, struct TRITONSERVER_Message **server_metadata)
Get the metadata of the server as a TRITONSERVER_Message object.
TRITONSERVER_ServerNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerNew(struct TRITONSERVER_Server **server, struct TRITONSERVER_ServerOptions *options)
Create a new server object.
TRITONSERVER_MetricValue
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricValue(struct TRITONSERVER_Metric *metric, double *value)
Get the current value of a metric object.
TRITONSERVER_InferenceResponseModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseModel(struct TRITONSERVER_InferenceResponse *inference_response, const char **model_name, int64_t *model_version)
Get model used to produce a response.
TRITONSERVER_InferenceTraceActivityFn_t
void(* TRITONSERVER_InferenceTraceActivityFn_t)(struct TRITONSERVER_InferenceTrace *trace, TRITONSERVER_InferenceTraceActivity activity, uint64_t timestamp_ns, void *userp)
Type for trace timeline activity callback function.
Definition: tritonserver.h:755
TRITONSERVER_LogLevel
enum TRITONSERVER_loglevel_enum TRITONSERVER_LogLevel
TRITONSERVER_Logging.
tritonserver_txn_property_flag_enum
tritonserver_txn_property_flag_enum
Model transaction policy flags.
Definition: tritonserver.h:2282
TRITONSERVER_REQUEST_RELEASE_RESCHEDULE
@ TRITONSERVER_REQUEST_RELEASE_RESCHEDULE
Definition: tritonserver.h:966
TRITONSERVER_InferenceRequestSetFlags
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetFlags(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t flags)
Set the flag(s) associated with a request.
TRITONSERVER_MetricArgsDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricArgsDelete(struct TRITONSERVER_MetricArgs *args)
Delete a metric args object.
TRITONSERVER_MessageNewFromSerializedJson
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageNewFromSerializedJson(struct TRITONSERVER_Message **message, const char *base, size_t byte_size)
TRITONSERVER_Message.
TRITONSERVER_MessageDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MessageDelete(struct TRITONSERVER_Message *message)
Delete a message object.
TRITONSERVER_InferenceRequestSetId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetId(struct TRITONSERVER_InferenceRequest *inference_request, const char *id)
Set the ID for a request.
TRITONSERVER_DataType
enum TRITONSERVER_datatype_enum TRITONSERVER_DataType
TRITONSERVER_DataType.
TRITONSERVER_BufferAttributesDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesDelete(struct TRITONSERVER_BufferAttributes *buffer_attributes)
Delete a buffer attributes object.
TRITONSERVER_ResponseAllocatorSetBufferAttributesFunction
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorSetBufferAttributesFunction(struct TRITONSERVER_ResponseAllocator *allocator, TRITONSERVER_ResponseAllocatorBufferAttributesFn_t buffer_attributes_fn)
Set the buffer attributes function for a response allocator object.
TRITONSERVER_TRACE_COMPUTE_START
@ TRITONSERVER_TRACE_COMPUTE_START
Definition: tritonserver.h:729
tritonserver_batchflag_enum
tritonserver_batchflag_enum
TRITONSERVER_Server.
Definition: tritonserver.h:2270
TRITONSERVER_ERROR_INVALID_ARG
@ TRITONSERVER_ERROR_INVALID_ARG
Definition: tritonserver.h:328
TRITONSERVER_TYPE_BOOL
@ TRITONSERVER_TYPE_BOOL
Definition: tritonserver.h:117
TRITONSERVER_ServerPollModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerPollModelRepository(struct TRITONSERVER_Server *server)
Check the model repository for changes and update server state based on those changes.
TRITONSERVER_MEMORY_CPU_PINNED
@ TRITONSERVER_MEMORY_CPU_PINNED
Definition: tritonserver.h:165
TRITONSERVER_ResponseCompleteFlag
enum tritonserver_responsecompleteflag_enum TRITONSERVER_ResponseCompleteFlag
Inference response complete flags.
TRITONSERVER_ServerUnloadModelAndDependents
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnloadModelAndDependents(struct TRITONSERVER_Server *server, const char *model_name)
Unload the requested model, and also unload any dependent model that was loaded along with the reques...
TRITONSERVER_InferenceRequestSetStringParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetStringParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const char *value)
Set a string parameter in the request.
TRITONSERVER_TRACE_TENSOR_BACKEND_OUTPUT
@ TRITONSERVER_TRACE_TENSOR_BACKEND_OUTPUT
Definition: tritonserver.h:736
TRITONSERVER_MetricArgsSetHistogram
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricArgsSetHistogram(struct TRITONSERVER_MetricArgs *args, const double *buckets, const uint64_t buckets_count)
Set metric args with histogram metric parameter.
TRITONSERVER_MetricsFormatted
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricsFormatted(struct TRITONSERVER_Metrics *metrics, TRITONSERVER_MetricFormat format, const char **base, size_t *byte_size)
Get a buffer containing the metrics in the specified format.
TRITONSERVER_ErrorDelete
TRITONSERVER_DECLSPEC void TRITONSERVER_ErrorDelete(struct TRITONSERVER_Error *error)
Delete an error object.
TRITONSERVER_ServerLoadModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerLoadModel(struct TRITONSERVER_Server *server, const char *model_name)
Load the requested model or reload the model if it is already loaded.
TRITONSERVER_TYPE_UINT8
@ TRITONSERVER_TYPE_UINT8
Definition: tritonserver.h:118
TRITONSERVER_ServerOptionsSetMinSupportedComputeCapability
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMinSupportedComputeCapability(struct TRITONSERVER_ServerOptions *options, double cc)
Set the minimum support CUDA compute capability in a server options.
TRITONSERVER_ServerOptionsSetModelRepositoryPath
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelRepositoryPath(struct TRITONSERVER_ServerOptions *options, const char *model_repository_path)
Set the model repository path in a server options.
TRITONSERVER_TYPE_INT32
@ TRITONSERVER_TYPE_INT32
Definition: tritonserver.h:124
TRITONSERVER_ServerOptionsSetStrictModelConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStrictModelConfig(struct TRITONSERVER_ServerOptions *options, bool strict)
Enable or disable strict model configuration handling in a server options.
TRITONSERVER_ParameterBytesNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter * TRITONSERVER_ParameterBytesNew(const char *name, const void *byte_ptr, const uint64_t size)
Create a new parameter object with type TRITONSERVER_PARAMETER_BYTES.
eMode::strict
@ strict
TRITONSERVER_LogMessage
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_LogMessage(TRITONSERVER_LogLevel level, const char *filename, const int line, const char *msg)
Log a message at a given log level if that level is enabled.
TRITONSERVER_ServerOptionsSetExitOnError
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetExitOnError(struct TRITONSERVER_ServerOptions *options, bool exit)
Enable or disable exit-on-error in a server options.
TRITONSERVER_ServerUnregisterModelRepository
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerUnregisterModelRepository(struct TRITONSERVER_Server *server, const char *repository_path)
Unregister a model repository.
TRITONSERVER_InferenceRequestId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestId(struct TRITONSERVER_InferenceRequest *inference_request, const char **id)
Get the ID for a request.
TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const void *base, size_t byte_size, TRITONSERVER_MemoryType memory_type, int64_t memory_type_id, const char *host_policy_name)
Assign a buffer of data to an input for execution on all model instances with the specified host poli...
TRITONSERVER_InferenceResponseOutputClassificationLabel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutputClassificationLabel(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const size_t class_index, const char **label)
Get a classification label associated with an output for a given index.
TRITONSERVER_TRACE_LEVEL_MIN
@ TRITONSERVER_TRACE_LEVEL_MIN
Deprecated. Use TRITONSERVER_TRACE_LEVEL_TIMESTAMPS.
Definition: tritonserver.h:707
TRITONSERVER_ServerOptionsSetBufferManagerThreadCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetBufferManagerThreadCount(struct TRITONSERVER_ServerOptions *options, unsigned int thread_count)
Set the number of threads used in buffer manager in a server options.
TRITONSERVER_InferenceTraceTensorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceTensorNew(struct TRITONSERVER_InferenceTrace **trace, TRITONSERVER_InferenceTraceLevel level, uint64_t parent_id, TRITONSERVER_InferenceTraceActivityFn_t activity_fn, TRITONSERVER_InferenceTraceTensorActivityFn_t tensor_activity_fn, TRITONSERVER_InferenceTraceReleaseFn_t release_fn, void *trace_userp)
Create a new inference trace object.
TRITONSERVER_InferenceRequestPriorityUInt64
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestPriorityUInt64(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *priority)
Get the priority for a request.
TRITONSERVER_InferenceRequestSetPriorityUInt64
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetPriorityUInt64(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t priority)
Set the priority for a request.
TRITONSERVER_ServerModelTransactionProperties
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelTransactionProperties(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, uint32_t *txn_flags, void **voidp)
Get the transaction policy of the model.
TRITONSERVER_ServerModelIndex
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelIndex(struct TRITONSERVER_Server *server, uint32_t flags, struct TRITONSERVER_Message **model_index)
Get the index of all unique models in the model repositories as a TRITONSERVER_Message object.
TRITONSERVER_ResponseAllocatorNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ResponseAllocatorNew(struct TRITONSERVER_ResponseAllocator **allocator, TRITONSERVER_ResponseAllocatorAllocFn_t alloc_fn, TRITONSERVER_ResponseAllocatorReleaseFn_t release_fn, TRITONSERVER_ResponseAllocatorStartFn_t start_fn)
Create a new response allocator object.
TRITONSERVER_ERROR_UNAVAILABLE
@ TRITONSERVER_ERROR_UNAVAILABLE
Definition: tritonserver.h:329
TRITONSERVER_INSTANCEGROUPKIND_AUTO
@ TRITONSERVER_INSTANCEGROUPKIND_AUTO
Definition: tritonserver.h:237
TRITONSERVER_ServerLoadModelWithParameters
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerLoadModelWithParameters(struct TRITONSERVER_Server *server, const char *model_name, const struct TRITONSERVER_Parameter **parameters, const uint64_t parameter_count)
Load the requested model or reload the model if it is already loaded, with load parameters provided.
TRITONSERVER_InferenceResponseOutputCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutputCount(struct TRITONSERVER_InferenceResponse *inference_response, uint32_t *count)
Get the number of outputs available in the response.
TRITONSERVER_InferenceResponseOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseOutput(struct TRITONSERVER_InferenceResponse *inference_response, const uint32_t index, const char **name, TRITONSERVER_DataType *datatype, const int64_t **shape, uint64_t *dim_count, const void **base, size_t *byte_size, TRITONSERVER_MemoryType *memory_type, int64_t *memory_type_id, void **userp)
Get all information about an output tensor.
TRITONSERVER_ServerInferAsync
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerInferAsync(struct TRITONSERVER_Server *server, struct TRITONSERVER_InferenceRequest *inference_request, struct TRITONSERVER_InferenceTrace *trace)
Perform inference using the meta-data and inputs supplied by the 'inference_request'.
TRITONSERVER_TYPE_FP32
@ TRITONSERVER_TYPE_FP32
Definition: tritonserver.h:127
TRITONSERVER_ServerOptionsSetCacheDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCacheDirectory(struct TRITONSERVER_ServerOptions *options, const char *cache_dir)
Set the directory containing cache shared libraries.
TRITONSERVER_METRIC_KIND_HISTOGRAM
@ TRITONSERVER_METRIC_KIND_HISTOGRAM
Definition: tritonserver.h:2620
TRITONSERVER_instancegroupkind_enum
TRITONSERVER_instancegroupkind_enum
TRITONSERVER_InstanceGroupKind.
Definition: tritonserver.h:236
TRITONSERVER_ServerOptionsSetModelLoadRetryCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelLoadRetryCount(struct TRITONSERVER_ServerOptions *options, unsigned int retry_count)
Set the number of retry to load a model in a server options.
tritonserver_modelcontrolmode_enum
tritonserver_modelcontrolmode_enum
TRITONSERVER_ServerOptions.
Definition: tritonserver.h:1761
TRITONSERVER_TRACE_TENSOR_BACKEND_INPUT
@ TRITONSERVER_TRACE_TENSOR_BACKEND_INPUT
Definition: tritonserver.h:735
TRITONSERVER_ServerOptionsSetExitTimeout
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetExitTimeout(struct TRITONSERVER_ServerOptions *options, unsigned int timeout)
Set the exit timeout, in seconds, for the server in a server options.
TRITONSERVER_loglevel_enum
TRITONSERVER_loglevel_enum
TRITONSERVER_Logging.
Definition: tritonserver.h:256
TRITONSERVER_InferenceRequestSetDoubleParameter
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetDoubleParameter(struct TRITONSERVER_InferenceRequest *request, const char *key, const double value)
Set a double parameter in the request.
TRITONSERVER_InferenceRequestSetReleaseCallback
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetReleaseCallback(struct TRITONSERVER_InferenceRequest *inference_request, TRITONSERVER_InferenceRequestReleaseFn_t request_release_fn, void *request_release_userp)
Set the release callback for an inference request.
TRITONSERVER_ERROR_UNSUPPORTED
@ TRITONSERVER_ERROR_UNSUPPORTED
Definition: tritonserver.h:330
TRITONSERVER_ServerOptionsSetResponseCacheByteSize
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetResponseCacheByteSize(struct TRITONSERVER_ServerOptions *options, uint64_t size)
Deprecated.
TRITONSERVER_GetMetricFamilyKind
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_GetMetricFamilyKind(struct TRITONSERVER_MetricFamily *family, TRITONSERVER_MetricKind *kind)
Get the TRITONSERVER_MetricKind of the metric family.
TRITONSERVER_InstanceGroupKindString
const TRITONSERVER_DECLSPEC char * TRITONSERVER_InstanceGroupKindString(TRITONSERVER_InstanceGroupKind kind)
Get the string representation of an instance-group kind.
TRITONSERVER_RateLimitMode
enum tritonserver_ratelimitmode_enum TRITONSERVER_RateLimitMode
Rate limit modes.
TRITONSERVER_TRACE_CUSTOM_ACTIVITY
@ TRITONSERVER_TRACE_CUSTOM_ACTIVITY
Definition: tritonserver.h:737
TRITONSERVER_InferenceTraceId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceId(struct TRITONSERVER_InferenceTrace *trace, uint64_t *id)
Get the id associated with a trace.
TRITONSERVER_LOG_ERROR
@ TRITONSERVER_LOG_ERROR
Definition: tritonserver.h:259
TRITONSERVER_InferenceRequestAddRequestedOutput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddRequestedOutput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name)
Add an output request to an inference request.
TRITONSERVER_MetricFormat
enum tritonserver_metricformat_enum TRITONSERVER_MetricFormat
TRITONSERVER_Metrics.
TRITONSERVER_TRACE_COMPUTE_OUTPUT_START
@ TRITONSERVER_TRACE_COMPUTE_OUTPUT_START
Definition: tritonserver.h:731
TRITONSERVER_InferenceRequestIsCancelled
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestIsCancelled(struct TRITONSERVER_InferenceRequest *inference_request, bool *is_cancelled)
Query whether the request is cancelled or not.
TRITONSERVER_InferenceRequestPriority
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestPriority(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t *priority)
Deprecated.
TRITONSERVER_RESPONSE_COMPLETE_FINAL
@ TRITONSERVER_RESPONSE_COMPLETE_FINAL
Definition: tritonserver.h:972
TRITONSERVER_InferenceTraceDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceDelete(struct TRITONSERVER_InferenceTrace *trace)
Delete a trace object.
TRITONSERVER_InferenceRequestReleaseFn_t
void(* TRITONSERVER_InferenceRequestReleaseFn_t)(struct TRITONSERVER_InferenceRequest *request, const uint32_t flags, void *userp)
Type for inference request release callback function.
Definition: tritonserver.h:1004
TRITONSERVER_LOG_WARN
@ TRITONSERVER_LOG_WARN
Definition: tritonserver.h:258
TRITONSERVER_datatype_enum
TRITONSERVER_datatype_enum
TRITONSERVER_DataType.
Definition: tritonserver.h:115
tritonserver_metricformat_enum
tritonserver_metricformat_enum
TRITONSERVER_Metrics.
Definition: tritonserver.h:652
TRITONSERVER_ParameterNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Parameter * TRITONSERVER_ParameterNew(const char *name, const TRITONSERVER_ParameterType type, const void *value)
Create a new parameter object.
TRITONSERVER_INSTANCEGROUPKIND_GPU
@ TRITONSERVER_INSTANCEGROUPKIND_GPU
Definition: tritonserver.h:239
TRITONSERVER_InstanceGroupKind
enum TRITONSERVER_instancegroupkind_enum TRITONSERVER_InstanceGroupKind
TRITONSERVER_InstanceGroupKind.
TRITONSERVER_LogIsEnabled
TRITONSERVER_DECLSPEC bool TRITONSERVER_LogIsEnabled(TRITONSERVER_LogLevel level)
Is a log level enabled?
tritonserver_requestflag_enum
tritonserver_requestflag_enum
TRITONSERVER_InferenceRequest.
Definition: tritonserver.h:957
TRITONSERVER_ServerOptionsSetRateLimiterMode
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetRateLimiterMode(struct TRITONSERVER_ServerOptions *options, TRITONSERVER_RateLimitMode mode)
Set the rate limit mode in a server options.
TRITONSERVER_ServerOptionsSetRepoAgentDirectory
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetRepoAgentDirectory(struct TRITONSERVER_ServerOptions *options, const char *repoagent_dir)
Set the directory containing repository agent shared libraries.
TRITONSERVER_TYPE_UINT32
@ TRITONSERVER_TYPE_UINT32
Definition: tritonserver.h:120
TRITONSERVER_InferenceRequestFlags
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestFlags(struct TRITONSERVER_InferenceRequest *inference_request, uint32_t *flags)
Get the flag(s) associated with a request.
TRITONSERVER_ServerModelConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerModelConfig(struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version, const uint32_t config_version, struct TRITONSERVER_Message **model_config)
Get the configuration of a model as a TRITONSERVER_Message object.
TRITONSERVER_InferenceRequestNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestNew(struct TRITONSERVER_InferenceRequest **inference_request, struct TRITONSERVER_Server *server, const char *model_name, const int64_t model_version)
Create a new inference request object.
TRITONSERVER_MetricFamilyNew
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_MetricFamilyNew(struct TRITONSERVER_MetricFamily **family, const TRITONSERVER_MetricKind kind, const char *name, const char *description)
Create a new metric family object.
TRITONSERVER_ServerMetrics
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerMetrics(struct TRITONSERVER_Server *server, struct TRITONSERVER_Metrics **metrics)
Get the current metrics for the server.
TRITONSERVER_InferenceRequestAddInput
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestAddInput(struct TRITONSERVER_InferenceRequest *inference_request, const char *name, const TRITONSERVER_DataType datatype, const int64_t *shape, uint64_t dim_count)
Add an input to a request.
TRITONSERVER_ServerOptionsSetServerId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetServerId(struct TRITONSERVER_ServerOptions *options, const char *server_id)
Set the textual ID for the server in a server options.
TRITONSERVER_ServerDelete
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerDelete(struct TRITONSERVER_Server *server)
Delete a server object.
TRITONSERVER_ModelIndexFlag
enum tritonserver_modelindexflag_enum TRITONSERVER_ModelIndexFlag
Model index flags. The enum values must be power-of-2 values.
TRITONSERVER_TRACE_LEVEL_MAX
@ TRITONSERVER_TRACE_LEVEL_MAX
Deprecated. Use TRITONSERVER_TRACE_LEVEL_TIMESTAMPS.
Definition: tritonserver.h:709
TRITONSERVER_BufferAttributesSetCudaIpcHandle
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesSetCudaIpcHandle(struct TRITONSERVER_BufferAttributes *buffer_attributes, void *cuda_ipc_handle)
Set the CudaIpcHandle field of the buffer attributes.
TRITONSERVER_TRACE_REQUEST_START
@ TRITONSERVER_TRACE_REQUEST_START
Definition: tritonserver.h:727
TRITONSERVER_ServerOptionsSetLogFile
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogFile(struct TRITONSERVER_ServerOptions *options, const char *file)
Provide a log output file.
TRITONSERVER_ServerOptionsSetStartupModel
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetStartupModel(struct TRITONSERVER_ServerOptions *options, const char *model_name)
Set the model to be loaded at startup in a server options.
TRITONSERVER_PARAMETER_BOOL
@ TRITONSERVER_PARAMETER_BOOL
Definition: tritonserver.h:185
TRITONSERVER_InferenceResponseParameterCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceResponseParameterCount(struct TRITONSERVER_InferenceResponse *inference_response, uint32_t *count)
Get the number of parameters available in the response.
TRITONSERVER_ServerOptionsSetMetricsInterval
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetMetricsInterval(struct TRITONSERVER_ServerOptions *options, uint64_t metrics_interval_ms)
Set the interval for metrics collection in a server options.
TRITONSERVER_BufferAttributesCudaIpcHandle
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_BufferAttributesCudaIpcHandle(struct TRITONSERVER_BufferAttributes *buffer_attributes, void **cuda_ipc_handle)
Get the CudaIpcHandle field of the buffer attributes object.
TRITONSERVER_InferenceRequestRemoveAllRequestedOutputs
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllRequestedOutputs(struct TRITONSERVER_InferenceRequest *inference_request)
Remove all output requests from an inference request.
TRITONSERVER_ModelBatchFlag
enum tritonserver_batchflag_enum TRITONSERVER_ModelBatchFlag
TRITONSERVER_Server.
TRITONSERVER_ServerSetExitTimeout
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerSetExitTimeout(struct TRITONSERVER_Server *server, unsigned int timeout)
Set the exit timeout on the server object.
TRITONSERVER_ErrorCode
TRITONSERVER_DECLSPEC TRITONSERVER_Error_Code TRITONSERVER_ErrorCode(struct TRITONSERVER_Error *error)
Get the error code.
TRITONSERVER_InferenceRequestCorrelationId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestCorrelationId(struct TRITONSERVER_InferenceRequest *inference_request, uint64_t *correlation_id)
Get the correlation ID of the inference request as an unsigned integer.
TRITONSERVER_MEMORY_GPU
@ TRITONSERVER_MEMORY_GPU
Definition: tritonserver.h:166
TRITONSERVER_ServerOptionsSetLogVerbose
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogVerbose(struct TRITONSERVER_ServerOptions *options, int level)
Set verbose logging level.
tritonserver_requestreleaseflag_enum
tritonserver_requestreleaseflag_enum
Inference request release flags.
Definition: tritonserver.h:964
TRITONSERVER_InferenceTraceRequestId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceRequestId(struct TRITONSERVER_InferenceTrace *trace, const char **request_id)
Get the request id associated with a trace.
TRITONSERVER_InferenceTraceParentId
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceTraceParentId(struct TRITONSERVER_InferenceTrace *trace, uint64_t *parent_id)
Get the parent id associated with a trace.
TRITONSERVER_ServerOptionsSetCacheConfig
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetCacheConfig(struct TRITONSERVER_ServerOptions *options, const char *cache_name, const char *config_json)
Set the cache config that will be used to initialize the cache implementation for "cache_name".
TRITONSERVER_InferenceRequestSetCorrelationIdString
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetCorrelationIdString(struct TRITONSERVER_InferenceRequest *inference_request, const char *correlation_id)
Set the correlation ID of the inference request to be a string.
tritonserver_ratelimitmode_enum
tritonserver_ratelimitmode_enum
Rate limit modes.
Definition: tritonserver.h:1768
TRITONSERVER_BATCH_FIRST_DIM
@ TRITONSERVER_BATCH_FIRST_DIM
Definition: tritonserver.h:2272
TRITONSERVER_ServerOptionsSetLogFormat
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetLogFormat(struct TRITONSERVER_ServerOptions *options, const TRITONSERVER_LogFormat format)
Set the logging format.
TRITONSERVER_InferenceTraceReportActivity
TRITONSERVER_DECLSPEC TRITONSERVER_Error * TRITONSERVER_InferenceTraceReportActivity(TRITONSERVER_InferenceTrace *trace, uint64_t timestamp, const char *activity_name)
Report a trace activity.
TRITONSERVER_InferenceRequestSetResponseCallback
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestSetResponseCallback(struct TRITONSERVER_InferenceRequest *inference_request, struct TRITONSERVER_ResponseAllocator *response_allocator, void *response_allocator_userp, TRITONSERVER_InferenceResponseCompleteFn_t response_fn, void *response_userp)
Set the allocator and response callback for an inference request.
TRITONSERVER_INSTANCEGROUPKIND_CPU
@ TRITONSERVER_INSTANCEGROUPKIND_CPU
Definition: tritonserver.h:238
TRITONSERVER_ServerOptionsSetModelNamespacing
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelNamespacing(struct TRITONSERVER_ServerOptions *options, bool enable_namespace)
Enable model namespacing to allow serving models with the same name if they are in different namespac...
TRITONSERVER_InferenceRequestRemoveAllInputs
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_InferenceRequestRemoveAllInputs(struct TRITONSERVER_InferenceRequest *inference_request)
Remove all inputs from a request.
TRITONSERVER_ServerOptionsSetModelLoadThreadCount
TRITONSERVER_DECLSPEC struct TRITONSERVER_Error * TRITONSERVER_ServerOptionsSetModelLoadThreadCount(struct TRITONSERVER_ServerOptions *options, unsigned int thread_count)
Set the number of threads to concurrently load models in a server options.