static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ApiVersion(int[] major,
int[] minor) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ApiVersion(IntBuffer major,
IntBuffer minor) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ApiVersion(IntPointer major,
IntPointer minor)
Get the TRITONBACKEND API version supported by Triton.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendArtifacts(TRITONBACKEND_Backend backend,
int[] artifact_type,
byte[] location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendArtifacts(TRITONBACKEND_Backend backend,
IntBuffer artifact_type,
ByteBuffer location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendArtifacts(TRITONBACKEND_Backend backend,
IntPointer artifact_type,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendArtifacts(TRITONBACKEND_Backend backend,
IntPointer artifact_type,
PointerPointer location)
Get the location of the files that make up the backend
implementation.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendAttributeAddPreferredInstanceGroup(TRITONBACKEND_BackendAttribute backend_attributes,
int kind,
long count,
long[] device_ids,
long id_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendAttributeAddPreferredInstanceGroup(TRITONBACKEND_BackendAttribute backend_attributes,
int kind,
long count,
LongBuffer device_ids,
long id_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendAttributeAddPreferredInstanceGroup(TRITONBACKEND_BackendAttribute backend_attributes,
int kind,
long count,
LongPointer device_ids,
long id_count)
TRITONBACKEND_BackendAttribute
API to modify attributes associated with a backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendAttributeSetParallelModelInstanceLoading(TRITONBACKEND_BackendAttribute backend_attributes,
boolean enabled)
Sets whether or not the backend supports concurrently loading multiple
TRITONBACKEND_ModelInstances in a thread-safe manner.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendConfig(TRITONBACKEND_Backend backend,
PointerPointer backend_config)
Get the backend configuration.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendConfig(TRITONBACKEND_Backend backend,
TRITONSERVER_Message backend_config) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendExecutionPolicy(TRITONBACKEND_Backend backend,
int[] policy) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendExecutionPolicy(TRITONBACKEND_Backend backend,
IntBuffer policy) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendExecutionPolicy(TRITONBACKEND_Backend backend,
IntPointer policy)
Get the execution policy for this backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendMemoryManager(TRITONBACKEND_Backend backend,
PointerPointer manager)
Get the memory manager associated with a backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendMemoryManager(TRITONBACKEND_Backend backend,
TRITONBACKEND_MemoryManager manager) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendName(TRITONBACKEND_Backend backend,
byte[] name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendName(TRITONBACKEND_Backend backend,
ByteBuffer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendName(TRITONBACKEND_Backend backend,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendName(TRITONBACKEND_Backend backend,
PointerPointer name)
Get the name of the backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendSetExecutionPolicy(TRITONBACKEND_Backend backend,
int policy)
Set the execution policy for this backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendSetState(TRITONBACKEND_Backend backend,
Pointer state)
Set the user-specified state associated with the backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendState(TRITONBACKEND_Backend backend,
Pointer state) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_BackendState(TRITONBACKEND_Backend backend,
PointerPointer state)
Get the user-specified state associated with the backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_Finalize(TRITONBACKEND_Backend backend)
Finalize for a backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_GetBackendAttribute(TRITONBACKEND_Backend backend,
TRITONBACKEND_BackendAttribute backend_attributes)
Query the backend for different model attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceRequestTimeoutMicroseconds(TRITONBACKEND_Request request,
long[] timeout) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceRequestTimeoutMicroseconds(TRITONBACKEND_Request request,
LongBuffer timeout) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceRequestTimeoutMicroseconds(TRITONBACKEND_Request request,
LongPointer timeout)
Get the timeout of the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutput(TRITONBACKEND_Response response,
int index,
byte[] name,
int[] datatype,
long[] shape,
long[] dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutput(TRITONBACKEND_Response response,
int index,
ByteBuffer name,
IntBuffer datatype,
LongBuffer shape,
LongBuffer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutput(TRITONBACKEND_Response response,
int index,
BytePointer name,
IntPointer datatype,
LongPointer shape,
LongPointer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutput(TRITONBACKEND_Response response,
int index,
PointerPointer name,
IntPointer datatype,
PointerPointer shape,
LongPointer dim_count)
Get all information about an output tensor by its index.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
BytePointer name,
int[] datatype,
long[] shape,
long[] dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
BytePointer name,
IntBuffer datatype,
LongBuffer shape,
LongBuffer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
BytePointer name,
IntPointer datatype,
LongPointer shape,
LongPointer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
String name,
int[] datatype,
long[] shape,
long[] dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
String name,
IntBuffer datatype,
LongBuffer shape,
LongBuffer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
String name,
IntPointer datatype,
LongPointer shape,
LongPointer dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InferenceResponseOutputByName(TRITONBACKEND_Response response,
String name,
IntPointer datatype,
PointerPointer shape,
LongPointer dim_count)
Get all information about an output tensor by its name.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_Initialize(TRITONBACKEND_Backend backend)
The following functions can be implemented by a backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBuffer(TRITONBACKEND_Input input,
int index,
Pointer buffer,
long[] buffer_byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBuffer(TRITONBACKEND_Input input,
int index,
Pointer buffer,
LongBuffer buffer_byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBuffer(TRITONBACKEND_Input input,
int index,
Pointer buffer,
LongPointer buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBuffer(TRITONBACKEND_Input input,
int index,
PointerPointer buffer,
LongPointer buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id)
Get a buffer holding (part of) the tensor data for an input.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferAttributes(TRITONBACKEND_Input input,
int index,
PointerPointer buffer,
PointerPointer buffer_attributes)
Get the buffer attributes associated with the given input buffer.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferAttributes(TRITONBACKEND_Input input,
int index,
Pointer buffer,
TRITONSERVER_BufferAttributes buffer_attributes) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
int index,
Pointer buffer,
long[] buffer_byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
int index,
Pointer buffer,
LongBuffer buffer_byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
int index,
Pointer buffer,
LongPointer buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
int index,
Pointer buffer,
long[] buffer_byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
int index,
Pointer buffer,
LongBuffer buffer_byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
int index,
Pointer buffer,
LongPointer buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputBufferForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
int index,
PointerPointer buffer,
LongPointer buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id)
Get a buffer holding (part of) the tensor data for an input for a specific
host policy.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputProperties(TRITONBACKEND_Input input,
byte[] name,
int[] datatype,
long[] shape,
int[] dims_count,
long[] byte_size,
int[] buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputProperties(TRITONBACKEND_Input input,
ByteBuffer name,
IntBuffer datatype,
LongBuffer shape,
IntBuffer dims_count,
LongBuffer byte_size,
IntBuffer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputProperties(TRITONBACKEND_Input input,
BytePointer name,
IntPointer datatype,
LongPointer shape,
IntPointer dims_count,
LongPointer byte_size,
IntPointer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputProperties(TRITONBACKEND_Input input,
PointerPointer name,
IntPointer datatype,
PointerPointer shape,
IntPointer dims_count,
LongPointer byte_size,
IntPointer buffer_count)
TRITONBACKEND_Input
Object representing an input tensor.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
byte[] name,
int[] datatype,
long[] shape,
int[] dims_count,
long[] byte_size,
int[] buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
ByteBuffer name,
IntBuffer datatype,
LongBuffer shape,
IntBuffer dims_count,
LongBuffer byte_size,
IntBuffer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
BytePointer host_policy_name,
BytePointer name,
IntPointer datatype,
LongPointer shape,
IntPointer dims_count,
LongPointer byte_size,
IntPointer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
byte[] name,
int[] datatype,
long[] shape,
int[] dims_count,
long[] byte_size,
int[] buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
ByteBuffer name,
IntBuffer datatype,
LongBuffer shape,
IntBuffer dims_count,
LongBuffer byte_size,
IntBuffer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
BytePointer name,
IntPointer datatype,
LongPointer shape,
IntPointer dims_count,
LongPointer byte_size,
IntPointer buffer_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_InputPropertiesForHostPolicy(TRITONBACKEND_Input input,
String host_policy_name,
PointerPointer name,
IntPointer datatype,
PointerPointer shape,
IntPointer dims_count,
LongPointer byte_size,
IntPointer buffer_count)
Get the name and properties of an input tensor associated with a given
host policy.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_MemoryManagerAllocate(TRITONBACKEND_MemoryManager manager,
Pointer buffer,
int memory_type,
long memory_type_id,
long byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_MemoryManagerAllocate(TRITONBACKEND_MemoryManager manager,
PointerPointer buffer,
int memory_type,
long memory_type_id,
long byte_size)
TRITONBACKEND_MemoryManager
Object representing an memory manager that is capable of
allocating and otherwise managing different memory types.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_MemoryManagerFree(TRITONBACKEND_MemoryManager manager,
Pointer buffer,
int memory_type,
long memory_type_id)
Free a buffer that was previously allocated with
TRITONBACKEND_MemoryManagerAllocate.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelAutoCompleteConfig(TRITONBACKEND_Model model,
boolean[] auto_complete_config)
Whether the backend should attempt to auto-complete the model configuration.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelAutoCompleteConfig(TRITONBACKEND_Model model,
BoolPointer auto_complete_config) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBackend(TRITONBACKEND_Model model,
PointerPointer backend)
Get the backend used by the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBackend(TRITONBACKEND_Model model,
TRITONBACKEND_Backend backend) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatcherFinalize(TRITONBACKEND_Batcher batcher)
Free memory associated with batcher.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatcherInitialize(PointerPointer batcher,
TRITONBACKEND_Model model)
TRITONBACKEND Batching
API to add custom batching strategy
The following functions can be implemented by a backend to add custom
batching conditionals on top of the existing Triton batching strategy.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatcherInitialize(TRITONBACKEND_Batcher batcher,
TRITONBACKEND_Model model) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatchFinalize(Pointer userp)
Callback to be invoked when Triton has finishing forming a batch.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatchIncludeRequest(TRITONBACKEND_Request request,
Pointer userp,
boolean[] should_include)
Check whether a request should be added to the pending model batch.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatchIncludeRequest(TRITONBACKEND_Request request,
Pointer userp,
BoolPointer should_include) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatchInitialize(TRITONBACKEND_Batcher batcher,
Pointer userp) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelBatchInitialize(TRITONBACKEND_Batcher batcher,
PointerPointer userp) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelConfig(TRITONBACKEND_Model model,
int config_version,
PointerPointer model_config)
Get the model configuration.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelConfig(TRITONBACKEND_Model model,
int config_version,
TRITONSERVER_Message model_config) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelFinalize(TRITONBACKEND_Model model)
Finalize for a model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInitialize(TRITONBACKEND_Model model)
Initialize for a model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceDeviceId(TRITONBACKEND_ModelInstance instance,
int[] device_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceDeviceId(TRITONBACKEND_ModelInstance instance,
IntBuffer device_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceDeviceId(TRITONBACKEND_ModelInstance instance,
IntPointer device_id)
Get the device ID of the model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceExecute(TRITONBACKEND_ModelInstance instance,
PointerPointer requests,
int request_count)
Execute a batch of one or more requests on a model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceExecute(TRITONBACKEND_ModelInstance instance,
TRITONBACKEND_Request requests,
int request_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceFinalize(TRITONBACKEND_ModelInstance instance)
Finalize for a model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceHostPolicy(TRITONBACKEND_ModelInstance instance,
PointerPointer host_policy)
Get the host policy setting.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceHostPolicy(TRITONBACKEND_ModelInstance instance,
TRITONSERVER_Message host_policy) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceInitialize(TRITONBACKEND_ModelInstance instance)
Initialize for a model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceIsPassive(TRITONBACKEND_ModelInstance instance,
boolean[] is_passive)
Whether the model instance is passive.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceIsPassive(TRITONBACKEND_ModelInstance instance,
BoolPointer is_passive) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceKind(TRITONBACKEND_ModelInstance instance,
int[] kind) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceKind(TRITONBACKEND_ModelInstance instance,
IntBuffer kind) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceKind(TRITONBACKEND_ModelInstance instance,
IntPointer kind)
Get the kind of the model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceModel(TRITONBACKEND_ModelInstance instance,
PointerPointer model)
Get the model associated with a model instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceModel(TRITONBACKEND_ModelInstance instance,
TRITONBACKEND_Model model) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceName(TRITONBACKEND_ModelInstance instance,
byte[] name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceName(TRITONBACKEND_ModelInstance instance,
ByteBuffer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceName(TRITONBACKEND_ModelInstance instance,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceName(TRITONBACKEND_ModelInstance instance,
PointerPointer name)
TRITONBACKEND_ModelInstance
Object representing a model instance implemented using the
backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileCount(TRITONBACKEND_ModelInstance instance,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileCount(TRITONBACKEND_ModelInstance instance,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileCount(TRITONBACKEND_ModelInstance instance,
IntPointer count)
Get the number of optimization profiles to be loaded for the instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileName(TRITONBACKEND_ModelInstance instance,
int index,
byte[] profile_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileName(TRITONBACKEND_ModelInstance instance,
int index,
ByteBuffer profile_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileName(TRITONBACKEND_ModelInstance instance,
int index,
BytePointer profile_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceProfileName(TRITONBACKEND_ModelInstance instance,
int index,
PointerPointer profile_name)
Get the name of optimization profile.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceReportBatchStatistics(TRITONBACKEND_ModelInstance instance,
long batch_size,
long exec_start_ns,
long compute_start_ns,
long compute_end_ns,
long exec_end_ns)
Record statistics for the execution of an entire batch of
inference requests.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceReportMemoryUsage(TRITONBACKEND_ModelInstance instance,
PointerPointer usage,
int usage_size)
Report the memory usage of the model instance that will be released on
TRITONBACKEND_ModelInstanceFinalize.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceReportMemoryUsage(TRITONBACKEND_ModelInstance instance,
TRITONSERVER_BufferAttributes usage,
int usage_size) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceReportStatistics(TRITONBACKEND_ModelInstance instance,
TRITONBACKEND_Request request,
boolean success,
long exec_start_ns,
long compute_start_ns,
long compute_end_ns,
long exec_end_ns)
Record statistics for an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceCount(TRITONBACKEND_ModelInstance instance,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceCount(TRITONBACKEND_ModelInstance instance,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceCount(TRITONBACKEND_ModelInstance instance,
IntPointer count)
Get the number of secondary devices configured for the instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceProperties(TRITONBACKEND_ModelInstance instance,
int index,
byte[] kind,
long[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceProperties(TRITONBACKEND_ModelInstance instance,
int index,
ByteBuffer kind,
LongBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceProperties(TRITONBACKEND_ModelInstance instance,
int index,
BytePointer kind,
LongPointer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSecondaryDeviceProperties(TRITONBACKEND_ModelInstance instance,
int index,
PointerPointer kind,
LongPointer id)
Get the properties of indexed secondary device.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceSetState(TRITONBACKEND_ModelInstance instance,
Pointer state)
Set the user-specified state associated with the model
instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceState(TRITONBACKEND_ModelInstance instance,
Pointer state) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelInstanceState(TRITONBACKEND_ModelInstance instance,
PointerPointer state)
Get the user-specified state associated with the model
instance.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelName(TRITONBACKEND_Model model,
byte[] name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelName(TRITONBACKEND_Model model,
ByteBuffer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelName(TRITONBACKEND_Model model,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelName(TRITONBACKEND_Model model,
PointerPointer name)
TRITONBACKEND_Model
Object representing a model implemented using the backend.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelReportMemoryUsage(TRITONBACKEND_Model model,
PointerPointer usage,
int usage_size)
Report the memory usage of the model that will be released on
TRITONBACKEND_ModelFinalize.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelReportMemoryUsage(TRITONBACKEND_Model model,
TRITONSERVER_BufferAttributes usage,
int usage_size) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelRepository(TRITONBACKEND_Model model,
int[] artifact_type,
byte[] location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelRepository(TRITONBACKEND_Model model,
IntBuffer artifact_type,
ByteBuffer location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelRepository(TRITONBACKEND_Model model,
IntPointer artifact_type,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelRepository(TRITONBACKEND_Model model,
IntPointer artifact_type,
PointerPointer location)
Get the location of the files that make up the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelServer(TRITONBACKEND_Model model,
PointerPointer server)
Get the TRITONSERVER_Server object that this model is being served
by.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelServer(TRITONBACKEND_Model model,
TRITONSERVER_Server server) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelSetConfig(TRITONBACKEND_Model model,
int config_version,
TRITONSERVER_Message model_config)
Set the model configuration in Triton server.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelSetState(TRITONBACKEND_Model model,
Pointer state)
Set the user-specified state associated with the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelState(TRITONBACKEND_Model model,
Pointer state) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelState(TRITONBACKEND_Model model,
PointerPointer state)
Get the user-specified state associated with the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelVersion(TRITONBACKEND_Model model,
long[] version) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelVersion(TRITONBACKEND_Model model,
LongBuffer version) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ModelVersion(TRITONBACKEND_Model model,
LongPointer version)
Get the version of the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBuffer(TRITONBACKEND_Output output,
Pointer buffer,
long buffer_byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBuffer(TRITONBACKEND_Output output,
Pointer buffer,
long buffer_byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBuffer(TRITONBACKEND_Output output,
Pointer buffer,
long buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBuffer(TRITONBACKEND_Output output,
PointerPointer buffer,
long buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id)
TRITONBACKEND_Output
Object representing a response output tensor.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBufferAttributes(TRITONBACKEND_Output output,
PointerPointer buffer_attributes)
Get the buffer attributes associated with the given output buffer.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_OutputBufferAttributes(TRITONBACKEND_Output output,
TRITONSERVER_BufferAttributes buffer_attributes) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationId(TRITONBACKEND_Request request,
long[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationId(TRITONBACKEND_Request request,
LongBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationId(TRITONBACKEND_Request request,
LongPointer id)
Get the correlation ID of the request if it is an unsigned integer.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationIdString(TRITONBACKEND_Request request,
byte[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationIdString(TRITONBACKEND_Request request,
ByteBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationIdString(TRITONBACKEND_Request request,
BytePointer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestCorrelationIdString(TRITONBACKEND_Request request,
PointerPointer id)
Get the correlation ID of the request if it is a string.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestFlags(TRITONBACKEND_Request request,
int[] flags) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestFlags(TRITONBACKEND_Request request,
IntBuffer flags) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestFlags(TRITONBACKEND_Request request,
IntPointer flags)
Get the flag(s) associated with a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestId(TRITONBACKEND_Request request,
byte[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestId(TRITONBACKEND_Request request,
ByteBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestId(TRITONBACKEND_Request request,
BytePointer id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestId(TRITONBACKEND_Request request,
PointerPointer id)
TRITONBACKEND_Request
Object representing an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInput(TRITONBACKEND_Request request,
BytePointer name,
TRITONBACKEND_Input input) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInput(TRITONBACKEND_Request request,
String name,
PointerPointer input)
Get a named request input.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInput(TRITONBACKEND_Request request,
String name,
TRITONBACKEND_Input input) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputByIndex(TRITONBACKEND_Request request,
int index,
PointerPointer input)
Get a request input by index.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputByIndex(TRITONBACKEND_Request request,
int index,
TRITONBACKEND_Input input) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputCount(TRITONBACKEND_Request request,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputCount(TRITONBACKEND_Request request,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputCount(TRITONBACKEND_Request request,
IntPointer count)
Get the number of input tensors specified in the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputName(TRITONBACKEND_Request request,
int index,
byte[] input_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputName(TRITONBACKEND_Request request,
int index,
ByteBuffer input_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputName(TRITONBACKEND_Request request,
int index,
BytePointer input_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestInputName(TRITONBACKEND_Request request,
int index,
PointerPointer input_name)
Get the name of an input tensor.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestIsCancelled(TRITONBACKEND_Request request,
boolean[] is_cancelled)
Query whether the request is cancelled or not.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestIsCancelled(TRITONBACKEND_Request request,
BoolPointer is_cancelled) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
BytePointer name,
SizeTPointer byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
BytePointer name,
SizeTPointer byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
BytePointer name,
SizeTPointer byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
String name,
SizeTPointer byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
String name,
SizeTPointer byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputBufferProperties(TRITONBACKEND_Request request,
String name,
SizeTPointer byte_size,
IntPointer memory_type,
LongPointer memory_type_id)
Returns the preferred memory type and memory type ID of the output buffer
for the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputCount(TRITONBACKEND_Request request,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputCount(TRITONBACKEND_Request request,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputCount(TRITONBACKEND_Request request,
IntPointer count)
Get the number of output tensors requested to be returned in the
request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputName(TRITONBACKEND_Request request,
int index,
byte[] output_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputName(TRITONBACKEND_Request request,
int index,
ByteBuffer output_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputName(TRITONBACKEND_Request request,
int index,
BytePointer output_name) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestOutputName(TRITONBACKEND_Request request,
int index,
PointerPointer output_name)
Get the name of a requested output tensor.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameter(TRITONBACKEND_Request request,
int index,
byte[] key,
int[] type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameter(TRITONBACKEND_Request request,
int index,
ByteBuffer key,
IntBuffer type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameter(TRITONBACKEND_Request request,
int index,
BytePointer key,
IntPointer type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameter(TRITONBACKEND_Request request,
int index,
PointerPointer key,
IntPointer type,
PointerPointer vvalue)
Get a request parameters by index.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameterCount(TRITONBACKEND_Request request,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameterCount(TRITONBACKEND_Request request,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestParameterCount(TRITONBACKEND_Request request,
IntPointer count)
Get the number of parameters specified in the inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestRelease(TRITONBACKEND_Request request,
int release_flags)
Release the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestTrace(TRITONBACKEND_Request request,
PointerPointer trace)
Get the trace associated with a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_RequestTrace(TRITONBACKEND_Request request,
TRITONSERVER_InferenceTrace trace) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseDelete(TRITONBACKEND_Response response)
Destroy a response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactoryDelete(TRITONBACKEND_ResponseFactory factory)
Destroy a response factory.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactoryIsCancelled(TRITONBACKEND_ResponseFactory factory,
boolean[] is_cancelled)
Query whether the response factory is cancelled or not.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactoryIsCancelled(TRITONBACKEND_ResponseFactory factory,
BoolPointer is_cancelled) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactoryNew(PointerPointer factory,
TRITONBACKEND_Request request)
TRITONBACKEND_ResponseFactory
Object representing an inference response factory.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactoryNew(TRITONBACKEND_ResponseFactory factory,
TRITONBACKEND_Request request) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseFactorySendFlags(TRITONBACKEND_ResponseFactory factory,
int send_flags)
Send response flags without a corresponding response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseNew(PointerPointer response,
TRITONBACKEND_Request request)
TRITONBACKEND_Response
Object representing an inference response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseNew(TRITONBACKEND_Response response,
TRITONBACKEND_Request request) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseNewFromFactory(PointerPointer response,
TRITONBACKEND_ResponseFactory factory)
Create a response using a factory.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseNewFromFactory(TRITONBACKEND_Response response,
TRITONBACKEND_ResponseFactory factory) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
PointerPointer output,
String name,
int datatype,
LongPointer shape,
int dims_count)
Create an output tensor in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
BytePointer name,
int datatype,
long[] shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
BytePointer name,
int datatype,
LongBuffer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
BytePointer name,
int datatype,
LongPointer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
String name,
int datatype,
long[] shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
String name,
int datatype,
LongBuffer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseOutput(TRITONBACKEND_Response response,
TRITONBACKEND_Output output,
String name,
int datatype,
LongPointer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSend(TRITONBACKEND_Response response,
int send_flags,
TRITONSERVER_Error error)
Send a response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetBoolParameter(TRITONBACKEND_Response response,
BytePointer name,
boolean value) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetBoolParameter(TRITONBACKEND_Response response,
String name,
boolean value)
Set a boolean parameter in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetIntParameter(TRITONBACKEND_Response response,
BytePointer name,
long value) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetIntParameter(TRITONBACKEND_Response response,
String name,
long value)
Set an integer parameter in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetStringParameter(TRITONBACKEND_Response response,
BytePointer name,
BytePointer value) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_ResponseSetStringParameter(TRITONBACKEND_Response response,
String name,
String value)
Set a string parameter in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBuffer(TRITONBACKEND_State state,
Pointer buffer,
long buffer_byte_size,
int[] memory_type,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBuffer(TRITONBACKEND_State state,
Pointer buffer,
long buffer_byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBuffer(TRITONBACKEND_State state,
Pointer buffer,
long buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBuffer(TRITONBACKEND_State state,
PointerPointer buffer,
long buffer_byte_size,
IntPointer memory_type,
LongPointer memory_type_id)
Get a buffer to use to hold the tensor data for the state.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBufferAttributes(TRITONBACKEND_State state,
PointerPointer buffer_attributes)
Get the buffer attributes associated with the given state buffer.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateBufferAttributes(TRITONBACKEND_State state,
TRITONSERVER_BufferAttributes buffer_attributes) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(PointerPointer state,
TRITONBACKEND_Request request,
String name,
int datatype,
LongPointer shape,
int dims_count)
TRITONBACKEND_State
Object representing a state.
|
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
BytePointer name,
int datatype,
long[] shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
BytePointer name,
int datatype,
LongBuffer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
BytePointer name,
int datatype,
LongPointer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
String name,
int datatype,
long[] shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
String name,
int datatype,
LongBuffer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateNew(TRITONBACKEND_State state,
TRITONBACKEND_Request request,
String name,
int datatype,
LongPointer shape,
int dims_count) |
static TRITONSERVER_Error |
tritonserver.TRITONBACKEND_StateUpdate(TRITONBACKEND_State state)
Update the state for the sequence.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ApiVersion(int[] major,
int[] minor) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ApiVersion(IntBuffer major,
IntBuffer minor) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ApiVersion(IntPointer major,
IntPointer minor)
Get the TRITONREPOAGENT API version supported by Triton.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_Finalize(TRITONREPOAGENT_Agent agent)
Finalize for an agent.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_Initialize(TRITONREPOAGENT_Agent agent)
The following functions can be implemented by an agent.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelAction(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int action_type)
Handle an action for a specified model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelConfig(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int config_version,
PointerPointer model_config)
Get the model configuration.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelConfig(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int config_version,
TRITONSERVER_Message model_config) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelFinalize(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model)
Finalize for a model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelInitialize(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model)
Initialize a model associated with an agent.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameter(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int index,
byte[] parameter_name,
byte[] parameter_value) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameter(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int index,
ByteBuffer parameter_name,
ByteBuffer parameter_value) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameter(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int index,
BytePointer parameter_name,
BytePointer parameter_value) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameter(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int index,
PointerPointer parameter_name,
PointerPointer parameter_value)
Get a parameter name and value.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameterCount(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameterCount(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelParameterCount(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
IntPointer count)
Get the number of agent parameters defined for a model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocation(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int[] artifact_type,
byte[] location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocation(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
IntBuffer artifact_type,
ByteBuffer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocation(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
IntPointer artifact_type,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocation(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
IntPointer artifact_type,
PointerPointer location)
Get the location of the files that make up the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationAcquire(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
byte[] location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationAcquire(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
ByteBuffer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationAcquire(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationAcquire(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
PointerPointer location)
Acquire a location where the agent can produce a new version of
the model repository files.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationRelease(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryLocationRelease(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
String location)
Discard and release ownership of a previously acquired location
and its contents.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryUpdate(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
BytePointer location) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelRepositoryUpdate(TRITONREPOAGENT_Agent agent,
TRITONREPOAGENT_AgentModel model,
int artifact_type,
String location)
Inform Triton that the specified repository location should be used for
the model in place of the original model repository.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelSetState(TRITONREPOAGENT_AgentModel model,
Pointer state)
Set the user-specified state associated with the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelState(TRITONREPOAGENT_AgentModel model,
Pointer state) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_ModelState(TRITONREPOAGENT_AgentModel model,
PointerPointer state)
Get the user-specified state associated with the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_SetState(TRITONREPOAGENT_Agent agent,
Pointer state)
Set the user-specified state associated with the agent.
|
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_State(TRITONREPOAGENT_Agent agent,
Pointer state) |
static TRITONSERVER_Error |
tritonserver.TRITONREPOAGENT_State(TRITONREPOAGENT_Agent agent,
PointerPointer state)
Get the user-specified state associated with the agent.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ApiVersion(int[] major,
int[] minor) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ApiVersion(IntBuffer major,
IntBuffer minor) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ApiVersion(IntPointer major,
IntPointer minor)
Get the TRITONBACKEND API version supported by the Triton shared
library.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesByteSize(TRITONSERVER_BufferAttributes buffer_attributes,
SizeTPointer byte_size)
Get the byte size field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesCudaIpcHandle(TRITONSERVER_BufferAttributes buffer_attributes,
Pointer cuda_ipc_handle) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesCudaIpcHandle(TRITONSERVER_BufferAttributes buffer_attributes,
PointerPointer cuda_ipc_handle)
Get the CudaIpcHandle field of the buffer attributes object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesDelete(TRITONSERVER_BufferAttributes buffer_attributes)
Delete a buffer attributes object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryType(TRITONSERVER_BufferAttributes buffer_attributes,
int[] memory_type) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryType(TRITONSERVER_BufferAttributes buffer_attributes,
IntBuffer memory_type) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryType(TRITONSERVER_BufferAttributes buffer_attributes,
IntPointer memory_type)
Get the memory type field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryTypeId(TRITONSERVER_BufferAttributes buffer_attributes,
long[] memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryTypeId(TRITONSERVER_BufferAttributes buffer_attributes,
LongBuffer memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesMemoryTypeId(TRITONSERVER_BufferAttributes buffer_attributes,
LongPointer memory_type_id)
Get the memory type id field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesNew(PointerPointer buffer_attributes)
TRITONSERVER_BufferAttributes
API to create, modify, or retrieve attributes associated with a buffer.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesNew(TRITONSERVER_BufferAttributes buffer_attributes) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesSetByteSize(TRITONSERVER_BufferAttributes buffer_attributes,
long byte_size)
Set the byte size field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesSetCudaIpcHandle(TRITONSERVER_BufferAttributes buffer_attributes,
Pointer cuda_ipc_handle)
Set the CudaIpcHandle field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesSetMemoryType(TRITONSERVER_BufferAttributes buffer_attributes,
int memory_type)
Set the memory type field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_BufferAttributesSetMemoryTypeId(TRITONSERVER_BufferAttributes buffer_attributes,
long memory_type_id)
Set the memory type id field of the buffer attributes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ErrorNew(int code,
BytePointer msg) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ErrorNew(int code,
String msg)
Create a new error object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_GetMetricKind(TRITONSERVER_Metric metric,
int[] kind) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_GetMetricKind(TRITONSERVER_Metric metric,
IntBuffer kind) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_GetMetricKind(TRITONSERVER_Metric metric,
IntPointer kind)
Get the TRITONSERVER_MetricKind of metric and its corresponding family.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
int datatype,
long[] shape,
long dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
int datatype,
LongBuffer shape,
long dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
int datatype,
LongPointer shape,
long dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
String name,
int datatype,
long[] shape,
long dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
String name,
int datatype,
LongBuffer shape,
long dim_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddInput(TRITONSERVER_InferenceRequest inference_request,
String name,
int datatype,
LongPointer shape,
long dim_count)
Add an input to a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddRawInput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddRawInput(TRITONSERVER_InferenceRequest inference_request,
String name)
Add a raw input to a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddRequestedOutput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAddRequestedOutput(TRITONSERVER_InferenceRequest inference_request,
String name)
Add an output request to an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputData(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
Pointer base,
long byte_size,
int memory_type,
long memory_type_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputData(TRITONSERVER_InferenceRequest inference_request,
String name,
Pointer base,
long byte_size,
int memory_type,
long memory_type_id)
Assign a buffer of data to an input.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
Pointer base,
TRITONSERVER_BufferAttributes buffer_attributes) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputDataWithBufferAttributes(TRITONSERVER_InferenceRequest inference_request,
String name,
Pointer base,
TRITONSERVER_BufferAttributes buffer_attributes)
Assign a buffer of data to an input.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy(TRITONSERVER_InferenceRequest inference_request,
BytePointer name,
Pointer base,
long byte_size,
int memory_type,
long memory_type_id,
BytePointer host_policy_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy(TRITONSERVER_InferenceRequest inference_request,
String name,
Pointer base,
long byte_size,
int memory_type,
long memory_type_id,
String host_policy_name)
Assign a buffer of data to an input for execution on all model instances
with the specified host policy.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCancel(TRITONSERVER_InferenceRequest inference_request)
Cancel an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationId(TRITONSERVER_InferenceRequest inference_request,
long[] correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationId(TRITONSERVER_InferenceRequest inference_request,
LongBuffer correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationId(TRITONSERVER_InferenceRequest inference_request,
LongPointer correlation_id)
Get the correlation ID of the inference request as an unsigned integer.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
byte[] correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
ByteBuffer correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
BytePointer correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
PointerPointer correlation_id)
Get the correlation ID of the inference request as a string.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestDelete(TRITONSERVER_InferenceRequest inference_request)
Delete an inference request object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestFlags(TRITONSERVER_InferenceRequest inference_request,
int[] flags) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestFlags(TRITONSERVER_InferenceRequest inference_request,
IntBuffer flags) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestFlags(TRITONSERVER_InferenceRequest inference_request,
IntPointer flags)
Get the flag(s) associated with a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestId(TRITONSERVER_InferenceRequest inference_request,
byte[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestId(TRITONSERVER_InferenceRequest inference_request,
ByteBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestId(TRITONSERVER_InferenceRequest inference_request,
BytePointer id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestId(TRITONSERVER_InferenceRequest inference_request,
PointerPointer id)
Get the ID for a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestIsCancelled(TRITONSERVER_InferenceRequest inference_request,
boolean[] is_cancelled)
Query whether the request is cancelled or not.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestIsCancelled(TRITONSERVER_InferenceRequest inference_request,
BoolPointer is_cancelled) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestNew(PointerPointer inference_request,
TRITONSERVER_Server server,
String model_name,
long model_version)
Create a new inference request object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestNew(TRITONSERVER_InferenceRequest inference_request,
TRITONSERVER_Server server,
BytePointer model_name,
long model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestNew(TRITONSERVER_InferenceRequest inference_request,
TRITONSERVER_Server server,
String model_name,
long model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriority(TRITONSERVER_InferenceRequest inference_request,
int[] priority) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriority(TRITONSERVER_InferenceRequest inference_request,
IntBuffer priority) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriority(TRITONSERVER_InferenceRequest inference_request,
IntPointer priority)
Deprecated.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriorityUInt64(TRITONSERVER_InferenceRequest inference_request,
long[] priority) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriorityUInt64(TRITONSERVER_InferenceRequest inference_request,
LongBuffer priority) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestPriorityUInt64(TRITONSERVER_InferenceRequest inference_request,
LongPointer priority)
Get the priority for a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveAllInputData(TRITONSERVER_InferenceRequest inference_request,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveAllInputData(TRITONSERVER_InferenceRequest inference_request,
String name)
Clear all input data from an input, releasing ownership of the
buffer(s) that were appended to the input with
TRITONSERVER_InferenceRequestAppendInputData or
TRITONSERVER_InferenceRequestAppendInputDataWithHostPolicy
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveAllInputs(TRITONSERVER_InferenceRequest inference_request)
Remove all inputs from a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveAllRequestedOutputs(TRITONSERVER_InferenceRequest inference_request)
Remove all output requests from an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveInput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveInput(TRITONSERVER_InferenceRequest inference_request,
String name)
Remove an input from a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveRequestedOutput(TRITONSERVER_InferenceRequest inference_request,
BytePointer name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestRemoveRequestedOutput(TRITONSERVER_InferenceRequest inference_request,
String name)
Remove an output request from an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetBoolParameter(TRITONSERVER_InferenceRequest request,
BytePointer key,
boolean value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetBoolParameter(TRITONSERVER_InferenceRequest request,
String key,
boolean value)
Set a boolean parameter in the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetCorrelationId(TRITONSERVER_InferenceRequest inference_request,
long correlation_id)
Set the correlation ID of the inference request to be an unsigned integer.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
BytePointer correlation_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetCorrelationIdString(TRITONSERVER_InferenceRequest inference_request,
String correlation_id)
Set the correlation ID of the inference request to be a string.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetFlags(TRITONSERVER_InferenceRequest inference_request,
int flags)
Set the flag(s) associated with a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetId(TRITONSERVER_InferenceRequest inference_request,
BytePointer id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetId(TRITONSERVER_InferenceRequest inference_request,
String id)
Set the ID for a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetIntParameter(TRITONSERVER_InferenceRequest request,
BytePointer key,
long value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetIntParameter(TRITONSERVER_InferenceRequest request,
String key,
long value)
Set an integer parameter in the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetPriority(TRITONSERVER_InferenceRequest inference_request,
int priority)
Deprecated.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetPriorityUInt64(TRITONSERVER_InferenceRequest inference_request,
long priority)
Set the priority for a request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetReleaseCallback(TRITONSERVER_InferenceRequest inference_request,
TRITONSERVER_InferenceRequestReleaseFn_t request_release_fn,
Pointer request_release_userp)
Set the release callback for an inference request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetResponseCallback(TRITONSERVER_InferenceRequest inference_request,
TRITONSERVER_ResponseAllocator response_allocator,
Pointer response_allocator_userp,
TRITONSERVER_InferenceResponseCompleteFn_t response_fn,
Pointer response_userp)
Set the allocator and response callback for an inference
request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetStringParameter(TRITONSERVER_InferenceRequest request,
BytePointer key,
BytePointer value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetStringParameter(TRITONSERVER_InferenceRequest request,
String key,
String value)
Set a string parameter in the request.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestSetTimeoutMicroseconds(TRITONSERVER_InferenceRequest inference_request,
long timeout_us)
Set the timeout for a request, in microseconds.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestTimeoutMicroseconds(TRITONSERVER_InferenceRequest inference_request,
long[] timeout_us) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestTimeoutMicroseconds(TRITONSERVER_InferenceRequest inference_request,
LongBuffer timeout_us) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceRequestTimeoutMicroseconds(TRITONSERVER_InferenceRequest inference_request,
LongPointer timeout_us)
Get the timeout for a request, in microseconds.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseDelete(TRITONSERVER_InferenceResponse inference_response)
TRITONSERVER_InferenceResponse
Object representing an inference response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseError(TRITONSERVER_InferenceResponse inference_response)
Return the error status of an inference response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseId(TRITONSERVER_InferenceResponse inference_response,
byte[] request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseId(TRITONSERVER_InferenceResponse inference_response,
ByteBuffer request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseId(TRITONSERVER_InferenceResponse inference_response,
BytePointer request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseId(TRITONSERVER_InferenceResponse inference_response,
PointerPointer request_id)
Get the ID of the request corresponding to a response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseModel(TRITONSERVER_InferenceResponse inference_response,
byte[] model_name,
long[] model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseModel(TRITONSERVER_InferenceResponse inference_response,
ByteBuffer model_name,
LongBuffer model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseModel(TRITONSERVER_InferenceResponse inference_response,
BytePointer model_name,
LongPointer model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseModel(TRITONSERVER_InferenceResponse inference_response,
PointerPointer model_name,
LongPointer model_version)
Get model used to produce a response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutput(TRITONSERVER_InferenceResponse inference_response,
int index,
byte[] name,
int[] datatype,
long[] shape,
long[] dim_count,
Pointer base,
SizeTPointer byte_size,
int[] memory_type,
long[] memory_type_id,
Pointer userp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutput(TRITONSERVER_InferenceResponse inference_response,
int index,
ByteBuffer name,
IntBuffer datatype,
LongBuffer shape,
LongBuffer dim_count,
Pointer base,
SizeTPointer byte_size,
IntBuffer memory_type,
LongBuffer memory_type_id,
Pointer userp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutput(TRITONSERVER_InferenceResponse inference_response,
int index,
BytePointer name,
IntPointer datatype,
LongPointer shape,
LongPointer dim_count,
Pointer base,
SizeTPointer byte_size,
IntPointer memory_type,
LongPointer memory_type_id,
Pointer userp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutput(TRITONSERVER_InferenceResponse inference_response,
int index,
PointerPointer name,
IntPointer datatype,
PointerPointer shape,
LongPointer dim_count,
PointerPointer base,
SizeTPointer byte_size,
IntPointer memory_type,
LongPointer memory_type_id,
PointerPointer userp)
Get all information about an output tensor.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputClassificationLabel(TRITONSERVER_InferenceResponse inference_response,
int index,
long class_index,
byte[] label) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputClassificationLabel(TRITONSERVER_InferenceResponse inference_response,
int index,
long class_index,
ByteBuffer label) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputClassificationLabel(TRITONSERVER_InferenceResponse inference_response,
int index,
long class_index,
BytePointer label) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputClassificationLabel(TRITONSERVER_InferenceResponse inference_response,
int index,
long class_index,
PointerPointer label)
Get a classification label associated with an output for a given
index.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputCount(TRITONSERVER_InferenceResponse inference_response,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputCount(TRITONSERVER_InferenceResponse inference_response,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseOutputCount(TRITONSERVER_InferenceResponse inference_response,
IntPointer count)
Get the number of outputs available in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameter(TRITONSERVER_InferenceResponse inference_response,
int index,
byte[] name,
int[] type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameter(TRITONSERVER_InferenceResponse inference_response,
int index,
ByteBuffer name,
IntBuffer type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameter(TRITONSERVER_InferenceResponse inference_response,
int index,
BytePointer name,
IntPointer type,
Pointer vvalue) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameter(TRITONSERVER_InferenceResponse inference_response,
int index,
PointerPointer name,
IntPointer type,
PointerPointer vvalue)
Get all information about a parameter.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameterCount(TRITONSERVER_InferenceResponse inference_response,
int[] count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameterCount(TRITONSERVER_InferenceResponse inference_response,
IntBuffer count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceResponseParameterCount(TRITONSERVER_InferenceResponse inference_response,
IntPointer count)
Get the number of parameters available in the response.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceDelete(TRITONSERVER_InferenceTrace trace)
Delete a trace object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceId(TRITONSERVER_InferenceTrace trace,
long[] id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceId(TRITONSERVER_InferenceTrace trace,
LongBuffer id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceId(TRITONSERVER_InferenceTrace trace,
LongPointer id)
Get the id associated with a trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelName(TRITONSERVER_InferenceTrace trace,
byte[] model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelName(TRITONSERVER_InferenceTrace trace,
ByteBuffer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelName(TRITONSERVER_InferenceTrace trace,
BytePointer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelName(TRITONSERVER_InferenceTrace trace,
PointerPointer model_name)
Get the name of the model associated with a trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelVersion(TRITONSERVER_InferenceTrace trace,
long[] model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelVersion(TRITONSERVER_InferenceTrace trace,
LongBuffer model_version) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceModelVersion(TRITONSERVER_InferenceTrace trace,
LongPointer model_version)
Get the version of the model associated with a trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceNew(PointerPointer trace,
int level,
long parent_id,
TRITONSERVER_InferenceTraceActivityFn_t activity_fn,
TRITONSERVER_InferenceTraceReleaseFn_t release_fn,
Pointer trace_userp)
Create a new inference trace object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceNew(TRITONSERVER_InferenceTrace trace,
int level,
long parent_id,
TRITONSERVER_InferenceTraceActivityFn_t activity_fn,
TRITONSERVER_InferenceTraceReleaseFn_t release_fn,
Pointer trace_userp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceParentId(TRITONSERVER_InferenceTrace trace,
long[] parent_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceParentId(TRITONSERVER_InferenceTrace trace,
LongBuffer parent_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceParentId(TRITONSERVER_InferenceTrace trace,
LongPointer parent_id)
Get the parent id associated with a trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceRequestId(TRITONSERVER_InferenceTrace trace,
byte[] request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceRequestId(TRITONSERVER_InferenceTrace trace,
ByteBuffer request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceRequestId(TRITONSERVER_InferenceTrace trace,
BytePointer request_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceRequestId(TRITONSERVER_InferenceTrace trace,
PointerPointer request_id)
Get the request id associated with a trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceSpawnChildTrace(TRITONSERVER_InferenceTrace trace,
PointerPointer child_trace)
Get the child trace, spawned from the parent trace.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceSpawnChildTrace(TRITONSERVER_InferenceTrace trace,
TRITONSERVER_InferenceTrace child_trace) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceTensorNew(PointerPointer trace,
int level,
long parent_id,
TRITONSERVER_InferenceTraceActivityFn_t activity_fn,
TRITONSERVER_InferenceTraceTensorActivityFn_t tensor_activity_fn,
TRITONSERVER_InferenceTraceReleaseFn_t release_fn,
Pointer trace_userp)
Create a new inference trace object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_InferenceTraceTensorNew(TRITONSERVER_InferenceTrace trace,
int level,
long parent_id,
TRITONSERVER_InferenceTraceActivityFn_t activity_fn,
TRITONSERVER_InferenceTraceTensorActivityFn_t tensor_activity_fn,
TRITONSERVER_InferenceTraceReleaseFn_t release_fn,
Pointer trace_userp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_LogMessage(int level,
BytePointer filename,
int line,
BytePointer msg) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_LogMessage(int level,
String filename,
int line,
String msg)
Log a message at a given log level if that level is enabled.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageDelete(TRITONSERVER_Message message)
Delete a message object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageNewFromSerializedJson(PointerPointer message,
String base,
long byte_size)
TRITONSERVER_Message
Object representing a Triton Server message.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageNewFromSerializedJson(TRITONSERVER_Message message,
BytePointer base,
long byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageNewFromSerializedJson(TRITONSERVER_Message message,
String base,
long byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageSerializeToJson(TRITONSERVER_Message message,
byte[] base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageSerializeToJson(TRITONSERVER_Message message,
ByteBuffer base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageSerializeToJson(TRITONSERVER_Message message,
BytePointer base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MessageSerializeToJson(TRITONSERVER_Message message,
PointerPointer base,
SizeTPointer byte_size)
Get the base and size of the buffer containing the serialized
message in JSON format.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricDelete(TRITONSERVER_Metric metric)
Delete a metric object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricFamilyDelete(TRITONSERVER_MetricFamily family)
Delete a metric family object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricFamilyNew(PointerPointer family,
int kind,
String name,
String description)
Create a new metric family object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricFamilyNew(TRITONSERVER_MetricFamily family,
int kind,
BytePointer name,
BytePointer description) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricFamilyNew(TRITONSERVER_MetricFamily family,
int kind,
String name,
String description) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricIncrement(TRITONSERVER_Metric metric,
double value)
Increment the current value of metric by value.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricNew(PointerPointer metric,
TRITONSERVER_MetricFamily family,
PointerPointer labels,
long label_count)
Create a new metric object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricNew(TRITONSERVER_Metric metric,
TRITONSERVER_MetricFamily family,
TRITONSERVER_Parameter labels,
long label_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricsDelete(TRITONSERVER_Metrics metrics)
Delete a metrics object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricSet(TRITONSERVER_Metric metric,
double value)
Set the current value of metric to value.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricsFormatted(TRITONSERVER_Metrics metrics,
int format,
byte[] base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricsFormatted(TRITONSERVER_Metrics metrics,
int format,
ByteBuffer base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricsFormatted(TRITONSERVER_Metrics metrics,
int format,
BytePointer base,
SizeTPointer byte_size) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricsFormatted(TRITONSERVER_Metrics metrics,
int format,
PointerPointer base,
SizeTPointer byte_size)
Get a buffer containing the metrics in the specified format.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricValue(TRITONSERVER_Metric metric,
double[] value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricValue(TRITONSERVER_Metric metric,
DoubleBuffer value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_MetricValue(TRITONSERVER_Metric metric,
DoublePointer value)
Get the current value of a metric object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ResponseAllocatorDelete(TRITONSERVER_ResponseAllocator allocator)
Delete a response allocator.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ResponseAllocatorNew(PointerPointer allocator,
TRITONSERVER_ResponseAllocatorAllocFn_t alloc_fn,
TRITONSERVER_ResponseAllocatorReleaseFn_t release_fn,
TRITONSERVER_ResponseAllocatorStartFn_t start_fn)
Create a new response allocator object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ResponseAllocatorNew(TRITONSERVER_ResponseAllocator allocator,
TRITONSERVER_ResponseAllocatorAllocFn_t alloc_fn,
TRITONSERVER_ResponseAllocatorReleaseFn_t release_fn,
TRITONSERVER_ResponseAllocatorStartFn_t start_fn) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ResponseAllocatorSetBufferAttributesFunction(TRITONSERVER_ResponseAllocator allocator,
TRITONSERVER_ResponseAllocatorBufferAttributesFn_t buffer_attributes_fn)
Set the buffer attributes function for a response allocator object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ResponseAllocatorSetQueryFunction(TRITONSERVER_ResponseAllocator allocator,
TRITONSERVER_ResponseAllocatorQueryFn_t query_fn)
Set the query function to a response allocator object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerDelete(TRITONSERVER_Server server)
Delete a server object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerInferAsync(TRITONSERVER_Server server,
TRITONSERVER_InferenceRequest inference_request,
TRITONSERVER_InferenceTrace trace)
Perform inference using the meta-data and inputs supplied by the
'inference_request'.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerIsLive(TRITONSERVER_Server server,
boolean[] live)
Is the server live?
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerIsLive(TRITONSERVER_Server server,
BoolPointer live) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerIsReady(TRITONSERVER_Server server,
boolean[] ready)
Is the server ready?
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerIsReady(TRITONSERVER_Server server,
BoolPointer ready) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerLoadModel(TRITONSERVER_Server server,
BytePointer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerLoadModel(TRITONSERVER_Server server,
String model_name)
Load the requested model or reload the model if it is already
loaded.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerLoadModelWithParameters(TRITONSERVER_Server server,
BytePointer model_name,
TRITONSERVER_Parameter parameters,
long parameter_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerLoadModelWithParameters(TRITONSERVER_Server server,
String model_name,
PointerPointer parameters,
long parameter_count)
Load the requested model or reload the model if it is already
loaded, with load parameters provided.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerLoadModelWithParameters(TRITONSERVER_Server server,
String model_name,
TRITONSERVER_Parameter parameters,
long parameter_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerMetadata(TRITONSERVER_Server server,
PointerPointer server_metadata)
Get the metadata of the server as a TRITONSERVER_Message object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerMetadata(TRITONSERVER_Server server,
TRITONSERVER_Message server_metadata) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerMetrics(TRITONSERVER_Server server,
PointerPointer metrics)
Get the current metrics for the server.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerMetrics(TRITONSERVER_Server server,
TRITONSERVER_Metrics metrics) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
int[] flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
IntBuffer flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
IntPointer flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
int[] flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntBuffer flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntPointer flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelBatchProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntPointer flags,
PointerPointer voidp)
Get the batch properties of the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelConfig(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
int config_version,
TRITONSERVER_Message model_config) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelConfig(TRITONSERVER_Server server,
String model_name,
long model_version,
int config_version,
PointerPointer model_config)
Get the configuration of a model as a TRITONSERVER_Message object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelConfig(TRITONSERVER_Server server,
String model_name,
long model_version,
int config_version,
TRITONSERVER_Message model_config) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelIndex(TRITONSERVER_Server server,
int flags,
PointerPointer model_index)
Get the index of all unique models in the model repositories as a
TRITONSERVER_Message object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelIndex(TRITONSERVER_Server server,
int flags,
TRITONSERVER_Message model_index) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelIsReady(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
BoolPointer ready) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelIsReady(TRITONSERVER_Server server,
String model_name,
long model_version,
boolean[] ready)
Is the model ready?
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelMetadata(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
TRITONSERVER_Message model_metadata) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelMetadata(TRITONSERVER_Server server,
String model_name,
long model_version,
PointerPointer model_metadata)
Get the metadata of a model as a TRITONSERVER_Message
object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelMetadata(TRITONSERVER_Server server,
String model_name,
long model_version,
TRITONSERVER_Message model_metadata) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelStatistics(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
TRITONSERVER_Message model_stats) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelStatistics(TRITONSERVER_Server server,
String model_name,
long model_version,
PointerPointer model_stats)
Get the statistics of a model as a TRITONSERVER_Message
object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelStatistics(TRITONSERVER_Server server,
String model_name,
long model_version,
TRITONSERVER_Message model_stats) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
int[] txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
IntBuffer txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
BytePointer model_name,
long model_version,
IntPointer txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
int[] txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntBuffer txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntPointer txn_flags,
Pointer voidp) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerModelTransactionProperties(TRITONSERVER_Server server,
String model_name,
long model_version,
IntPointer txn_flags,
PointerPointer voidp)
Get the transaction policy of the model.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerNew(PointerPointer server,
TRITONSERVER_ServerOptions options)
Create a new server object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerNew(TRITONSERVER_Server server,
TRITONSERVER_ServerOptions options) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsAddRateLimiterResource(TRITONSERVER_ServerOptions options,
BytePointer resource_name,
long resource_count,
int device) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsAddRateLimiterResource(TRITONSERVER_ServerOptions options,
String resource_name,
long resource_count,
int device)
Add resource count for rate limiting.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsDelete(TRITONSERVER_ServerOptions options)
Delete a server options object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsNew(PointerPointer options)
Create a new server options object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsNew(TRITONSERVER_ServerOptions options) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetBackendConfig(TRITONSERVER_ServerOptions options,
BytePointer backend_name,
BytePointer setting,
BytePointer value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetBackendConfig(TRITONSERVER_ServerOptions options,
String backend_name,
String setting,
String value)
Set a configuration setting for a named backend in a server
options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetBackendDirectory(TRITONSERVER_ServerOptions options,
BytePointer backend_dir) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetBackendDirectory(TRITONSERVER_ServerOptions options,
String backend_dir)
Set the directory containing backend shared libraries.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetBufferManagerThreadCount(TRITONSERVER_ServerOptions options,
int thread_count)
Set the number of threads used in buffer manager in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCacheConfig(TRITONSERVER_ServerOptions options,
BytePointer cache_name,
BytePointer config_json) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCacheConfig(TRITONSERVER_ServerOptions options,
String cache_name,
String config_json)
Set the cache config that will be used to initialize the cache
implementation for "cache_name".
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCacheDirectory(TRITONSERVER_ServerOptions options,
BytePointer cache_dir) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCacheDirectory(TRITONSERVER_ServerOptions options,
String cache_dir)
Set the directory containing cache shared libraries.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCpuMetrics(TRITONSERVER_ServerOptions options,
boolean cpu_metrics)
Enable or disable CPU metrics collection in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCudaMemoryPoolByteSize(TRITONSERVER_ServerOptions options,
int gpu_device,
long size)
Set the total CUDA memory byte size that the server can allocate
on given GPU device in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetCudaVirtualAddressSize(TRITONSERVER_ServerOptions options,
int gpu_device,
long cuda_virtual_address_size)
Set the size of the virtual address space that will be used
for growable memory in implicit state.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetExitOnError(TRITONSERVER_ServerOptions options,
boolean exit)
Enable or disable exit-on-error in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetExitTimeout(TRITONSERVER_ServerOptions options,
int timeout)
Set the exit timeout, in seconds, for the server in a server
options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetGpuMetrics(TRITONSERVER_ServerOptions options,
boolean gpu_metrics)
Enable or disable GPU metrics collection in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetHostPolicy(TRITONSERVER_ServerOptions options,
BytePointer policy_name,
BytePointer setting,
BytePointer value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetHostPolicy(TRITONSERVER_ServerOptions options,
String policy_name,
String setting,
String value)
Set a host policy setting for a given policy name in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogError(TRITONSERVER_ServerOptions options,
boolean log)
Enable or disable error level logging.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogFile(TRITONSERVER_ServerOptions options,
BytePointer file) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogFile(TRITONSERVER_ServerOptions options,
String file)
Provide a log output file.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogFormat(TRITONSERVER_ServerOptions options,
int format)
Set the logging format.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogInfo(TRITONSERVER_ServerOptions options,
boolean log)
Enable or disable info level logging.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogVerbose(TRITONSERVER_ServerOptions options,
int level)
Set verbose logging level.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetLogWarn(TRITONSERVER_ServerOptions options,
boolean log)
Enable or disable warning level logging.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetMetrics(TRITONSERVER_ServerOptions options,
boolean metrics)
Enable or disable metrics collection in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetMetricsConfig(TRITONSERVER_ServerOptions options,
BytePointer name,
BytePointer setting,
BytePointer value) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetMetricsConfig(TRITONSERVER_ServerOptions options,
String name,
String setting,
String value)
Set a configuration setting for metrics in server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetMetricsInterval(TRITONSERVER_ServerOptions options,
long metrics_interval_ms)
Set the interval for metrics collection in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetMinSupportedComputeCapability(TRITONSERVER_ServerOptions options,
double cc)
Set the minimum support CUDA compute capability in a server
options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelControlMode(TRITONSERVER_ServerOptions options,
int mode)
Set the model control mode in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelLoadDeviceLimit(TRITONSERVER_ServerOptions options,
int kind,
int device_id,
double fraction)
Specify the limit on memory usage as a fraction on the device identified by
'kind' and 'device_id'.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelLoadThreadCount(TRITONSERVER_ServerOptions options,
int thread_count)
Set the number of threads to concurrently load models in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelNamespacing(TRITONSERVER_ServerOptions options,
boolean enable_namespace)
Enable model namespacing to allow serving models with the same name if
they are in different namespaces.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelRepositoryPath(TRITONSERVER_ServerOptions options,
BytePointer model_repository_path) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetModelRepositoryPath(TRITONSERVER_ServerOptions options,
String model_repository_path)
Set the model repository path in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetPinnedMemoryPoolByteSize(TRITONSERVER_ServerOptions options,
long size)
Set the total pinned memory byte size that the server can allocate
in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetRateLimiterMode(TRITONSERVER_ServerOptions options,
int mode)
Set the rate limit mode in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetRepoAgentDirectory(TRITONSERVER_ServerOptions options,
BytePointer repoagent_dir) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetRepoAgentDirectory(TRITONSERVER_ServerOptions options,
String repoagent_dir)
Set the directory containing repository agent shared libraries.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetResponseCacheByteSize(TRITONSERVER_ServerOptions options,
long size)
Deprecated.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetServerId(TRITONSERVER_ServerOptions options,
BytePointer server_id) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetServerId(TRITONSERVER_ServerOptions options,
String server_id)
Set the textual ID for the server in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetStartupModel(TRITONSERVER_ServerOptions options,
BytePointer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetStartupModel(TRITONSERVER_ServerOptions options,
String model_name)
Set the model to be loaded at startup in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetStrictModelConfig(TRITONSERVER_ServerOptions options,
boolean strict)
Enable or disable strict model configuration handling in a server
options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerOptionsSetStrictReadiness(TRITONSERVER_ServerOptions options,
boolean strict)
Enable or disable strict readiness handling in a server options.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerPollModelRepository(TRITONSERVER_Server server)
Check the model repository for changes and update server state
based on those changes.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerRegisterModelRepository(TRITONSERVER_Server server,
BytePointer repository_path,
TRITONSERVER_Parameter name_mapping,
int mapping_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerRegisterModelRepository(TRITONSERVER_Server server,
String repository_path,
PointerPointer name_mapping,
int mapping_count)
Register a new model repository.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerRegisterModelRepository(TRITONSERVER_Server server,
String repository_path,
TRITONSERVER_Parameter name_mapping,
int mapping_count) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerStop(TRITONSERVER_Server server)
Stop a server object.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnloadModel(TRITONSERVER_Server server,
BytePointer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnloadModel(TRITONSERVER_Server server,
String model_name)
Unload the requested model.
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnloadModelAndDependents(TRITONSERVER_Server server,
BytePointer model_name) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnloadModelAndDependents(TRITONSERVER_Server server,
String model_name)
Unload the requested model, and also unload any dependent model that
was loaded along with the requested model (for example, the models composing
an ensemble).
|
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnregisterModelRepository(TRITONSERVER_Server server,
BytePointer repository_path) |
static TRITONSERVER_Error |
tritonserver.TRITONSERVER_ServerUnregisterModelRepository(TRITONSERVER_Server server,
String repository_path)
Unregister a model repository.
|