tritonclient 2.34.0__py3-none-any.whl → 2.36.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (43) hide show
  1. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_client.py +20 -0
  2. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_utils.py +1 -1
  3. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/__init__.py +4 -1
  4. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/model_config_pb2.py +1 -1
  5. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2.py +131 -121
  6. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/utils/__init__.py +1 -0
  7. tritonclient-2.36.0.data/purelib/tritonclient/utils/_dlpack.py +266 -0
  8. tritonclient-2.36.0.data/purelib/tritonclient/utils/_shared_memory_tensor.py +79 -0
  9. {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/METADATA +1 -1
  10. tritonclient-2.36.0.dist-info/RECORD +42 -0
  11. tritonclient-2.34.0.dist-info/RECORD +0 -40
  12. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/data/LICENSE.txt +0 -0
  13. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/__init__.py +0 -0
  14. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_auth.py +0 -0
  15. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_client.py +0 -0
  16. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_plugin.py +0 -0
  17. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_request.py +0 -0
  18. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/__init__.py +0 -0
  19. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_input.py +0 -0
  20. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_result.py +0 -0
  21. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_stream.py +0 -0
  22. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_requested_output.py +0 -0
  23. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/auth/__init__.py +0 -0
  24. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/auth/__init__.py +0 -0
  25. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2_grpc.py +0 -0
  26. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/__init__.py +0 -0
  27. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_client.py +0 -0
  28. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_input.py +0 -0
  29. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_result.py +0 -0
  30. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_requested_output.py +0 -0
  31. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_utils.py +0 -0
  32. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/__init__.py +0 -0
  33. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/auth/__init__.py +0 -0
  34. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/auth/__init__.py +0 -0
  35. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclientutils/__init__.py +0 -0
  36. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/__init__.py +0 -0
  37. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/grpc_service_pb2.py +0 -0
  38. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/grpc_service_pb2_grpc.py +0 -0
  39. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/model_config_pb2.py +0 -0
  40. {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonhttpclient/__init__.py +0 -0
  41. {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/LICENSE.txt +0 -0
  42. {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/WHEEL +0 -0
  43. {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/top_level.txt +0 -0
@@ -1532,6 +1532,7 @@ class InferenceServerClient(InferenceServerClientBase):
1532
1532
  sequence_id=0,
1533
1533
  sequence_start=False,
1534
1534
  sequence_end=False,
1535
+ enable_empty_final_response=False,
1535
1536
  priority=0,
1536
1537
  timeout=None,
1537
1538
  parameters=None):
@@ -1571,6 +1572,18 @@ class InferenceServerClient(InferenceServerClientBase):
1571
1572
  Indicates whether the request being added marks the end of the
1572
1573
  sequence. Default value is False. This argument is ignored if
1573
1574
  'sequence_id' is 0 or "".
1575
+ enable_empty_final_response: bool
1576
+ Indicates whether "empty" responses should be generated and sent
1577
+ back to the client from the server during streaming inference when
1578
+ they contain the TRITONSERVER_RESPONSE_COMPLETE_FINAL flag.
1579
+ This strictly relates to the case of models/backends that send
1580
+ flags-only responses (use TRITONBACKEND_ResponseFactorySendFlags(TRITONSERVER_RESPONSE_COMPLETE_FINAL)
1581
+ or InferenceResponseSender.send(flags=TRITONSERVER_RESPONSE_COMPLETE_FINAL))
1582
+ Currently, this only occurs for decoupled models, and can be
1583
+ used to communicate to the client when a request has received
1584
+ its final response from the model. If the backend sends the final
1585
+ flag along with a non-empty response, this arg is not needed.
1586
+ Default value is False.
1574
1587
  priority : int
1575
1588
  Indicates the priority of the request. Priority value zero
1576
1589
  indicates that the default priority level should be used
@@ -1616,6 +1629,13 @@ class InferenceServerClient(InferenceServerClientBase):
1616
1629
  priority=priority,
1617
1630
  timeout=timeout,
1618
1631
  parameters=parameters)
1632
+
1633
+ # Unique to streaming inference as it only pertains to decoupled models
1634
+ # Only attach the parameter if True, no need to send/parse when False.
1635
+ if enable_empty_final_response:
1636
+ request.parameters[
1637
+ 'triton_enable_empty_final_response'].bool_param = True
1638
+
1619
1639
  if self._verbose:
1620
1640
  print("async_stream_infer\n{}".format(request))
1621
1641
  # Enqueues the request to the stream
@@ -85,7 +85,7 @@ def _get_inference_request(model_name, inputs, model_version, request_id,
85
85
  request.parameters['sequence_start'].bool_param = sequence_start
86
86
  request.parameters['sequence_end'].bool_param = sequence_end
87
87
  if priority != 0:
88
- request.parameters['priority'].int64_param = priority
88
+ request.parameters['priority'].uint64_param = priority
89
89
  if timeout is not None:
90
90
  request.parameters['timeout'].int64_param = timeout
91
91
 
@@ -24,9 +24,12 @@
24
24
  # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25
25
  # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26
26
 
27
+ import base64
28
+
29
+ import rapidjson as json
30
+ from google.protobuf.json_format import MessageToJson
27
31
  from tritonclient.grpc import *
28
32
  from .._utils import _get_inference_request, _grpc_compression_type
29
- import base64
30
33
  from ..._client import InferenceServerClientBase
31
34
  from ..._request import Request
32
35
  from ..._plugin import InferenceServerClientPlugin
@@ -15,7 +15,7 @@ _sym_db = _symbol_database.Default()
15
15
 
16
16
 
17
17
 
18
- DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12model_config.proto\x12\tinference\"\x96\x01\n\x10ModelRateLimiter\x12\x37\n\tresources\x18\x01 \x03(\x0b\x32$.inference.ModelRateLimiter.Resource\x12\x10\n\x08priority\x18\x02 \x01(\r\x1a\x37\n\x08Resource\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0e\n\x06global\x18\x02 \x01(\x08\x12\r\n\x05\x63ount\x18\x03 \x01(\r\"\x87\x04\n\x12ModelInstanceGroup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x30\n\x04kind\x18\x04 \x01(\x0e\x32\".inference.ModelInstanceGroup.Kind\x12\r\n\x05\x63ount\x18\x02 \x01(\x05\x12\x31\n\x0crate_limiter\x18\x06 \x01(\x0b\x32\x1b.inference.ModelRateLimiter\x12\x0c\n\x04gpus\x18\x03 \x03(\x05\x12H\n\x11secondary_devices\x18\x08 \x03(\x0b\x32-.inference.ModelInstanceGroup.SecondaryDevice\x12\x0f\n\x07profile\x18\x05 \x03(\t\x12\x0f\n\x07passive\x18\x07 \x01(\x08\x12\x13\n\x0bhost_policy\x18\t \x01(\t\x1a\x9c\x01\n\x0fSecondaryDevice\x12O\n\x04kind\x18\x01 \x01(\x0e\x32\x41.inference.ModelInstanceGroup.SecondaryDevice.SecondaryDeviceKind\x12\x11\n\tdevice_id\x18\x02 \x01(\x03\"%\n\x13SecondaryDeviceKind\x12\x0e\n\nKIND_NVDLA\x10\x00\"A\n\x04Kind\x12\r\n\tKIND_AUTO\x10\x00\x12\x0c\n\x08KIND_GPU\x10\x01\x12\x0c\n\x08KIND_CPU\x10\x02\x12\x0e\n\nKIND_MODEL\x10\x03\"#\n\x12ModelTensorReshape\x12\r\n\x05shape\x18\x01 \x03(\x03\"\xb2\x02\n\nModelInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12,\n\x06\x66ormat\x18\x03 \x01(\x0e\x32\x1c.inference.ModelInput.Format\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\x12\x1a\n\x12\x61llow_ragged_batch\x18\x07 \x01(\x08\x12\x10\n\x08optional\x18\x08 \x01(\x08\";\n\x06\x46ormat\x12\x0f\n\x0b\x46ORMAT_NONE\x10\x00\x12\x0f\n\x0b\x46ORMAT_NHWC\x10\x01\x12\x0f\n\x0b\x46ORMAT_NCHW\x10\x02\"\xb2\x01\n\x0bModelOutput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x03 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x16\n\x0elabel_filename\x18\x04 \x01(\t\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\"\xd9\x02\n\nBatchInput\x12(\n\x04kind\x18\x01 \x01(\x0e\x32\x1a.inference.BatchInput.Kind\x12\x13\n\x0btarget_name\x18\x02 \x03(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x14\n\x0csource_input\x18\x04 \x03(\t\"\xcd\x01\n\x04Kind\x12\x17\n\x13\x42\x41TCH_ELEMENT_COUNT\x10\x00\x12#\n\x1f\x42\x41TCH_ACCUMULATED_ELEMENT_COUNT\x10\x01\x12-\n)BATCH_ACCUMULATED_ELEMENT_COUNT_WITH_ZERO\x10\x02\x12$\n BATCH_MAX_ELEMENT_COUNT_AS_SHAPE\x10\x03\x12\x14\n\x10\x42\x41TCH_ITEM_SHAPE\x10\x04\x12\x1c\n\x18\x42\x41TCH_ITEM_SHAPE_FLATTEN\x10\x05\"\x8f\x01\n\x0b\x42\x61tchOutput\x12\x13\n\x0btarget_name\x18\x01 \x03(\t\x12)\n\x04kind\x18\x02 \x01(\x0e\x32\x1b.inference.BatchOutput.Kind\x12\x14\n\x0csource_input\x18\x03 \x03(\t\"*\n\x04Kind\x12\"\n\x1e\x42\x41TCH_SCATTER_WITH_INPUT_SHAPE\x10\x00\"\x90\x02\n\x12ModelVersionPolicy\x12\x36\n\x06latest\x18\x01 \x01(\x0b\x32$.inference.ModelVersionPolicy.LatestH\x00\x12\x30\n\x03\x61ll\x18\x02 \x01(\x0b\x32!.inference.ModelVersionPolicy.AllH\x00\x12:\n\x08specific\x18\x03 \x01(\x0b\x32&.inference.ModelVersionPolicy.SpecificH\x00\x1a\x1e\n\x06Latest\x12\x14\n\x0cnum_versions\x18\x01 \x01(\r\x1a\x05\n\x03\x41ll\x1a\x1c\n\x08Specific\x12\x10\n\x08versions\x18\x01 \x03(\x03\x42\x0f\n\rpolicy_choice\"\xfd\r\n\x17ModelOptimizationPolicy\x12\x37\n\x05graph\x18\x01 \x01(\x0b\x32(.inference.ModelOptimizationPolicy.Graph\x12\x42\n\x08priority\x18\x02 \x01(\x0e\x32\x30.inference.ModelOptimizationPolicy.ModelPriority\x12\x35\n\x04\x63uda\x18\x03 \x01(\x0b\x32\'.inference.ModelOptimizationPolicy.Cuda\x12X\n\x16\x65xecution_accelerators\x18\x04 \x01(\x0b\x32\x38.inference.ModelOptimizationPolicy.ExecutionAccelerators\x12R\n\x13input_pinned_memory\x18\x05 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12S\n\x14output_pinned_memory\x18\x06 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12&\n\x1egather_kernel_buffer_threshold\x18\x07 \x01(\r\x12\x16\n\x0e\x65\x61ger_batching\x18\x08 \x01(\x08\x1a\x16\n\x05Graph\x12\r\n\x05level\x18\x01 \x01(\x05\x1a\xba\x05\n\x04\x43uda\x12\x0e\n\x06graphs\x18\x01 \x01(\x08\x12\x18\n\x10\x62usy_wait_events\x18\x02 \x01(\x08\x12\x45\n\ngraph_spec\x18\x03 \x03(\x0b\x32\x31.inference.ModelOptimizationPolicy.Cuda.GraphSpec\x12\x1a\n\x12output_copy_stream\x18\x04 \x01(\x08\x1a\xa4\x04\n\tGraphSpec\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12K\n\x05input\x18\x02 \x03(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.InputEntry\x12W\n\x11graph_lower_bound\x18\x03 \x01(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound\x1a\x14\n\x05Shape\x12\x0b\n\x03\x64im\x18\x01 \x03(\x03\x1a\xdf\x01\n\nLowerBound\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12V\n\x05input\x18\x02 \x03(\x0b\x32G.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound.InputEntry\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\xa4\x03\n\x15\x45xecutionAccelerators\x12g\n\x19gpu_execution_accelerator\x18\x01 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x12g\n\x19\x63pu_execution_accelerator\x18\x02 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x1a\xb8\x01\n\x0b\x41\x63\x63\x65lerator\x12\x0c\n\x04name\x18\x01 \x01(\t\x12h\n\nparameters\x18\x02 \x03(\x0b\x32T.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a$\n\x12PinnedMemoryBuffer\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"I\n\rModelPriority\x12\x14\n\x10PRIORITY_DEFAULT\x10\x00\x12\x10\n\x0cPRIORITY_MAX\x10\x01\x12\x10\n\x0cPRIORITY_MIN\x10\x02\"\xdb\x01\n\x10ModelQueuePolicy\x12\x41\n\x0etimeout_action\x18\x01 \x01(\x0e\x32).inference.ModelQueuePolicy.TimeoutAction\x12$\n\x1c\x64\x65\x66\x61ult_timeout_microseconds\x18\x02 \x01(\x04\x12\x1e\n\x16\x61llow_timeout_override\x18\x03 \x01(\x08\x12\x16\n\x0emax_queue_size\x18\x04 \x01(\r\"&\n\rTimeoutAction\x12\n\n\x06REJECT\x10\x00\x12\t\n\x05\x44\x45LAY\x10\x01\"\x9b\x03\n\x14ModelDynamicBatching\x12\x1c\n\x14preferred_batch_size\x18\x01 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x02 \x01(\x04\x12\x19\n\x11preserve_ordering\x18\x03 \x01(\x08\x12\x17\n\x0fpriority_levels\x18\x04 \x01(\r\x12\x1e\n\x16\x64\x65\x66\x61ult_priority_level\x18\x05 \x01(\r\x12\x39\n\x14\x64\x65\x66\x61ult_queue_policy\x18\x06 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy\x12W\n\x15priority_queue_policy\x18\x07 \x03(\x0b\x32\x38.inference.ModelDynamicBatching.PriorityQueuePolicyEntry\x1aW\n\x18PriorityQueuePolicyEntry\x12\x0b\n\x03key\x18\x01 \x01(\r\x12*\n\x05value\x18\x02 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy:\x02\x38\x01\"\xef\t\n\x15ModelSequenceBatching\x12\x41\n\x06\x64irect\x18\x03 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyDirectH\x00\x12\x41\n\x06oldest\x18\x04 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyOldestH\x00\x12&\n\x1emax_sequence_idle_microseconds\x18\x01 \x01(\x04\x12\x44\n\rcontrol_input\x18\x02 \x03(\x0b\x32-.inference.ModelSequenceBatching.ControlInput\x12\x35\n\x05state\x18\x05 \x03(\x0b\x32&.inference.ModelSequenceBatching.State\x1a\xb1\x02\n\x07\x43ontrol\x12;\n\x04kind\x18\x01 \x01(\x0e\x32-.inference.ModelSequenceBatching.Control.Kind\x12\x18\n\x10int32_false_true\x18\x02 \x03(\x05\x12\x17\n\x0f\x66p32_false_true\x18\x03 \x03(\x02\x12\x17\n\x0f\x62ool_false_true\x18\x05 \x03(\x08\x12&\n\tdata_type\x18\x04 \x01(\x0e\x32\x13.inference.DataType\"u\n\x04Kind\x12\x1a\n\x16\x43ONTROL_SEQUENCE_START\x10\x00\x12\x1a\n\x16\x43ONTROL_SEQUENCE_READY\x10\x01\x12\x18\n\x14\x43ONTROL_SEQUENCE_END\x10\x02\x12\x1b\n\x17\x43ONTROL_SEQUENCE_CORRID\x10\x03\x1aW\n\x0c\x43ontrolInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x39\n\x07\x63ontrol\x18\x02 \x03(\x0b\x32(.inference.ModelSequenceBatching.Control\x1a\x8a\x01\n\x0cInitialState\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x13\n\tdata_file\x18\x04 \x01(\tH\x00\x12\x0c\n\x04name\x18\x05 \x01(\tB\x0c\n\nstate_data\x1a\xac\x01\n\x05State\x12\x12\n\ninput_name\x18\x01 \x01(\t\x12\x13\n\x0boutput_name\x18\x02 \x01(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12\x44\n\rinitial_state\x18\x05 \x03(\x0b\x32-.inference.ModelSequenceBatching.InitialState\x1aX\n\x0eStrategyDirect\x12$\n\x1cmax_queue_delay_microseconds\x18\x01 \x01(\x04\x12 \n\x18minimum_slot_utilization\x18\x02 \x01(\x02\x1au\n\x0eStrategyOldest\x12\x1f\n\x17max_candidate_sequences\x18\x01 \x01(\x05\x12\x1c\n\x14preferred_batch_size\x18\x02 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x03 \x01(\x04\x42\x11\n\x0fstrategy_choice\"\xf6\x02\n\x0fModelEnsembling\x12-\n\x04step\x18\x01 \x03(\x0b\x32\x1f.inference.ModelEnsembling.Step\x1a\xb3\x02\n\x04Step\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\x03\x12@\n\tinput_map\x18\x03 \x03(\x0b\x32-.inference.ModelEnsembling.Step.InputMapEntry\x12\x42\n\noutput_map\x18\x04 \x03(\x0b\x32..inference.ModelEnsembling.Step.OutputMapEntry\x12\x17\n\x0fmodel_namespace\x18\x05 \x01(\t\x1a/\n\rInputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x30\n\x0eOutputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"&\n\x0eModelParameter\x12\x14\n\x0cstring_value\x18\x01 \x01(\t\"\xd9\x02\n\x0bModelWarmup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x02 \x01(\r\x12\x32\n\x06inputs\x18\x03 \x03(\x0b\x32\".inference.ModelWarmup.InputsEntry\x12\r\n\x05\x63ount\x18\x04 \x01(\r\x1a\x97\x01\n\x05Input\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x15\n\x0brandom_data\x18\x04 \x01(\x08H\x00\x12\x19\n\x0finput_data_file\x18\x05 \x01(\tH\x00\x42\x11\n\x0finput_data_type\x1aK\n\x0bInputsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12+\n\x05value\x18\x02 \x01(\x0b\x32\x1c.inference.ModelWarmup.Input:\x02\x38\x01\".\n\x0fModelOperations\x12\x1b\n\x13op_library_filename\x18\x01 \x03(\t\"+\n\x16ModelTransactionPolicy\x12\x11\n\tdecoupled\x18\x01 \x01(\x08\"\xe6\x01\n\x15ModelRepositoryAgents\x12\x36\n\x06\x61gents\x18\x01 \x03(\x0b\x32&.inference.ModelRepositoryAgents.Agent\x1a\x94\x01\n\x05\x41gent\x12\x0c\n\x04name\x18\x01 \x01(\t\x12J\n\nparameters\x18\x02 \x03(\x0b\x32\x36.inference.ModelRepositoryAgents.Agent.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"$\n\x12ModelResponseCache\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"\xb2\n\n\x0bModelConfig\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08platform\x18\x02 \x01(\t\x12\x0f\n\x07\x62\x61\x63kend\x18\x11 \x01(\t\x12\x35\n\x0eversion_policy\x18\x03 \x01(\x0b\x32\x1d.inference.ModelVersionPolicy\x12\x16\n\x0emax_batch_size\x18\x04 \x01(\x05\x12$\n\x05input\x18\x05 \x03(\x0b\x32\x15.inference.ModelInput\x12&\n\x06output\x18\x06 \x03(\x0b\x32\x16.inference.ModelOutput\x12*\n\x0b\x62\x61tch_input\x18\x14 \x03(\x0b\x32\x15.inference.BatchInput\x12,\n\x0c\x62\x61tch_output\x18\x15 \x03(\x0b\x32\x16.inference.BatchOutput\x12\x38\n\x0coptimization\x18\x0c \x01(\x0b\x32\".inference.ModelOptimizationPolicy\x12;\n\x10\x64ynamic_batching\x18\x0b \x01(\x0b\x32\x1f.inference.ModelDynamicBatchingH\x00\x12=\n\x11sequence_batching\x18\r \x01(\x0b\x32 .inference.ModelSequenceBatchingH\x00\x12\x39\n\x13\x65nsemble_scheduling\x18\x0f \x01(\x0b\x32\x1a.inference.ModelEnsemblingH\x00\x12\x35\n\x0einstance_group\x18\x07 \x03(\x0b\x32\x1d.inference.ModelInstanceGroup\x12\x1e\n\x16\x64\x65\x66\x61ult_model_filename\x18\x08 \x01(\t\x12H\n\x12\x63\x63_model_filenames\x18\t \x03(\x0b\x32,.inference.ModelConfig.CcModelFilenamesEntry\x12;\n\x0bmetric_tags\x18\n \x03(\x0b\x32&.inference.ModelConfig.MetricTagsEntry\x12:\n\nparameters\x18\x0e \x03(\x0b\x32&.inference.ModelConfig.ParametersEntry\x12,\n\x0cmodel_warmup\x18\x10 \x03(\x0b\x32\x16.inference.ModelWarmup\x12\x34\n\x10model_operations\x18\x12 \x01(\x0b\x32\x1a.inference.ModelOperations\x12\x43\n\x18model_transaction_policy\x18\x13 \x01(\x0b\x32!.inference.ModelTransactionPolicy\x12\x41\n\x17model_repository_agents\x18\x17 \x01(\x0b\x32 .inference.ModelRepositoryAgents\x12\x35\n\x0eresponse_cache\x18\x18 \x01(\x0b\x32\x1d.inference.ModelResponseCache\x1a\x37\n\x15\x43\x63ModelFilenamesEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x31\n\x0fMetricTagsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.ModelParameter:\x02\x38\x01\x42\x13\n\x11scheduling_choice*\xfa\x01\n\x08\x44\x61taType\x12\x10\n\x0cTYPE_INVALID\x10\x00\x12\r\n\tTYPE_BOOL\x10\x01\x12\x0e\n\nTYPE_UINT8\x10\x02\x12\x0f\n\x0bTYPE_UINT16\x10\x03\x12\x0f\n\x0bTYPE_UINT32\x10\x04\x12\x0f\n\x0bTYPE_UINT64\x10\x05\x12\r\n\tTYPE_INT8\x10\x06\x12\x0e\n\nTYPE_INT16\x10\x07\x12\x0e\n\nTYPE_INT32\x10\x08\x12\x0e\n\nTYPE_INT64\x10\t\x12\r\n\tTYPE_FP16\x10\n\x12\r\n\tTYPE_FP32\x10\x0b\x12\r\n\tTYPE_FP64\x10\x0c\x12\x0f\n\x0bTYPE_STRING\x10\r\x12\r\n\tTYPE_BF16\x10\x0e\x62\x06proto3')
18
+ DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12model_config.proto\x12\tinference\"\x96\x01\n\x10ModelRateLimiter\x12\x37\n\tresources\x18\x01 \x03(\x0b\x32$.inference.ModelRateLimiter.Resource\x12\x10\n\x08priority\x18\x02 \x01(\r\x1a\x37\n\x08Resource\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0e\n\x06global\x18\x02 \x01(\x08\x12\r\n\x05\x63ount\x18\x03 \x01(\r\"\x87\x04\n\x12ModelInstanceGroup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x30\n\x04kind\x18\x04 \x01(\x0e\x32\".inference.ModelInstanceGroup.Kind\x12\r\n\x05\x63ount\x18\x02 \x01(\x05\x12\x31\n\x0crate_limiter\x18\x06 \x01(\x0b\x32\x1b.inference.ModelRateLimiter\x12\x0c\n\x04gpus\x18\x03 \x03(\x05\x12H\n\x11secondary_devices\x18\x08 \x03(\x0b\x32-.inference.ModelInstanceGroup.SecondaryDevice\x12\x0f\n\x07profile\x18\x05 \x03(\t\x12\x0f\n\x07passive\x18\x07 \x01(\x08\x12\x13\n\x0bhost_policy\x18\t \x01(\t\x1a\x9c\x01\n\x0fSecondaryDevice\x12O\n\x04kind\x18\x01 \x01(\x0e\x32\x41.inference.ModelInstanceGroup.SecondaryDevice.SecondaryDeviceKind\x12\x11\n\tdevice_id\x18\x02 \x01(\x03\"%\n\x13SecondaryDeviceKind\x12\x0e\n\nKIND_NVDLA\x10\x00\"A\n\x04Kind\x12\r\n\tKIND_AUTO\x10\x00\x12\x0c\n\x08KIND_GPU\x10\x01\x12\x0c\n\x08KIND_CPU\x10\x02\x12\x0e\n\nKIND_MODEL\x10\x03\"#\n\x12ModelTensorReshape\x12\r\n\x05shape\x18\x01 \x03(\x03\"\xb2\x02\n\nModelInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12,\n\x06\x66ormat\x18\x03 \x01(\x0e\x32\x1c.inference.ModelInput.Format\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\x12\x1a\n\x12\x61llow_ragged_batch\x18\x07 \x01(\x08\x12\x10\n\x08optional\x18\x08 \x01(\x08\";\n\x06\x46ormat\x12\x0f\n\x0b\x46ORMAT_NONE\x10\x00\x12\x0f\n\x0b\x46ORMAT_NHWC\x10\x01\x12\x0f\n\x0b\x46ORMAT_NCHW\x10\x02\"\xb2\x01\n\x0bModelOutput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x03 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x16\n\x0elabel_filename\x18\x04 \x01(\t\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\"\xd9\x02\n\nBatchInput\x12(\n\x04kind\x18\x01 \x01(\x0e\x32\x1a.inference.BatchInput.Kind\x12\x13\n\x0btarget_name\x18\x02 \x03(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x14\n\x0csource_input\x18\x04 \x03(\t\"\xcd\x01\n\x04Kind\x12\x17\n\x13\x42\x41TCH_ELEMENT_COUNT\x10\x00\x12#\n\x1f\x42\x41TCH_ACCUMULATED_ELEMENT_COUNT\x10\x01\x12-\n)BATCH_ACCUMULATED_ELEMENT_COUNT_WITH_ZERO\x10\x02\x12$\n BATCH_MAX_ELEMENT_COUNT_AS_SHAPE\x10\x03\x12\x14\n\x10\x42\x41TCH_ITEM_SHAPE\x10\x04\x12\x1c\n\x18\x42\x41TCH_ITEM_SHAPE_FLATTEN\x10\x05\"\x8f\x01\n\x0b\x42\x61tchOutput\x12\x13\n\x0btarget_name\x18\x01 \x03(\t\x12)\n\x04kind\x18\x02 \x01(\x0e\x32\x1b.inference.BatchOutput.Kind\x12\x14\n\x0csource_input\x18\x03 \x03(\t\"*\n\x04Kind\x12\"\n\x1e\x42\x41TCH_SCATTER_WITH_INPUT_SHAPE\x10\x00\"\x90\x02\n\x12ModelVersionPolicy\x12\x36\n\x06latest\x18\x01 \x01(\x0b\x32$.inference.ModelVersionPolicy.LatestH\x00\x12\x30\n\x03\x61ll\x18\x02 \x01(\x0b\x32!.inference.ModelVersionPolicy.AllH\x00\x12:\n\x08specific\x18\x03 \x01(\x0b\x32&.inference.ModelVersionPolicy.SpecificH\x00\x1a\x1e\n\x06Latest\x12\x14\n\x0cnum_versions\x18\x01 \x01(\r\x1a\x05\n\x03\x41ll\x1a\x1c\n\x08Specific\x12\x10\n\x08versions\x18\x01 \x03(\x03\x42\x0f\n\rpolicy_choice\"\xfd\r\n\x17ModelOptimizationPolicy\x12\x37\n\x05graph\x18\x01 \x01(\x0b\x32(.inference.ModelOptimizationPolicy.Graph\x12\x42\n\x08priority\x18\x02 \x01(\x0e\x32\x30.inference.ModelOptimizationPolicy.ModelPriority\x12\x35\n\x04\x63uda\x18\x03 \x01(\x0b\x32\'.inference.ModelOptimizationPolicy.Cuda\x12X\n\x16\x65xecution_accelerators\x18\x04 \x01(\x0b\x32\x38.inference.ModelOptimizationPolicy.ExecutionAccelerators\x12R\n\x13input_pinned_memory\x18\x05 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12S\n\x14output_pinned_memory\x18\x06 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12&\n\x1egather_kernel_buffer_threshold\x18\x07 \x01(\r\x12\x16\n\x0e\x65\x61ger_batching\x18\x08 \x01(\x08\x1a\x16\n\x05Graph\x12\r\n\x05level\x18\x01 \x01(\x05\x1a\xba\x05\n\x04\x43uda\x12\x0e\n\x06graphs\x18\x01 \x01(\x08\x12\x18\n\x10\x62usy_wait_events\x18\x02 \x01(\x08\x12\x45\n\ngraph_spec\x18\x03 \x03(\x0b\x32\x31.inference.ModelOptimizationPolicy.Cuda.GraphSpec\x12\x1a\n\x12output_copy_stream\x18\x04 \x01(\x08\x1a\xa4\x04\n\tGraphSpec\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12K\n\x05input\x18\x02 \x03(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.InputEntry\x12W\n\x11graph_lower_bound\x18\x03 \x01(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound\x1a\x14\n\x05Shape\x12\x0b\n\x03\x64im\x18\x01 \x03(\x03\x1a\xdf\x01\n\nLowerBound\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12V\n\x05input\x18\x02 \x03(\x0b\x32G.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound.InputEntry\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\xa4\x03\n\x15\x45xecutionAccelerators\x12g\n\x19gpu_execution_accelerator\x18\x01 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x12g\n\x19\x63pu_execution_accelerator\x18\x02 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x1a\xb8\x01\n\x0b\x41\x63\x63\x65lerator\x12\x0c\n\x04name\x18\x01 \x01(\t\x12h\n\nparameters\x18\x02 \x03(\x0b\x32T.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a$\n\x12PinnedMemoryBuffer\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"I\n\rModelPriority\x12\x14\n\x10PRIORITY_DEFAULT\x10\x00\x12\x10\n\x0cPRIORITY_MAX\x10\x01\x12\x10\n\x0cPRIORITY_MIN\x10\x02\"\xdb\x01\n\x10ModelQueuePolicy\x12\x41\n\x0etimeout_action\x18\x01 \x01(\x0e\x32).inference.ModelQueuePolicy.TimeoutAction\x12$\n\x1c\x64\x65\x66\x61ult_timeout_microseconds\x18\x02 \x01(\x04\x12\x1e\n\x16\x61llow_timeout_override\x18\x03 \x01(\x08\x12\x16\n\x0emax_queue_size\x18\x04 \x01(\r\"&\n\rTimeoutAction\x12\n\n\x06REJECT\x10\x00\x12\t\n\x05\x44\x45LAY\x10\x01\"\x9b\x03\n\x14ModelDynamicBatching\x12\x1c\n\x14preferred_batch_size\x18\x01 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x02 \x01(\x04\x12\x19\n\x11preserve_ordering\x18\x03 \x01(\x08\x12\x17\n\x0fpriority_levels\x18\x04 \x01(\x04\x12\x1e\n\x16\x64\x65\x66\x61ult_priority_level\x18\x05 \x01(\x04\x12\x39\n\x14\x64\x65\x66\x61ult_queue_policy\x18\x06 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy\x12W\n\x15priority_queue_policy\x18\x07 \x03(\x0b\x32\x38.inference.ModelDynamicBatching.PriorityQueuePolicyEntry\x1aW\n\x18PriorityQueuePolicyEntry\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12*\n\x05value\x18\x02 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy:\x02\x38\x01\"\xef\t\n\x15ModelSequenceBatching\x12\x41\n\x06\x64irect\x18\x03 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyDirectH\x00\x12\x41\n\x06oldest\x18\x04 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyOldestH\x00\x12&\n\x1emax_sequence_idle_microseconds\x18\x01 \x01(\x04\x12\x44\n\rcontrol_input\x18\x02 \x03(\x0b\x32-.inference.ModelSequenceBatching.ControlInput\x12\x35\n\x05state\x18\x05 \x03(\x0b\x32&.inference.ModelSequenceBatching.State\x1a\xb1\x02\n\x07\x43ontrol\x12;\n\x04kind\x18\x01 \x01(\x0e\x32-.inference.ModelSequenceBatching.Control.Kind\x12\x18\n\x10int32_false_true\x18\x02 \x03(\x05\x12\x17\n\x0f\x66p32_false_true\x18\x03 \x03(\x02\x12\x17\n\x0f\x62ool_false_true\x18\x05 \x03(\x08\x12&\n\tdata_type\x18\x04 \x01(\x0e\x32\x13.inference.DataType\"u\n\x04Kind\x12\x1a\n\x16\x43ONTROL_SEQUENCE_START\x10\x00\x12\x1a\n\x16\x43ONTROL_SEQUENCE_READY\x10\x01\x12\x18\n\x14\x43ONTROL_SEQUENCE_END\x10\x02\x12\x1b\n\x17\x43ONTROL_SEQUENCE_CORRID\x10\x03\x1aW\n\x0c\x43ontrolInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x39\n\x07\x63ontrol\x18\x02 \x03(\x0b\x32(.inference.ModelSequenceBatching.Control\x1a\x8a\x01\n\x0cInitialState\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x13\n\tdata_file\x18\x04 \x01(\tH\x00\x12\x0c\n\x04name\x18\x05 \x01(\tB\x0c\n\nstate_data\x1a\xac\x01\n\x05State\x12\x12\n\ninput_name\x18\x01 \x01(\t\x12\x13\n\x0boutput_name\x18\x02 \x01(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12\x44\n\rinitial_state\x18\x05 \x03(\x0b\x32-.inference.ModelSequenceBatching.InitialState\x1aX\n\x0eStrategyDirect\x12$\n\x1cmax_queue_delay_microseconds\x18\x01 \x01(\x04\x12 \n\x18minimum_slot_utilization\x18\x02 \x01(\x02\x1au\n\x0eStrategyOldest\x12\x1f\n\x17max_candidate_sequences\x18\x01 \x01(\x05\x12\x1c\n\x14preferred_batch_size\x18\x02 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x03 \x01(\x04\x42\x11\n\x0fstrategy_choice\"\xf6\x02\n\x0fModelEnsembling\x12-\n\x04step\x18\x01 \x03(\x0b\x32\x1f.inference.ModelEnsembling.Step\x1a\xb3\x02\n\x04Step\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\x03\x12@\n\tinput_map\x18\x03 \x03(\x0b\x32-.inference.ModelEnsembling.Step.InputMapEntry\x12\x42\n\noutput_map\x18\x04 \x03(\x0b\x32..inference.ModelEnsembling.Step.OutputMapEntry\x12\x17\n\x0fmodel_namespace\x18\x05 \x01(\t\x1a/\n\rInputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x30\n\x0eOutputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"&\n\x0eModelParameter\x12\x14\n\x0cstring_value\x18\x01 \x01(\t\"\xd9\x02\n\x0bModelWarmup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x02 \x01(\r\x12\x32\n\x06inputs\x18\x03 \x03(\x0b\x32\".inference.ModelWarmup.InputsEntry\x12\r\n\x05\x63ount\x18\x04 \x01(\r\x1a\x97\x01\n\x05Input\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x15\n\x0brandom_data\x18\x04 \x01(\x08H\x00\x12\x19\n\x0finput_data_file\x18\x05 \x01(\tH\x00\x42\x11\n\x0finput_data_type\x1aK\n\x0bInputsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12+\n\x05value\x18\x02 \x01(\x0b\x32\x1c.inference.ModelWarmup.Input:\x02\x38\x01\".\n\x0fModelOperations\x12\x1b\n\x13op_library_filename\x18\x01 \x03(\t\"+\n\x16ModelTransactionPolicy\x12\x11\n\tdecoupled\x18\x01 \x01(\x08\"\xe6\x01\n\x15ModelRepositoryAgents\x12\x36\n\x06\x61gents\x18\x01 \x03(\x0b\x32&.inference.ModelRepositoryAgents.Agent\x1a\x94\x01\n\x05\x41gent\x12\x0c\n\x04name\x18\x01 \x01(\t\x12J\n\nparameters\x18\x02 \x03(\x0b\x32\x36.inference.ModelRepositoryAgents.Agent.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"$\n\x12ModelResponseCache\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"\xb2\n\n\x0bModelConfig\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08platform\x18\x02 \x01(\t\x12\x0f\n\x07\x62\x61\x63kend\x18\x11 \x01(\t\x12\x35\n\x0eversion_policy\x18\x03 \x01(\x0b\x32\x1d.inference.ModelVersionPolicy\x12\x16\n\x0emax_batch_size\x18\x04 \x01(\x05\x12$\n\x05input\x18\x05 \x03(\x0b\x32\x15.inference.ModelInput\x12&\n\x06output\x18\x06 \x03(\x0b\x32\x16.inference.ModelOutput\x12*\n\x0b\x62\x61tch_input\x18\x14 \x03(\x0b\x32\x15.inference.BatchInput\x12,\n\x0c\x62\x61tch_output\x18\x15 \x03(\x0b\x32\x16.inference.BatchOutput\x12\x38\n\x0coptimization\x18\x0c \x01(\x0b\x32\".inference.ModelOptimizationPolicy\x12;\n\x10\x64ynamic_batching\x18\x0b \x01(\x0b\x32\x1f.inference.ModelDynamicBatchingH\x00\x12=\n\x11sequence_batching\x18\r \x01(\x0b\x32 .inference.ModelSequenceBatchingH\x00\x12\x39\n\x13\x65nsemble_scheduling\x18\x0f \x01(\x0b\x32\x1a.inference.ModelEnsemblingH\x00\x12\x35\n\x0einstance_group\x18\x07 \x03(\x0b\x32\x1d.inference.ModelInstanceGroup\x12\x1e\n\x16\x64\x65\x66\x61ult_model_filename\x18\x08 \x01(\t\x12H\n\x12\x63\x63_model_filenames\x18\t \x03(\x0b\x32,.inference.ModelConfig.CcModelFilenamesEntry\x12;\n\x0bmetric_tags\x18\n \x03(\x0b\x32&.inference.ModelConfig.MetricTagsEntry\x12:\n\nparameters\x18\x0e \x03(\x0b\x32&.inference.ModelConfig.ParametersEntry\x12,\n\x0cmodel_warmup\x18\x10 \x03(\x0b\x32\x16.inference.ModelWarmup\x12\x34\n\x10model_operations\x18\x12 \x01(\x0b\x32\x1a.inference.ModelOperations\x12\x43\n\x18model_transaction_policy\x18\x13 \x01(\x0b\x32!.inference.ModelTransactionPolicy\x12\x41\n\x17model_repository_agents\x18\x17 \x01(\x0b\x32 .inference.ModelRepositoryAgents\x12\x35\n\x0eresponse_cache\x18\x18 \x01(\x0b\x32\x1d.inference.ModelResponseCache\x1a\x37\n\x15\x43\x63ModelFilenamesEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x31\n\x0fMetricTagsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.ModelParameter:\x02\x38\x01\x42\x13\n\x11scheduling_choice*\xfa\x01\n\x08\x44\x61taType\x12\x10\n\x0cTYPE_INVALID\x10\x00\x12\r\n\tTYPE_BOOL\x10\x01\x12\x0e\n\nTYPE_UINT8\x10\x02\x12\x0f\n\x0bTYPE_UINT16\x10\x03\x12\x0f\n\x0bTYPE_UINT32\x10\x04\x12\x0f\n\x0bTYPE_UINT64\x10\x05\x12\r\n\tTYPE_INT8\x10\x06\x12\x0e\n\nTYPE_INT16\x10\x07\x12\x0e\n\nTYPE_INT32\x10\x08\x12\x0e\n\nTYPE_INT64\x10\t\x12\r\n\tTYPE_FP16\x10\n\x12\r\n\tTYPE_FP32\x10\x0b\x12\r\n\tTYPE_FP64\x10\x0c\x12\x0f\n\x0bTYPE_STRING\x10\r\x12\r\n\tTYPE_BF16\x10\x0e\x62\x06proto3')
19
19
 
20
20
  _DATATYPE = DESCRIPTOR.enum_types_by_name['DataType']
21
21
  DataType = enum_type_wrapper.EnumTypeWrapper(_DATATYPE)
@@ -15,7 +15,7 @@ _sym_db = _symbol_database.Default()
15
15
  from tritonclient.grpc import model_config_pb2 as model__config__pb2
16
16
 
17
17
 
18
- DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12grpc_service.proto\x12\tinference\x1a\x12model_config.proto\"\x13\n\x11ServerLiveRequest\"\"\n\x12ServerLiveResponse\x12\x0c\n\x04live\x18\x01 \x01(\x08\"\x14\n\x12ServerReadyRequest\"$\n\x13ServerReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"2\n\x11ModelReadyRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"#\n\x12ModelReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"\x17\n\x15ServerMetadataRequest\"K\n\x16ServerMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x12\n\nextensions\x18\x03 \x03(\t\"5\n\x14ModelMetadataRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"\x8d\x02\n\x15ModelMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08versions\x18\x02 \x03(\t\x12\x10\n\x08platform\x18\x03 \x01(\t\x12?\n\x06inputs\x18\x04 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x1a?\n\x0eTensorMetadata\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\"i\n\x0eInferParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\"\xd0\x01\n\x13InferTensorContents\x12\x15\n\rbool_contents\x18\x01 \x03(\x08\x12\x14\n\x0cint_contents\x18\x02 \x03(\x05\x12\x16\n\x0eint64_contents\x18\x03 \x03(\x03\x12\x15\n\ruint_contents\x18\x04 \x03(\r\x12\x17\n\x0fuint64_contents\x18\x05 \x03(\x04\x12\x15\n\rfp32_contents\x18\x06 \x03(\x02\x12\x15\n\rfp64_contents\x18\x07 \x03(\x01\x12\x16\n\x0e\x62ytes_contents\x18\x08 \x03(\x0c\"\xee\x06\n\x11ModelInferRequest\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12@\n\nparameters\x18\x04 \x03(\x0b\x32,.inference.ModelInferRequest.ParametersEntry\x12=\n\x06inputs\x18\x05 \x03(\x0b\x32-.inference.ModelInferRequest.InferInputTensor\x12H\n\x07outputs\x18\x06 \x03(\x0b\x32\x37.inference.ModelInferRequest.InferRequestedOutputTensor\x12\x1a\n\x12raw_input_contents\x18\x07 \x03(\x0c\x1a\x94\x02\n\x10InferInputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12Q\n\nparameters\x18\x04 \x03(\x0b\x32=.inference.ModelInferRequest.InferInputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1a\xd5\x01\n\x1aInferRequestedOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12[\n\nparameters\x18\x02 \x03(\x0b\x32G.inference.ModelInferRequest.InferRequestedOutputTensor.ParametersEntry\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"\xd5\x04\n\x12ModelInferResponse\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12\x41\n\nparameters\x18\x04 \x03(\x0b\x32-.inference.ModelInferResponse.ParametersEntry\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelInferResponse.InferOutputTensor\x12\x1b\n\x13raw_output_contents\x18\x06 \x03(\x0c\x1a\x97\x02\n\x11InferOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12S\n\nparameters\x18\x04 \x03(\x0b\x32?.inference.ModelInferResponse.InferOutputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"h\n\x18ModelStreamInferResponse\x12\x15\n\rerror_message\x18\x01 \x01(\t\x12\x35\n\x0einfer_response\x18\x02 \x01(\x0b\x32\x1d.inference.ModelInferResponse\"3\n\x12ModelConfigRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"=\n\x13ModelConfigResponse\x12&\n\x06\x63onfig\x18\x01 \x01(\x0b\x32\x16.inference.ModelConfig\"7\n\x16ModelStatisticsRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\".\n\x11StatisticDuration\x12\r\n\x05\x63ount\x18\x01 \x01(\x04\x12\n\n\x02ns\x18\x02 \x01(\x04\"\x9c\x03\n\x0fInferStatistics\x12-\n\x07success\x18\x01 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12*\n\x04\x66\x61il\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12+\n\x05queue\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_input\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x05 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x06 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12/\n\tcache_hit\x18\x07 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x30\n\ncache_miss\x18\x08 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xca\x01\n\x14InferBatchStatistics\x12\x12\n\nbatch_size\x18\x01 \x01(\x04\x12\x33\n\rcompute_input\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xe5\x01\n\x0fModelStatistics\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x16\n\x0elast_inference\x18\x03 \x01(\x04\x12\x17\n\x0finference_count\x18\x04 \x01(\x04\x12\x17\n\x0f\x65xecution_count\x18\x05 \x01(\x04\x12\x33\n\x0finference_stats\x18\x06 \x01(\x0b\x32\x1a.inference.InferStatistics\x12\x34\n\x0b\x62\x61tch_stats\x18\x07 \x03(\x0b\x32\x1f.inference.InferBatchStatistics\"J\n\x17ModelStatisticsResponse\x12/\n\x0bmodel_stats\x18\x01 \x03(\x0b\x32\x1a.inference.ModelStatistics\"\x8a\x01\n\x18ModelRepositoryParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x15\n\x0b\x62ytes_param\x18\x04 \x01(\x0cH\x00\x42\x12\n\x10parameter_choice\"@\n\x16RepositoryIndexRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\r\n\x05ready\x18\x02 \x01(\x08\"\xa4\x01\n\x17RepositoryIndexResponse\x12=\n\x06models\x18\x01 \x03(\x0b\x32-.inference.RepositoryIndexResponse.ModelIndex\x1aJ\n\nModelIndex\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\r\n\x05state\x18\x03 \x01(\t\x12\x0e\n\x06reason\x18\x04 \x01(\t\"\xec\x01\n\x1aRepositoryModelLoadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12I\n\nparameters\x18\x03 \x03(\x0b\x32\x35.inference.RepositoryModelLoadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1d\n\x1bRepositoryModelLoadResponse\"\xf0\x01\n\x1cRepositoryModelUnloadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12K\n\nparameters\x18\x03 \x03(\x0b\x32\x37.inference.RepositoryModelUnloadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1f\n\x1dRepositoryModelUnloadResponse\"/\n\x1fSystemSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\xa5\x02\n SystemSharedMemoryStatusResponse\x12I\n\x07regions\x18\x01 \x03(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionsEntry\x1aL\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\x1ah\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12G\n\x05value\x18\x02 \x01(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"a\n!SystemSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"$\n\"SystemSharedMemoryRegisterResponse\"3\n#SystemSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"&\n$SystemSharedMemoryUnregisterResponse\"-\n\x1d\x43udaSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\x95\x02\n\x1e\x43udaSharedMemoryStatusResponse\x12G\n\x07regions\x18\x01 \x03(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionsEntry\x1a\x42\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x11\n\tdevice_id\x18\x02 \x01(\x04\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\x1a\x66\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x45\n\x05value\x18\x02 \x01(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"i\n\x1f\x43udaSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nraw_handle\x18\x02 \x01(\x0c\x12\x11\n\tdevice_id\x18\x03 \x01(\x03\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"\"\n CudaSharedMemoryRegisterResponse\"1\n!CudaSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"$\n\"CudaSharedMemoryUnregisterResponse\"\xe6\x01\n\x13TraceSettingRequest\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.TraceSettingRequest.SettingsEntry\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.TraceSettingRequest.SettingValue:\x02\x38\x01\"\xd5\x01\n\x14TraceSettingResponse\x12?\n\x08settings\x18\x01 \x03(\x0b\x32-.inference.TraceSettingResponse.SettingsEntry\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a]\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12;\n\x05value\x18\x02 \x01(\x0b\x32,.inference.TraceSettingResponse.SettingValue:\x02\x38\x01\"\x9a\x02\n\x12LogSettingsRequest\x12=\n\x08settings\x18\x01 \x03(\x0b\x32+.inference.LogSettingsRequest.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a[\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x39\n\x05value\x18\x02 \x01(\x0b\x32*.inference.LogSettingsRequest.SettingValue:\x02\x38\x01\"\x9d\x02\n\x13LogSettingsResponse\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.LogSettingsResponse.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.LogSettingsResponse.SettingValue:\x02\x38\x01\x32\xb7\x0f\n\x14GRPCInferenceService\x12K\n\nServerLive\x12\x1c.inference.ServerLiveRequest\x1a\x1d.inference.ServerLiveResponse\"\x00\x12N\n\x0bServerReady\x12\x1d.inference.ServerReadyRequest\x1a\x1e.inference.ServerReadyResponse\"\x00\x12K\n\nModelReady\x12\x1c.inference.ModelReadyRequest\x1a\x1d.inference.ModelReadyResponse\"\x00\x12W\n\x0eServerMetadata\x12 .inference.ServerMetadataRequest\x1a!.inference.ServerMetadataResponse\"\x00\x12T\n\rModelMetadata\x12\x1f.inference.ModelMetadataRequest\x1a .inference.ModelMetadataResponse\"\x00\x12K\n\nModelInfer\x12\x1c.inference.ModelInferRequest\x1a\x1d.inference.ModelInferResponse\"\x00\x12[\n\x10ModelStreamInfer\x12\x1c.inference.ModelInferRequest\x1a#.inference.ModelStreamInferResponse\"\x00(\x01\x30\x01\x12N\n\x0bModelConfig\x12\x1d.inference.ModelConfigRequest\x1a\x1e.inference.ModelConfigResponse\"\x00\x12Z\n\x0fModelStatistics\x12!.inference.ModelStatisticsRequest\x1a\".inference.ModelStatisticsResponse\"\x00\x12Z\n\x0fRepositoryIndex\x12!.inference.RepositoryIndexRequest\x1a\".inference.RepositoryIndexResponse\"\x00\x12\x66\n\x13RepositoryModelLoad\x12%.inference.RepositoryModelLoadRequest\x1a&.inference.RepositoryModelLoadResponse\"\x00\x12l\n\x15RepositoryModelUnload\x12\'.inference.RepositoryModelUnloadRequest\x1a(.inference.RepositoryModelUnloadResponse\"\x00\x12u\n\x18SystemSharedMemoryStatus\x12*.inference.SystemSharedMemoryStatusRequest\x1a+.inference.SystemSharedMemoryStatusResponse\"\x00\x12{\n\x1aSystemSharedMemoryRegister\x12,.inference.SystemSharedMemoryRegisterRequest\x1a-.inference.SystemSharedMemoryRegisterResponse\"\x00\x12\x81\x01\n\x1cSystemSharedMemoryUnregister\x12..inference.SystemSharedMemoryUnregisterRequest\x1a/.inference.SystemSharedMemoryUnregisterResponse\"\x00\x12o\n\x16\x43udaSharedMemoryStatus\x12(.inference.CudaSharedMemoryStatusRequest\x1a).inference.CudaSharedMemoryStatusResponse\"\x00\x12u\n\x18\x43udaSharedMemoryRegister\x12*.inference.CudaSharedMemoryRegisterRequest\x1a+.inference.CudaSharedMemoryRegisterResponse\"\x00\x12{\n\x1a\x43udaSharedMemoryUnregister\x12,.inference.CudaSharedMemoryUnregisterRequest\x1a-.inference.CudaSharedMemoryUnregisterResponse\"\x00\x12Q\n\x0cTraceSetting\x12\x1e.inference.TraceSettingRequest\x1a\x1f.inference.TraceSettingResponse\"\x00\x12N\n\x0bLogSettings\x12\x1d.inference.LogSettingsRequest\x1a\x1e.inference.LogSettingsResponse\"\x00\x62\x06proto3')
18
+ DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12grpc_service.proto\x12\tinference\x1a\x12model_config.proto\"\x13\n\x11ServerLiveRequest\"\"\n\x12ServerLiveResponse\x12\x0c\n\x04live\x18\x01 \x01(\x08\"\x14\n\x12ServerReadyRequest\"$\n\x13ServerReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"2\n\x11ModelReadyRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"#\n\x12ModelReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"\x17\n\x15ServerMetadataRequest\"K\n\x16ServerMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x12\n\nextensions\x18\x03 \x03(\t\"5\n\x14ModelMetadataRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"\x8d\x02\n\x15ModelMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08versions\x18\x02 \x03(\t\x12\x10\n\x08platform\x18\x03 \x01(\t\x12?\n\x06inputs\x18\x04 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x1a?\n\x0eTensorMetadata\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\"\x99\x01\n\x0eInferParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x16\n\x0c\x64ouble_param\x18\x04 \x01(\x01H\x00\x12\x16\n\x0cuint64_param\x18\x05 \x01(\x04H\x00\x42\x12\n\x10parameter_choice\"\xd0\x01\n\x13InferTensorContents\x12\x15\n\rbool_contents\x18\x01 \x03(\x08\x12\x14\n\x0cint_contents\x18\x02 \x03(\x05\x12\x16\n\x0eint64_contents\x18\x03 \x03(\x03\x12\x15\n\ruint_contents\x18\x04 \x03(\r\x12\x17\n\x0fuint64_contents\x18\x05 \x03(\x04\x12\x15\n\rfp32_contents\x18\x06 \x03(\x02\x12\x15\n\rfp64_contents\x18\x07 \x03(\x01\x12\x16\n\x0e\x62ytes_contents\x18\x08 \x03(\x0c\"\xee\x06\n\x11ModelInferRequest\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12@\n\nparameters\x18\x04 \x03(\x0b\x32,.inference.ModelInferRequest.ParametersEntry\x12=\n\x06inputs\x18\x05 \x03(\x0b\x32-.inference.ModelInferRequest.InferInputTensor\x12H\n\x07outputs\x18\x06 \x03(\x0b\x32\x37.inference.ModelInferRequest.InferRequestedOutputTensor\x12\x1a\n\x12raw_input_contents\x18\x07 \x03(\x0c\x1a\x94\x02\n\x10InferInputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12Q\n\nparameters\x18\x04 \x03(\x0b\x32=.inference.ModelInferRequest.InferInputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1a\xd5\x01\n\x1aInferRequestedOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12[\n\nparameters\x18\x02 \x03(\x0b\x32G.inference.ModelInferRequest.InferRequestedOutputTensor.ParametersEntry\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"\xd5\x04\n\x12ModelInferResponse\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12\x41\n\nparameters\x18\x04 \x03(\x0b\x32-.inference.ModelInferResponse.ParametersEntry\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelInferResponse.InferOutputTensor\x12\x1b\n\x13raw_output_contents\x18\x06 \x03(\x0c\x1a\x97\x02\n\x11InferOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12S\n\nparameters\x18\x04 \x03(\x0b\x32?.inference.ModelInferResponse.InferOutputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"h\n\x18ModelStreamInferResponse\x12\x15\n\rerror_message\x18\x01 \x01(\t\x12\x35\n\x0einfer_response\x18\x02 \x01(\x0b\x32\x1d.inference.ModelInferResponse\"3\n\x12ModelConfigRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"=\n\x13ModelConfigResponse\x12&\n\x06\x63onfig\x18\x01 \x01(\x0b\x32\x16.inference.ModelConfig\"7\n\x16ModelStatisticsRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\".\n\x11StatisticDuration\x12\r\n\x05\x63ount\x18\x01 \x01(\x04\x12\n\n\x02ns\x18\x02 \x01(\x04\"\x9c\x03\n\x0fInferStatistics\x12-\n\x07success\x18\x01 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12*\n\x04\x66\x61il\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12+\n\x05queue\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_input\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x05 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x06 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12/\n\tcache_hit\x18\x07 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x30\n\ncache_miss\x18\x08 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xca\x01\n\x14InferBatchStatistics\x12\x12\n\nbatch_size\x18\x01 \x01(\x04\x12\x33\n\rcompute_input\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\":\n\x0bMemoryUsage\x12\x0c\n\x04type\x18\x01 \x01(\t\x12\n\n\x02id\x18\x02 \x01(\x03\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\"\x93\x02\n\x0fModelStatistics\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x16\n\x0elast_inference\x18\x03 \x01(\x04\x12\x17\n\x0finference_count\x18\x04 \x01(\x04\x12\x17\n\x0f\x65xecution_count\x18\x05 \x01(\x04\x12\x33\n\x0finference_stats\x18\x06 \x01(\x0b\x32\x1a.inference.InferStatistics\x12\x34\n\x0b\x62\x61tch_stats\x18\x07 \x03(\x0b\x32\x1f.inference.InferBatchStatistics\x12,\n\x0cmemory_usage\x18\x08 \x03(\x0b\x32\x16.inference.MemoryUsage\"J\n\x17ModelStatisticsResponse\x12/\n\x0bmodel_stats\x18\x01 \x03(\x0b\x32\x1a.inference.ModelStatistics\"\x8a\x01\n\x18ModelRepositoryParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x15\n\x0b\x62ytes_param\x18\x04 \x01(\x0cH\x00\x42\x12\n\x10parameter_choice\"@\n\x16RepositoryIndexRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\r\n\x05ready\x18\x02 \x01(\x08\"\xa4\x01\n\x17RepositoryIndexResponse\x12=\n\x06models\x18\x01 \x03(\x0b\x32-.inference.RepositoryIndexResponse.ModelIndex\x1aJ\n\nModelIndex\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\r\n\x05state\x18\x03 \x01(\t\x12\x0e\n\x06reason\x18\x04 \x01(\t\"\xec\x01\n\x1aRepositoryModelLoadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12I\n\nparameters\x18\x03 \x03(\x0b\x32\x35.inference.RepositoryModelLoadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1d\n\x1bRepositoryModelLoadResponse\"\xf0\x01\n\x1cRepositoryModelUnloadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12K\n\nparameters\x18\x03 \x03(\x0b\x32\x37.inference.RepositoryModelUnloadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1f\n\x1dRepositoryModelUnloadResponse\"/\n\x1fSystemSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\xa5\x02\n SystemSharedMemoryStatusResponse\x12I\n\x07regions\x18\x01 \x03(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionsEntry\x1aL\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\x1ah\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12G\n\x05value\x18\x02 \x01(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"a\n!SystemSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"$\n\"SystemSharedMemoryRegisterResponse\"3\n#SystemSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"&\n$SystemSharedMemoryUnregisterResponse\"-\n\x1d\x43udaSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\x95\x02\n\x1e\x43udaSharedMemoryStatusResponse\x12G\n\x07regions\x18\x01 \x03(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionsEntry\x1a\x42\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x11\n\tdevice_id\x18\x02 \x01(\x04\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\x1a\x66\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x45\n\x05value\x18\x02 \x01(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"i\n\x1f\x43udaSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nraw_handle\x18\x02 \x01(\x0c\x12\x11\n\tdevice_id\x18\x03 \x01(\x03\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"\"\n CudaSharedMemoryRegisterResponse\"1\n!CudaSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"$\n\"CudaSharedMemoryUnregisterResponse\"\xe6\x01\n\x13TraceSettingRequest\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.TraceSettingRequest.SettingsEntry\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.TraceSettingRequest.SettingValue:\x02\x38\x01\"\xd5\x01\n\x14TraceSettingResponse\x12?\n\x08settings\x18\x01 \x03(\x0b\x32-.inference.TraceSettingResponse.SettingsEntry\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a]\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12;\n\x05value\x18\x02 \x01(\x0b\x32,.inference.TraceSettingResponse.SettingValue:\x02\x38\x01\"\x9a\x02\n\x12LogSettingsRequest\x12=\n\x08settings\x18\x01 \x03(\x0b\x32+.inference.LogSettingsRequest.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a[\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x39\n\x05value\x18\x02 \x01(\x0b\x32*.inference.LogSettingsRequest.SettingValue:\x02\x38\x01\"\x9d\x02\n\x13LogSettingsResponse\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.LogSettingsResponse.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.LogSettingsResponse.SettingValue:\x02\x38\x01\x32\xb7\x0f\n\x14GRPCInferenceService\x12K\n\nServerLive\x12\x1c.inference.ServerLiveRequest\x1a\x1d.inference.ServerLiveResponse\"\x00\x12N\n\x0bServerReady\x12\x1d.inference.ServerReadyRequest\x1a\x1e.inference.ServerReadyResponse\"\x00\x12K\n\nModelReady\x12\x1c.inference.ModelReadyRequest\x1a\x1d.inference.ModelReadyResponse\"\x00\x12W\n\x0eServerMetadata\x12 .inference.ServerMetadataRequest\x1a!.inference.ServerMetadataResponse\"\x00\x12T\n\rModelMetadata\x12\x1f.inference.ModelMetadataRequest\x1a .inference.ModelMetadataResponse\"\x00\x12K\n\nModelInfer\x12\x1c.inference.ModelInferRequest\x1a\x1d.inference.ModelInferResponse\"\x00\x12[\n\x10ModelStreamInfer\x12\x1c.inference.ModelInferRequest\x1a#.inference.ModelStreamInferResponse\"\x00(\x01\x30\x01\x12N\n\x0bModelConfig\x12\x1d.inference.ModelConfigRequest\x1a\x1e.inference.ModelConfigResponse\"\x00\x12Z\n\x0fModelStatistics\x12!.inference.ModelStatisticsRequest\x1a\".inference.ModelStatisticsResponse\"\x00\x12Z\n\x0fRepositoryIndex\x12!.inference.RepositoryIndexRequest\x1a\".inference.RepositoryIndexResponse\"\x00\x12\x66\n\x13RepositoryModelLoad\x12%.inference.RepositoryModelLoadRequest\x1a&.inference.RepositoryModelLoadResponse\"\x00\x12l\n\x15RepositoryModelUnload\x12\'.inference.RepositoryModelUnloadRequest\x1a(.inference.RepositoryModelUnloadResponse\"\x00\x12u\n\x18SystemSharedMemoryStatus\x12*.inference.SystemSharedMemoryStatusRequest\x1a+.inference.SystemSharedMemoryStatusResponse\"\x00\x12{\n\x1aSystemSharedMemoryRegister\x12,.inference.SystemSharedMemoryRegisterRequest\x1a-.inference.SystemSharedMemoryRegisterResponse\"\x00\x12\x81\x01\n\x1cSystemSharedMemoryUnregister\x12..inference.SystemSharedMemoryUnregisterRequest\x1a/.inference.SystemSharedMemoryUnregisterResponse\"\x00\x12o\n\x16\x43udaSharedMemoryStatus\x12(.inference.CudaSharedMemoryStatusRequest\x1a).inference.CudaSharedMemoryStatusResponse\"\x00\x12u\n\x18\x43udaSharedMemoryRegister\x12*.inference.CudaSharedMemoryRegisterRequest\x1a+.inference.CudaSharedMemoryRegisterResponse\"\x00\x12{\n\x1a\x43udaSharedMemoryUnregister\x12,.inference.CudaSharedMemoryUnregisterRequest\x1a-.inference.CudaSharedMemoryUnregisterResponse\"\x00\x12Q\n\x0cTraceSetting\x12\x1e.inference.TraceSettingRequest\x1a\x1f.inference.TraceSettingResponse\"\x00\x12N\n\x0bLogSettings\x12\x1d.inference.LogSettingsRequest\x1a\x1e.inference.LogSettingsResponse\"\x00\x62\x06proto3')
19
19
 
20
20
 
21
21
 
@@ -49,6 +49,7 @@ _MODELSTATISTICSREQUEST = DESCRIPTOR.message_types_by_name['ModelStatisticsReque
49
49
  _STATISTICDURATION = DESCRIPTOR.message_types_by_name['StatisticDuration']
50
50
  _INFERSTATISTICS = DESCRIPTOR.message_types_by_name['InferStatistics']
51
51
  _INFERBATCHSTATISTICS = DESCRIPTOR.message_types_by_name['InferBatchStatistics']
52
+ _MEMORYUSAGE = DESCRIPTOR.message_types_by_name['MemoryUsage']
52
53
  _MODELSTATISTICS = DESCRIPTOR.message_types_by_name['ModelStatistics']
53
54
  _MODELSTATISTICSRESPONSE = DESCRIPTOR.message_types_by_name['ModelStatisticsResponse']
54
55
  _MODELREPOSITORYPARAMETER = DESCRIPTOR.message_types_by_name['ModelRepositoryParameter']
@@ -308,6 +309,13 @@ InferBatchStatistics = _reflection.GeneratedProtocolMessageType('InferBatchStati
308
309
  })
309
310
  _sym_db.RegisterMessage(InferBatchStatistics)
310
311
 
312
+ MemoryUsage = _reflection.GeneratedProtocolMessageType('MemoryUsage', (_message.Message,), {
313
+ 'DESCRIPTOR' : _MEMORYUSAGE,
314
+ '__module__' : 'grpc_service_pb2'
315
+ # @@protoc_insertion_point(class_scope:inference.MemoryUsage)
316
+ })
317
+ _sym_db.RegisterMessage(MemoryUsage)
318
+
311
319
  ModelStatistics = _reflection.GeneratedProtocolMessageType('ModelStatistics', (_message.Message,), {
312
320
  'DESCRIPTOR' : _MODELSTATISTICS,
313
321
  '__module__' : 'grpc_service_pb2'
@@ -655,124 +663,126 @@ if _descriptor._USE_C_DESCRIPTORS == False:
655
663
  _MODELMETADATARESPONSE._serialized_end=686
656
664
  _MODELMETADATARESPONSE_TENSORMETADATA._serialized_start=623
657
665
  _MODELMETADATARESPONSE_TENSORMETADATA._serialized_end=686
658
- _INFERPARAMETER._serialized_start=688
659
- _INFERPARAMETER._serialized_end=793
660
- _INFERTENSORCONTENTS._serialized_start=796
661
- _INFERTENSORCONTENTS._serialized_end=1004
662
- _MODELINFERREQUEST._serialized_start=1007
663
- _MODELINFERREQUEST._serialized_end=1885
664
- _MODELINFERREQUEST_INFERINPUTTENSOR._serialized_start=1315
665
- _MODELINFERREQUEST_INFERINPUTTENSOR._serialized_end=1591
666
- _MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_start=1515
667
- _MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_end=1591
668
- _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_start=1594
669
- _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_end=1807
670
- _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1515
671
- _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1591
672
- _MODELINFERREQUEST_PARAMETERSENTRY._serialized_start=1515
673
- _MODELINFERREQUEST_PARAMETERSENTRY._serialized_end=1591
674
- _MODELINFERRESPONSE._serialized_start=1888
675
- _MODELINFERRESPONSE._serialized_end=2485
676
- _MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_start=2128
677
- _MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_end=2407
678
- _MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1515
679
- _MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1591
680
- _MODELINFERRESPONSE_PARAMETERSENTRY._serialized_start=1515
681
- _MODELINFERRESPONSE_PARAMETERSENTRY._serialized_end=1591
682
- _MODELSTREAMINFERRESPONSE._serialized_start=2487
683
- _MODELSTREAMINFERRESPONSE._serialized_end=2591
684
- _MODELCONFIGREQUEST._serialized_start=2593
685
- _MODELCONFIGREQUEST._serialized_end=2644
686
- _MODELCONFIGRESPONSE._serialized_start=2646
687
- _MODELCONFIGRESPONSE._serialized_end=2707
688
- _MODELSTATISTICSREQUEST._serialized_start=2709
689
- _MODELSTATISTICSREQUEST._serialized_end=2764
690
- _STATISTICDURATION._serialized_start=2766
691
- _STATISTICDURATION._serialized_end=2812
692
- _INFERSTATISTICS._serialized_start=2815
693
- _INFERSTATISTICS._serialized_end=3227
694
- _INFERBATCHSTATISTICS._serialized_start=3230
695
- _INFERBATCHSTATISTICS._serialized_end=3432
696
- _MODELSTATISTICS._serialized_start=3435
697
- _MODELSTATISTICS._serialized_end=3664
698
- _MODELSTATISTICSRESPONSE._serialized_start=3666
699
- _MODELSTATISTICSRESPONSE._serialized_end=3740
700
- _MODELREPOSITORYPARAMETER._serialized_start=3743
701
- _MODELREPOSITORYPARAMETER._serialized_end=3881
702
- _REPOSITORYINDEXREQUEST._serialized_start=3883
703
- _REPOSITORYINDEXREQUEST._serialized_end=3947
704
- _REPOSITORYINDEXRESPONSE._serialized_start=3950
705
- _REPOSITORYINDEXRESPONSE._serialized_end=4114
706
- _REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_start=4040
707
- _REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_end=4114
708
- _REPOSITORYMODELLOADREQUEST._serialized_start=4117
709
- _REPOSITORYMODELLOADREQUEST._serialized_end=4353
710
- _REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_start=4267
711
- _REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_end=4353
712
- _REPOSITORYMODELLOADRESPONSE._serialized_start=4355
713
- _REPOSITORYMODELLOADRESPONSE._serialized_end=4384
714
- _REPOSITORYMODELUNLOADREQUEST._serialized_start=4387
715
- _REPOSITORYMODELUNLOADREQUEST._serialized_end=4627
716
- _REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_start=4267
717
- _REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_end=4353
718
- _REPOSITORYMODELUNLOADRESPONSE._serialized_start=4629
719
- _REPOSITORYMODELUNLOADRESPONSE._serialized_end=4660
720
- _SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_start=4662
721
- _SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_end=4709
722
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_start=4712
723
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_end=5005
724
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=4823
725
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=4899
726
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=4901
727
- _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5005
728
- _SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_start=5007
729
- _SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_end=5104
730
- _SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_start=5106
731
- _SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_end=5142
732
- _SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_start=5144
733
- _SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_end=5195
734
- _SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5197
735
- _SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5235
736
- _CUDASHAREDMEMORYSTATUSREQUEST._serialized_start=5237
737
- _CUDASHAREDMEMORYSTATUSREQUEST._serialized_end=5282
738
- _CUDASHAREDMEMORYSTATUSRESPONSE._serialized_start=5285
739
- _CUDASHAREDMEMORYSTATUSRESPONSE._serialized_end=5562
740
- _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=5392
741
- _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=5458
742
- _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=5460
743
- _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5562
744
- _CUDASHAREDMEMORYREGISTERREQUEST._serialized_start=5564
745
- _CUDASHAREDMEMORYREGISTERREQUEST._serialized_end=5669
746
- _CUDASHAREDMEMORYREGISTERRESPONSE._serialized_start=5671
747
- _CUDASHAREDMEMORYREGISTERRESPONSE._serialized_end=5705
748
- _CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_start=5707
749
- _CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_end=5756
750
- _CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5758
751
- _CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5794
752
- _TRACESETTINGREQUEST._serialized_start=5797
753
- _TRACESETTINGREQUEST._serialized_end=6027
754
- _TRACESETTINGREQUEST_SETTINGVALUE._serialized_start=5904
755
- _TRACESETTINGREQUEST_SETTINGVALUE._serialized_end=5933
756
- _TRACESETTINGREQUEST_SETTINGSENTRY._serialized_start=5935
757
- _TRACESETTINGREQUEST_SETTINGSENTRY._serialized_end=6027
758
- _TRACESETTINGRESPONSE._serialized_start=6030
759
- _TRACESETTINGRESPONSE._serialized_end=6243
760
- _TRACESETTINGRESPONSE_SETTINGVALUE._serialized_start=5904
761
- _TRACESETTINGRESPONSE_SETTINGVALUE._serialized_end=5933
762
- _TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_start=6150
763
- _TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_end=6243
764
- _LOGSETTINGSREQUEST._serialized_start=6246
765
- _LOGSETTINGSREQUEST._serialized_end=6528
766
- _LOGSETTINGSREQUEST_SETTINGVALUE._serialized_start=6331
767
- _LOGSETTINGSREQUEST_SETTINGVALUE._serialized_end=6435
768
- _LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_start=6437
769
- _LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_end=6528
770
- _LOGSETTINGSRESPONSE._serialized_start=6531
771
- _LOGSETTINGSRESPONSE._serialized_end=6816
772
- _LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_start=6331
773
- _LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_end=6435
774
- _LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_start=6724
775
- _LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_end=6816
776
- _GRPCINFERENCESERVICE._serialized_start=6819
777
- _GRPCINFERENCESERVICE._serialized_end=8794
666
+ _INFERPARAMETER._serialized_start=689
667
+ _INFERPARAMETER._serialized_end=842
668
+ _INFERTENSORCONTENTS._serialized_start=845
669
+ _INFERTENSORCONTENTS._serialized_end=1053
670
+ _MODELINFERREQUEST._serialized_start=1056
671
+ _MODELINFERREQUEST._serialized_end=1934
672
+ _MODELINFERREQUEST_INFERINPUTTENSOR._serialized_start=1364
673
+ _MODELINFERREQUEST_INFERINPUTTENSOR._serialized_end=1640
674
+ _MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
675
+ _MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
676
+ _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_start=1643
677
+ _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_end=1856
678
+ _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
679
+ _MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
680
+ _MODELINFERREQUEST_PARAMETERSENTRY._serialized_start=1564
681
+ _MODELINFERREQUEST_PARAMETERSENTRY._serialized_end=1640
682
+ _MODELINFERRESPONSE._serialized_start=1937
683
+ _MODELINFERRESPONSE._serialized_end=2534
684
+ _MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_start=2177
685
+ _MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_end=2456
686
+ _MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
687
+ _MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
688
+ _MODELINFERRESPONSE_PARAMETERSENTRY._serialized_start=1564
689
+ _MODELINFERRESPONSE_PARAMETERSENTRY._serialized_end=1640
690
+ _MODELSTREAMINFERRESPONSE._serialized_start=2536
691
+ _MODELSTREAMINFERRESPONSE._serialized_end=2640
692
+ _MODELCONFIGREQUEST._serialized_start=2642
693
+ _MODELCONFIGREQUEST._serialized_end=2693
694
+ _MODELCONFIGRESPONSE._serialized_start=2695
695
+ _MODELCONFIGRESPONSE._serialized_end=2756
696
+ _MODELSTATISTICSREQUEST._serialized_start=2758
697
+ _MODELSTATISTICSREQUEST._serialized_end=2813
698
+ _STATISTICDURATION._serialized_start=2815
699
+ _STATISTICDURATION._serialized_end=2861
700
+ _INFERSTATISTICS._serialized_start=2864
701
+ _INFERSTATISTICS._serialized_end=3276
702
+ _INFERBATCHSTATISTICS._serialized_start=3279
703
+ _INFERBATCHSTATISTICS._serialized_end=3481
704
+ _MEMORYUSAGE._serialized_start=3483
705
+ _MEMORYUSAGE._serialized_end=3541
706
+ _MODELSTATISTICS._serialized_start=3544
707
+ _MODELSTATISTICS._serialized_end=3819
708
+ _MODELSTATISTICSRESPONSE._serialized_start=3821
709
+ _MODELSTATISTICSRESPONSE._serialized_end=3895
710
+ _MODELREPOSITORYPARAMETER._serialized_start=3898
711
+ _MODELREPOSITORYPARAMETER._serialized_end=4036
712
+ _REPOSITORYINDEXREQUEST._serialized_start=4038
713
+ _REPOSITORYINDEXREQUEST._serialized_end=4102
714
+ _REPOSITORYINDEXRESPONSE._serialized_start=4105
715
+ _REPOSITORYINDEXRESPONSE._serialized_end=4269
716
+ _REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_start=4195
717
+ _REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_end=4269
718
+ _REPOSITORYMODELLOADREQUEST._serialized_start=4272
719
+ _REPOSITORYMODELLOADREQUEST._serialized_end=4508
720
+ _REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_start=4422
721
+ _REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_end=4508
722
+ _REPOSITORYMODELLOADRESPONSE._serialized_start=4510
723
+ _REPOSITORYMODELLOADRESPONSE._serialized_end=4539
724
+ _REPOSITORYMODELUNLOADREQUEST._serialized_start=4542
725
+ _REPOSITORYMODELUNLOADREQUEST._serialized_end=4782
726
+ _REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_start=4422
727
+ _REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_end=4508
728
+ _REPOSITORYMODELUNLOADRESPONSE._serialized_start=4784
729
+ _REPOSITORYMODELUNLOADRESPONSE._serialized_end=4815
730
+ _SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_start=4817
731
+ _SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_end=4864
732
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_start=4867
733
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_end=5160
734
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=4978
735
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=5054
736
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=5056
737
+ _SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5160
738
+ _SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_start=5162
739
+ _SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_end=5259
740
+ _SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_start=5261
741
+ _SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_end=5297
742
+ _SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_start=5299
743
+ _SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_end=5350
744
+ _SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5352
745
+ _SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5390
746
+ _CUDASHAREDMEMORYSTATUSREQUEST._serialized_start=5392
747
+ _CUDASHAREDMEMORYSTATUSREQUEST._serialized_end=5437
748
+ _CUDASHAREDMEMORYSTATUSRESPONSE._serialized_start=5440
749
+ _CUDASHAREDMEMORYSTATUSRESPONSE._serialized_end=5717
750
+ _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=5547
751
+ _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=5613
752
+ _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=5615
753
+ _CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5717
754
+ _CUDASHAREDMEMORYREGISTERREQUEST._serialized_start=5719
755
+ _CUDASHAREDMEMORYREGISTERREQUEST._serialized_end=5824
756
+ _CUDASHAREDMEMORYREGISTERRESPONSE._serialized_start=5826
757
+ _CUDASHAREDMEMORYREGISTERRESPONSE._serialized_end=5860
758
+ _CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_start=5862
759
+ _CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_end=5911
760
+ _CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5913
761
+ _CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5949
762
+ _TRACESETTINGREQUEST._serialized_start=5952
763
+ _TRACESETTINGREQUEST._serialized_end=6182
764
+ _TRACESETTINGREQUEST_SETTINGVALUE._serialized_start=6059
765
+ _TRACESETTINGREQUEST_SETTINGVALUE._serialized_end=6088
766
+ _TRACESETTINGREQUEST_SETTINGSENTRY._serialized_start=6090
767
+ _TRACESETTINGREQUEST_SETTINGSENTRY._serialized_end=6182
768
+ _TRACESETTINGRESPONSE._serialized_start=6185
769
+ _TRACESETTINGRESPONSE._serialized_end=6398
770
+ _TRACESETTINGRESPONSE_SETTINGVALUE._serialized_start=6059
771
+ _TRACESETTINGRESPONSE_SETTINGVALUE._serialized_end=6088
772
+ _TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_start=6305
773
+ _TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_end=6398
774
+ _LOGSETTINGSREQUEST._serialized_start=6401
775
+ _LOGSETTINGSREQUEST._serialized_end=6683
776
+ _LOGSETTINGSREQUEST_SETTINGVALUE._serialized_start=6486
777
+ _LOGSETTINGSREQUEST_SETTINGVALUE._serialized_end=6590
778
+ _LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_start=6592
779
+ _LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_end=6683
780
+ _LOGSETTINGSRESPONSE._serialized_start=6686
781
+ _LOGSETTINGSRESPONSE._serialized_end=6971
782
+ _LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_start=6486
783
+ _LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_end=6590
784
+ _LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_start=6879
785
+ _LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_end=6971
786
+ _GRPCINFERENCESERVICE._serialized_start=6974
787
+ _GRPCINFERENCESERVICE._serialized_end=8949
778
788
  # @@protoc_insertion_point(module_scope)
@@ -26,6 +26,7 @@
26
26
 
27
27
  import numpy as np
28
28
  import struct
29
+ from ._shared_memory_tensor import SharedMemoryTensor
29
30
 
30
31
 
31
32
  def raise_error(msg):
@@ -0,0 +1,266 @@
1
+ # Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ #
3
+ # Redistribution and use in source and binary forms, with or without
4
+ # modification, are permitted provided that the following conditions
5
+ # are met:
6
+ # * Redistributions of source code must retain the above copyright
7
+ # notice, this list of conditions and the following disclaimer.
8
+ # * Redistributions in binary form must reproduce the above copyright
9
+ # notice, this list of conditions and the following disclaimer in the
10
+ # documentation and/or other materials provided with the distribution.
11
+ # * Neither the name of NVIDIA CORPORATION nor the names of its
12
+ # contributors may be used to endorse or promote products derived
13
+ # from this software without specific prior written permission.
14
+ #
15
+ # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
16
+ # EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17
+ # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18
+ # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
19
+ # CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20
+ # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21
+ # PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22
+ # PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
23
+ # OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24
+ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25
+ # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26
+
27
+ ################################################################################
28
+ # This file contains the DLPack API wrapped in Python style (see
29
+ # 'dlpack.h' for detail) and the utilities for Triton client to interact
30
+ # with DLPack
31
+ #
32
+ # Ref:
33
+ # https://github.com/dmlc/dlpack/blob/main/include/dlpack/dlpack.h
34
+ # https://github.com/dmlc/dlpack/blob/main/apps/numpy_dlpack/dlpack/from_numpy.py
35
+ ################################################################################
36
+
37
+ import ctypes
38
+
39
+ # Need to explicit set the res / arg types for pythonapi functions to
40
+ # work properly
41
+ ctypes.pythonapi.PyMem_RawMalloc.restype = ctypes.c_void_p
42
+ ctypes.pythonapi.PyMem_RawFree.argtypes = [ctypes.c_void_p]
43
+
44
+ ctypes.pythonapi.PyCapsule_New.restype = ctypes.py_object
45
+ ctypes.pythonapi.PyCapsule_New.argtypes = [
46
+ ctypes.c_void_p, ctypes.c_char_p, ctypes.c_void_p
47
+ ]
48
+
49
+ ctypes.pythonapi.PyCapsule_GetPointer.restype = ctypes.c_void_p
50
+ ctypes.pythonapi.PyCapsule_GetPointer.argtypes = [
51
+ ctypes.py_object, ctypes.c_char_p
52
+ ]
53
+
54
+ c_str_dltensor = b"dltensor"
55
+
56
+
57
+ class DLDeviceType(ctypes.c_int):
58
+ kDLCPU = 1
59
+ kDLCUDA = 2
60
+ kDLCUDAHost = 3
61
+ kDLOpenCL = 4
62
+ kDLVulkan = 7
63
+ kDLMetal = 8
64
+ kDLVPI = 9
65
+ kDLROCM = 10
66
+ kDLROCMHost = 11
67
+ kDLExtDev = 12
68
+ kDLCUDAManaged = 13
69
+ kDLOneAPI = 14
70
+ kDLWebGPU = 15
71
+ kDLHexagon = 16
72
+
73
+
74
+ class DLDevice(ctypes.Structure):
75
+ _fields_ = [
76
+ ("device_type", DLDeviceType),
77
+ ("device_id", ctypes.c_int),
78
+ ]
79
+
80
+
81
+ class DLDataTypeCode(ctypes.c_uint8):
82
+ kDLInt = 0
83
+ kDLUInt = 1
84
+ kDLFloat = 2
85
+ kDLOpaquePointer = 3
86
+ kDLBfloat = 4
87
+ kDLComplex = 5
88
+ kDLBool = 6
89
+
90
+
91
+ class DLDataType(ctypes.Structure):
92
+ _fields_ = [
93
+ ("type_code", DLDataTypeCode),
94
+ ("bits", ctypes.c_uint8),
95
+ ("lanes", ctypes.c_uint16),
96
+ ]
97
+
98
+
99
+ class DLTensor(ctypes.Structure):
100
+ _fields_ = [
101
+ ("data", ctypes.c_void_p),
102
+ ("device", DLDevice),
103
+ ("ndim", ctypes.c_int),
104
+ ("dtype", DLDataType),
105
+ ("shape", ctypes.POINTER(ctypes.c_int64)),
106
+ ("strides", ctypes.POINTER(ctypes.c_int64)),
107
+ ("byte_offset", ctypes.c_uint64),
108
+ ]
109
+
110
+
111
+ class DLManagedTensor(ctypes.Structure):
112
+ _fields_ = [
113
+ ("dl_tensor", DLTensor),
114
+ ("manager_ctx", ctypes.c_void_p),
115
+ ("deleter", ctypes.CFUNCTYPE(None, ctypes.c_void_p)),
116
+ ]
117
+
118
+
119
+ # Utilities
120
+
121
+
122
+ def _raise_error(msg):
123
+ """
124
+ Raise error with the provided message
125
+ """
126
+ raise Exception(msg=msg) from None
127
+
128
+
129
+ # Use as managed context in DLPack that doesn't hold ownership of the
130
+ # data content.
131
+ class DataViewContext:
132
+
133
+ def __init__(self, shape) -> None:
134
+ # Convert the Python object to ctypes objects expected by
135
+ # DLPack
136
+ self._shape = (ctypes.c_int64 * len(shape))(*shape)
137
+ # No strides: compact and row-major
138
+ self._strides = ctypes.POINTER(ctypes.c_int64)()
139
+
140
+ def as_manager_ctx(self) -> ctypes.c_void_p:
141
+ py_obj = ctypes.py_object(self)
142
+ py_obj_ptr = ctypes.pointer(py_obj)
143
+ ctypes.pythonapi.Py_IncRef(py_obj)
144
+ ctypes.pythonapi.Py_IncRef(ctypes.py_object(py_obj_ptr))
145
+ return ctypes.cast(py_obj_ptr, ctypes.c_void_p)
146
+
147
+
148
+ @ctypes.CFUNCTYPE(None, ctypes.c_void_p)
149
+ def managed_tensor_deleter(handle: ctypes.c_void_p) -> None:
150
+ dl_managed_tensor = DLManagedTensor.from_address(handle)
151
+ py_obj_ptr = ctypes.cast(dl_managed_tensor.manager_ctx,
152
+ ctypes.POINTER(ctypes.py_object))
153
+ py_obj = py_obj_ptr.contents
154
+ ctypes.pythonapi.Py_DecRef(py_obj)
155
+ ctypes.pythonapi.Py_DecRef(ctypes.py_object(py_obj_ptr))
156
+ ctypes.pythonapi.PyMem_RawFree(handle)
157
+
158
+
159
+ @ctypes.CFUNCTYPE(None, ctypes.c_void_p)
160
+ def pycapsule_deleter(handle: ctypes.c_void_p) -> None:
161
+ pycapsule: ctypes.py_object = ctypes.cast(handle, ctypes.py_object)
162
+ if ctypes.pythonapi.PyCapsule_IsValid(pycapsule, c_str_dltensor):
163
+ dl_managed_tensor = ctypes.pythonapi.PyCapsule_GetPointer(
164
+ pycapsule, c_str_dltensor)
165
+ managed_tensor_deleter(dl_managed_tensor)
166
+ ctypes.pythonapi.PyCapsule_SetDestructor(pycapsule, None)
167
+
168
+
169
+ def triton_to_dlpack_dtype(dtype):
170
+ if dtype == "BOOL":
171
+ type_code = DLDataTypeCode.kDLBool
172
+ bits = 1
173
+ elif dtype == "INT8":
174
+ type_code = DLDataTypeCode.kDLInt
175
+ bits = 8
176
+ elif dtype == "INT16":
177
+ type_code = DLDataTypeCode.kDLInt
178
+ bits = 16
179
+ elif dtype == "INT32":
180
+ type_code = DLDataTypeCode.kDLInt
181
+ bits = 32
182
+ elif dtype == "INT64":
183
+ type_code = DLDataTypeCode.kDLInt
184
+ bits = 64
185
+ elif dtype == "UINT8":
186
+ type_code = DLDataTypeCode.kDLUInt
187
+ bits = 8
188
+ elif dtype == "UINT16":
189
+ type_code = DLDataTypeCode.kDLUInt
190
+ bits = 16
191
+ elif dtype == "UINT32":
192
+ type_code = DLDataTypeCode.kDLUInt
193
+ bits = 32
194
+ elif dtype == "UINT64":
195
+ type_code = DLDataTypeCode.kDLUInt
196
+ bits = 64
197
+ elif dtype == "FP16":
198
+ type_code = DLDataTypeCode.kDLFloat
199
+ bits = 16
200
+ elif dtype == "FP32":
201
+ type_code = DLDataTypeCode.kDLFloat
202
+ bits = 32
203
+ elif dtype == "FP64":
204
+ type_code = DLDataTypeCode.kDLFloat
205
+ bits = 64
206
+ elif dtype == "BF16":
207
+ type_code = DLDataTypeCode.kDLBfloat
208
+ bits = 16
209
+ elif dtype == "BYTES":
210
+ _raise_error("DLPack currently doesn't suppose BYTES type")
211
+ else:
212
+ _raise_error(
213
+ "Can not covert unknown data type '{}' to DLPack data type".format(
214
+ dtype))
215
+ return DLDataType(type_code, bits, 1)
216
+
217
+
218
+ def is_device_supported(device: DLDevice):
219
+ return device[0] in [
220
+ DLDeviceType.kDLCPU, DLDeviceType.kDLCUDA, DLDeviceType.kDLCUDAHost
221
+ ]
222
+
223
+
224
+ def is_contiguous_data(ndim: ctypes.c_int,
225
+ shape: ctypes.POINTER(ctypes.c_int64),
226
+ stride: ctypes.POINTER(ctypes.c_int64)):
227
+ # If 'stride' doesn't capture valid value
228
+ if (stride is None) or (not bool(stride)):
229
+ return True
230
+ calculated_stride = 1
231
+ # iterate stride in reverse order [ndim-1, -1)
232
+ for i in reversed(range(ndim)):
233
+ if stride[i] != calculated_stride:
234
+ return False
235
+ calculated_stride *= shape[i]
236
+ return True
237
+
238
+
239
+ def get_byte_size(dtype: DLDataType, ndim: ctypes.c_int,
240
+ shape: ctypes.POINTER(ctypes.c_int64)):
241
+ element_byte_size = dtype.bits * dtype.lanes // 8 # Assume 8 bits in a byte
242
+ for i in range(ndim):
243
+ element_byte_size *= shape[i]
244
+ return element_byte_size
245
+
246
+
247
+ def get_dlpack_capsule(dlpack_obj, stream=None):
248
+ # Extract PyCapsule of the DLPack object
249
+ if hasattr(dlpack_obj, '__dlpack__'):
250
+ if not hasattr(dlpack_obj, '__dlpack_device__'):
251
+ _raise_error(
252
+ "DLPack expects '__dlpack_device__' if '__dlpack__' has been defined"
253
+ )
254
+ device = dlpack_obj.__dlpack_device__()
255
+ if not is_device_supported(device):
256
+ _raise_error("DLPack device type {} is not supported".format(
257
+ device[0]))
258
+ # Have to condition on the device type as, using numpy as example,
259
+ # some DLPack implementation doesn't accept 'stream' as arguments
260
+ if device != DLDeviceType.kDLCUDA:
261
+ return dlpack_obj.__dlpack__()
262
+ else:
263
+ return dlpack_obj.__dlpack__(stream)
264
+ else:
265
+ # Old interface where PyCapsule object is passed directly
266
+ return dlpack_obj
@@ -0,0 +1,79 @@
1
+ # Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ #
3
+ # Redistribution and use in source and binary forms, with or without
4
+ # modification, are permitted provided that the following conditions
5
+ # are met:
6
+ # * Redistributions of source code must retain the above copyright
7
+ # notice, this list of conditions and the following disclaimer.
8
+ # * Redistributions in binary form must reproduce the above copyright
9
+ # notice, this list of conditions and the following disclaimer in the
10
+ # documentation and/or other materials provided with the distribution.
11
+ # * Neither the name of NVIDIA CORPORATION nor the names of its
12
+ # contributors may be used to endorse or promote products derived
13
+ # from this software without specific prior written permission.
14
+ #
15
+ # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
16
+ # EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17
+ # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18
+ # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
19
+ # CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20
+ # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21
+ # PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22
+ # PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
23
+ # OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24
+ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25
+ # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26
+
27
+ import ctypes
28
+ from . import _dlpack
29
+ import collections
30
+
31
+
32
+ class SharedMemoryTensor:
33
+ """An object of SharedMemoryTensor class is a view of the shared memory
34
+ region that follows DLPack specification. This object should be considered
35
+ invalidated if there is modification on the corresponding shared memory
36
+ region.
37
+
38
+ https://dmlc.github.io/dlpack/latest/python_spec.html
39
+
40
+ """
41
+
42
+ def __init__(self, dtype: str, shape: collections.abc.Iterable,
43
+ shm_addr: ctypes.c_void_p, offset: ctypes.c_uint64,
44
+ byte_size: ctypes.c_uint64, device_id: ctypes.c_int) -> None:
45
+ self._dtype = dtype
46
+ self._shape = shape
47
+ self._shm_addr = shm_addr
48
+ self._offset = offset
49
+ self._byte_size = byte_size
50
+ self._device_id = device_id
51
+ if device_id.value != -1:
52
+ self._dl_device = (_dlpack.DLDeviceType.kDLCUDA, device_id.value)
53
+ else:
54
+ self._dl_device = (_dlpack.DLDeviceType.kDLCPU, 0)
55
+
56
+ def __dlpack__(self, stream=None):
57
+ context = _dlpack.DataViewContext(self._shape)
58
+ size = ctypes.c_size_t(ctypes.sizeof(_dlpack.DLManagedTensor))
59
+ dl_managed_tensor = _dlpack.DLManagedTensor.from_address(
60
+ ctypes.pythonapi.PyMem_RawMalloc(size))
61
+ dl_managed_tensor.dl_tensor.data = self._shm_addr
62
+ dl_managed_tensor.dl_tensor.device = self._dl_device
63
+ dl_managed_tensor.dl_tensor.dtype = _dlpack.triton_to_dlpack_dtype(
64
+ self._dtype)
65
+ dl_managed_tensor.dl_tensor.ndim = len(self._shape)
66
+ dl_managed_tensor.dl_tensor.shape = context._shape
67
+ dl_managed_tensor.dl_tensor.strides = context._strides
68
+ dl_managed_tensor.dl_tensor.byte_offset = self._offset
69
+ dl_managed_tensor.manager_ctx = context.as_manager_ctx()
70
+ dl_managed_tensor.deleter = _dlpack.managed_tensor_deleter
71
+ pycapsule = ctypes.pythonapi.PyCapsule_New(
72
+ ctypes.byref(dl_managed_tensor),
73
+ _dlpack.c_str_dltensor,
74
+ _dlpack.pycapsule_deleter,
75
+ )
76
+ return pycapsule
77
+
78
+ def __dlpack_device__(self):
79
+ return self._dl_device
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: tritonclient
3
- Version: 2.34.0
3
+ Version: 2.36.0
4
4
  Summary: Python client library and utilities for communicating with Triton Inference Server
5
5
  Home-page: https://developer.nvidia.com/nvidia-triton-inference-server
6
6
  Author: NVIDIA Inc.
@@ -0,0 +1,42 @@
1
+ tritonclient-2.36.0.data/data/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
2
+ tritonclient-2.36.0.data/purelib/tritonclient/__init__.py,sha256=erynU-5HRlcIz1tx1Ve0kdCnzAXfNFeUYB5bx2fnL4Y,1542
3
+ tritonclient-2.36.0.data/purelib/tritonclient/_auth.py,sha256=sXf16LlDoQj1qI3GSnFa1mgOv0zhwFmB0OHofkIwVh0,2047
4
+ tritonclient-2.36.0.data/purelib/tritonclient/_client.py,sha256=8-VaArNooS9zKRY0aYTW9xvphmNa5vgWy7PDbBnGVw4,2964
5
+ tritonclient-2.36.0.data/purelib/tritonclient/_plugin.py,sha256=hAaX9FakQBsbh5DZVAlcDujVwrV4EddcmPxMp3puxX0,2069
6
+ tritonclient-2.36.0.data/purelib/tritonclient/_request.py,sha256=RmGnJpiRxTi33mn8Nl7ivGFqeKjicj_HhShtgOTci8I,1789
7
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/__init__.py,sha256=MDsTzhwtE6603Ixkf6g_N3_5OCqhoDdCZT0KuZFtAmI,2959
8
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_client.py,sha256=tGQzAF8ld7JKKgIHYmLvSItGQNHz7CuoTLcW_YyMbuk,69184
9
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_input.py,sha256=5cfHBc7lVxWq36HGG12xgnQlx_-3OG8L0fQ18AK3zjA,7213
10
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_result.py,sha256=gWA8LO7SiA7BsJnC8TGVh0kfE3hEmRrXNpXRSqMmOwY,6193
11
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_stream.py,sha256=AYGC7pD2jXkFQr0wq1moUE1MDgICMMTHVbCFvlujvl8,6618
12
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_requested_output.py,sha256=SUHrwwH0RA2Uge6imndW5hNdzhcZtNhrV_0DRwFep8U,4409
13
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/_utils.py,sha256=aMF8Vi6TtZve7BJ8QlZ6FjQr1MLkPs0PIg7iV5DVxXo,4954
14
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/model_config_pb2.py,sha256=KL3whNLO69fTXi4RBrdMDQ1OPsOrPPpjYx1xZCsnA78,46321
15
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/service_pb2.py,sha256=4DTipBPPoTBFW8FwKCD1BMYYHSxhKizuyYW0vYhg1bg,55250
16
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/service_pb2_grpc.py,sha256=BRXBBgehQgx_LSLqiw_N0zqFl4NYDhstm6AJHP3uxBw,37795
17
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/aio/__init__.py,sha256=b4AFQnhd_ujj9eGAEGhpqKlfjDtx9AMLJgrdn77OSEI,33059
18
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/aio/auth/__init__.py,sha256=nOIwuyXvzV1Dha2ZFX5vRjFhgsDa-cBdP2wSWNA6g1w,1573
19
+ tritonclient-2.36.0.data/purelib/tritonclient/grpc/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
20
+ tritonclient-2.36.0.data/purelib/tritonclient/http/__init__.py,sha256=tbJXG_x_NV7x9LbR2h7DAImiwM3a2uA7HBMKfDhpX1A,2128
21
+ tritonclient-2.36.0.data/purelib/tritonclient/http/_client.py,sha256=R8QDM_hFJACsvly0QheM7_ZRLkUrOEp6RMhPOLVUO1g,61716
22
+ tritonclient-2.36.0.data/purelib/tritonclient/http/_infer_input.py,sha256=eEYQEiK8AzAAW5zJq_c_thbxdHq0mAAjdWgeZYv5EoY,9506
23
+ tritonclient-2.36.0.data/purelib/tritonclient/http/_infer_result.py,sha256=vQIcWxxThgvFSnChZwZebKIJW-pSawXG1nVi6ncCYYE,9920
24
+ tritonclient-2.36.0.data/purelib/tritonclient/http/_requested_output.py,sha256=QU-07jLHbKh1S7hCoqvqjPxrHWeb0CsJ8Qd3077AU1U,4695
25
+ tritonclient-2.36.0.data/purelib/tritonclient/http/_utils.py,sha256=rMw1Ojz3UFsbPjrvU4nKVLH65TPJbujMJXhw7klZynk,5118
26
+ tritonclient-2.36.0.data/purelib/tritonclient/http/aio/__init__.py,sha256=edd6GlMqiAb2kJG2jWlBs2P0B6cjAIYig4hEcFs4U68,30390
27
+ tritonclient-2.36.0.data/purelib/tritonclient/http/aio/auth/__init__.py,sha256=2hd0vpFKURRLz9MjB6sf1Tnfq3bzLdhgG_VJBFwj6vA,1575
28
+ tritonclient-2.36.0.data/purelib/tritonclient/http/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
29
+ tritonclient-2.36.0.data/purelib/tritonclient/utils/__init__.py,sha256=JVWOJ5YCglG1gJWgfJGsWrCK4PgzFA_2kz3bag3nZ8E,10557
30
+ tritonclient-2.36.0.data/purelib/tritonclient/utils/_dlpack.py,sha256=eEUc-F0pBO6p8vBtN7KC5bB29DdkYH4wS9YtQPn1oKw,8963
31
+ tritonclient-2.36.0.data/purelib/tritonclient/utils/_shared_memory_tensor.py,sha256=Ei9P4xecCckED_lQ7xXL98NJNNuE_89gIW54B4Sh0MY,3688
32
+ tritonclient-2.36.0.data/purelib/tritonclientutils/__init__.py,sha256=D9hxs7FZaDd50ql_jLvaDFOwH8gCOp2LeFTaW1purzo,1821
33
+ tritonclient-2.36.0.data/purelib/tritongrpcclient/__init__.py,sha256=hRAS-HadBCUVAzEFi2ZNW0Cbtd2-x09mmG0bXu-Q3iI,1818
34
+ tritonclient-2.36.0.data/purelib/tritongrpcclient/grpc_service_pb2.py,sha256=L8UJUpxXzI0AA8YbGActcCUiaYQodaZBRLlOEDcbtEU,1842
35
+ tritonclient-2.36.0.data/purelib/tritongrpcclient/grpc_service_pb2_grpc.py,sha256=YN64p5Y7HZ7eMLnM596As4WAQ2FKh828Rda7jVXF9TM,1852
36
+ tritonclient-2.36.0.data/purelib/tritongrpcclient/model_config_pb2.py,sha256=Mk94wHJMdtG4Ptj0QSTVz7uRDsfX-l4zmN0dPeqiIZE,1852
37
+ tritonclient-2.36.0.data/purelib/tritonhttpclient/__init__.py,sha256=IHIoNJAlBvjTut2ySmh9c0Iw1DyJzc4a5IcYbrzLw3Q,1818
38
+ tritonclient-2.36.0.dist-info/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
39
+ tritonclient-2.36.0.dist-info/METADATA,sha256=8H9_Zw6bxz11Sptyuqm93tyy5CApNy8m_Mg4VLivr9k,2716
40
+ tritonclient-2.36.0.dist-info/WHEEL,sha256=HVOIUsWA--OEoo_LBcXUZ_J2MMLFJ69mOq_A9H3ARGY,93
41
+ tritonclient-2.36.0.dist-info/top_level.txt,sha256=J2zLu0JxoFexDB102feHPD6J3JXAUEYUInFJZM9yEkM,65
42
+ tritonclient-2.36.0.dist-info/RECORD,,
@@ -1,40 +0,0 @@
1
- tritonclient-2.34.0.data/data/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
2
- tritonclient-2.34.0.data/purelib/tritonclient/__init__.py,sha256=erynU-5HRlcIz1tx1Ve0kdCnzAXfNFeUYB5bx2fnL4Y,1542
3
- tritonclient-2.34.0.data/purelib/tritonclient/_auth.py,sha256=sXf16LlDoQj1qI3GSnFa1mgOv0zhwFmB0OHofkIwVh0,2047
4
- tritonclient-2.34.0.data/purelib/tritonclient/_client.py,sha256=8-VaArNooS9zKRY0aYTW9xvphmNa5vgWy7PDbBnGVw4,2964
5
- tritonclient-2.34.0.data/purelib/tritonclient/_plugin.py,sha256=hAaX9FakQBsbh5DZVAlcDujVwrV4EddcmPxMp3puxX0,2069
6
- tritonclient-2.34.0.data/purelib/tritonclient/_request.py,sha256=RmGnJpiRxTi33mn8Nl7ivGFqeKjicj_HhShtgOTci8I,1789
7
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/__init__.py,sha256=MDsTzhwtE6603Ixkf6g_N3_5OCqhoDdCZT0KuZFtAmI,2959
8
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_client.py,sha256=HT1E8nMsi5TYjeRRuhLIwT3gD17_223M2nN8spSdzi4,67932
9
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_input.py,sha256=5cfHBc7lVxWq36HGG12xgnQlx_-3OG8L0fQ18AK3zjA,7213
10
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_result.py,sha256=gWA8LO7SiA7BsJnC8TGVh0kfE3hEmRrXNpXRSqMmOwY,6193
11
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_stream.py,sha256=AYGC7pD2jXkFQr0wq1moUE1MDgICMMTHVbCFvlujvl8,6618
12
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_requested_output.py,sha256=SUHrwwH0RA2Uge6imndW5hNdzhcZtNhrV_0DRwFep8U,4409
13
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/_utils.py,sha256=JdmHVv7efZg_Wiuf4tW6Q5hyqK_v9k_9aw7C4Mh3U38,4953
14
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/model_config_pb2.py,sha256=UI9ApQ47f5WzOtQX0KnNnXzwCA-Ady0VHimxLlKYi4M,46315
15
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/service_pb2.py,sha256=q3bQJtgKaCFJlWSZxkZjOmCU0BRNG3S5_1QaiV-oG58,54542
16
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/service_pb2_grpc.py,sha256=BRXBBgehQgx_LSLqiw_N0zqFl4NYDhstm6AJHP3uxBw,37795
17
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/aio/__init__.py,sha256=8gEdEltJSzd3GF_xSrLG1gh3aGuvX7aQzigi1WPbw1I,32979
18
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/aio/auth/__init__.py,sha256=nOIwuyXvzV1Dha2ZFX5vRjFhgsDa-cBdP2wSWNA6g1w,1573
19
- tritonclient-2.34.0.data/purelib/tritonclient/grpc/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
20
- tritonclient-2.34.0.data/purelib/tritonclient/http/__init__.py,sha256=tbJXG_x_NV7x9LbR2h7DAImiwM3a2uA7HBMKfDhpX1A,2128
21
- tritonclient-2.34.0.data/purelib/tritonclient/http/_client.py,sha256=R8QDM_hFJACsvly0QheM7_ZRLkUrOEp6RMhPOLVUO1g,61716
22
- tritonclient-2.34.0.data/purelib/tritonclient/http/_infer_input.py,sha256=eEYQEiK8AzAAW5zJq_c_thbxdHq0mAAjdWgeZYv5EoY,9506
23
- tritonclient-2.34.0.data/purelib/tritonclient/http/_infer_result.py,sha256=vQIcWxxThgvFSnChZwZebKIJW-pSawXG1nVi6ncCYYE,9920
24
- tritonclient-2.34.0.data/purelib/tritonclient/http/_requested_output.py,sha256=QU-07jLHbKh1S7hCoqvqjPxrHWeb0CsJ8Qd3077AU1U,4695
25
- tritonclient-2.34.0.data/purelib/tritonclient/http/_utils.py,sha256=rMw1Ojz3UFsbPjrvU4nKVLH65TPJbujMJXhw7klZynk,5118
26
- tritonclient-2.34.0.data/purelib/tritonclient/http/aio/__init__.py,sha256=edd6GlMqiAb2kJG2jWlBs2P0B6cjAIYig4hEcFs4U68,30390
27
- tritonclient-2.34.0.data/purelib/tritonclient/http/aio/auth/__init__.py,sha256=2hd0vpFKURRLz9MjB6sf1Tnfq3bzLdhgG_VJBFwj6vA,1575
28
- tritonclient-2.34.0.data/purelib/tritonclient/http/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
29
- tritonclient-2.34.0.data/purelib/tritonclient/utils/__init__.py,sha256=0aKf-KpxgWFqMIXT-5msg_Y4LNCDMe33VyuTcuyRNM4,10503
30
- tritonclient-2.34.0.data/purelib/tritonclientutils/__init__.py,sha256=D9hxs7FZaDd50ql_jLvaDFOwH8gCOp2LeFTaW1purzo,1821
31
- tritonclient-2.34.0.data/purelib/tritongrpcclient/__init__.py,sha256=hRAS-HadBCUVAzEFi2ZNW0Cbtd2-x09mmG0bXu-Q3iI,1818
32
- tritonclient-2.34.0.data/purelib/tritongrpcclient/grpc_service_pb2.py,sha256=L8UJUpxXzI0AA8YbGActcCUiaYQodaZBRLlOEDcbtEU,1842
33
- tritonclient-2.34.0.data/purelib/tritongrpcclient/grpc_service_pb2_grpc.py,sha256=YN64p5Y7HZ7eMLnM596As4WAQ2FKh828Rda7jVXF9TM,1852
34
- tritonclient-2.34.0.data/purelib/tritongrpcclient/model_config_pb2.py,sha256=Mk94wHJMdtG4Ptj0QSTVz7uRDsfX-l4zmN0dPeqiIZE,1852
35
- tritonclient-2.34.0.data/purelib/tritonhttpclient/__init__.py,sha256=IHIoNJAlBvjTut2ySmh9c0Iw1DyJzc4a5IcYbrzLw3Q,1818
36
- tritonclient-2.34.0.dist-info/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
37
- tritonclient-2.34.0.dist-info/METADATA,sha256=F7faWwgsiTKETF7NL6g7-V_CFRR4JXHye0X3Oy4XyEI,2716
38
- tritonclient-2.34.0.dist-info/WHEEL,sha256=HVOIUsWA--OEoo_LBcXUZ_J2MMLFJ69mOq_A9H3ARGY,93
39
- tritonclient-2.34.0.dist-info/top_level.txt,sha256=J2zLu0JxoFexDB102feHPD6J3JXAUEYUInFJZM9yEkM,65
40
- tritonclient-2.34.0.dist-info/RECORD,,