tritonclient 2.34.0__py3-none-any.whl → 2.36.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_client.py +20 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_utils.py +1 -1
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/__init__.py +4 -1
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/model_config_pb2.py +1 -1
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2.py +131 -121
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/utils/__init__.py +1 -0
- tritonclient-2.36.0.data/purelib/tritonclient/utils/_dlpack.py +266 -0
- tritonclient-2.36.0.data/purelib/tritonclient/utils/_shared_memory_tensor.py +79 -0
- {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/METADATA +1 -1
- tritonclient-2.36.0.dist-info/RECORD +42 -0
- tritonclient-2.34.0.dist-info/RECORD +0 -40
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/data/LICENSE.txt +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_auth.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_client.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_plugin.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/_request.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_input.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_result.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_stream.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_requested_output.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/auth/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/auth/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2_grpc.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_client.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_input.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_result.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_requested_output.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_utils.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/auth/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/auth/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclientutils/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/__init__.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/grpc_service_pb2.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/grpc_service_pb2_grpc.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/model_config_pb2.py +0 -0
- {tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonhttpclient/__init__.py +0 -0
- {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/LICENSE.txt +0 -0
- {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/WHEEL +0 -0
- {tritonclient-2.34.0.dist-info → tritonclient-2.36.0.dist-info}/top_level.txt +0 -0
|
@@ -1532,6 +1532,7 @@ class InferenceServerClient(InferenceServerClientBase):
|
|
|
1532
1532
|
sequence_id=0,
|
|
1533
1533
|
sequence_start=False,
|
|
1534
1534
|
sequence_end=False,
|
|
1535
|
+
enable_empty_final_response=False,
|
|
1535
1536
|
priority=0,
|
|
1536
1537
|
timeout=None,
|
|
1537
1538
|
parameters=None):
|
|
@@ -1571,6 +1572,18 @@ class InferenceServerClient(InferenceServerClientBase):
|
|
|
1571
1572
|
Indicates whether the request being added marks the end of the
|
|
1572
1573
|
sequence. Default value is False. This argument is ignored if
|
|
1573
1574
|
'sequence_id' is 0 or "".
|
|
1575
|
+
enable_empty_final_response: bool
|
|
1576
|
+
Indicates whether "empty" responses should be generated and sent
|
|
1577
|
+
back to the client from the server during streaming inference when
|
|
1578
|
+
they contain the TRITONSERVER_RESPONSE_COMPLETE_FINAL flag.
|
|
1579
|
+
This strictly relates to the case of models/backends that send
|
|
1580
|
+
flags-only responses (use TRITONBACKEND_ResponseFactorySendFlags(TRITONSERVER_RESPONSE_COMPLETE_FINAL)
|
|
1581
|
+
or InferenceResponseSender.send(flags=TRITONSERVER_RESPONSE_COMPLETE_FINAL))
|
|
1582
|
+
Currently, this only occurs for decoupled models, and can be
|
|
1583
|
+
used to communicate to the client when a request has received
|
|
1584
|
+
its final response from the model. If the backend sends the final
|
|
1585
|
+
flag along with a non-empty response, this arg is not needed.
|
|
1586
|
+
Default value is False.
|
|
1574
1587
|
priority : int
|
|
1575
1588
|
Indicates the priority of the request. Priority value zero
|
|
1576
1589
|
indicates that the default priority level should be used
|
|
@@ -1616,6 +1629,13 @@ class InferenceServerClient(InferenceServerClientBase):
|
|
|
1616
1629
|
priority=priority,
|
|
1617
1630
|
timeout=timeout,
|
|
1618
1631
|
parameters=parameters)
|
|
1632
|
+
|
|
1633
|
+
# Unique to streaming inference as it only pertains to decoupled models
|
|
1634
|
+
# Only attach the parameter if True, no need to send/parse when False.
|
|
1635
|
+
if enable_empty_final_response:
|
|
1636
|
+
request.parameters[
|
|
1637
|
+
'triton_enable_empty_final_response'].bool_param = True
|
|
1638
|
+
|
|
1619
1639
|
if self._verbose:
|
|
1620
1640
|
print("async_stream_infer\n{}".format(request))
|
|
1621
1641
|
# Enqueues the request to the stream
|
|
@@ -85,7 +85,7 @@ def _get_inference_request(model_name, inputs, model_version, request_id,
|
|
|
85
85
|
request.parameters['sequence_start'].bool_param = sequence_start
|
|
86
86
|
request.parameters['sequence_end'].bool_param = sequence_end
|
|
87
87
|
if priority != 0:
|
|
88
|
-
request.parameters['priority'].
|
|
88
|
+
request.parameters['priority'].uint64_param = priority
|
|
89
89
|
if timeout is not None:
|
|
90
90
|
request.parameters['timeout'].int64_param = timeout
|
|
91
91
|
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/__init__.py
RENAMED
|
@@ -24,9 +24,12 @@
|
|
|
24
24
|
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
25
25
|
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
26
26
|
|
|
27
|
+
import base64
|
|
28
|
+
|
|
29
|
+
import rapidjson as json
|
|
30
|
+
from google.protobuf.json_format import MessageToJson
|
|
27
31
|
from tritonclient.grpc import *
|
|
28
32
|
from .._utils import _get_inference_request, _grpc_compression_type
|
|
29
|
-
import base64
|
|
30
33
|
from ..._client import InferenceServerClientBase
|
|
31
34
|
from ..._request import Request
|
|
32
35
|
from ..._plugin import InferenceServerClientPlugin
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/model_config_pb2.py
RENAMED
|
@@ -15,7 +15,7 @@ _sym_db = _symbol_database.Default()
|
|
|
15
15
|
|
|
16
16
|
|
|
17
17
|
|
|
18
|
-
DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12model_config.proto\x12\tinference\"\x96\x01\n\x10ModelRateLimiter\x12\x37\n\tresources\x18\x01 \x03(\x0b\x32$.inference.ModelRateLimiter.Resource\x12\x10\n\x08priority\x18\x02 \x01(\r\x1a\x37\n\x08Resource\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0e\n\x06global\x18\x02 \x01(\x08\x12\r\n\x05\x63ount\x18\x03 \x01(\r\"\x87\x04\n\x12ModelInstanceGroup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x30\n\x04kind\x18\x04 \x01(\x0e\x32\".inference.ModelInstanceGroup.Kind\x12\r\n\x05\x63ount\x18\x02 \x01(\x05\x12\x31\n\x0crate_limiter\x18\x06 \x01(\x0b\x32\x1b.inference.ModelRateLimiter\x12\x0c\n\x04gpus\x18\x03 \x03(\x05\x12H\n\x11secondary_devices\x18\x08 \x03(\x0b\x32-.inference.ModelInstanceGroup.SecondaryDevice\x12\x0f\n\x07profile\x18\x05 \x03(\t\x12\x0f\n\x07passive\x18\x07 \x01(\x08\x12\x13\n\x0bhost_policy\x18\t \x01(\t\x1a\x9c\x01\n\x0fSecondaryDevice\x12O\n\x04kind\x18\x01 \x01(\x0e\x32\x41.inference.ModelInstanceGroup.SecondaryDevice.SecondaryDeviceKind\x12\x11\n\tdevice_id\x18\x02 \x01(\x03\"%\n\x13SecondaryDeviceKind\x12\x0e\n\nKIND_NVDLA\x10\x00\"A\n\x04Kind\x12\r\n\tKIND_AUTO\x10\x00\x12\x0c\n\x08KIND_GPU\x10\x01\x12\x0c\n\x08KIND_CPU\x10\x02\x12\x0e\n\nKIND_MODEL\x10\x03\"#\n\x12ModelTensorReshape\x12\r\n\x05shape\x18\x01 \x03(\x03\"\xb2\x02\n\nModelInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12,\n\x06\x66ormat\x18\x03 \x01(\x0e\x32\x1c.inference.ModelInput.Format\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\x12\x1a\n\x12\x61llow_ragged_batch\x18\x07 \x01(\x08\x12\x10\n\x08optional\x18\x08 \x01(\x08\";\n\x06\x46ormat\x12\x0f\n\x0b\x46ORMAT_NONE\x10\x00\x12\x0f\n\x0b\x46ORMAT_NHWC\x10\x01\x12\x0f\n\x0b\x46ORMAT_NCHW\x10\x02\"\xb2\x01\n\x0bModelOutput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x03 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x16\n\x0elabel_filename\x18\x04 \x01(\t\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\"\xd9\x02\n\nBatchInput\x12(\n\x04kind\x18\x01 \x01(\x0e\x32\x1a.inference.BatchInput.Kind\x12\x13\n\x0btarget_name\x18\x02 \x03(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x14\n\x0csource_input\x18\x04 \x03(\t\"\xcd\x01\n\x04Kind\x12\x17\n\x13\x42\x41TCH_ELEMENT_COUNT\x10\x00\x12#\n\x1f\x42\x41TCH_ACCUMULATED_ELEMENT_COUNT\x10\x01\x12-\n)BATCH_ACCUMULATED_ELEMENT_COUNT_WITH_ZERO\x10\x02\x12$\n BATCH_MAX_ELEMENT_COUNT_AS_SHAPE\x10\x03\x12\x14\n\x10\x42\x41TCH_ITEM_SHAPE\x10\x04\x12\x1c\n\x18\x42\x41TCH_ITEM_SHAPE_FLATTEN\x10\x05\"\x8f\x01\n\x0b\x42\x61tchOutput\x12\x13\n\x0btarget_name\x18\x01 \x03(\t\x12)\n\x04kind\x18\x02 \x01(\x0e\x32\x1b.inference.BatchOutput.Kind\x12\x14\n\x0csource_input\x18\x03 \x03(\t\"*\n\x04Kind\x12\"\n\x1e\x42\x41TCH_SCATTER_WITH_INPUT_SHAPE\x10\x00\"\x90\x02\n\x12ModelVersionPolicy\x12\x36\n\x06latest\x18\x01 \x01(\x0b\x32$.inference.ModelVersionPolicy.LatestH\x00\x12\x30\n\x03\x61ll\x18\x02 \x01(\x0b\x32!.inference.ModelVersionPolicy.AllH\x00\x12:\n\x08specific\x18\x03 \x01(\x0b\x32&.inference.ModelVersionPolicy.SpecificH\x00\x1a\x1e\n\x06Latest\x12\x14\n\x0cnum_versions\x18\x01 \x01(\r\x1a\x05\n\x03\x41ll\x1a\x1c\n\x08Specific\x12\x10\n\x08versions\x18\x01 \x03(\x03\x42\x0f\n\rpolicy_choice\"\xfd\r\n\x17ModelOptimizationPolicy\x12\x37\n\x05graph\x18\x01 \x01(\x0b\x32(.inference.ModelOptimizationPolicy.Graph\x12\x42\n\x08priority\x18\x02 \x01(\x0e\x32\x30.inference.ModelOptimizationPolicy.ModelPriority\x12\x35\n\x04\x63uda\x18\x03 \x01(\x0b\x32\'.inference.ModelOptimizationPolicy.Cuda\x12X\n\x16\x65xecution_accelerators\x18\x04 \x01(\x0b\x32\x38.inference.ModelOptimizationPolicy.ExecutionAccelerators\x12R\n\x13input_pinned_memory\x18\x05 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12S\n\x14output_pinned_memory\x18\x06 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12&\n\x1egather_kernel_buffer_threshold\x18\x07 \x01(\r\x12\x16\n\x0e\x65\x61ger_batching\x18\x08 \x01(\x08\x1a\x16\n\x05Graph\x12\r\n\x05level\x18\x01 \x01(\x05\x1a\xba\x05\n\x04\x43uda\x12\x0e\n\x06graphs\x18\x01 \x01(\x08\x12\x18\n\x10\x62usy_wait_events\x18\x02 \x01(\x08\x12\x45\n\ngraph_spec\x18\x03 \x03(\x0b\x32\x31.inference.ModelOptimizationPolicy.Cuda.GraphSpec\x12\x1a\n\x12output_copy_stream\x18\x04 \x01(\x08\x1a\xa4\x04\n\tGraphSpec\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12K\n\x05input\x18\x02 \x03(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.InputEntry\x12W\n\x11graph_lower_bound\x18\x03 \x01(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound\x1a\x14\n\x05Shape\x12\x0b\n\x03\x64im\x18\x01 \x03(\x03\x1a\xdf\x01\n\nLowerBound\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12V\n\x05input\x18\x02 \x03(\x0b\x32G.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound.InputEntry\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\xa4\x03\n\x15\x45xecutionAccelerators\x12g\n\x19gpu_execution_accelerator\x18\x01 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x12g\n\x19\x63pu_execution_accelerator\x18\x02 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x1a\xb8\x01\n\x0b\x41\x63\x63\x65lerator\x12\x0c\n\x04name\x18\x01 \x01(\t\x12h\n\nparameters\x18\x02 \x03(\x0b\x32T.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a$\n\x12PinnedMemoryBuffer\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"I\n\rModelPriority\x12\x14\n\x10PRIORITY_DEFAULT\x10\x00\x12\x10\n\x0cPRIORITY_MAX\x10\x01\x12\x10\n\x0cPRIORITY_MIN\x10\x02\"\xdb\x01\n\x10ModelQueuePolicy\x12\x41\n\x0etimeout_action\x18\x01 \x01(\x0e\x32).inference.ModelQueuePolicy.TimeoutAction\x12$\n\x1c\x64\x65\x66\x61ult_timeout_microseconds\x18\x02 \x01(\x04\x12\x1e\n\x16\x61llow_timeout_override\x18\x03 \x01(\x08\x12\x16\n\x0emax_queue_size\x18\x04 \x01(\r\"&\n\rTimeoutAction\x12\n\n\x06REJECT\x10\x00\x12\t\n\x05\x44\x45LAY\x10\x01\"\x9b\x03\n\x14ModelDynamicBatching\x12\x1c\n\x14preferred_batch_size\x18\x01 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x02 \x01(\x04\x12\x19\n\x11preserve_ordering\x18\x03 \x01(\x08\x12\x17\n\x0fpriority_levels\x18\x04 \x01(\r\x12\x1e\n\x16\x64\x65\x66\x61ult_priority_level\x18\x05 \x01(\r\x12\x39\n\x14\x64\x65\x66\x61ult_queue_policy\x18\x06 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy\x12W\n\x15priority_queue_policy\x18\x07 \x03(\x0b\x32\x38.inference.ModelDynamicBatching.PriorityQueuePolicyEntry\x1aW\n\x18PriorityQueuePolicyEntry\x12\x0b\n\x03key\x18\x01 \x01(\r\x12*\n\x05value\x18\x02 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy:\x02\x38\x01\"\xef\t\n\x15ModelSequenceBatching\x12\x41\n\x06\x64irect\x18\x03 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyDirectH\x00\x12\x41\n\x06oldest\x18\x04 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyOldestH\x00\x12&\n\x1emax_sequence_idle_microseconds\x18\x01 \x01(\x04\x12\x44\n\rcontrol_input\x18\x02 \x03(\x0b\x32-.inference.ModelSequenceBatching.ControlInput\x12\x35\n\x05state\x18\x05 \x03(\x0b\x32&.inference.ModelSequenceBatching.State\x1a\xb1\x02\n\x07\x43ontrol\x12;\n\x04kind\x18\x01 \x01(\x0e\x32-.inference.ModelSequenceBatching.Control.Kind\x12\x18\n\x10int32_false_true\x18\x02 \x03(\x05\x12\x17\n\x0f\x66p32_false_true\x18\x03 \x03(\x02\x12\x17\n\x0f\x62ool_false_true\x18\x05 \x03(\x08\x12&\n\tdata_type\x18\x04 \x01(\x0e\x32\x13.inference.DataType\"u\n\x04Kind\x12\x1a\n\x16\x43ONTROL_SEQUENCE_START\x10\x00\x12\x1a\n\x16\x43ONTROL_SEQUENCE_READY\x10\x01\x12\x18\n\x14\x43ONTROL_SEQUENCE_END\x10\x02\x12\x1b\n\x17\x43ONTROL_SEQUENCE_CORRID\x10\x03\x1aW\n\x0c\x43ontrolInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x39\n\x07\x63ontrol\x18\x02 \x03(\x0b\x32(.inference.ModelSequenceBatching.Control\x1a\x8a\x01\n\x0cInitialState\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x13\n\tdata_file\x18\x04 \x01(\tH\x00\x12\x0c\n\x04name\x18\x05 \x01(\tB\x0c\n\nstate_data\x1a\xac\x01\n\x05State\x12\x12\n\ninput_name\x18\x01 \x01(\t\x12\x13\n\x0boutput_name\x18\x02 \x01(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12\x44\n\rinitial_state\x18\x05 \x03(\x0b\x32-.inference.ModelSequenceBatching.InitialState\x1aX\n\x0eStrategyDirect\x12$\n\x1cmax_queue_delay_microseconds\x18\x01 \x01(\x04\x12 \n\x18minimum_slot_utilization\x18\x02 \x01(\x02\x1au\n\x0eStrategyOldest\x12\x1f\n\x17max_candidate_sequences\x18\x01 \x01(\x05\x12\x1c\n\x14preferred_batch_size\x18\x02 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x03 \x01(\x04\x42\x11\n\x0fstrategy_choice\"\xf6\x02\n\x0fModelEnsembling\x12-\n\x04step\x18\x01 \x03(\x0b\x32\x1f.inference.ModelEnsembling.Step\x1a\xb3\x02\n\x04Step\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\x03\x12@\n\tinput_map\x18\x03 \x03(\x0b\x32-.inference.ModelEnsembling.Step.InputMapEntry\x12\x42\n\noutput_map\x18\x04 \x03(\x0b\x32..inference.ModelEnsembling.Step.OutputMapEntry\x12\x17\n\x0fmodel_namespace\x18\x05 \x01(\t\x1a/\n\rInputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x30\n\x0eOutputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"&\n\x0eModelParameter\x12\x14\n\x0cstring_value\x18\x01 \x01(\t\"\xd9\x02\n\x0bModelWarmup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x02 \x01(\r\x12\x32\n\x06inputs\x18\x03 \x03(\x0b\x32\".inference.ModelWarmup.InputsEntry\x12\r\n\x05\x63ount\x18\x04 \x01(\r\x1a\x97\x01\n\x05Input\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x15\n\x0brandom_data\x18\x04 \x01(\x08H\x00\x12\x19\n\x0finput_data_file\x18\x05 \x01(\tH\x00\x42\x11\n\x0finput_data_type\x1aK\n\x0bInputsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12+\n\x05value\x18\x02 \x01(\x0b\x32\x1c.inference.ModelWarmup.Input:\x02\x38\x01\".\n\x0fModelOperations\x12\x1b\n\x13op_library_filename\x18\x01 \x03(\t\"+\n\x16ModelTransactionPolicy\x12\x11\n\tdecoupled\x18\x01 \x01(\x08\"\xe6\x01\n\x15ModelRepositoryAgents\x12\x36\n\x06\x61gents\x18\x01 \x03(\x0b\x32&.inference.ModelRepositoryAgents.Agent\x1a\x94\x01\n\x05\x41gent\x12\x0c\n\x04name\x18\x01 \x01(\t\x12J\n\nparameters\x18\x02 \x03(\x0b\x32\x36.inference.ModelRepositoryAgents.Agent.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"$\n\x12ModelResponseCache\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"\xb2\n\n\x0bModelConfig\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08platform\x18\x02 \x01(\t\x12\x0f\n\x07\x62\x61\x63kend\x18\x11 \x01(\t\x12\x35\n\x0eversion_policy\x18\x03 \x01(\x0b\x32\x1d.inference.ModelVersionPolicy\x12\x16\n\x0emax_batch_size\x18\x04 \x01(\x05\x12$\n\x05input\x18\x05 \x03(\x0b\x32\x15.inference.ModelInput\x12&\n\x06output\x18\x06 \x03(\x0b\x32\x16.inference.ModelOutput\x12*\n\x0b\x62\x61tch_input\x18\x14 \x03(\x0b\x32\x15.inference.BatchInput\x12,\n\x0c\x62\x61tch_output\x18\x15 \x03(\x0b\x32\x16.inference.BatchOutput\x12\x38\n\x0coptimization\x18\x0c \x01(\x0b\x32\".inference.ModelOptimizationPolicy\x12;\n\x10\x64ynamic_batching\x18\x0b \x01(\x0b\x32\x1f.inference.ModelDynamicBatchingH\x00\x12=\n\x11sequence_batching\x18\r \x01(\x0b\x32 .inference.ModelSequenceBatchingH\x00\x12\x39\n\x13\x65nsemble_scheduling\x18\x0f \x01(\x0b\x32\x1a.inference.ModelEnsemblingH\x00\x12\x35\n\x0einstance_group\x18\x07 \x03(\x0b\x32\x1d.inference.ModelInstanceGroup\x12\x1e\n\x16\x64\x65\x66\x61ult_model_filename\x18\x08 \x01(\t\x12H\n\x12\x63\x63_model_filenames\x18\t \x03(\x0b\x32,.inference.ModelConfig.CcModelFilenamesEntry\x12;\n\x0bmetric_tags\x18\n \x03(\x0b\x32&.inference.ModelConfig.MetricTagsEntry\x12:\n\nparameters\x18\x0e \x03(\x0b\x32&.inference.ModelConfig.ParametersEntry\x12,\n\x0cmodel_warmup\x18\x10 \x03(\x0b\x32\x16.inference.ModelWarmup\x12\x34\n\x10model_operations\x18\x12 \x01(\x0b\x32\x1a.inference.ModelOperations\x12\x43\n\x18model_transaction_policy\x18\x13 \x01(\x0b\x32!.inference.ModelTransactionPolicy\x12\x41\n\x17model_repository_agents\x18\x17 \x01(\x0b\x32 .inference.ModelRepositoryAgents\x12\x35\n\x0eresponse_cache\x18\x18 \x01(\x0b\x32\x1d.inference.ModelResponseCache\x1a\x37\n\x15\x43\x63ModelFilenamesEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x31\n\x0fMetricTagsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.ModelParameter:\x02\x38\x01\x42\x13\n\x11scheduling_choice*\xfa\x01\n\x08\x44\x61taType\x12\x10\n\x0cTYPE_INVALID\x10\x00\x12\r\n\tTYPE_BOOL\x10\x01\x12\x0e\n\nTYPE_UINT8\x10\x02\x12\x0f\n\x0bTYPE_UINT16\x10\x03\x12\x0f\n\x0bTYPE_UINT32\x10\x04\x12\x0f\n\x0bTYPE_UINT64\x10\x05\x12\r\n\tTYPE_INT8\x10\x06\x12\x0e\n\nTYPE_INT16\x10\x07\x12\x0e\n\nTYPE_INT32\x10\x08\x12\x0e\n\nTYPE_INT64\x10\t\x12\r\n\tTYPE_FP16\x10\n\x12\r\n\tTYPE_FP32\x10\x0b\x12\r\n\tTYPE_FP64\x10\x0c\x12\x0f\n\x0bTYPE_STRING\x10\r\x12\r\n\tTYPE_BF16\x10\x0e\x62\x06proto3')
|
|
18
|
+
DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12model_config.proto\x12\tinference\"\x96\x01\n\x10ModelRateLimiter\x12\x37\n\tresources\x18\x01 \x03(\x0b\x32$.inference.ModelRateLimiter.Resource\x12\x10\n\x08priority\x18\x02 \x01(\r\x1a\x37\n\x08Resource\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0e\n\x06global\x18\x02 \x01(\x08\x12\r\n\x05\x63ount\x18\x03 \x01(\r\"\x87\x04\n\x12ModelInstanceGroup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x30\n\x04kind\x18\x04 \x01(\x0e\x32\".inference.ModelInstanceGroup.Kind\x12\r\n\x05\x63ount\x18\x02 \x01(\x05\x12\x31\n\x0crate_limiter\x18\x06 \x01(\x0b\x32\x1b.inference.ModelRateLimiter\x12\x0c\n\x04gpus\x18\x03 \x03(\x05\x12H\n\x11secondary_devices\x18\x08 \x03(\x0b\x32-.inference.ModelInstanceGroup.SecondaryDevice\x12\x0f\n\x07profile\x18\x05 \x03(\t\x12\x0f\n\x07passive\x18\x07 \x01(\x08\x12\x13\n\x0bhost_policy\x18\t \x01(\t\x1a\x9c\x01\n\x0fSecondaryDevice\x12O\n\x04kind\x18\x01 \x01(\x0e\x32\x41.inference.ModelInstanceGroup.SecondaryDevice.SecondaryDeviceKind\x12\x11\n\tdevice_id\x18\x02 \x01(\x03\"%\n\x13SecondaryDeviceKind\x12\x0e\n\nKIND_NVDLA\x10\x00\"A\n\x04Kind\x12\r\n\tKIND_AUTO\x10\x00\x12\x0c\n\x08KIND_GPU\x10\x01\x12\x0c\n\x08KIND_CPU\x10\x02\x12\x0e\n\nKIND_MODEL\x10\x03\"#\n\x12ModelTensorReshape\x12\r\n\x05shape\x18\x01 \x03(\x03\"\xb2\x02\n\nModelInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12,\n\x06\x66ormat\x18\x03 \x01(\x0e\x32\x1c.inference.ModelInput.Format\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\x12\x1a\n\x12\x61llow_ragged_batch\x18\x07 \x01(\x08\x12\x10\n\x08optional\x18\x08 \x01(\x08\";\n\x06\x46ormat\x12\x0f\n\x0b\x46ORMAT_NONE\x10\x00\x12\x0f\n\x0b\x46ORMAT_NHWC\x10\x01\x12\x0f\n\x0b\x46ORMAT_NCHW\x10\x02\"\xb2\x01\n\x0bModelOutput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12&\n\tdata_type\x18\x02 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x03 \x03(\x03\x12.\n\x07reshape\x18\x05 \x01(\x0b\x32\x1d.inference.ModelTensorReshape\x12\x16\n\x0elabel_filename\x18\x04 \x01(\t\x12\x17\n\x0fis_shape_tensor\x18\x06 \x01(\x08\"\xd9\x02\n\nBatchInput\x12(\n\x04kind\x18\x01 \x01(\x0e\x32\x1a.inference.BatchInput.Kind\x12\x13\n\x0btarget_name\x18\x02 \x03(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x14\n\x0csource_input\x18\x04 \x03(\t\"\xcd\x01\n\x04Kind\x12\x17\n\x13\x42\x41TCH_ELEMENT_COUNT\x10\x00\x12#\n\x1f\x42\x41TCH_ACCUMULATED_ELEMENT_COUNT\x10\x01\x12-\n)BATCH_ACCUMULATED_ELEMENT_COUNT_WITH_ZERO\x10\x02\x12$\n BATCH_MAX_ELEMENT_COUNT_AS_SHAPE\x10\x03\x12\x14\n\x10\x42\x41TCH_ITEM_SHAPE\x10\x04\x12\x1c\n\x18\x42\x41TCH_ITEM_SHAPE_FLATTEN\x10\x05\"\x8f\x01\n\x0b\x42\x61tchOutput\x12\x13\n\x0btarget_name\x18\x01 \x03(\t\x12)\n\x04kind\x18\x02 \x01(\x0e\x32\x1b.inference.BatchOutput.Kind\x12\x14\n\x0csource_input\x18\x03 \x03(\t\"*\n\x04Kind\x12\"\n\x1e\x42\x41TCH_SCATTER_WITH_INPUT_SHAPE\x10\x00\"\x90\x02\n\x12ModelVersionPolicy\x12\x36\n\x06latest\x18\x01 \x01(\x0b\x32$.inference.ModelVersionPolicy.LatestH\x00\x12\x30\n\x03\x61ll\x18\x02 \x01(\x0b\x32!.inference.ModelVersionPolicy.AllH\x00\x12:\n\x08specific\x18\x03 \x01(\x0b\x32&.inference.ModelVersionPolicy.SpecificH\x00\x1a\x1e\n\x06Latest\x12\x14\n\x0cnum_versions\x18\x01 \x01(\r\x1a\x05\n\x03\x41ll\x1a\x1c\n\x08Specific\x12\x10\n\x08versions\x18\x01 \x03(\x03\x42\x0f\n\rpolicy_choice\"\xfd\r\n\x17ModelOptimizationPolicy\x12\x37\n\x05graph\x18\x01 \x01(\x0b\x32(.inference.ModelOptimizationPolicy.Graph\x12\x42\n\x08priority\x18\x02 \x01(\x0e\x32\x30.inference.ModelOptimizationPolicy.ModelPriority\x12\x35\n\x04\x63uda\x18\x03 \x01(\x0b\x32\'.inference.ModelOptimizationPolicy.Cuda\x12X\n\x16\x65xecution_accelerators\x18\x04 \x01(\x0b\x32\x38.inference.ModelOptimizationPolicy.ExecutionAccelerators\x12R\n\x13input_pinned_memory\x18\x05 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12S\n\x14output_pinned_memory\x18\x06 \x01(\x0b\x32\x35.inference.ModelOptimizationPolicy.PinnedMemoryBuffer\x12&\n\x1egather_kernel_buffer_threshold\x18\x07 \x01(\r\x12\x16\n\x0e\x65\x61ger_batching\x18\x08 \x01(\x08\x1a\x16\n\x05Graph\x12\r\n\x05level\x18\x01 \x01(\x05\x1a\xba\x05\n\x04\x43uda\x12\x0e\n\x06graphs\x18\x01 \x01(\x08\x12\x18\n\x10\x62usy_wait_events\x18\x02 \x01(\x08\x12\x45\n\ngraph_spec\x18\x03 \x03(\x0b\x32\x31.inference.ModelOptimizationPolicy.Cuda.GraphSpec\x12\x1a\n\x12output_copy_stream\x18\x04 \x01(\x08\x1a\xa4\x04\n\tGraphSpec\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12K\n\x05input\x18\x02 \x03(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.InputEntry\x12W\n\x11graph_lower_bound\x18\x03 \x01(\x0b\x32<.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound\x1a\x14\n\x05Shape\x12\x0b\n\x03\x64im\x18\x01 \x03(\x03\x1a\xdf\x01\n\nLowerBound\x12\x12\n\nbatch_size\x18\x01 \x01(\x05\x12V\n\x05input\x18\x02 \x03(\x0b\x32G.inference.ModelOptimizationPolicy.Cuda.GraphSpec.LowerBound.InputEntry\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\x65\n\nInputEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x46\n\x05value\x18\x02 \x01(\x0b\x32\x37.inference.ModelOptimizationPolicy.Cuda.GraphSpec.Shape:\x02\x38\x01\x1a\xa4\x03\n\x15\x45xecutionAccelerators\x12g\n\x19gpu_execution_accelerator\x18\x01 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x12g\n\x19\x63pu_execution_accelerator\x18\x02 \x03(\x0b\x32\x44.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator\x1a\xb8\x01\n\x0b\x41\x63\x63\x65lerator\x12\x0c\n\x04name\x18\x01 \x01(\t\x12h\n\nparameters\x18\x02 \x03(\x0b\x32T.inference.ModelOptimizationPolicy.ExecutionAccelerators.Accelerator.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a$\n\x12PinnedMemoryBuffer\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"I\n\rModelPriority\x12\x14\n\x10PRIORITY_DEFAULT\x10\x00\x12\x10\n\x0cPRIORITY_MAX\x10\x01\x12\x10\n\x0cPRIORITY_MIN\x10\x02\"\xdb\x01\n\x10ModelQueuePolicy\x12\x41\n\x0etimeout_action\x18\x01 \x01(\x0e\x32).inference.ModelQueuePolicy.TimeoutAction\x12$\n\x1c\x64\x65\x66\x61ult_timeout_microseconds\x18\x02 \x01(\x04\x12\x1e\n\x16\x61llow_timeout_override\x18\x03 \x01(\x08\x12\x16\n\x0emax_queue_size\x18\x04 \x01(\r\"&\n\rTimeoutAction\x12\n\n\x06REJECT\x10\x00\x12\t\n\x05\x44\x45LAY\x10\x01\"\x9b\x03\n\x14ModelDynamicBatching\x12\x1c\n\x14preferred_batch_size\x18\x01 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x02 \x01(\x04\x12\x19\n\x11preserve_ordering\x18\x03 \x01(\x08\x12\x17\n\x0fpriority_levels\x18\x04 \x01(\x04\x12\x1e\n\x16\x64\x65\x66\x61ult_priority_level\x18\x05 \x01(\x04\x12\x39\n\x14\x64\x65\x66\x61ult_queue_policy\x18\x06 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy\x12W\n\x15priority_queue_policy\x18\x07 \x03(\x0b\x32\x38.inference.ModelDynamicBatching.PriorityQueuePolicyEntry\x1aW\n\x18PriorityQueuePolicyEntry\x12\x0b\n\x03key\x18\x01 \x01(\x04\x12*\n\x05value\x18\x02 \x01(\x0b\x32\x1b.inference.ModelQueuePolicy:\x02\x38\x01\"\xef\t\n\x15ModelSequenceBatching\x12\x41\n\x06\x64irect\x18\x03 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyDirectH\x00\x12\x41\n\x06oldest\x18\x04 \x01(\x0b\x32/.inference.ModelSequenceBatching.StrategyOldestH\x00\x12&\n\x1emax_sequence_idle_microseconds\x18\x01 \x01(\x04\x12\x44\n\rcontrol_input\x18\x02 \x03(\x0b\x32-.inference.ModelSequenceBatching.ControlInput\x12\x35\n\x05state\x18\x05 \x03(\x0b\x32&.inference.ModelSequenceBatching.State\x1a\xb1\x02\n\x07\x43ontrol\x12;\n\x04kind\x18\x01 \x01(\x0e\x32-.inference.ModelSequenceBatching.Control.Kind\x12\x18\n\x10int32_false_true\x18\x02 \x03(\x05\x12\x17\n\x0f\x66p32_false_true\x18\x03 \x03(\x02\x12\x17\n\x0f\x62ool_false_true\x18\x05 \x03(\x08\x12&\n\tdata_type\x18\x04 \x01(\x0e\x32\x13.inference.DataType\"u\n\x04Kind\x12\x1a\n\x16\x43ONTROL_SEQUENCE_START\x10\x00\x12\x1a\n\x16\x43ONTROL_SEQUENCE_READY\x10\x01\x12\x18\n\x14\x43ONTROL_SEQUENCE_END\x10\x02\x12\x1b\n\x17\x43ONTROL_SEQUENCE_CORRID\x10\x03\x1aW\n\x0c\x43ontrolInput\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x39\n\x07\x63ontrol\x18\x02 \x03(\x0b\x32(.inference.ModelSequenceBatching.Control\x1a\x8a\x01\n\x0cInitialState\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x13\n\tdata_file\x18\x04 \x01(\tH\x00\x12\x0c\n\x04name\x18\x05 \x01(\tB\x0c\n\nstate_data\x1a\xac\x01\n\x05State\x12\x12\n\ninput_name\x18\x01 \x01(\t\x12\x13\n\x0boutput_name\x18\x02 \x01(\t\x12&\n\tdata_type\x18\x03 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x04 \x03(\x03\x12\x44\n\rinitial_state\x18\x05 \x03(\x0b\x32-.inference.ModelSequenceBatching.InitialState\x1aX\n\x0eStrategyDirect\x12$\n\x1cmax_queue_delay_microseconds\x18\x01 \x01(\x04\x12 \n\x18minimum_slot_utilization\x18\x02 \x01(\x02\x1au\n\x0eStrategyOldest\x12\x1f\n\x17max_candidate_sequences\x18\x01 \x01(\x05\x12\x1c\n\x14preferred_batch_size\x18\x02 \x03(\x05\x12$\n\x1cmax_queue_delay_microseconds\x18\x03 \x01(\x04\x42\x11\n\x0fstrategy_choice\"\xf6\x02\n\x0fModelEnsembling\x12-\n\x04step\x18\x01 \x03(\x0b\x32\x1f.inference.ModelEnsembling.Step\x1a\xb3\x02\n\x04Step\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\x03\x12@\n\tinput_map\x18\x03 \x03(\x0b\x32-.inference.ModelEnsembling.Step.InputMapEntry\x12\x42\n\noutput_map\x18\x04 \x03(\x0b\x32..inference.ModelEnsembling.Step.OutputMapEntry\x12\x17\n\x0fmodel_namespace\x18\x05 \x01(\t\x1a/\n\rInputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x30\n\x0eOutputMapEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"&\n\x0eModelParameter\x12\x14\n\x0cstring_value\x18\x01 \x01(\t\"\xd9\x02\n\x0bModelWarmup\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x02 \x01(\r\x12\x32\n\x06inputs\x18\x03 \x03(\x0b\x32\".inference.ModelWarmup.InputsEntry\x12\r\n\x05\x63ount\x18\x04 \x01(\r\x1a\x97\x01\n\x05Input\x12&\n\tdata_type\x18\x01 \x01(\x0e\x32\x13.inference.DataType\x12\x0c\n\x04\x64ims\x18\x02 \x03(\x03\x12\x13\n\tzero_data\x18\x03 \x01(\x08H\x00\x12\x15\n\x0brandom_data\x18\x04 \x01(\x08H\x00\x12\x19\n\x0finput_data_file\x18\x05 \x01(\tH\x00\x42\x11\n\x0finput_data_type\x1aK\n\x0bInputsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12+\n\x05value\x18\x02 \x01(\x0b\x32\x1c.inference.ModelWarmup.Input:\x02\x38\x01\".\n\x0fModelOperations\x12\x1b\n\x13op_library_filename\x18\x01 \x03(\t\"+\n\x16ModelTransactionPolicy\x12\x11\n\tdecoupled\x18\x01 \x01(\x08\"\xe6\x01\n\x15ModelRepositoryAgents\x12\x36\n\x06\x61gents\x18\x01 \x03(\x0b\x32&.inference.ModelRepositoryAgents.Agent\x1a\x94\x01\n\x05\x41gent\x12\x0c\n\x04name\x18\x01 \x01(\t\x12J\n\nparameters\x18\x02 \x03(\x0b\x32\x36.inference.ModelRepositoryAgents.Agent.ParametersEntry\x1a\x31\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"$\n\x12ModelResponseCache\x12\x0e\n\x06\x65nable\x18\x01 \x01(\x08\"\xb2\n\n\x0bModelConfig\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08platform\x18\x02 \x01(\t\x12\x0f\n\x07\x62\x61\x63kend\x18\x11 \x01(\t\x12\x35\n\x0eversion_policy\x18\x03 \x01(\x0b\x32\x1d.inference.ModelVersionPolicy\x12\x16\n\x0emax_batch_size\x18\x04 \x01(\x05\x12$\n\x05input\x18\x05 \x03(\x0b\x32\x15.inference.ModelInput\x12&\n\x06output\x18\x06 \x03(\x0b\x32\x16.inference.ModelOutput\x12*\n\x0b\x62\x61tch_input\x18\x14 \x03(\x0b\x32\x15.inference.BatchInput\x12,\n\x0c\x62\x61tch_output\x18\x15 \x03(\x0b\x32\x16.inference.BatchOutput\x12\x38\n\x0coptimization\x18\x0c \x01(\x0b\x32\".inference.ModelOptimizationPolicy\x12;\n\x10\x64ynamic_batching\x18\x0b \x01(\x0b\x32\x1f.inference.ModelDynamicBatchingH\x00\x12=\n\x11sequence_batching\x18\r \x01(\x0b\x32 .inference.ModelSequenceBatchingH\x00\x12\x39\n\x13\x65nsemble_scheduling\x18\x0f \x01(\x0b\x32\x1a.inference.ModelEnsemblingH\x00\x12\x35\n\x0einstance_group\x18\x07 \x03(\x0b\x32\x1d.inference.ModelInstanceGroup\x12\x1e\n\x16\x64\x65\x66\x61ult_model_filename\x18\x08 \x01(\t\x12H\n\x12\x63\x63_model_filenames\x18\t \x03(\x0b\x32,.inference.ModelConfig.CcModelFilenamesEntry\x12;\n\x0bmetric_tags\x18\n \x03(\x0b\x32&.inference.ModelConfig.MetricTagsEntry\x12:\n\nparameters\x18\x0e \x03(\x0b\x32&.inference.ModelConfig.ParametersEntry\x12,\n\x0cmodel_warmup\x18\x10 \x03(\x0b\x32\x16.inference.ModelWarmup\x12\x34\n\x10model_operations\x18\x12 \x01(\x0b\x32\x1a.inference.ModelOperations\x12\x43\n\x18model_transaction_policy\x18\x13 \x01(\x0b\x32!.inference.ModelTransactionPolicy\x12\x41\n\x17model_repository_agents\x18\x17 \x01(\x0b\x32 .inference.ModelRepositoryAgents\x12\x35\n\x0eresponse_cache\x18\x18 \x01(\x0b\x32\x1d.inference.ModelResponseCache\x1a\x37\n\x15\x43\x63ModelFilenamesEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1a\x31\n\x0fMetricTagsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.ModelParameter:\x02\x38\x01\x42\x13\n\x11scheduling_choice*\xfa\x01\n\x08\x44\x61taType\x12\x10\n\x0cTYPE_INVALID\x10\x00\x12\r\n\tTYPE_BOOL\x10\x01\x12\x0e\n\nTYPE_UINT8\x10\x02\x12\x0f\n\x0bTYPE_UINT16\x10\x03\x12\x0f\n\x0bTYPE_UINT32\x10\x04\x12\x0f\n\x0bTYPE_UINT64\x10\x05\x12\r\n\tTYPE_INT8\x10\x06\x12\x0e\n\nTYPE_INT16\x10\x07\x12\x0e\n\nTYPE_INT32\x10\x08\x12\x0e\n\nTYPE_INT64\x10\t\x12\r\n\tTYPE_FP16\x10\n\x12\r\n\tTYPE_FP32\x10\x0b\x12\r\n\tTYPE_FP64\x10\x0c\x12\x0f\n\x0bTYPE_STRING\x10\r\x12\r\n\tTYPE_BF16\x10\x0e\x62\x06proto3')
|
|
19
19
|
|
|
20
20
|
_DATATYPE = DESCRIPTOR.enum_types_by_name['DataType']
|
|
21
21
|
DataType = enum_type_wrapper.EnumTypeWrapper(_DATATYPE)
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2.py
RENAMED
|
@@ -15,7 +15,7 @@ _sym_db = _symbol_database.Default()
|
|
|
15
15
|
from tritonclient.grpc import model_config_pb2 as model__config__pb2
|
|
16
16
|
|
|
17
17
|
|
|
18
|
-
DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12grpc_service.proto\x12\tinference\x1a\x12model_config.proto\"\x13\n\x11ServerLiveRequest\"\"\n\x12ServerLiveResponse\x12\x0c\n\x04live\x18\x01 \x01(\x08\"\x14\n\x12ServerReadyRequest\"$\n\x13ServerReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"2\n\x11ModelReadyRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"#\n\x12ModelReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"\x17\n\x15ServerMetadataRequest\"K\n\x16ServerMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x12\n\nextensions\x18\x03 \x03(\t\"5\n\x14ModelMetadataRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"\x8d\x02\n\x15ModelMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08versions\x18\x02 \x03(\t\x12\x10\n\x08platform\x18\x03 \x01(\t\x12?\n\x06inputs\x18\x04 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x1a?\n\x0eTensorMetadata\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\"i\n\x0eInferParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\"\xd0\x01\n\x13InferTensorContents\x12\x15\n\rbool_contents\x18\x01 \x03(\x08\x12\x14\n\x0cint_contents\x18\x02 \x03(\x05\x12\x16\n\x0eint64_contents\x18\x03 \x03(\x03\x12\x15\n\ruint_contents\x18\x04 \x03(\r\x12\x17\n\x0fuint64_contents\x18\x05 \x03(\x04\x12\x15\n\rfp32_contents\x18\x06 \x03(\x02\x12\x15\n\rfp64_contents\x18\x07 \x03(\x01\x12\x16\n\x0e\x62ytes_contents\x18\x08 \x03(\x0c\"\xee\x06\n\x11ModelInferRequest\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12@\n\nparameters\x18\x04 \x03(\x0b\x32,.inference.ModelInferRequest.ParametersEntry\x12=\n\x06inputs\x18\x05 \x03(\x0b\x32-.inference.ModelInferRequest.InferInputTensor\x12H\n\x07outputs\x18\x06 \x03(\x0b\x32\x37.inference.ModelInferRequest.InferRequestedOutputTensor\x12\x1a\n\x12raw_input_contents\x18\x07 \x03(\x0c\x1a\x94\x02\n\x10InferInputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12Q\n\nparameters\x18\x04 \x03(\x0b\x32=.inference.ModelInferRequest.InferInputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1a\xd5\x01\n\x1aInferRequestedOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12[\n\nparameters\x18\x02 \x03(\x0b\x32G.inference.ModelInferRequest.InferRequestedOutputTensor.ParametersEntry\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"\xd5\x04\n\x12ModelInferResponse\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12\x41\n\nparameters\x18\x04 \x03(\x0b\x32-.inference.ModelInferResponse.ParametersEntry\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelInferResponse.InferOutputTensor\x12\x1b\n\x13raw_output_contents\x18\x06 \x03(\x0c\x1a\x97\x02\n\x11InferOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12S\n\nparameters\x18\x04 \x03(\x0b\x32?.inference.ModelInferResponse.InferOutputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"h\n\x18ModelStreamInferResponse\x12\x15\n\rerror_message\x18\x01 \x01(\t\x12\x35\n\x0einfer_response\x18\x02 \x01(\x0b\x32\x1d.inference.ModelInferResponse\"3\n\x12ModelConfigRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"=\n\x13ModelConfigResponse\x12&\n\x06\x63onfig\x18\x01 \x01(\x0b\x32\x16.inference.ModelConfig\"7\n\x16ModelStatisticsRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\".\n\x11StatisticDuration\x12\r\n\x05\x63ount\x18\x01 \x01(\x04\x12\n\n\x02ns\x18\x02 \x01(\x04\"\x9c\x03\n\x0fInferStatistics\x12-\n\x07success\x18\x01 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12*\n\x04\x66\x61il\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12+\n\x05queue\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_input\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x05 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x06 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12/\n\tcache_hit\x18\x07 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x30\n\ncache_miss\x18\x08 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xca\x01\n\x14InferBatchStatistics\x12\x12\n\nbatch_size\x18\x01 \x01(\x04\x12\x33\n\rcompute_input\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xe5\x01\n\x0fModelStatistics\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x16\n\x0elast_inference\x18\x03 \x01(\x04\x12\x17\n\x0finference_count\x18\x04 \x01(\x04\x12\x17\n\x0f\x65xecution_count\x18\x05 \x01(\x04\x12\x33\n\x0finference_stats\x18\x06 \x01(\x0b\x32\x1a.inference.InferStatistics\x12\x34\n\x0b\x62\x61tch_stats\x18\x07 \x03(\x0b\x32\x1f.inference.InferBatchStatistics\"J\n\x17ModelStatisticsResponse\x12/\n\x0bmodel_stats\x18\x01 \x03(\x0b\x32\x1a.inference.ModelStatistics\"\x8a\x01\n\x18ModelRepositoryParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x15\n\x0b\x62ytes_param\x18\x04 \x01(\x0cH\x00\x42\x12\n\x10parameter_choice\"@\n\x16RepositoryIndexRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\r\n\x05ready\x18\x02 \x01(\x08\"\xa4\x01\n\x17RepositoryIndexResponse\x12=\n\x06models\x18\x01 \x03(\x0b\x32-.inference.RepositoryIndexResponse.ModelIndex\x1aJ\n\nModelIndex\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\r\n\x05state\x18\x03 \x01(\t\x12\x0e\n\x06reason\x18\x04 \x01(\t\"\xec\x01\n\x1aRepositoryModelLoadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12I\n\nparameters\x18\x03 \x03(\x0b\x32\x35.inference.RepositoryModelLoadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1d\n\x1bRepositoryModelLoadResponse\"\xf0\x01\n\x1cRepositoryModelUnloadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12K\n\nparameters\x18\x03 \x03(\x0b\x32\x37.inference.RepositoryModelUnloadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1f\n\x1dRepositoryModelUnloadResponse\"/\n\x1fSystemSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\xa5\x02\n SystemSharedMemoryStatusResponse\x12I\n\x07regions\x18\x01 \x03(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionsEntry\x1aL\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\x1ah\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12G\n\x05value\x18\x02 \x01(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"a\n!SystemSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"$\n\"SystemSharedMemoryRegisterResponse\"3\n#SystemSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"&\n$SystemSharedMemoryUnregisterResponse\"-\n\x1d\x43udaSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\x95\x02\n\x1e\x43udaSharedMemoryStatusResponse\x12G\n\x07regions\x18\x01 \x03(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionsEntry\x1a\x42\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x11\n\tdevice_id\x18\x02 \x01(\x04\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\x1a\x66\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x45\n\x05value\x18\x02 \x01(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"i\n\x1f\x43udaSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nraw_handle\x18\x02 \x01(\x0c\x12\x11\n\tdevice_id\x18\x03 \x01(\x03\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"\"\n CudaSharedMemoryRegisterResponse\"1\n!CudaSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"$\n\"CudaSharedMemoryUnregisterResponse\"\xe6\x01\n\x13TraceSettingRequest\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.TraceSettingRequest.SettingsEntry\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.TraceSettingRequest.SettingValue:\x02\x38\x01\"\xd5\x01\n\x14TraceSettingResponse\x12?\n\x08settings\x18\x01 \x03(\x0b\x32-.inference.TraceSettingResponse.SettingsEntry\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a]\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12;\n\x05value\x18\x02 \x01(\x0b\x32,.inference.TraceSettingResponse.SettingValue:\x02\x38\x01\"\x9a\x02\n\x12LogSettingsRequest\x12=\n\x08settings\x18\x01 \x03(\x0b\x32+.inference.LogSettingsRequest.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a[\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x39\n\x05value\x18\x02 \x01(\x0b\x32*.inference.LogSettingsRequest.SettingValue:\x02\x38\x01\"\x9d\x02\n\x13LogSettingsResponse\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.LogSettingsResponse.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.LogSettingsResponse.SettingValue:\x02\x38\x01\x32\xb7\x0f\n\x14GRPCInferenceService\x12K\n\nServerLive\x12\x1c.inference.ServerLiveRequest\x1a\x1d.inference.ServerLiveResponse\"\x00\x12N\n\x0bServerReady\x12\x1d.inference.ServerReadyRequest\x1a\x1e.inference.ServerReadyResponse\"\x00\x12K\n\nModelReady\x12\x1c.inference.ModelReadyRequest\x1a\x1d.inference.ModelReadyResponse\"\x00\x12W\n\x0eServerMetadata\x12 .inference.ServerMetadataRequest\x1a!.inference.ServerMetadataResponse\"\x00\x12T\n\rModelMetadata\x12\x1f.inference.ModelMetadataRequest\x1a .inference.ModelMetadataResponse\"\x00\x12K\n\nModelInfer\x12\x1c.inference.ModelInferRequest\x1a\x1d.inference.ModelInferResponse\"\x00\x12[\n\x10ModelStreamInfer\x12\x1c.inference.ModelInferRequest\x1a#.inference.ModelStreamInferResponse\"\x00(\x01\x30\x01\x12N\n\x0bModelConfig\x12\x1d.inference.ModelConfigRequest\x1a\x1e.inference.ModelConfigResponse\"\x00\x12Z\n\x0fModelStatistics\x12!.inference.ModelStatisticsRequest\x1a\".inference.ModelStatisticsResponse\"\x00\x12Z\n\x0fRepositoryIndex\x12!.inference.RepositoryIndexRequest\x1a\".inference.RepositoryIndexResponse\"\x00\x12\x66\n\x13RepositoryModelLoad\x12%.inference.RepositoryModelLoadRequest\x1a&.inference.RepositoryModelLoadResponse\"\x00\x12l\n\x15RepositoryModelUnload\x12\'.inference.RepositoryModelUnloadRequest\x1a(.inference.RepositoryModelUnloadResponse\"\x00\x12u\n\x18SystemSharedMemoryStatus\x12*.inference.SystemSharedMemoryStatusRequest\x1a+.inference.SystemSharedMemoryStatusResponse\"\x00\x12{\n\x1aSystemSharedMemoryRegister\x12,.inference.SystemSharedMemoryRegisterRequest\x1a-.inference.SystemSharedMemoryRegisterResponse\"\x00\x12\x81\x01\n\x1cSystemSharedMemoryUnregister\x12..inference.SystemSharedMemoryUnregisterRequest\x1a/.inference.SystemSharedMemoryUnregisterResponse\"\x00\x12o\n\x16\x43udaSharedMemoryStatus\x12(.inference.CudaSharedMemoryStatusRequest\x1a).inference.CudaSharedMemoryStatusResponse\"\x00\x12u\n\x18\x43udaSharedMemoryRegister\x12*.inference.CudaSharedMemoryRegisterRequest\x1a+.inference.CudaSharedMemoryRegisterResponse\"\x00\x12{\n\x1a\x43udaSharedMemoryUnregister\x12,.inference.CudaSharedMemoryUnregisterRequest\x1a-.inference.CudaSharedMemoryUnregisterResponse\"\x00\x12Q\n\x0cTraceSetting\x12\x1e.inference.TraceSettingRequest\x1a\x1f.inference.TraceSettingResponse\"\x00\x12N\n\x0bLogSettings\x12\x1d.inference.LogSettingsRequest\x1a\x1e.inference.LogSettingsResponse\"\x00\x62\x06proto3')
|
|
18
|
+
DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x12grpc_service.proto\x12\tinference\x1a\x12model_config.proto\"\x13\n\x11ServerLiveRequest\"\"\n\x12ServerLiveResponse\x12\x0c\n\x04live\x18\x01 \x01(\x08\"\x14\n\x12ServerReadyRequest\"$\n\x13ServerReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"2\n\x11ModelReadyRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"#\n\x12ModelReadyResponse\x12\r\n\x05ready\x18\x01 \x01(\x08\"\x17\n\x15ServerMetadataRequest\"K\n\x16ServerMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x12\n\nextensions\x18\x03 \x03(\t\"5\n\x14ModelMetadataRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"\x8d\x02\n\x15ModelMetadataResponse\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08versions\x18\x02 \x03(\t\x12\x10\n\x08platform\x18\x03 \x01(\t\x12?\n\x06inputs\x18\x04 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelMetadataResponse.TensorMetadata\x1a?\n\x0eTensorMetadata\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\"\x99\x01\n\x0eInferParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x16\n\x0c\x64ouble_param\x18\x04 \x01(\x01H\x00\x12\x16\n\x0cuint64_param\x18\x05 \x01(\x04H\x00\x42\x12\n\x10parameter_choice\"\xd0\x01\n\x13InferTensorContents\x12\x15\n\rbool_contents\x18\x01 \x03(\x08\x12\x14\n\x0cint_contents\x18\x02 \x03(\x05\x12\x16\n\x0eint64_contents\x18\x03 \x03(\x03\x12\x15\n\ruint_contents\x18\x04 \x03(\r\x12\x17\n\x0fuint64_contents\x18\x05 \x03(\x04\x12\x15\n\rfp32_contents\x18\x06 \x03(\x02\x12\x15\n\rfp64_contents\x18\x07 \x03(\x01\x12\x16\n\x0e\x62ytes_contents\x18\x08 \x03(\x0c\"\xee\x06\n\x11ModelInferRequest\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12@\n\nparameters\x18\x04 \x03(\x0b\x32,.inference.ModelInferRequest.ParametersEntry\x12=\n\x06inputs\x18\x05 \x03(\x0b\x32-.inference.ModelInferRequest.InferInputTensor\x12H\n\x07outputs\x18\x06 \x03(\x0b\x32\x37.inference.ModelInferRequest.InferRequestedOutputTensor\x12\x1a\n\x12raw_input_contents\x18\x07 \x03(\x0c\x1a\x94\x02\n\x10InferInputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12Q\n\nparameters\x18\x04 \x03(\x0b\x32=.inference.ModelInferRequest.InferInputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1a\xd5\x01\n\x1aInferRequestedOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12[\n\nparameters\x18\x02 \x03(\x0b\x32G.inference.ModelInferRequest.InferRequestedOutputTensor.ParametersEntry\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"\xd5\x04\n\x12ModelInferResponse\x12\x12\n\nmodel_name\x18\x01 \x01(\t\x12\x15\n\rmodel_version\x18\x02 \x01(\t\x12\n\n\x02id\x18\x03 \x01(\t\x12\x41\n\nparameters\x18\x04 \x03(\x0b\x32-.inference.ModelInferResponse.ParametersEntry\x12@\n\x07outputs\x18\x05 \x03(\x0b\x32/.inference.ModelInferResponse.InferOutputTensor\x12\x1b\n\x13raw_output_contents\x18\x06 \x03(\x0c\x1a\x97\x02\n\x11InferOutputTensor\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x10\n\x08\x64\x61tatype\x18\x02 \x01(\t\x12\r\n\x05shape\x18\x03 \x03(\x03\x12S\n\nparameters\x18\x04 \x03(\x0b\x32?.inference.ModelInferResponse.InferOutputTensor.ParametersEntry\x12\x30\n\x08\x63ontents\x18\x05 \x01(\x0b\x32\x1e.inference.InferTensorContents\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\x1aL\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12(\n\x05value\x18\x02 \x01(\x0b\x32\x19.inference.InferParameter:\x02\x38\x01\"h\n\x18ModelStreamInferResponse\x12\x15\n\rerror_message\x18\x01 \x01(\t\x12\x35\n\x0einfer_response\x18\x02 \x01(\x0b\x32\x1d.inference.ModelInferResponse\"3\n\x12ModelConfigRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\"=\n\x13ModelConfigResponse\x12&\n\x06\x63onfig\x18\x01 \x01(\x0b\x32\x16.inference.ModelConfig\"7\n\x16ModelStatisticsRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\".\n\x11StatisticDuration\x12\r\n\x05\x63ount\x18\x01 \x01(\x04\x12\n\n\x02ns\x18\x02 \x01(\x04\"\x9c\x03\n\x0fInferStatistics\x12-\n\x07success\x18\x01 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12*\n\x04\x66\x61il\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12+\n\x05queue\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_input\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x05 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x06 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12/\n\tcache_hit\x18\x07 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x30\n\ncache_miss\x18\x08 \x01(\x0b\x32\x1c.inference.StatisticDuration\"\xca\x01\n\x14InferBatchStatistics\x12\x12\n\nbatch_size\x18\x01 \x01(\x04\x12\x33\n\rcompute_input\x18\x02 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x33\n\rcompute_infer\x18\x03 \x01(\x0b\x32\x1c.inference.StatisticDuration\x12\x34\n\x0e\x63ompute_output\x18\x04 \x01(\x0b\x32\x1c.inference.StatisticDuration\":\n\x0bMemoryUsage\x12\x0c\n\x04type\x18\x01 \x01(\t\x12\n\n\x02id\x18\x02 \x01(\x03\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\"\x93\x02\n\x0fModelStatistics\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\x16\n\x0elast_inference\x18\x03 \x01(\x04\x12\x17\n\x0finference_count\x18\x04 \x01(\x04\x12\x17\n\x0f\x65xecution_count\x18\x05 \x01(\x04\x12\x33\n\x0finference_stats\x18\x06 \x01(\x0b\x32\x1a.inference.InferStatistics\x12\x34\n\x0b\x62\x61tch_stats\x18\x07 \x03(\x0b\x32\x1f.inference.InferBatchStatistics\x12,\n\x0cmemory_usage\x18\x08 \x03(\x0b\x32\x16.inference.MemoryUsage\"J\n\x17ModelStatisticsResponse\x12/\n\x0bmodel_stats\x18\x01 \x03(\x0b\x32\x1a.inference.ModelStatistics\"\x8a\x01\n\x18ModelRepositoryParameter\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x15\n\x0bint64_param\x18\x02 \x01(\x03H\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x12\x15\n\x0b\x62ytes_param\x18\x04 \x01(\x0cH\x00\x42\x12\n\x10parameter_choice\"@\n\x16RepositoryIndexRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\r\n\x05ready\x18\x02 \x01(\x08\"\xa4\x01\n\x17RepositoryIndexResponse\x12=\n\x06models\x18\x01 \x03(\x0b\x32-.inference.RepositoryIndexResponse.ModelIndex\x1aJ\n\nModelIndex\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0f\n\x07version\x18\x02 \x01(\t\x12\r\n\x05state\x18\x03 \x01(\t\x12\x0e\n\x06reason\x18\x04 \x01(\t\"\xec\x01\n\x1aRepositoryModelLoadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12I\n\nparameters\x18\x03 \x03(\x0b\x32\x35.inference.RepositoryModelLoadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1d\n\x1bRepositoryModelLoadResponse\"\xf0\x01\n\x1cRepositoryModelUnloadRequest\x12\x17\n\x0frepository_name\x18\x01 \x01(\t\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x12K\n\nparameters\x18\x03 \x03(\x0b\x32\x37.inference.RepositoryModelUnloadRequest.ParametersEntry\x1aV\n\x0fParametersEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x32\n\x05value\x18\x02 \x01(\x0b\x32#.inference.ModelRepositoryParameter:\x02\x38\x01\"\x1f\n\x1dRepositoryModelUnloadResponse\"/\n\x1fSystemSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\xa5\x02\n SystemSharedMemoryStatusResponse\x12I\n\x07regions\x18\x01 \x03(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionsEntry\x1aL\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\x1ah\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12G\n\x05value\x18\x02 \x01(\x0b\x32\x38.inference.SystemSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"a\n!SystemSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0b\n\x03key\x18\x02 \x01(\t\x12\x0e\n\x06offset\x18\x03 \x01(\x04\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"$\n\"SystemSharedMemoryRegisterResponse\"3\n#SystemSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"&\n$SystemSharedMemoryUnregisterResponse\"-\n\x1d\x43udaSharedMemoryStatusRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"\x95\x02\n\x1e\x43udaSharedMemoryStatusResponse\x12G\n\x07regions\x18\x01 \x03(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionsEntry\x1a\x42\n\x0cRegionStatus\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x11\n\tdevice_id\x18\x02 \x01(\x04\x12\x11\n\tbyte_size\x18\x03 \x01(\x04\x1a\x66\n\x0cRegionsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x45\n\x05value\x18\x02 \x01(\x0b\x32\x36.inference.CudaSharedMemoryStatusResponse.RegionStatus:\x02\x38\x01\"i\n\x1f\x43udaSharedMemoryRegisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nraw_handle\x18\x02 \x01(\x0c\x12\x11\n\tdevice_id\x18\x03 \x01(\x03\x12\x11\n\tbyte_size\x18\x04 \x01(\x04\"\"\n CudaSharedMemoryRegisterResponse\"1\n!CudaSharedMemoryUnregisterRequest\x12\x0c\n\x04name\x18\x01 \x01(\t\"$\n\"CudaSharedMemoryUnregisterResponse\"\xe6\x01\n\x13TraceSettingRequest\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.TraceSettingRequest.SettingsEntry\x12\x12\n\nmodel_name\x18\x02 \x01(\t\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.TraceSettingRequest.SettingValue:\x02\x38\x01\"\xd5\x01\n\x14TraceSettingResponse\x12?\n\x08settings\x18\x01 \x03(\x0b\x32-.inference.TraceSettingResponse.SettingsEntry\x1a\x1d\n\x0cSettingValue\x12\r\n\x05value\x18\x01 \x03(\t\x1a]\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12;\n\x05value\x18\x02 \x01(\x0b\x32,.inference.TraceSettingResponse.SettingValue:\x02\x38\x01\"\x9a\x02\n\x12LogSettingsRequest\x12=\n\x08settings\x18\x01 \x03(\x0b\x32+.inference.LogSettingsRequest.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a[\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\x39\n\x05value\x18\x02 \x01(\x0b\x32*.inference.LogSettingsRequest.SettingValue:\x02\x38\x01\"\x9d\x02\n\x13LogSettingsResponse\x12>\n\x08settings\x18\x01 \x03(\x0b\x32,.inference.LogSettingsResponse.SettingsEntry\x1ah\n\x0cSettingValue\x12\x14\n\nbool_param\x18\x01 \x01(\x08H\x00\x12\x16\n\x0cuint32_param\x18\x02 \x01(\rH\x00\x12\x16\n\x0cstring_param\x18\x03 \x01(\tH\x00\x42\x12\n\x10parameter_choice\x1a\\\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12:\n\x05value\x18\x02 \x01(\x0b\x32+.inference.LogSettingsResponse.SettingValue:\x02\x38\x01\x32\xb7\x0f\n\x14GRPCInferenceService\x12K\n\nServerLive\x12\x1c.inference.ServerLiveRequest\x1a\x1d.inference.ServerLiveResponse\"\x00\x12N\n\x0bServerReady\x12\x1d.inference.ServerReadyRequest\x1a\x1e.inference.ServerReadyResponse\"\x00\x12K\n\nModelReady\x12\x1c.inference.ModelReadyRequest\x1a\x1d.inference.ModelReadyResponse\"\x00\x12W\n\x0eServerMetadata\x12 .inference.ServerMetadataRequest\x1a!.inference.ServerMetadataResponse\"\x00\x12T\n\rModelMetadata\x12\x1f.inference.ModelMetadataRequest\x1a .inference.ModelMetadataResponse\"\x00\x12K\n\nModelInfer\x12\x1c.inference.ModelInferRequest\x1a\x1d.inference.ModelInferResponse\"\x00\x12[\n\x10ModelStreamInfer\x12\x1c.inference.ModelInferRequest\x1a#.inference.ModelStreamInferResponse\"\x00(\x01\x30\x01\x12N\n\x0bModelConfig\x12\x1d.inference.ModelConfigRequest\x1a\x1e.inference.ModelConfigResponse\"\x00\x12Z\n\x0fModelStatistics\x12!.inference.ModelStatisticsRequest\x1a\".inference.ModelStatisticsResponse\"\x00\x12Z\n\x0fRepositoryIndex\x12!.inference.RepositoryIndexRequest\x1a\".inference.RepositoryIndexResponse\"\x00\x12\x66\n\x13RepositoryModelLoad\x12%.inference.RepositoryModelLoadRequest\x1a&.inference.RepositoryModelLoadResponse\"\x00\x12l\n\x15RepositoryModelUnload\x12\'.inference.RepositoryModelUnloadRequest\x1a(.inference.RepositoryModelUnloadResponse\"\x00\x12u\n\x18SystemSharedMemoryStatus\x12*.inference.SystemSharedMemoryStatusRequest\x1a+.inference.SystemSharedMemoryStatusResponse\"\x00\x12{\n\x1aSystemSharedMemoryRegister\x12,.inference.SystemSharedMemoryRegisterRequest\x1a-.inference.SystemSharedMemoryRegisterResponse\"\x00\x12\x81\x01\n\x1cSystemSharedMemoryUnregister\x12..inference.SystemSharedMemoryUnregisterRequest\x1a/.inference.SystemSharedMemoryUnregisterResponse\"\x00\x12o\n\x16\x43udaSharedMemoryStatus\x12(.inference.CudaSharedMemoryStatusRequest\x1a).inference.CudaSharedMemoryStatusResponse\"\x00\x12u\n\x18\x43udaSharedMemoryRegister\x12*.inference.CudaSharedMemoryRegisterRequest\x1a+.inference.CudaSharedMemoryRegisterResponse\"\x00\x12{\n\x1a\x43udaSharedMemoryUnregister\x12,.inference.CudaSharedMemoryUnregisterRequest\x1a-.inference.CudaSharedMemoryUnregisterResponse\"\x00\x12Q\n\x0cTraceSetting\x12\x1e.inference.TraceSettingRequest\x1a\x1f.inference.TraceSettingResponse\"\x00\x12N\n\x0bLogSettings\x12\x1d.inference.LogSettingsRequest\x1a\x1e.inference.LogSettingsResponse\"\x00\x62\x06proto3')
|
|
19
19
|
|
|
20
20
|
|
|
21
21
|
|
|
@@ -49,6 +49,7 @@ _MODELSTATISTICSREQUEST = DESCRIPTOR.message_types_by_name['ModelStatisticsReque
|
|
|
49
49
|
_STATISTICDURATION = DESCRIPTOR.message_types_by_name['StatisticDuration']
|
|
50
50
|
_INFERSTATISTICS = DESCRIPTOR.message_types_by_name['InferStatistics']
|
|
51
51
|
_INFERBATCHSTATISTICS = DESCRIPTOR.message_types_by_name['InferBatchStatistics']
|
|
52
|
+
_MEMORYUSAGE = DESCRIPTOR.message_types_by_name['MemoryUsage']
|
|
52
53
|
_MODELSTATISTICS = DESCRIPTOR.message_types_by_name['ModelStatistics']
|
|
53
54
|
_MODELSTATISTICSRESPONSE = DESCRIPTOR.message_types_by_name['ModelStatisticsResponse']
|
|
54
55
|
_MODELREPOSITORYPARAMETER = DESCRIPTOR.message_types_by_name['ModelRepositoryParameter']
|
|
@@ -308,6 +309,13 @@ InferBatchStatistics = _reflection.GeneratedProtocolMessageType('InferBatchStati
|
|
|
308
309
|
})
|
|
309
310
|
_sym_db.RegisterMessage(InferBatchStatistics)
|
|
310
311
|
|
|
312
|
+
MemoryUsage = _reflection.GeneratedProtocolMessageType('MemoryUsage', (_message.Message,), {
|
|
313
|
+
'DESCRIPTOR' : _MEMORYUSAGE,
|
|
314
|
+
'__module__' : 'grpc_service_pb2'
|
|
315
|
+
# @@protoc_insertion_point(class_scope:inference.MemoryUsage)
|
|
316
|
+
})
|
|
317
|
+
_sym_db.RegisterMessage(MemoryUsage)
|
|
318
|
+
|
|
311
319
|
ModelStatistics = _reflection.GeneratedProtocolMessageType('ModelStatistics', (_message.Message,), {
|
|
312
320
|
'DESCRIPTOR' : _MODELSTATISTICS,
|
|
313
321
|
'__module__' : 'grpc_service_pb2'
|
|
@@ -655,124 +663,126 @@ if _descriptor._USE_C_DESCRIPTORS == False:
|
|
|
655
663
|
_MODELMETADATARESPONSE._serialized_end=686
|
|
656
664
|
_MODELMETADATARESPONSE_TENSORMETADATA._serialized_start=623
|
|
657
665
|
_MODELMETADATARESPONSE_TENSORMETADATA._serialized_end=686
|
|
658
|
-
_INFERPARAMETER._serialized_start=
|
|
659
|
-
_INFERPARAMETER._serialized_end=
|
|
660
|
-
_INFERTENSORCONTENTS._serialized_start=
|
|
661
|
-
_INFERTENSORCONTENTS._serialized_end=
|
|
662
|
-
_MODELINFERREQUEST._serialized_start=
|
|
663
|
-
_MODELINFERREQUEST._serialized_end=
|
|
664
|
-
_MODELINFERREQUEST_INFERINPUTTENSOR._serialized_start=
|
|
665
|
-
_MODELINFERREQUEST_INFERINPUTTENSOR._serialized_end=
|
|
666
|
-
_MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_start=
|
|
667
|
-
_MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_end=
|
|
668
|
-
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_start=
|
|
669
|
-
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_end=
|
|
670
|
-
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_start=
|
|
671
|
-
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_end=
|
|
672
|
-
_MODELINFERREQUEST_PARAMETERSENTRY._serialized_start=
|
|
673
|
-
_MODELINFERREQUEST_PARAMETERSENTRY._serialized_end=
|
|
674
|
-
_MODELINFERRESPONSE._serialized_start=
|
|
675
|
-
_MODELINFERRESPONSE._serialized_end=
|
|
676
|
-
_MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_start=
|
|
677
|
-
_MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_end=
|
|
678
|
-
_MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_start=
|
|
679
|
-
_MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_end=
|
|
680
|
-
_MODELINFERRESPONSE_PARAMETERSENTRY._serialized_start=
|
|
681
|
-
_MODELINFERRESPONSE_PARAMETERSENTRY._serialized_end=
|
|
682
|
-
_MODELSTREAMINFERRESPONSE._serialized_start=
|
|
683
|
-
_MODELSTREAMINFERRESPONSE._serialized_end=
|
|
684
|
-
_MODELCONFIGREQUEST._serialized_start=
|
|
685
|
-
_MODELCONFIGREQUEST._serialized_end=
|
|
686
|
-
_MODELCONFIGRESPONSE._serialized_start=
|
|
687
|
-
_MODELCONFIGRESPONSE._serialized_end=
|
|
688
|
-
_MODELSTATISTICSREQUEST._serialized_start=
|
|
689
|
-
_MODELSTATISTICSREQUEST._serialized_end=
|
|
690
|
-
_STATISTICDURATION._serialized_start=
|
|
691
|
-
_STATISTICDURATION._serialized_end=
|
|
692
|
-
_INFERSTATISTICS._serialized_start=
|
|
693
|
-
_INFERSTATISTICS._serialized_end=
|
|
694
|
-
_INFERBATCHSTATISTICS._serialized_start=
|
|
695
|
-
_INFERBATCHSTATISTICS._serialized_end=
|
|
696
|
-
|
|
697
|
-
|
|
698
|
-
|
|
699
|
-
|
|
700
|
-
|
|
701
|
-
|
|
702
|
-
|
|
703
|
-
|
|
704
|
-
|
|
705
|
-
|
|
706
|
-
|
|
707
|
-
|
|
708
|
-
|
|
709
|
-
|
|
710
|
-
|
|
711
|
-
|
|
712
|
-
|
|
713
|
-
|
|
714
|
-
|
|
715
|
-
|
|
716
|
-
|
|
717
|
-
|
|
718
|
-
|
|
719
|
-
|
|
720
|
-
|
|
721
|
-
|
|
722
|
-
|
|
723
|
-
|
|
724
|
-
|
|
725
|
-
|
|
726
|
-
|
|
727
|
-
|
|
728
|
-
|
|
729
|
-
|
|
730
|
-
|
|
731
|
-
|
|
732
|
-
|
|
733
|
-
|
|
734
|
-
|
|
735
|
-
|
|
736
|
-
|
|
737
|
-
|
|
738
|
-
|
|
739
|
-
|
|
740
|
-
|
|
741
|
-
|
|
742
|
-
|
|
743
|
-
|
|
744
|
-
|
|
745
|
-
|
|
746
|
-
|
|
747
|
-
|
|
748
|
-
|
|
749
|
-
|
|
750
|
-
|
|
751
|
-
|
|
752
|
-
|
|
753
|
-
|
|
754
|
-
|
|
755
|
-
|
|
756
|
-
|
|
757
|
-
|
|
758
|
-
|
|
759
|
-
|
|
760
|
-
|
|
761
|
-
|
|
762
|
-
|
|
763
|
-
|
|
764
|
-
|
|
765
|
-
|
|
766
|
-
|
|
767
|
-
|
|
768
|
-
|
|
769
|
-
|
|
770
|
-
|
|
771
|
-
|
|
772
|
-
|
|
773
|
-
|
|
774
|
-
|
|
775
|
-
|
|
776
|
-
|
|
777
|
-
|
|
666
|
+
_INFERPARAMETER._serialized_start=689
|
|
667
|
+
_INFERPARAMETER._serialized_end=842
|
|
668
|
+
_INFERTENSORCONTENTS._serialized_start=845
|
|
669
|
+
_INFERTENSORCONTENTS._serialized_end=1053
|
|
670
|
+
_MODELINFERREQUEST._serialized_start=1056
|
|
671
|
+
_MODELINFERREQUEST._serialized_end=1934
|
|
672
|
+
_MODELINFERREQUEST_INFERINPUTTENSOR._serialized_start=1364
|
|
673
|
+
_MODELINFERREQUEST_INFERINPUTTENSOR._serialized_end=1640
|
|
674
|
+
_MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
|
|
675
|
+
_MODELINFERREQUEST_INFERINPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
|
|
676
|
+
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_start=1643
|
|
677
|
+
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR._serialized_end=1856
|
|
678
|
+
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
|
|
679
|
+
_MODELINFERREQUEST_INFERREQUESTEDOUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
|
|
680
|
+
_MODELINFERREQUEST_PARAMETERSENTRY._serialized_start=1564
|
|
681
|
+
_MODELINFERREQUEST_PARAMETERSENTRY._serialized_end=1640
|
|
682
|
+
_MODELINFERRESPONSE._serialized_start=1937
|
|
683
|
+
_MODELINFERRESPONSE._serialized_end=2534
|
|
684
|
+
_MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_start=2177
|
|
685
|
+
_MODELINFERRESPONSE_INFEROUTPUTTENSOR._serialized_end=2456
|
|
686
|
+
_MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_start=1564
|
|
687
|
+
_MODELINFERRESPONSE_INFEROUTPUTTENSOR_PARAMETERSENTRY._serialized_end=1640
|
|
688
|
+
_MODELINFERRESPONSE_PARAMETERSENTRY._serialized_start=1564
|
|
689
|
+
_MODELINFERRESPONSE_PARAMETERSENTRY._serialized_end=1640
|
|
690
|
+
_MODELSTREAMINFERRESPONSE._serialized_start=2536
|
|
691
|
+
_MODELSTREAMINFERRESPONSE._serialized_end=2640
|
|
692
|
+
_MODELCONFIGREQUEST._serialized_start=2642
|
|
693
|
+
_MODELCONFIGREQUEST._serialized_end=2693
|
|
694
|
+
_MODELCONFIGRESPONSE._serialized_start=2695
|
|
695
|
+
_MODELCONFIGRESPONSE._serialized_end=2756
|
|
696
|
+
_MODELSTATISTICSREQUEST._serialized_start=2758
|
|
697
|
+
_MODELSTATISTICSREQUEST._serialized_end=2813
|
|
698
|
+
_STATISTICDURATION._serialized_start=2815
|
|
699
|
+
_STATISTICDURATION._serialized_end=2861
|
|
700
|
+
_INFERSTATISTICS._serialized_start=2864
|
|
701
|
+
_INFERSTATISTICS._serialized_end=3276
|
|
702
|
+
_INFERBATCHSTATISTICS._serialized_start=3279
|
|
703
|
+
_INFERBATCHSTATISTICS._serialized_end=3481
|
|
704
|
+
_MEMORYUSAGE._serialized_start=3483
|
|
705
|
+
_MEMORYUSAGE._serialized_end=3541
|
|
706
|
+
_MODELSTATISTICS._serialized_start=3544
|
|
707
|
+
_MODELSTATISTICS._serialized_end=3819
|
|
708
|
+
_MODELSTATISTICSRESPONSE._serialized_start=3821
|
|
709
|
+
_MODELSTATISTICSRESPONSE._serialized_end=3895
|
|
710
|
+
_MODELREPOSITORYPARAMETER._serialized_start=3898
|
|
711
|
+
_MODELREPOSITORYPARAMETER._serialized_end=4036
|
|
712
|
+
_REPOSITORYINDEXREQUEST._serialized_start=4038
|
|
713
|
+
_REPOSITORYINDEXREQUEST._serialized_end=4102
|
|
714
|
+
_REPOSITORYINDEXRESPONSE._serialized_start=4105
|
|
715
|
+
_REPOSITORYINDEXRESPONSE._serialized_end=4269
|
|
716
|
+
_REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_start=4195
|
|
717
|
+
_REPOSITORYINDEXRESPONSE_MODELINDEX._serialized_end=4269
|
|
718
|
+
_REPOSITORYMODELLOADREQUEST._serialized_start=4272
|
|
719
|
+
_REPOSITORYMODELLOADREQUEST._serialized_end=4508
|
|
720
|
+
_REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_start=4422
|
|
721
|
+
_REPOSITORYMODELLOADREQUEST_PARAMETERSENTRY._serialized_end=4508
|
|
722
|
+
_REPOSITORYMODELLOADRESPONSE._serialized_start=4510
|
|
723
|
+
_REPOSITORYMODELLOADRESPONSE._serialized_end=4539
|
|
724
|
+
_REPOSITORYMODELUNLOADREQUEST._serialized_start=4542
|
|
725
|
+
_REPOSITORYMODELUNLOADREQUEST._serialized_end=4782
|
|
726
|
+
_REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_start=4422
|
|
727
|
+
_REPOSITORYMODELUNLOADREQUEST_PARAMETERSENTRY._serialized_end=4508
|
|
728
|
+
_REPOSITORYMODELUNLOADRESPONSE._serialized_start=4784
|
|
729
|
+
_REPOSITORYMODELUNLOADRESPONSE._serialized_end=4815
|
|
730
|
+
_SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_start=4817
|
|
731
|
+
_SYSTEMSHAREDMEMORYSTATUSREQUEST._serialized_end=4864
|
|
732
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_start=4867
|
|
733
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE._serialized_end=5160
|
|
734
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=4978
|
|
735
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=5054
|
|
736
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=5056
|
|
737
|
+
_SYSTEMSHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5160
|
|
738
|
+
_SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_start=5162
|
|
739
|
+
_SYSTEMSHAREDMEMORYREGISTERREQUEST._serialized_end=5259
|
|
740
|
+
_SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_start=5261
|
|
741
|
+
_SYSTEMSHAREDMEMORYREGISTERRESPONSE._serialized_end=5297
|
|
742
|
+
_SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_start=5299
|
|
743
|
+
_SYSTEMSHAREDMEMORYUNREGISTERREQUEST._serialized_end=5350
|
|
744
|
+
_SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5352
|
|
745
|
+
_SYSTEMSHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5390
|
|
746
|
+
_CUDASHAREDMEMORYSTATUSREQUEST._serialized_start=5392
|
|
747
|
+
_CUDASHAREDMEMORYSTATUSREQUEST._serialized_end=5437
|
|
748
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE._serialized_start=5440
|
|
749
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE._serialized_end=5717
|
|
750
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_start=5547
|
|
751
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSTATUS._serialized_end=5613
|
|
752
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_start=5615
|
|
753
|
+
_CUDASHAREDMEMORYSTATUSRESPONSE_REGIONSENTRY._serialized_end=5717
|
|
754
|
+
_CUDASHAREDMEMORYREGISTERREQUEST._serialized_start=5719
|
|
755
|
+
_CUDASHAREDMEMORYREGISTERREQUEST._serialized_end=5824
|
|
756
|
+
_CUDASHAREDMEMORYREGISTERRESPONSE._serialized_start=5826
|
|
757
|
+
_CUDASHAREDMEMORYREGISTERRESPONSE._serialized_end=5860
|
|
758
|
+
_CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_start=5862
|
|
759
|
+
_CUDASHAREDMEMORYUNREGISTERREQUEST._serialized_end=5911
|
|
760
|
+
_CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_start=5913
|
|
761
|
+
_CUDASHAREDMEMORYUNREGISTERRESPONSE._serialized_end=5949
|
|
762
|
+
_TRACESETTINGREQUEST._serialized_start=5952
|
|
763
|
+
_TRACESETTINGREQUEST._serialized_end=6182
|
|
764
|
+
_TRACESETTINGREQUEST_SETTINGVALUE._serialized_start=6059
|
|
765
|
+
_TRACESETTINGREQUEST_SETTINGVALUE._serialized_end=6088
|
|
766
|
+
_TRACESETTINGREQUEST_SETTINGSENTRY._serialized_start=6090
|
|
767
|
+
_TRACESETTINGREQUEST_SETTINGSENTRY._serialized_end=6182
|
|
768
|
+
_TRACESETTINGRESPONSE._serialized_start=6185
|
|
769
|
+
_TRACESETTINGRESPONSE._serialized_end=6398
|
|
770
|
+
_TRACESETTINGRESPONSE_SETTINGVALUE._serialized_start=6059
|
|
771
|
+
_TRACESETTINGRESPONSE_SETTINGVALUE._serialized_end=6088
|
|
772
|
+
_TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_start=6305
|
|
773
|
+
_TRACESETTINGRESPONSE_SETTINGSENTRY._serialized_end=6398
|
|
774
|
+
_LOGSETTINGSREQUEST._serialized_start=6401
|
|
775
|
+
_LOGSETTINGSREQUEST._serialized_end=6683
|
|
776
|
+
_LOGSETTINGSREQUEST_SETTINGVALUE._serialized_start=6486
|
|
777
|
+
_LOGSETTINGSREQUEST_SETTINGVALUE._serialized_end=6590
|
|
778
|
+
_LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_start=6592
|
|
779
|
+
_LOGSETTINGSREQUEST_SETTINGSENTRY._serialized_end=6683
|
|
780
|
+
_LOGSETTINGSRESPONSE._serialized_start=6686
|
|
781
|
+
_LOGSETTINGSRESPONSE._serialized_end=6971
|
|
782
|
+
_LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_start=6486
|
|
783
|
+
_LOGSETTINGSRESPONSE_SETTINGVALUE._serialized_end=6590
|
|
784
|
+
_LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_start=6879
|
|
785
|
+
_LOGSETTINGSRESPONSE_SETTINGSENTRY._serialized_end=6971
|
|
786
|
+
_GRPCINFERENCESERVICE._serialized_start=6974
|
|
787
|
+
_GRPCINFERENCESERVICE._serialized_end=8949
|
|
778
788
|
# @@protoc_insertion_point(module_scope)
|
|
@@ -0,0 +1,266 @@
|
|
|
1
|
+
# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
#
|
|
3
|
+
# Redistribution and use in source and binary forms, with or without
|
|
4
|
+
# modification, are permitted provided that the following conditions
|
|
5
|
+
# are met:
|
|
6
|
+
# * Redistributions of source code must retain the above copyright
|
|
7
|
+
# notice, this list of conditions and the following disclaimer.
|
|
8
|
+
# * Redistributions in binary form must reproduce the above copyright
|
|
9
|
+
# notice, this list of conditions and the following disclaimer in the
|
|
10
|
+
# documentation and/or other materials provided with the distribution.
|
|
11
|
+
# * Neither the name of NVIDIA CORPORATION nor the names of its
|
|
12
|
+
# contributors may be used to endorse or promote products derived
|
|
13
|
+
# from this software without specific prior written permission.
|
|
14
|
+
#
|
|
15
|
+
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
|
|
16
|
+
# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
17
|
+
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
18
|
+
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
|
|
19
|
+
# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
20
|
+
# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
21
|
+
# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
22
|
+
# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
|
|
23
|
+
# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
24
|
+
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
25
|
+
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
26
|
+
|
|
27
|
+
################################################################################
|
|
28
|
+
# This file contains the DLPack API wrapped in Python style (see
|
|
29
|
+
# 'dlpack.h' for detail) and the utilities for Triton client to interact
|
|
30
|
+
# with DLPack
|
|
31
|
+
#
|
|
32
|
+
# Ref:
|
|
33
|
+
# https://github.com/dmlc/dlpack/blob/main/include/dlpack/dlpack.h
|
|
34
|
+
# https://github.com/dmlc/dlpack/blob/main/apps/numpy_dlpack/dlpack/from_numpy.py
|
|
35
|
+
################################################################################
|
|
36
|
+
|
|
37
|
+
import ctypes
|
|
38
|
+
|
|
39
|
+
# Need to explicit set the res / arg types for pythonapi functions to
|
|
40
|
+
# work properly
|
|
41
|
+
ctypes.pythonapi.PyMem_RawMalloc.restype = ctypes.c_void_p
|
|
42
|
+
ctypes.pythonapi.PyMem_RawFree.argtypes = [ctypes.c_void_p]
|
|
43
|
+
|
|
44
|
+
ctypes.pythonapi.PyCapsule_New.restype = ctypes.py_object
|
|
45
|
+
ctypes.pythonapi.PyCapsule_New.argtypes = [
|
|
46
|
+
ctypes.c_void_p, ctypes.c_char_p, ctypes.c_void_p
|
|
47
|
+
]
|
|
48
|
+
|
|
49
|
+
ctypes.pythonapi.PyCapsule_GetPointer.restype = ctypes.c_void_p
|
|
50
|
+
ctypes.pythonapi.PyCapsule_GetPointer.argtypes = [
|
|
51
|
+
ctypes.py_object, ctypes.c_char_p
|
|
52
|
+
]
|
|
53
|
+
|
|
54
|
+
c_str_dltensor = b"dltensor"
|
|
55
|
+
|
|
56
|
+
|
|
57
|
+
class DLDeviceType(ctypes.c_int):
|
|
58
|
+
kDLCPU = 1
|
|
59
|
+
kDLCUDA = 2
|
|
60
|
+
kDLCUDAHost = 3
|
|
61
|
+
kDLOpenCL = 4
|
|
62
|
+
kDLVulkan = 7
|
|
63
|
+
kDLMetal = 8
|
|
64
|
+
kDLVPI = 9
|
|
65
|
+
kDLROCM = 10
|
|
66
|
+
kDLROCMHost = 11
|
|
67
|
+
kDLExtDev = 12
|
|
68
|
+
kDLCUDAManaged = 13
|
|
69
|
+
kDLOneAPI = 14
|
|
70
|
+
kDLWebGPU = 15
|
|
71
|
+
kDLHexagon = 16
|
|
72
|
+
|
|
73
|
+
|
|
74
|
+
class DLDevice(ctypes.Structure):
|
|
75
|
+
_fields_ = [
|
|
76
|
+
("device_type", DLDeviceType),
|
|
77
|
+
("device_id", ctypes.c_int),
|
|
78
|
+
]
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
class DLDataTypeCode(ctypes.c_uint8):
|
|
82
|
+
kDLInt = 0
|
|
83
|
+
kDLUInt = 1
|
|
84
|
+
kDLFloat = 2
|
|
85
|
+
kDLOpaquePointer = 3
|
|
86
|
+
kDLBfloat = 4
|
|
87
|
+
kDLComplex = 5
|
|
88
|
+
kDLBool = 6
|
|
89
|
+
|
|
90
|
+
|
|
91
|
+
class DLDataType(ctypes.Structure):
|
|
92
|
+
_fields_ = [
|
|
93
|
+
("type_code", DLDataTypeCode),
|
|
94
|
+
("bits", ctypes.c_uint8),
|
|
95
|
+
("lanes", ctypes.c_uint16),
|
|
96
|
+
]
|
|
97
|
+
|
|
98
|
+
|
|
99
|
+
class DLTensor(ctypes.Structure):
|
|
100
|
+
_fields_ = [
|
|
101
|
+
("data", ctypes.c_void_p),
|
|
102
|
+
("device", DLDevice),
|
|
103
|
+
("ndim", ctypes.c_int),
|
|
104
|
+
("dtype", DLDataType),
|
|
105
|
+
("shape", ctypes.POINTER(ctypes.c_int64)),
|
|
106
|
+
("strides", ctypes.POINTER(ctypes.c_int64)),
|
|
107
|
+
("byte_offset", ctypes.c_uint64),
|
|
108
|
+
]
|
|
109
|
+
|
|
110
|
+
|
|
111
|
+
class DLManagedTensor(ctypes.Structure):
|
|
112
|
+
_fields_ = [
|
|
113
|
+
("dl_tensor", DLTensor),
|
|
114
|
+
("manager_ctx", ctypes.c_void_p),
|
|
115
|
+
("deleter", ctypes.CFUNCTYPE(None, ctypes.c_void_p)),
|
|
116
|
+
]
|
|
117
|
+
|
|
118
|
+
|
|
119
|
+
# Utilities
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
def _raise_error(msg):
|
|
123
|
+
"""
|
|
124
|
+
Raise error with the provided message
|
|
125
|
+
"""
|
|
126
|
+
raise Exception(msg=msg) from None
|
|
127
|
+
|
|
128
|
+
|
|
129
|
+
# Use as managed context in DLPack that doesn't hold ownership of the
|
|
130
|
+
# data content.
|
|
131
|
+
class DataViewContext:
|
|
132
|
+
|
|
133
|
+
def __init__(self, shape) -> None:
|
|
134
|
+
# Convert the Python object to ctypes objects expected by
|
|
135
|
+
# DLPack
|
|
136
|
+
self._shape = (ctypes.c_int64 * len(shape))(*shape)
|
|
137
|
+
# No strides: compact and row-major
|
|
138
|
+
self._strides = ctypes.POINTER(ctypes.c_int64)()
|
|
139
|
+
|
|
140
|
+
def as_manager_ctx(self) -> ctypes.c_void_p:
|
|
141
|
+
py_obj = ctypes.py_object(self)
|
|
142
|
+
py_obj_ptr = ctypes.pointer(py_obj)
|
|
143
|
+
ctypes.pythonapi.Py_IncRef(py_obj)
|
|
144
|
+
ctypes.pythonapi.Py_IncRef(ctypes.py_object(py_obj_ptr))
|
|
145
|
+
return ctypes.cast(py_obj_ptr, ctypes.c_void_p)
|
|
146
|
+
|
|
147
|
+
|
|
148
|
+
@ctypes.CFUNCTYPE(None, ctypes.c_void_p)
|
|
149
|
+
def managed_tensor_deleter(handle: ctypes.c_void_p) -> None:
|
|
150
|
+
dl_managed_tensor = DLManagedTensor.from_address(handle)
|
|
151
|
+
py_obj_ptr = ctypes.cast(dl_managed_tensor.manager_ctx,
|
|
152
|
+
ctypes.POINTER(ctypes.py_object))
|
|
153
|
+
py_obj = py_obj_ptr.contents
|
|
154
|
+
ctypes.pythonapi.Py_DecRef(py_obj)
|
|
155
|
+
ctypes.pythonapi.Py_DecRef(ctypes.py_object(py_obj_ptr))
|
|
156
|
+
ctypes.pythonapi.PyMem_RawFree(handle)
|
|
157
|
+
|
|
158
|
+
|
|
159
|
+
@ctypes.CFUNCTYPE(None, ctypes.c_void_p)
|
|
160
|
+
def pycapsule_deleter(handle: ctypes.c_void_p) -> None:
|
|
161
|
+
pycapsule: ctypes.py_object = ctypes.cast(handle, ctypes.py_object)
|
|
162
|
+
if ctypes.pythonapi.PyCapsule_IsValid(pycapsule, c_str_dltensor):
|
|
163
|
+
dl_managed_tensor = ctypes.pythonapi.PyCapsule_GetPointer(
|
|
164
|
+
pycapsule, c_str_dltensor)
|
|
165
|
+
managed_tensor_deleter(dl_managed_tensor)
|
|
166
|
+
ctypes.pythonapi.PyCapsule_SetDestructor(pycapsule, None)
|
|
167
|
+
|
|
168
|
+
|
|
169
|
+
def triton_to_dlpack_dtype(dtype):
|
|
170
|
+
if dtype == "BOOL":
|
|
171
|
+
type_code = DLDataTypeCode.kDLBool
|
|
172
|
+
bits = 1
|
|
173
|
+
elif dtype == "INT8":
|
|
174
|
+
type_code = DLDataTypeCode.kDLInt
|
|
175
|
+
bits = 8
|
|
176
|
+
elif dtype == "INT16":
|
|
177
|
+
type_code = DLDataTypeCode.kDLInt
|
|
178
|
+
bits = 16
|
|
179
|
+
elif dtype == "INT32":
|
|
180
|
+
type_code = DLDataTypeCode.kDLInt
|
|
181
|
+
bits = 32
|
|
182
|
+
elif dtype == "INT64":
|
|
183
|
+
type_code = DLDataTypeCode.kDLInt
|
|
184
|
+
bits = 64
|
|
185
|
+
elif dtype == "UINT8":
|
|
186
|
+
type_code = DLDataTypeCode.kDLUInt
|
|
187
|
+
bits = 8
|
|
188
|
+
elif dtype == "UINT16":
|
|
189
|
+
type_code = DLDataTypeCode.kDLUInt
|
|
190
|
+
bits = 16
|
|
191
|
+
elif dtype == "UINT32":
|
|
192
|
+
type_code = DLDataTypeCode.kDLUInt
|
|
193
|
+
bits = 32
|
|
194
|
+
elif dtype == "UINT64":
|
|
195
|
+
type_code = DLDataTypeCode.kDLUInt
|
|
196
|
+
bits = 64
|
|
197
|
+
elif dtype == "FP16":
|
|
198
|
+
type_code = DLDataTypeCode.kDLFloat
|
|
199
|
+
bits = 16
|
|
200
|
+
elif dtype == "FP32":
|
|
201
|
+
type_code = DLDataTypeCode.kDLFloat
|
|
202
|
+
bits = 32
|
|
203
|
+
elif dtype == "FP64":
|
|
204
|
+
type_code = DLDataTypeCode.kDLFloat
|
|
205
|
+
bits = 64
|
|
206
|
+
elif dtype == "BF16":
|
|
207
|
+
type_code = DLDataTypeCode.kDLBfloat
|
|
208
|
+
bits = 16
|
|
209
|
+
elif dtype == "BYTES":
|
|
210
|
+
_raise_error("DLPack currently doesn't suppose BYTES type")
|
|
211
|
+
else:
|
|
212
|
+
_raise_error(
|
|
213
|
+
"Can not covert unknown data type '{}' to DLPack data type".format(
|
|
214
|
+
dtype))
|
|
215
|
+
return DLDataType(type_code, bits, 1)
|
|
216
|
+
|
|
217
|
+
|
|
218
|
+
def is_device_supported(device: DLDevice):
|
|
219
|
+
return device[0] in [
|
|
220
|
+
DLDeviceType.kDLCPU, DLDeviceType.kDLCUDA, DLDeviceType.kDLCUDAHost
|
|
221
|
+
]
|
|
222
|
+
|
|
223
|
+
|
|
224
|
+
def is_contiguous_data(ndim: ctypes.c_int,
|
|
225
|
+
shape: ctypes.POINTER(ctypes.c_int64),
|
|
226
|
+
stride: ctypes.POINTER(ctypes.c_int64)):
|
|
227
|
+
# If 'stride' doesn't capture valid value
|
|
228
|
+
if (stride is None) or (not bool(stride)):
|
|
229
|
+
return True
|
|
230
|
+
calculated_stride = 1
|
|
231
|
+
# iterate stride in reverse order [ndim-1, -1)
|
|
232
|
+
for i in reversed(range(ndim)):
|
|
233
|
+
if stride[i] != calculated_stride:
|
|
234
|
+
return False
|
|
235
|
+
calculated_stride *= shape[i]
|
|
236
|
+
return True
|
|
237
|
+
|
|
238
|
+
|
|
239
|
+
def get_byte_size(dtype: DLDataType, ndim: ctypes.c_int,
|
|
240
|
+
shape: ctypes.POINTER(ctypes.c_int64)):
|
|
241
|
+
element_byte_size = dtype.bits * dtype.lanes // 8 # Assume 8 bits in a byte
|
|
242
|
+
for i in range(ndim):
|
|
243
|
+
element_byte_size *= shape[i]
|
|
244
|
+
return element_byte_size
|
|
245
|
+
|
|
246
|
+
|
|
247
|
+
def get_dlpack_capsule(dlpack_obj, stream=None):
|
|
248
|
+
# Extract PyCapsule of the DLPack object
|
|
249
|
+
if hasattr(dlpack_obj, '__dlpack__'):
|
|
250
|
+
if not hasattr(dlpack_obj, '__dlpack_device__'):
|
|
251
|
+
_raise_error(
|
|
252
|
+
"DLPack expects '__dlpack_device__' if '__dlpack__' has been defined"
|
|
253
|
+
)
|
|
254
|
+
device = dlpack_obj.__dlpack_device__()
|
|
255
|
+
if not is_device_supported(device):
|
|
256
|
+
_raise_error("DLPack device type {} is not supported".format(
|
|
257
|
+
device[0]))
|
|
258
|
+
# Have to condition on the device type as, using numpy as example,
|
|
259
|
+
# some DLPack implementation doesn't accept 'stream' as arguments
|
|
260
|
+
if device != DLDeviceType.kDLCUDA:
|
|
261
|
+
return dlpack_obj.__dlpack__()
|
|
262
|
+
else:
|
|
263
|
+
return dlpack_obj.__dlpack__(stream)
|
|
264
|
+
else:
|
|
265
|
+
# Old interface where PyCapsule object is passed directly
|
|
266
|
+
return dlpack_obj
|
|
@@ -0,0 +1,79 @@
|
|
|
1
|
+
# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
#
|
|
3
|
+
# Redistribution and use in source and binary forms, with or without
|
|
4
|
+
# modification, are permitted provided that the following conditions
|
|
5
|
+
# are met:
|
|
6
|
+
# * Redistributions of source code must retain the above copyright
|
|
7
|
+
# notice, this list of conditions and the following disclaimer.
|
|
8
|
+
# * Redistributions in binary form must reproduce the above copyright
|
|
9
|
+
# notice, this list of conditions and the following disclaimer in the
|
|
10
|
+
# documentation and/or other materials provided with the distribution.
|
|
11
|
+
# * Neither the name of NVIDIA CORPORATION nor the names of its
|
|
12
|
+
# contributors may be used to endorse or promote products derived
|
|
13
|
+
# from this software without specific prior written permission.
|
|
14
|
+
#
|
|
15
|
+
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
|
|
16
|
+
# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
17
|
+
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
18
|
+
# PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
|
|
19
|
+
# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
20
|
+
# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
21
|
+
# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
22
|
+
# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
|
|
23
|
+
# OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
24
|
+
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
25
|
+
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
26
|
+
|
|
27
|
+
import ctypes
|
|
28
|
+
from . import _dlpack
|
|
29
|
+
import collections
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
class SharedMemoryTensor:
|
|
33
|
+
"""An object of SharedMemoryTensor class is a view of the shared memory
|
|
34
|
+
region that follows DLPack specification. This object should be considered
|
|
35
|
+
invalidated if there is modification on the corresponding shared memory
|
|
36
|
+
region.
|
|
37
|
+
|
|
38
|
+
https://dmlc.github.io/dlpack/latest/python_spec.html
|
|
39
|
+
|
|
40
|
+
"""
|
|
41
|
+
|
|
42
|
+
def __init__(self, dtype: str, shape: collections.abc.Iterable,
|
|
43
|
+
shm_addr: ctypes.c_void_p, offset: ctypes.c_uint64,
|
|
44
|
+
byte_size: ctypes.c_uint64, device_id: ctypes.c_int) -> None:
|
|
45
|
+
self._dtype = dtype
|
|
46
|
+
self._shape = shape
|
|
47
|
+
self._shm_addr = shm_addr
|
|
48
|
+
self._offset = offset
|
|
49
|
+
self._byte_size = byte_size
|
|
50
|
+
self._device_id = device_id
|
|
51
|
+
if device_id.value != -1:
|
|
52
|
+
self._dl_device = (_dlpack.DLDeviceType.kDLCUDA, device_id.value)
|
|
53
|
+
else:
|
|
54
|
+
self._dl_device = (_dlpack.DLDeviceType.kDLCPU, 0)
|
|
55
|
+
|
|
56
|
+
def __dlpack__(self, stream=None):
|
|
57
|
+
context = _dlpack.DataViewContext(self._shape)
|
|
58
|
+
size = ctypes.c_size_t(ctypes.sizeof(_dlpack.DLManagedTensor))
|
|
59
|
+
dl_managed_tensor = _dlpack.DLManagedTensor.from_address(
|
|
60
|
+
ctypes.pythonapi.PyMem_RawMalloc(size))
|
|
61
|
+
dl_managed_tensor.dl_tensor.data = self._shm_addr
|
|
62
|
+
dl_managed_tensor.dl_tensor.device = self._dl_device
|
|
63
|
+
dl_managed_tensor.dl_tensor.dtype = _dlpack.triton_to_dlpack_dtype(
|
|
64
|
+
self._dtype)
|
|
65
|
+
dl_managed_tensor.dl_tensor.ndim = len(self._shape)
|
|
66
|
+
dl_managed_tensor.dl_tensor.shape = context._shape
|
|
67
|
+
dl_managed_tensor.dl_tensor.strides = context._strides
|
|
68
|
+
dl_managed_tensor.dl_tensor.byte_offset = self._offset
|
|
69
|
+
dl_managed_tensor.manager_ctx = context.as_manager_ctx()
|
|
70
|
+
dl_managed_tensor.deleter = _dlpack.managed_tensor_deleter
|
|
71
|
+
pycapsule = ctypes.pythonapi.PyCapsule_New(
|
|
72
|
+
ctypes.byref(dl_managed_tensor),
|
|
73
|
+
_dlpack.c_str_dltensor,
|
|
74
|
+
_dlpack.pycapsule_deleter,
|
|
75
|
+
)
|
|
76
|
+
return pycapsule
|
|
77
|
+
|
|
78
|
+
def __dlpack_device__(self):
|
|
79
|
+
return self._dl_device
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
tritonclient-2.36.0.data/data/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
|
|
2
|
+
tritonclient-2.36.0.data/purelib/tritonclient/__init__.py,sha256=erynU-5HRlcIz1tx1Ve0kdCnzAXfNFeUYB5bx2fnL4Y,1542
|
|
3
|
+
tritonclient-2.36.0.data/purelib/tritonclient/_auth.py,sha256=sXf16LlDoQj1qI3GSnFa1mgOv0zhwFmB0OHofkIwVh0,2047
|
|
4
|
+
tritonclient-2.36.0.data/purelib/tritonclient/_client.py,sha256=8-VaArNooS9zKRY0aYTW9xvphmNa5vgWy7PDbBnGVw4,2964
|
|
5
|
+
tritonclient-2.36.0.data/purelib/tritonclient/_plugin.py,sha256=hAaX9FakQBsbh5DZVAlcDujVwrV4EddcmPxMp3puxX0,2069
|
|
6
|
+
tritonclient-2.36.0.data/purelib/tritonclient/_request.py,sha256=RmGnJpiRxTi33mn8Nl7ivGFqeKjicj_HhShtgOTci8I,1789
|
|
7
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/__init__.py,sha256=MDsTzhwtE6603Ixkf6g_N3_5OCqhoDdCZT0KuZFtAmI,2959
|
|
8
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_client.py,sha256=tGQzAF8ld7JKKgIHYmLvSItGQNHz7CuoTLcW_YyMbuk,69184
|
|
9
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_input.py,sha256=5cfHBc7lVxWq36HGG12xgnQlx_-3OG8L0fQ18AK3zjA,7213
|
|
10
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_result.py,sha256=gWA8LO7SiA7BsJnC8TGVh0kfE3hEmRrXNpXRSqMmOwY,6193
|
|
11
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_infer_stream.py,sha256=AYGC7pD2jXkFQr0wq1moUE1MDgICMMTHVbCFvlujvl8,6618
|
|
12
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_requested_output.py,sha256=SUHrwwH0RA2Uge6imndW5hNdzhcZtNhrV_0DRwFep8U,4409
|
|
13
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/_utils.py,sha256=aMF8Vi6TtZve7BJ8QlZ6FjQr1MLkPs0PIg7iV5DVxXo,4954
|
|
14
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/model_config_pb2.py,sha256=KL3whNLO69fTXi4RBrdMDQ1OPsOrPPpjYx1xZCsnA78,46321
|
|
15
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/service_pb2.py,sha256=4DTipBPPoTBFW8FwKCD1BMYYHSxhKizuyYW0vYhg1bg,55250
|
|
16
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/service_pb2_grpc.py,sha256=BRXBBgehQgx_LSLqiw_N0zqFl4NYDhstm6AJHP3uxBw,37795
|
|
17
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/aio/__init__.py,sha256=b4AFQnhd_ujj9eGAEGhpqKlfjDtx9AMLJgrdn77OSEI,33059
|
|
18
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/aio/auth/__init__.py,sha256=nOIwuyXvzV1Dha2ZFX5vRjFhgsDa-cBdP2wSWNA6g1w,1573
|
|
19
|
+
tritonclient-2.36.0.data/purelib/tritonclient/grpc/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
|
|
20
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/__init__.py,sha256=tbJXG_x_NV7x9LbR2h7DAImiwM3a2uA7HBMKfDhpX1A,2128
|
|
21
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/_client.py,sha256=R8QDM_hFJACsvly0QheM7_ZRLkUrOEp6RMhPOLVUO1g,61716
|
|
22
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/_infer_input.py,sha256=eEYQEiK8AzAAW5zJq_c_thbxdHq0mAAjdWgeZYv5EoY,9506
|
|
23
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/_infer_result.py,sha256=vQIcWxxThgvFSnChZwZebKIJW-pSawXG1nVi6ncCYYE,9920
|
|
24
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/_requested_output.py,sha256=QU-07jLHbKh1S7hCoqvqjPxrHWeb0CsJ8Qd3077AU1U,4695
|
|
25
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/_utils.py,sha256=rMw1Ojz3UFsbPjrvU4nKVLH65TPJbujMJXhw7klZynk,5118
|
|
26
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/aio/__init__.py,sha256=edd6GlMqiAb2kJG2jWlBs2P0B6cjAIYig4hEcFs4U68,30390
|
|
27
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/aio/auth/__init__.py,sha256=2hd0vpFKURRLz9MjB6sf1Tnfq3bzLdhgG_VJBFwj6vA,1575
|
|
28
|
+
tritonclient-2.36.0.data/purelib/tritonclient/http/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
|
|
29
|
+
tritonclient-2.36.0.data/purelib/tritonclient/utils/__init__.py,sha256=JVWOJ5YCglG1gJWgfJGsWrCK4PgzFA_2kz3bag3nZ8E,10557
|
|
30
|
+
tritonclient-2.36.0.data/purelib/tritonclient/utils/_dlpack.py,sha256=eEUc-F0pBO6p8vBtN7KC5bB29DdkYH4wS9YtQPn1oKw,8963
|
|
31
|
+
tritonclient-2.36.0.data/purelib/tritonclient/utils/_shared_memory_tensor.py,sha256=Ei9P4xecCckED_lQ7xXL98NJNNuE_89gIW54B4Sh0MY,3688
|
|
32
|
+
tritonclient-2.36.0.data/purelib/tritonclientutils/__init__.py,sha256=D9hxs7FZaDd50ql_jLvaDFOwH8gCOp2LeFTaW1purzo,1821
|
|
33
|
+
tritonclient-2.36.0.data/purelib/tritongrpcclient/__init__.py,sha256=hRAS-HadBCUVAzEFi2ZNW0Cbtd2-x09mmG0bXu-Q3iI,1818
|
|
34
|
+
tritonclient-2.36.0.data/purelib/tritongrpcclient/grpc_service_pb2.py,sha256=L8UJUpxXzI0AA8YbGActcCUiaYQodaZBRLlOEDcbtEU,1842
|
|
35
|
+
tritonclient-2.36.0.data/purelib/tritongrpcclient/grpc_service_pb2_grpc.py,sha256=YN64p5Y7HZ7eMLnM596As4WAQ2FKh828Rda7jVXF9TM,1852
|
|
36
|
+
tritonclient-2.36.0.data/purelib/tritongrpcclient/model_config_pb2.py,sha256=Mk94wHJMdtG4Ptj0QSTVz7uRDsfX-l4zmN0dPeqiIZE,1852
|
|
37
|
+
tritonclient-2.36.0.data/purelib/tritonhttpclient/__init__.py,sha256=IHIoNJAlBvjTut2ySmh9c0Iw1DyJzc4a5IcYbrzLw3Q,1818
|
|
38
|
+
tritonclient-2.36.0.dist-info/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
|
|
39
|
+
tritonclient-2.36.0.dist-info/METADATA,sha256=8H9_Zw6bxz11Sptyuqm93tyy5CApNy8m_Mg4VLivr9k,2716
|
|
40
|
+
tritonclient-2.36.0.dist-info/WHEEL,sha256=HVOIUsWA--OEoo_LBcXUZ_J2MMLFJ69mOq_A9H3ARGY,93
|
|
41
|
+
tritonclient-2.36.0.dist-info/top_level.txt,sha256=J2zLu0JxoFexDB102feHPD6J3JXAUEYUInFJZM9yEkM,65
|
|
42
|
+
tritonclient-2.36.0.dist-info/RECORD,,
|
|
@@ -1,40 +0,0 @@
|
|
|
1
|
-
tritonclient-2.34.0.data/data/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
|
|
2
|
-
tritonclient-2.34.0.data/purelib/tritonclient/__init__.py,sha256=erynU-5HRlcIz1tx1Ve0kdCnzAXfNFeUYB5bx2fnL4Y,1542
|
|
3
|
-
tritonclient-2.34.0.data/purelib/tritonclient/_auth.py,sha256=sXf16LlDoQj1qI3GSnFa1mgOv0zhwFmB0OHofkIwVh0,2047
|
|
4
|
-
tritonclient-2.34.0.data/purelib/tritonclient/_client.py,sha256=8-VaArNooS9zKRY0aYTW9xvphmNa5vgWy7PDbBnGVw4,2964
|
|
5
|
-
tritonclient-2.34.0.data/purelib/tritonclient/_plugin.py,sha256=hAaX9FakQBsbh5DZVAlcDujVwrV4EddcmPxMp3puxX0,2069
|
|
6
|
-
tritonclient-2.34.0.data/purelib/tritonclient/_request.py,sha256=RmGnJpiRxTi33mn8Nl7ivGFqeKjicj_HhShtgOTci8I,1789
|
|
7
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/__init__.py,sha256=MDsTzhwtE6603Ixkf6g_N3_5OCqhoDdCZT0KuZFtAmI,2959
|
|
8
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_client.py,sha256=HT1E8nMsi5TYjeRRuhLIwT3gD17_223M2nN8spSdzi4,67932
|
|
9
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_input.py,sha256=5cfHBc7lVxWq36HGG12xgnQlx_-3OG8L0fQ18AK3zjA,7213
|
|
10
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_result.py,sha256=gWA8LO7SiA7BsJnC8TGVh0kfE3hEmRrXNpXRSqMmOwY,6193
|
|
11
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_infer_stream.py,sha256=AYGC7pD2jXkFQr0wq1moUE1MDgICMMTHVbCFvlujvl8,6618
|
|
12
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_requested_output.py,sha256=SUHrwwH0RA2Uge6imndW5hNdzhcZtNhrV_0DRwFep8U,4409
|
|
13
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/_utils.py,sha256=JdmHVv7efZg_Wiuf4tW6Q5hyqK_v9k_9aw7C4Mh3U38,4953
|
|
14
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/model_config_pb2.py,sha256=UI9ApQ47f5WzOtQX0KnNnXzwCA-Ady0VHimxLlKYi4M,46315
|
|
15
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/service_pb2.py,sha256=q3bQJtgKaCFJlWSZxkZjOmCU0BRNG3S5_1QaiV-oG58,54542
|
|
16
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/service_pb2_grpc.py,sha256=BRXBBgehQgx_LSLqiw_N0zqFl4NYDhstm6AJHP3uxBw,37795
|
|
17
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/aio/__init__.py,sha256=8gEdEltJSzd3GF_xSrLG1gh3aGuvX7aQzigi1WPbw1I,32979
|
|
18
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/aio/auth/__init__.py,sha256=nOIwuyXvzV1Dha2ZFX5vRjFhgsDa-cBdP2wSWNA6g1w,1573
|
|
19
|
-
tritonclient-2.34.0.data/purelib/tritonclient/grpc/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
|
|
20
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/__init__.py,sha256=tbJXG_x_NV7x9LbR2h7DAImiwM3a2uA7HBMKfDhpX1A,2128
|
|
21
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/_client.py,sha256=R8QDM_hFJACsvly0QheM7_ZRLkUrOEp6RMhPOLVUO1g,61716
|
|
22
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/_infer_input.py,sha256=eEYQEiK8AzAAW5zJq_c_thbxdHq0mAAjdWgeZYv5EoY,9506
|
|
23
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/_infer_result.py,sha256=vQIcWxxThgvFSnChZwZebKIJW-pSawXG1nVi6ncCYYE,9920
|
|
24
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/_requested_output.py,sha256=QU-07jLHbKh1S7hCoqvqjPxrHWeb0CsJ8Qd3077AU1U,4695
|
|
25
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/_utils.py,sha256=rMw1Ojz3UFsbPjrvU4nKVLH65TPJbujMJXhw7klZynk,5118
|
|
26
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/aio/__init__.py,sha256=edd6GlMqiAb2kJG2jWlBs2P0B6cjAIYig4hEcFs4U68,30390
|
|
27
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/aio/auth/__init__.py,sha256=2hd0vpFKURRLz9MjB6sf1Tnfq3bzLdhgG_VJBFwj6vA,1575
|
|
28
|
-
tritonclient-2.34.0.data/purelib/tritonclient/http/auth/__init__.py,sha256=1JifMIv8ipug7qUP4joArCyRsEXjxV-DIhvrJ2Kj5Rk,1574
|
|
29
|
-
tritonclient-2.34.0.data/purelib/tritonclient/utils/__init__.py,sha256=0aKf-KpxgWFqMIXT-5msg_Y4LNCDMe33VyuTcuyRNM4,10503
|
|
30
|
-
tritonclient-2.34.0.data/purelib/tritonclientutils/__init__.py,sha256=D9hxs7FZaDd50ql_jLvaDFOwH8gCOp2LeFTaW1purzo,1821
|
|
31
|
-
tritonclient-2.34.0.data/purelib/tritongrpcclient/__init__.py,sha256=hRAS-HadBCUVAzEFi2ZNW0Cbtd2-x09mmG0bXu-Q3iI,1818
|
|
32
|
-
tritonclient-2.34.0.data/purelib/tritongrpcclient/grpc_service_pb2.py,sha256=L8UJUpxXzI0AA8YbGActcCUiaYQodaZBRLlOEDcbtEU,1842
|
|
33
|
-
tritonclient-2.34.0.data/purelib/tritongrpcclient/grpc_service_pb2_grpc.py,sha256=YN64p5Y7HZ7eMLnM596As4WAQ2FKh828Rda7jVXF9TM,1852
|
|
34
|
-
tritonclient-2.34.0.data/purelib/tritongrpcclient/model_config_pb2.py,sha256=Mk94wHJMdtG4Ptj0QSTVz7uRDsfX-l4zmN0dPeqiIZE,1852
|
|
35
|
-
tritonclient-2.34.0.data/purelib/tritonhttpclient/__init__.py,sha256=IHIoNJAlBvjTut2ySmh9c0Iw1DyJzc4a5IcYbrzLw3Q,1818
|
|
36
|
-
tritonclient-2.34.0.dist-info/LICENSE.txt,sha256=NMqy92YzgvtkIas9IW34i27ARqi_sCunXDu-t-EqxL8,1533
|
|
37
|
-
tritonclient-2.34.0.dist-info/METADATA,sha256=F7faWwgsiTKETF7NL6g7-V_CFRR4JXHye0X3Oy4XyEI,2716
|
|
38
|
-
tritonclient-2.34.0.dist-info/WHEEL,sha256=HVOIUsWA--OEoo_LBcXUZ_J2MMLFJ69mOq_A9H3ARGY,93
|
|
39
|
-
tritonclient-2.34.0.dist-info/top_level.txt,sha256=J2zLu0JxoFexDB102feHPD6J3JXAUEYUInFJZM9yEkM,65
|
|
40
|
-
tritonclient-2.34.0.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_input.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_result.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_infer_stream.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/_requested_output.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/aio/auth/__init__.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/auth/__init__.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/grpc/service_pb2_grpc.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_input.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_infer_result.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/_requested_output.py
RENAMED
|
File without changes
|
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/__init__.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/aio/auth/__init__.py
RENAMED
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritonclient/http/auth/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/grpc_service_pb2.py
RENAMED
|
File without changes
|
|
File without changes
|
{tritonclient-2.34.0.data → tritonclient-2.36.0.data}/purelib/tritongrpcclient/model_config_pb2.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|