google-cloud-ai_platform-v1 0.34.0 → 0.35.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -14,7 +14,7 @@ require 'google/cloud/aiplatform/v1/types_pb'
14
14
  require 'google/protobuf/struct_pb'
15
15
 
16
16
 
17
- descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\x8f\t\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
17
+ descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc0\x01\n\x14\x44irectPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x84\x01\n\x15\x44irectPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"{\n\x17\x44irectRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"*\n\x18\x44irectRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"~\n\x1aStreamingRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"-\n\x1bStreamingRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\xb6\x0e\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xc0\x01\n\rDirectPredict\x12\x30.google.cloud.aiplatform.v1.DirectPredictRequest\x1a\x31.google.cloud.aiplatform.v1.DirectPredictResponse\"J\x82\xd3\xe4\x93\x02\x44\"?/v1/{endpoint=projects/*/locations/*/endpoints/*}:directPredict:\x01*\x12\xcc\x01\n\x10\x44irectRawPredict\x12\x33.google.cloud.aiplatform.v1.DirectRawPredictRequest\x1a\x34.google.cloud.aiplatform.v1.DirectRawPredictResponse\"M\x82\xd3\xe4\x93\x02G\"B/v1/{endpoint=projects/*/locations/*/endpoints/*}:directRawPredict:\x01*\x12\x83\x01\n\x10StreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\x00(\x01\x30\x01\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\x8c\x01\n\x13StreamingRawPredict\x12\x36.google.cloud.aiplatform.v1.StreamingRawPredictRequest\x1a\x37.google.cloud.aiplatform.v1.StreamingRawPredictResponse\"\x00(\x01\x30\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
18
18
 
19
19
  pool = Google::Protobuf::DescriptorPool.generated_pool
20
20
 
@@ -51,8 +51,14 @@ module Google
51
51
  PredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictRequest").msgclass
52
52
  PredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictResponse").msgclass
53
53
  RawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.RawPredictRequest").msgclass
54
+ DirectPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictRequest").msgclass
55
+ DirectPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictResponse").msgclass
56
+ DirectRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictRequest").msgclass
57
+ DirectRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictResponse").msgclass
54
58
  StreamingPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictRequest").msgclass
55
59
  StreamingPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictResponse").msgclass
60
+ StreamingRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictRequest").msgclass
61
+ StreamingRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictResponse").msgclass
56
62
  ExplainRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainRequest").msgclass
57
63
  ExplainResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainResponse").msgclass
58
64
  CountTokensRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.CountTokensRequest").msgclass
@@ -47,9 +47,19 @@ module Google
47
47
  # [DeployedModel][google.cloud.aiplatform.v1.DeployedModel] that served this
48
48
  # prediction.
49
49
  rpc :RawPredict, ::Google::Cloud::AIPlatform::V1::RawPredictRequest, ::Google::Api::HttpBody
50
+ # Perform an unary online prediction request for Vertex first-party products
51
+ # and frameworks.
52
+ rpc :DirectPredict, ::Google::Cloud::AIPlatform::V1::DirectPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectPredictResponse
53
+ # Perform an online prediction request through gRPC.
54
+ rpc :DirectRawPredict, ::Google::Cloud::AIPlatform::V1::DirectRawPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectRawPredictResponse
55
+ # Perform a streaming online prediction request for Vertex first-party
56
+ # products and frameworks.
57
+ rpc :StreamingPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
50
58
  # Perform a server-side streaming online prediction request for Vertex
51
59
  # LLM streaming.
52
60
  rpc :ServerStreamingPredict, ::Google::Cloud::AIPlatform::V1::StreamingPredictRequest, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
61
+ # Perform a streaming online prediction request through gRPC.
62
+ rpc :StreamingRawPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictResponse)
53
63
  # Perform an online explanation.
54
64
  #
55
65
  # If
@@ -304,6 +304,19 @@ module Google
304
304
  # seconds: 360 # 6 minutes
305
305
  # total_poll_timeout:
306
306
  # seconds: 54000 # 90 minutes
307
+ # @!attribute [rw] auto_populated_fields
308
+ # @return [::Array<::String>]
309
+ # List of top-level fields of the request message, that should be
310
+ # automatically populated by the client libraries based on their
311
+ # (google.api.field_info).format. Currently supported format: UUID4.
312
+ #
313
+ # Example of a YAML configuration:
314
+ #
315
+ # publishing:
316
+ # method_settings:
317
+ # - selector: google.example.v1.ExampleService.CreateExample
318
+ # auto_populated_fields:
319
+ # - request_id
307
320
  class MethodSettings
308
321
  include ::Google::Protobuf::MessageExts
309
322
  extend ::Google::Protobuf::MessageExts::ClassMethods
@@ -0,0 +1,64 @@
1
+ # frozen_string_literal: true
2
+
3
+ # Copyright 2023 Google LLC
4
+ #
5
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
+ # you may not use this file except in compliance with the License.
7
+ # You may obtain a copy of the License at
8
+ #
9
+ # https://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing, software
12
+ # distributed under the License is distributed on an "AS IS" BASIS,
13
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ # See the License for the specific language governing permissions and
15
+ # limitations under the License.
16
+
17
+ # Auto-generated by gapic-generator-ruby. DO NOT EDIT!
18
+
19
+
20
+ module Google
21
+ module Cloud
22
+ module AIPlatform
23
+ module V1
24
+ # Request message for ComputeTokens RPC call.
25
+ # @!attribute [rw] endpoint
26
+ # @return [::String]
27
+ # Required. The name of the Endpoint requested to get lists of tokens and
28
+ # token ids.
29
+ # @!attribute [rw] instances
30
+ # @return [::Array<::Google::Protobuf::Value>]
31
+ # Required. The instances that are the input to token computing API call.
32
+ # Schema is identical to the prediction schema of the text model, even for
33
+ # the non-text models, like chat models, or Codey models.
34
+ class ComputeTokensRequest
35
+ include ::Google::Protobuf::MessageExts
36
+ extend ::Google::Protobuf::MessageExts::ClassMethods
37
+ end
38
+
39
+ # Tokens info with a list of tokens and the corresponding list of token ids.
40
+ # @!attribute [rw] tokens
41
+ # @return [::Array<::String>]
42
+ # A list of tokens from the input.
43
+ # @!attribute [rw] token_ids
44
+ # @return [::Array<::Integer>]
45
+ # A list of token ids from the input.
46
+ class TokensInfo
47
+ include ::Google::Protobuf::MessageExts
48
+ extend ::Google::Protobuf::MessageExts::ClassMethods
49
+ end
50
+
51
+ # Response message for ComputeTokens RPC call.
52
+ # @!attribute [rw] tokens_info
53
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::TokensInfo>]
54
+ # Lists of tokens info from the input. A ComputeTokensRequest could have
55
+ # multiple instances with a prompt in each instance. We also need to return
56
+ # lists of tokens info for the request with multiple instances.
57
+ class ComputeTokensResponse
58
+ include ::Google::Protobuf::MessageExts
59
+ extend ::Google::Protobuf::MessageExts::ClassMethods
60
+ end
61
+ end
62
+ end
63
+ end
64
+ end
@@ -663,6 +663,31 @@ module Google
663
663
  # (Vertex AI makes this value available to your container code as the
664
664
  # [`AIP_DEPLOYED_MODEL_ID` environment
665
665
  # variable](https://cloud.google.com/vertex-ai/docs/predictions/custom-container-requirements#aip-variables).)
666
+ # @!attribute [rw] grpc_ports
667
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Port>]
668
+ # Immutable. List of ports to expose from the container. Vertex AI sends gRPC
669
+ # prediction requests that it receives to the first port on this list. Vertex
670
+ # AI also sends liveness and health checks to this port.
671
+ #
672
+ # If you do not specify this field, gRPC requests to the container will be
673
+ # disabled.
674
+ #
675
+ # Vertex AI does not use ports other than the first one listed. This field
676
+ # corresponds to the `ports` field of the Kubernetes Containers v1 core API.
677
+ # @!attribute [rw] deployment_timeout
678
+ # @return [::Google::Protobuf::Duration]
679
+ # Immutable. Deployment timeout.
680
+ # Limit for deployment timeout is 2 hours.
681
+ # @!attribute [rw] shared_memory_size_mb
682
+ # @return [::Integer]
683
+ # Immutable. The amount of the VM memory to reserve as the shared memory for
684
+ # the model in megabytes.
685
+ # @!attribute [rw] startup_probe
686
+ # @return [::Google::Cloud::AIPlatform::V1::Probe]
687
+ # Immutable. Specification for Kubernetes startup probe.
688
+ # @!attribute [rw] health_probe
689
+ # @return [::Google::Cloud::AIPlatform::V1::Probe]
690
+ # Immutable. Specification for Kubernetes readiness probe.
666
691
  class ModelContainerSpec
667
692
  include ::Google::Protobuf::MessageExts
668
693
  extend ::Google::Protobuf::MessageExts::ClassMethods
@@ -712,6 +737,42 @@ module Google
712
737
  GENIE = 5
713
738
  end
714
739
  end
740
+
741
+ # Probe describes a health check to be performed against a container to
742
+ # determine whether it is alive or ready to receive traffic.
743
+ # @!attribute [rw] exec
744
+ # @return [::Google::Cloud::AIPlatform::V1::Probe::ExecAction]
745
+ # Exec specifies the action to take.
746
+ # @!attribute [rw] period_seconds
747
+ # @return [::Integer]
748
+ # How often (in seconds) to perform the probe. Default to 10 seconds.
749
+ # Minimum value is 1. Must be less than timeout_seconds.
750
+ #
751
+ # Maps to Kubernetes probe argument 'periodSeconds'.
752
+ # @!attribute [rw] timeout_seconds
753
+ # @return [::Integer]
754
+ # Number of seconds after which the probe times out. Defaults to 1 second.
755
+ # Minimum value is 1. Must be greater or equal to period_seconds.
756
+ #
757
+ # Maps to Kubernetes probe argument 'timeoutSeconds'.
758
+ class Probe
759
+ include ::Google::Protobuf::MessageExts
760
+ extend ::Google::Protobuf::MessageExts::ClassMethods
761
+
762
+ # ExecAction specifies a command to execute.
763
+ # @!attribute [rw] command
764
+ # @return [::Array<::String>]
765
+ # Command is the command line to execute inside the container, the working
766
+ # directory for the command is root ('/') in the container's filesystem.
767
+ # The command is simply exec'd, it is not run inside a shell, so
768
+ # traditional shell instructions ('|', etc) won't work. To use a shell, you
769
+ # need to explicitly call out to that shell. Exit status of 0 is treated as
770
+ # live/healthy and non-zero is unhealthy.
771
+ class ExecAction
772
+ include ::Google::Protobuf::MessageExts
773
+ extend ::Google::Protobuf::MessageExts::ClassMethods
774
+ end
775
+ end
715
776
  end
716
777
  end
717
778
  end
@@ -115,7 +115,72 @@ module Google
115
115
  end
116
116
 
117
117
  # Request message for
118
- # [PredictionService.StreamingPredict][google.cloud.aiplatform.v1.PredictionService.StreamingPredict].
118
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
119
+ # @!attribute [rw] endpoint
120
+ # @return [::String]
121
+ # Required. The name of the Endpoint requested to serve the prediction.
122
+ # Format:
123
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
124
+ # @!attribute [rw] inputs
125
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
126
+ # The prediction input.
127
+ # @!attribute [rw] parameters
128
+ # @return [::Google::Cloud::AIPlatform::V1::Tensor]
129
+ # The parameters that govern the prediction.
130
+ class DirectPredictRequest
131
+ include ::Google::Protobuf::MessageExts
132
+ extend ::Google::Protobuf::MessageExts::ClassMethods
133
+ end
134
+
135
+ # Response message for
136
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
137
+ # @!attribute [rw] outputs
138
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
139
+ # The prediction output.
140
+ # @!attribute [rw] parameters
141
+ # @return [::Google::Cloud::AIPlatform::V1::Tensor]
142
+ # The parameters that govern the prediction.
143
+ class DirectPredictResponse
144
+ include ::Google::Protobuf::MessageExts
145
+ extend ::Google::Protobuf::MessageExts::ClassMethods
146
+ end
147
+
148
+ # Request message for
149
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
150
+ # @!attribute [rw] endpoint
151
+ # @return [::String]
152
+ # Required. The name of the Endpoint requested to serve the prediction.
153
+ # Format:
154
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
155
+ # @!attribute [rw] method_name
156
+ # @return [::String]
157
+ # Fully qualified name of the API method being invoked to perform
158
+ # predictions.
159
+ #
160
+ # Format:
161
+ # `/namespace.Service/Method/`
162
+ # Example:
163
+ # `/tensorflow.serving.PredictionService/Predict`
164
+ # @!attribute [rw] input
165
+ # @return [::String]
166
+ # The prediction input.
167
+ class DirectRawPredictRequest
168
+ include ::Google::Protobuf::MessageExts
169
+ extend ::Google::Protobuf::MessageExts::ClassMethods
170
+ end
171
+
172
+ # Response message for
173
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
174
+ # @!attribute [rw] output
175
+ # @return [::String]
176
+ # The prediction output.
177
+ class DirectRawPredictResponse
178
+ include ::Google::Protobuf::MessageExts
179
+ extend ::Google::Protobuf::MessageExts::ClassMethods
180
+ end
181
+
182
+ # Request message for
183
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
119
184
  #
120
185
  # The first message must contain
121
186
  # {::Google::Cloud::AIPlatform::V1::StreamingPredictRequest#endpoint endpoint} field
@@ -137,7 +202,7 @@ module Google
137
202
  end
138
203
 
139
204
  # Response message for
140
- # [PredictionService.StreamingPredict][google.cloud.aiplatform.v1.PredictionService.StreamingPredict].
205
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
141
206
  # @!attribute [rw] outputs
142
207
  # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
143
208
  # The prediction output.
@@ -149,6 +214,51 @@ module Google
149
214
  extend ::Google::Protobuf::MessageExts::ClassMethods
150
215
  end
151
216
 
217
+ # Request message for
218
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
219
+ #
220
+ # The first message must contain
221
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#endpoint endpoint}
222
+ # and
223
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
224
+ # fields and optionally
225
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}. The
226
+ # subsequent messages must contain
227
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}.
228
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
229
+ # in the subsequent messages have no effect.
230
+ # @!attribute [rw] endpoint
231
+ # @return [::String]
232
+ # Required. The name of the Endpoint requested to serve the prediction.
233
+ # Format:
234
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
235
+ # @!attribute [rw] method_name
236
+ # @return [::String]
237
+ # Fully qualified name of the API method being invoked to perform
238
+ # predictions.
239
+ #
240
+ # Format:
241
+ # `/namespace.Service/Method/`
242
+ # Example:
243
+ # `/tensorflow.serving.PredictionService/Predict`
244
+ # @!attribute [rw] input
245
+ # @return [::String]
246
+ # The prediction input.
247
+ class StreamingRawPredictRequest
248
+ include ::Google::Protobuf::MessageExts
249
+ extend ::Google::Protobuf::MessageExts::ClassMethods
250
+ end
251
+
252
+ # Response message for
253
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
254
+ # @!attribute [rw] output
255
+ # @return [::String]
256
+ # The prediction output.
257
+ class StreamingRawPredictResponse
258
+ include ::Google::Protobuf::MessageExts
259
+ extend ::Google::Protobuf::MessageExts::ClassMethods
260
+ end
261
+
152
262
  # Request message for
153
263
  # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#explain PredictionService.Explain}.
154
264
  # @!attribute [rw] endpoint
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: google-cloud-ai_platform-v1
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.34.0
4
+ version: 0.35.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Google LLC
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-11-20 00:00:00.000000000 Z
11
+ date: 2023-12-04 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: gapic-common
@@ -260,6 +260,10 @@ files:
260
260
  - lib/google/cloud/ai_platform/v1/job_service/credentials.rb
261
261
  - lib/google/cloud/ai_platform/v1/job_service/operations.rb
262
262
  - lib/google/cloud/ai_platform/v1/job_service/paths.rb
263
+ - lib/google/cloud/ai_platform/v1/llm_utility_service.rb
264
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb
265
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb
266
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb
263
267
  - lib/google/cloud/ai_platform/v1/match_service.rb
264
268
  - lib/google/cloud/ai_platform/v1/match_service/client.rb
265
269
  - lib/google/cloud/ai_platform/v1/match_service/credentials.rb
@@ -371,6 +375,8 @@ files:
371
375
  - lib/google/cloud/aiplatform/v1/job_service_services_pb.rb
372
376
  - lib/google/cloud/aiplatform/v1/job_state_pb.rb
373
377
  - lib/google/cloud/aiplatform/v1/lineage_subgraph_pb.rb
378
+ - lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb
379
+ - lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb
374
380
  - lib/google/cloud/aiplatform/v1/machine_resources_pb.rb
375
381
  - lib/google/cloud/aiplatform/v1/manual_batch_tuning_parameters_pb.rb
376
382
  - lib/google/cloud/aiplatform/v1/match_service_pb.rb
@@ -478,6 +484,7 @@ files:
478
484
  - proto_docs/google/cloud/aiplatform/v1/job_service.rb
479
485
  - proto_docs/google/cloud/aiplatform/v1/job_state.rb
480
486
  - proto_docs/google/cloud/aiplatform/v1/lineage_subgraph.rb
487
+ - proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb
481
488
  - proto_docs/google/cloud/aiplatform/v1/machine_resources.rb
482
489
  - proto_docs/google/cloud/aiplatform/v1/manual_batch_tuning_parameters.rb
483
490
  - proto_docs/google/cloud/aiplatform/v1/match_service.rb