google-cloud-ai_platform-v1 0.34.0 → 0.35.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -14,7 +14,7 @@ require 'google/cloud/aiplatform/v1/types_pb'
14
14
  require 'google/protobuf/struct_pb'
15
15
 
16
16
 
17
- descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\x8f\t\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
17
+ descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc0\x01\n\x14\x44irectPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x84\x01\n\x15\x44irectPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"{\n\x17\x44irectRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"*\n\x18\x44irectRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"~\n\x1aStreamingRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"-\n\x1bStreamingRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\xb6\x0e\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xc0\x01\n\rDirectPredict\x12\x30.google.cloud.aiplatform.v1.DirectPredictRequest\x1a\x31.google.cloud.aiplatform.v1.DirectPredictResponse\"J\x82\xd3\xe4\x93\x02\x44\"?/v1/{endpoint=projects/*/locations/*/endpoints/*}:directPredict:\x01*\x12\xcc\x01\n\x10\x44irectRawPredict\x12\x33.google.cloud.aiplatform.v1.DirectRawPredictRequest\x1a\x34.google.cloud.aiplatform.v1.DirectRawPredictResponse\"M\x82\xd3\xe4\x93\x02G\"B/v1/{endpoint=projects/*/locations/*/endpoints/*}:directRawPredict:\x01*\x12\x83\x01\n\x10StreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\x00(\x01\x30\x01\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\x8c\x01\n\x13StreamingRawPredict\x12\x36.google.cloud.aiplatform.v1.StreamingRawPredictRequest\x1a\x37.google.cloud.aiplatform.v1.StreamingRawPredictResponse\"\x00(\x01\x30\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
18
18
 
19
19
  pool = Google::Protobuf::DescriptorPool.generated_pool
20
20
 
@@ -51,8 +51,14 @@ module Google
51
51
  PredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictRequest").msgclass
52
52
  PredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictResponse").msgclass
53
53
  RawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.RawPredictRequest").msgclass
54
+ DirectPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictRequest").msgclass
55
+ DirectPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictResponse").msgclass
56
+ DirectRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictRequest").msgclass
57
+ DirectRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictResponse").msgclass
54
58
  StreamingPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictRequest").msgclass
55
59
  StreamingPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictResponse").msgclass
60
+ StreamingRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictRequest").msgclass
61
+ StreamingRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictResponse").msgclass
56
62
  ExplainRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainRequest").msgclass
57
63
  ExplainResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainResponse").msgclass
58
64
  CountTokensRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.CountTokensRequest").msgclass
@@ -47,9 +47,19 @@ module Google
47
47
  # [DeployedModel][google.cloud.aiplatform.v1.DeployedModel] that served this
48
48
  # prediction.
49
49
  rpc :RawPredict, ::Google::Cloud::AIPlatform::V1::RawPredictRequest, ::Google::Api::HttpBody
50
+ # Perform an unary online prediction request for Vertex first-party products
51
+ # and frameworks.
52
+ rpc :DirectPredict, ::Google::Cloud::AIPlatform::V1::DirectPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectPredictResponse
53
+ # Perform an online prediction request through gRPC.
54
+ rpc :DirectRawPredict, ::Google::Cloud::AIPlatform::V1::DirectRawPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectRawPredictResponse
55
+ # Perform a streaming online prediction request for Vertex first-party
56
+ # products and frameworks.
57
+ rpc :StreamingPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
50
58
  # Perform a server-side streaming online prediction request for Vertex
51
59
  # LLM streaming.
52
60
  rpc :ServerStreamingPredict, ::Google::Cloud::AIPlatform::V1::StreamingPredictRequest, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
61
+ # Perform a streaming online prediction request through gRPC.
62
+ rpc :StreamingRawPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictResponse)
53
63
  # Perform an online explanation.
54
64
  #
55
65
  # If
@@ -304,6 +304,19 @@ module Google
304
304
  # seconds: 360 # 6 minutes
305
305
  # total_poll_timeout:
306
306
  # seconds: 54000 # 90 minutes
307
+ # @!attribute [rw] auto_populated_fields
308
+ # @return [::Array<::String>]
309
+ # List of top-level fields of the request message, that should be
310
+ # automatically populated by the client libraries based on their
311
+ # (google.api.field_info).format. Currently supported format: UUID4.
312
+ #
313
+ # Example of a YAML configuration:
314
+ #
315
+ # publishing:
316
+ # method_settings:
317
+ # - selector: google.example.v1.ExampleService.CreateExample
318
+ # auto_populated_fields:
319
+ # - request_id
307
320
  class MethodSettings
308
321
  include ::Google::Protobuf::MessageExts
309
322
  extend ::Google::Protobuf::MessageExts::ClassMethods
@@ -0,0 +1,64 @@
1
+ # frozen_string_literal: true
2
+
3
+ # Copyright 2023 Google LLC
4
+ #
5
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
+ # you may not use this file except in compliance with the License.
7
+ # You may obtain a copy of the License at
8
+ #
9
+ # https://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing, software
12
+ # distributed under the License is distributed on an "AS IS" BASIS,
13
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ # See the License for the specific language governing permissions and
15
+ # limitations under the License.
16
+
17
+ # Auto-generated by gapic-generator-ruby. DO NOT EDIT!
18
+
19
+
20
+ module Google
21
+ module Cloud
22
+ module AIPlatform
23
+ module V1
24
+ # Request message for ComputeTokens RPC call.
25
+ # @!attribute [rw] endpoint
26
+ # @return [::String]
27
+ # Required. The name of the Endpoint requested to get lists of tokens and
28
+ # token ids.
29
+ # @!attribute [rw] instances
30
+ # @return [::Array<::Google::Protobuf::Value>]
31
+ # Required. The instances that are the input to token computing API call.
32
+ # Schema is identical to the prediction schema of the text model, even for
33
+ # the non-text models, like chat models, or Codey models.
34
+ class ComputeTokensRequest
35
+ include ::Google::Protobuf::MessageExts
36
+ extend ::Google::Protobuf::MessageExts::ClassMethods
37
+ end
38
+
39
+ # Tokens info with a list of tokens and the corresponding list of token ids.
40
+ # @!attribute [rw] tokens
41
+ # @return [::Array<::String>]
42
+ # A list of tokens from the input.
43
+ # @!attribute [rw] token_ids
44
+ # @return [::Array<::Integer>]
45
+ # A list of token ids from the input.
46
+ class TokensInfo
47
+ include ::Google::Protobuf::MessageExts
48
+ extend ::Google::Protobuf::MessageExts::ClassMethods
49
+ end
50
+
51
+ # Response message for ComputeTokens RPC call.
52
+ # @!attribute [rw] tokens_info
53
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::TokensInfo>]
54
+ # Lists of tokens info from the input. A ComputeTokensRequest could have
55
+ # multiple instances with a prompt in each instance. We also need to return
56
+ # lists of tokens info for the request with multiple instances.
57
+ class ComputeTokensResponse
58
+ include ::Google::Protobuf::MessageExts
59
+ extend ::Google::Protobuf::MessageExts::ClassMethods
60
+ end
61
+ end
62
+ end
63
+ end
64
+ end
@@ -663,6 +663,31 @@ module Google
663
663
  # (Vertex AI makes this value available to your container code as the
664
664
  # [`AIP_DEPLOYED_MODEL_ID` environment
665
665
  # variable](https://cloud.google.com/vertex-ai/docs/predictions/custom-container-requirements#aip-variables).)
666
+ # @!attribute [rw] grpc_ports
667
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Port>]
668
+ # Immutable. List of ports to expose from the container. Vertex AI sends gRPC
669
+ # prediction requests that it receives to the first port on this list. Vertex
670
+ # AI also sends liveness and health checks to this port.
671
+ #
672
+ # If you do not specify this field, gRPC requests to the container will be
673
+ # disabled.
674
+ #
675
+ # Vertex AI does not use ports other than the first one listed. This field
676
+ # corresponds to the `ports` field of the Kubernetes Containers v1 core API.
677
+ # @!attribute [rw] deployment_timeout
678
+ # @return [::Google::Protobuf::Duration]
679
+ # Immutable. Deployment timeout.
680
+ # Limit for deployment timeout is 2 hours.
681
+ # @!attribute [rw] shared_memory_size_mb
682
+ # @return [::Integer]
683
+ # Immutable. The amount of the VM memory to reserve as the shared memory for
684
+ # the model in megabytes.
685
+ # @!attribute [rw] startup_probe
686
+ # @return [::Google::Cloud::AIPlatform::V1::Probe]
687
+ # Immutable. Specification for Kubernetes startup probe.
688
+ # @!attribute [rw] health_probe
689
+ # @return [::Google::Cloud::AIPlatform::V1::Probe]
690
+ # Immutable. Specification for Kubernetes readiness probe.
666
691
  class ModelContainerSpec
667
692
  include ::Google::Protobuf::MessageExts
668
693
  extend ::Google::Protobuf::MessageExts::ClassMethods
@@ -712,6 +737,42 @@ module Google
712
737
  GENIE = 5
713
738
  end
714
739
  end
740
+
741
+ # Probe describes a health check to be performed against a container to
742
+ # determine whether it is alive or ready to receive traffic.
743
+ # @!attribute [rw] exec
744
+ # @return [::Google::Cloud::AIPlatform::V1::Probe::ExecAction]
745
+ # Exec specifies the action to take.
746
+ # @!attribute [rw] period_seconds
747
+ # @return [::Integer]
748
+ # How often (in seconds) to perform the probe. Default to 10 seconds.
749
+ # Minimum value is 1. Must be less than timeout_seconds.
750
+ #
751
+ # Maps to Kubernetes probe argument 'periodSeconds'.
752
+ # @!attribute [rw] timeout_seconds
753
+ # @return [::Integer]
754
+ # Number of seconds after which the probe times out. Defaults to 1 second.
755
+ # Minimum value is 1. Must be greater or equal to period_seconds.
756
+ #
757
+ # Maps to Kubernetes probe argument 'timeoutSeconds'.
758
+ class Probe
759
+ include ::Google::Protobuf::MessageExts
760
+ extend ::Google::Protobuf::MessageExts::ClassMethods
761
+
762
+ # ExecAction specifies a command to execute.
763
+ # @!attribute [rw] command
764
+ # @return [::Array<::String>]
765
+ # Command is the command line to execute inside the container, the working
766
+ # directory for the command is root ('/') in the container's filesystem.
767
+ # The command is simply exec'd, it is not run inside a shell, so
768
+ # traditional shell instructions ('|', etc) won't work. To use a shell, you
769
+ # need to explicitly call out to that shell. Exit status of 0 is treated as
770
+ # live/healthy and non-zero is unhealthy.
771
+ class ExecAction
772
+ include ::Google::Protobuf::MessageExts
773
+ extend ::Google::Protobuf::MessageExts::ClassMethods
774
+ end
775
+ end
715
776
  end
716
777
  end
717
778
  end
@@ -115,7 +115,72 @@ module Google
115
115
  end
116
116
 
117
117
  # Request message for
118
- # [PredictionService.StreamingPredict][google.cloud.aiplatform.v1.PredictionService.StreamingPredict].
118
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
119
+ # @!attribute [rw] endpoint
120
+ # @return [::String]
121
+ # Required. The name of the Endpoint requested to serve the prediction.
122
+ # Format:
123
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
124
+ # @!attribute [rw] inputs
125
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
126
+ # The prediction input.
127
+ # @!attribute [rw] parameters
128
+ # @return [::Google::Cloud::AIPlatform::V1::Tensor]
129
+ # The parameters that govern the prediction.
130
+ class DirectPredictRequest
131
+ include ::Google::Protobuf::MessageExts
132
+ extend ::Google::Protobuf::MessageExts::ClassMethods
133
+ end
134
+
135
+ # Response message for
136
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
137
+ # @!attribute [rw] outputs
138
+ # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
139
+ # The prediction output.
140
+ # @!attribute [rw] parameters
141
+ # @return [::Google::Cloud::AIPlatform::V1::Tensor]
142
+ # The parameters that govern the prediction.
143
+ class DirectPredictResponse
144
+ include ::Google::Protobuf::MessageExts
145
+ extend ::Google::Protobuf::MessageExts::ClassMethods
146
+ end
147
+
148
+ # Request message for
149
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
150
+ # @!attribute [rw] endpoint
151
+ # @return [::String]
152
+ # Required. The name of the Endpoint requested to serve the prediction.
153
+ # Format:
154
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
155
+ # @!attribute [rw] method_name
156
+ # @return [::String]
157
+ # Fully qualified name of the API method being invoked to perform
158
+ # predictions.
159
+ #
160
+ # Format:
161
+ # `/namespace.Service/Method/`
162
+ # Example:
163
+ # `/tensorflow.serving.PredictionService/Predict`
164
+ # @!attribute [rw] input
165
+ # @return [::String]
166
+ # The prediction input.
167
+ class DirectRawPredictRequest
168
+ include ::Google::Protobuf::MessageExts
169
+ extend ::Google::Protobuf::MessageExts::ClassMethods
170
+ end
171
+
172
+ # Response message for
173
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
174
+ # @!attribute [rw] output
175
+ # @return [::String]
176
+ # The prediction output.
177
+ class DirectRawPredictResponse
178
+ include ::Google::Protobuf::MessageExts
179
+ extend ::Google::Protobuf::MessageExts::ClassMethods
180
+ end
181
+
182
+ # Request message for
183
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
119
184
  #
120
185
  # The first message must contain
121
186
  # {::Google::Cloud::AIPlatform::V1::StreamingPredictRequest#endpoint endpoint} field
@@ -137,7 +202,7 @@ module Google
137
202
  end
138
203
 
139
204
  # Response message for
140
- # [PredictionService.StreamingPredict][google.cloud.aiplatform.v1.PredictionService.StreamingPredict].
205
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
141
206
  # @!attribute [rw] outputs
142
207
  # @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
143
208
  # The prediction output.
@@ -149,6 +214,51 @@ module Google
149
214
  extend ::Google::Protobuf::MessageExts::ClassMethods
150
215
  end
151
216
 
217
+ # Request message for
218
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
219
+ #
220
+ # The first message must contain
221
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#endpoint endpoint}
222
+ # and
223
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
224
+ # fields and optionally
225
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}. The
226
+ # subsequent messages must contain
227
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}.
228
+ # {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
229
+ # in the subsequent messages have no effect.
230
+ # @!attribute [rw] endpoint
231
+ # @return [::String]
232
+ # Required. The name of the Endpoint requested to serve the prediction.
233
+ # Format:
234
+ # `projects/{project}/locations/{location}/endpoints/{endpoint}`
235
+ # @!attribute [rw] method_name
236
+ # @return [::String]
237
+ # Fully qualified name of the API method being invoked to perform
238
+ # predictions.
239
+ #
240
+ # Format:
241
+ # `/namespace.Service/Method/`
242
+ # Example:
243
+ # `/tensorflow.serving.PredictionService/Predict`
244
+ # @!attribute [rw] input
245
+ # @return [::String]
246
+ # The prediction input.
247
+ class StreamingRawPredictRequest
248
+ include ::Google::Protobuf::MessageExts
249
+ extend ::Google::Protobuf::MessageExts::ClassMethods
250
+ end
251
+
252
+ # Response message for
253
+ # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
254
+ # @!attribute [rw] output
255
+ # @return [::String]
256
+ # The prediction output.
257
+ class StreamingRawPredictResponse
258
+ include ::Google::Protobuf::MessageExts
259
+ extend ::Google::Protobuf::MessageExts::ClassMethods
260
+ end
261
+
152
262
  # Request message for
153
263
  # {::Google::Cloud::AIPlatform::V1::PredictionService::Client#explain PredictionService.Explain}.
154
264
  # @!attribute [rw] endpoint
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: google-cloud-ai_platform-v1
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.34.0
4
+ version: 0.35.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Google LLC
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-11-20 00:00:00.000000000 Z
11
+ date: 2023-12-04 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: gapic-common
@@ -260,6 +260,10 @@ files:
260
260
  - lib/google/cloud/ai_platform/v1/job_service/credentials.rb
261
261
  - lib/google/cloud/ai_platform/v1/job_service/operations.rb
262
262
  - lib/google/cloud/ai_platform/v1/job_service/paths.rb
263
+ - lib/google/cloud/ai_platform/v1/llm_utility_service.rb
264
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb
265
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb
266
+ - lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb
263
267
  - lib/google/cloud/ai_platform/v1/match_service.rb
264
268
  - lib/google/cloud/ai_platform/v1/match_service/client.rb
265
269
  - lib/google/cloud/ai_platform/v1/match_service/credentials.rb
@@ -371,6 +375,8 @@ files:
371
375
  - lib/google/cloud/aiplatform/v1/job_service_services_pb.rb
372
376
  - lib/google/cloud/aiplatform/v1/job_state_pb.rb
373
377
  - lib/google/cloud/aiplatform/v1/lineage_subgraph_pb.rb
378
+ - lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb
379
+ - lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb
374
380
  - lib/google/cloud/aiplatform/v1/machine_resources_pb.rb
375
381
  - lib/google/cloud/aiplatform/v1/manual_batch_tuning_parameters_pb.rb
376
382
  - lib/google/cloud/aiplatform/v1/match_service_pb.rb
@@ -478,6 +484,7 @@ files:
478
484
  - proto_docs/google/cloud/aiplatform/v1/job_service.rb
479
485
  - proto_docs/google/cloud/aiplatform/v1/job_state.rb
480
486
  - proto_docs/google/cloud/aiplatform/v1/lineage_subgraph.rb
487
+ - proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb
481
488
  - proto_docs/google/cloud/aiplatform/v1/machine_resources.rb
482
489
  - proto_docs/google/cloud/aiplatform/v1/manual_batch_tuning_parameters.rb
483
490
  - proto_docs/google/cloud/aiplatform/v1/match_service.rb