google-cloud-ai_platform-v1 0.34.0 → 0.35.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb +528 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb +47 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb +78 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service.rb +49 -0
- data/lib/google/cloud/ai_platform/v1/prediction_service/client.rb +374 -0
- data/lib/google/cloud/ai_platform/v1/version.rb +1 -1
- data/lib/google/cloud/ai_platform/v1.rb +2 -1
- data/lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb +52 -0
- data/lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb +47 -0
- data/lib/google/cloud/aiplatform/v1/model_pb.rb +5 -1
- data/lib/google/cloud/aiplatform/v1/prediction_service_pb.rb +7 -1
- data/lib/google/cloud/aiplatform/v1/prediction_service_services_pb.rb +10 -0
- data/proto_docs/google/api/client.rb +13 -0
- data/proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb +64 -0
- data/proto_docs/google/cloud/aiplatform/v1/model.rb +61 -0
- data/proto_docs/google/cloud/aiplatform/v1/prediction_service.rb +112 -2
- metadata +9 -2
@@ -14,7 +14,7 @@ require 'google/cloud/aiplatform/v1/types_pb'
|
|
14
14
|
require 'google/protobuf/struct_pb'
|
15
15
|
|
16
16
|
|
17
|
-
descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\
|
17
|
+
descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc0\x01\n\x14\x44irectPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x84\x01\n\x15\x44irectPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"{\n\x17\x44irectRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"*\n\x18\x44irectRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"~\n\x1aStreamingRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"-\n\x1bStreamingRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\xb6\x0e\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xc0\x01\n\rDirectPredict\x12\x30.google.cloud.aiplatform.v1.DirectPredictRequest\x1a\x31.google.cloud.aiplatform.v1.DirectPredictResponse\"J\x82\xd3\xe4\x93\x02\x44\"?/v1/{endpoint=projects/*/locations/*/endpoints/*}:directPredict:\x01*\x12\xcc\x01\n\x10\x44irectRawPredict\x12\x33.google.cloud.aiplatform.v1.DirectRawPredictRequest\x1a\x34.google.cloud.aiplatform.v1.DirectRawPredictResponse\"M\x82\xd3\xe4\x93\x02G\"B/v1/{endpoint=projects/*/locations/*/endpoints/*}:directRawPredict:\x01*\x12\x83\x01\n\x10StreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\x00(\x01\x30\x01\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\x8c\x01\n\x13StreamingRawPredict\x12\x36.google.cloud.aiplatform.v1.StreamingRawPredictRequest\x1a\x37.google.cloud.aiplatform.v1.StreamingRawPredictResponse\"\x00(\x01\x30\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
|
18
18
|
|
19
19
|
pool = Google::Protobuf::DescriptorPool.generated_pool
|
20
20
|
|
@@ -51,8 +51,14 @@ module Google
|
|
51
51
|
PredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictRequest").msgclass
|
52
52
|
PredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictResponse").msgclass
|
53
53
|
RawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.RawPredictRequest").msgclass
|
54
|
+
DirectPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictRequest").msgclass
|
55
|
+
DirectPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictResponse").msgclass
|
56
|
+
DirectRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictRequest").msgclass
|
57
|
+
DirectRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictResponse").msgclass
|
54
58
|
StreamingPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictRequest").msgclass
|
55
59
|
StreamingPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictResponse").msgclass
|
60
|
+
StreamingRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictRequest").msgclass
|
61
|
+
StreamingRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictResponse").msgclass
|
56
62
|
ExplainRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainRequest").msgclass
|
57
63
|
ExplainResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainResponse").msgclass
|
58
64
|
CountTokensRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.CountTokensRequest").msgclass
|
@@ -47,9 +47,19 @@ module Google
|
|
47
47
|
# [DeployedModel][google.cloud.aiplatform.v1.DeployedModel] that served this
|
48
48
|
# prediction.
|
49
49
|
rpc :RawPredict, ::Google::Cloud::AIPlatform::V1::RawPredictRequest, ::Google::Api::HttpBody
|
50
|
+
# Perform an unary online prediction request for Vertex first-party products
|
51
|
+
# and frameworks.
|
52
|
+
rpc :DirectPredict, ::Google::Cloud::AIPlatform::V1::DirectPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectPredictResponse
|
53
|
+
# Perform an online prediction request through gRPC.
|
54
|
+
rpc :DirectRawPredict, ::Google::Cloud::AIPlatform::V1::DirectRawPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectRawPredictResponse
|
55
|
+
# Perform a streaming online prediction request for Vertex first-party
|
56
|
+
# products and frameworks.
|
57
|
+
rpc :StreamingPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
|
50
58
|
# Perform a server-side streaming online prediction request for Vertex
|
51
59
|
# LLM streaming.
|
52
60
|
rpc :ServerStreamingPredict, ::Google::Cloud::AIPlatform::V1::StreamingPredictRequest, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
|
61
|
+
# Perform a streaming online prediction request through gRPC.
|
62
|
+
rpc :StreamingRawPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictResponse)
|
53
63
|
# Perform an online explanation.
|
54
64
|
#
|
55
65
|
# If
|
@@ -304,6 +304,19 @@ module Google
|
|
304
304
|
# seconds: 360 # 6 minutes
|
305
305
|
# total_poll_timeout:
|
306
306
|
# seconds: 54000 # 90 minutes
|
307
|
+
# @!attribute [rw] auto_populated_fields
|
308
|
+
# @return [::Array<::String>]
|
309
|
+
# List of top-level fields of the request message, that should be
|
310
|
+
# automatically populated by the client libraries based on their
|
311
|
+
# (google.api.field_info).format. Currently supported format: UUID4.
|
312
|
+
#
|
313
|
+
# Example of a YAML configuration:
|
314
|
+
#
|
315
|
+
# publishing:
|
316
|
+
# method_settings:
|
317
|
+
# - selector: google.example.v1.ExampleService.CreateExample
|
318
|
+
# auto_populated_fields:
|
319
|
+
# - request_id
|
307
320
|
class MethodSettings
|
308
321
|
include ::Google::Protobuf::MessageExts
|
309
322
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
@@ -0,0 +1,64 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
# Copyright 2023 Google LLC
|
4
|
+
#
|
5
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
6
|
+
# you may not use this file except in compliance with the License.
|
7
|
+
# You may obtain a copy of the License at
|
8
|
+
#
|
9
|
+
# https://www.apache.org/licenses/LICENSE-2.0
|
10
|
+
#
|
11
|
+
# Unless required by applicable law or agreed to in writing, software
|
12
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
13
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
14
|
+
# See the License for the specific language governing permissions and
|
15
|
+
# limitations under the License.
|
16
|
+
|
17
|
+
# Auto-generated by gapic-generator-ruby. DO NOT EDIT!
|
18
|
+
|
19
|
+
|
20
|
+
module Google
|
21
|
+
module Cloud
|
22
|
+
module AIPlatform
|
23
|
+
module V1
|
24
|
+
# Request message for ComputeTokens RPC call.
|
25
|
+
# @!attribute [rw] endpoint
|
26
|
+
# @return [::String]
|
27
|
+
# Required. The name of the Endpoint requested to get lists of tokens and
|
28
|
+
# token ids.
|
29
|
+
# @!attribute [rw] instances
|
30
|
+
# @return [::Array<::Google::Protobuf::Value>]
|
31
|
+
# Required. The instances that are the input to token computing API call.
|
32
|
+
# Schema is identical to the prediction schema of the text model, even for
|
33
|
+
# the non-text models, like chat models, or Codey models.
|
34
|
+
class ComputeTokensRequest
|
35
|
+
include ::Google::Protobuf::MessageExts
|
36
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
37
|
+
end
|
38
|
+
|
39
|
+
# Tokens info with a list of tokens and the corresponding list of token ids.
|
40
|
+
# @!attribute [rw] tokens
|
41
|
+
# @return [::Array<::String>]
|
42
|
+
# A list of tokens from the input.
|
43
|
+
# @!attribute [rw] token_ids
|
44
|
+
# @return [::Array<::Integer>]
|
45
|
+
# A list of token ids from the input.
|
46
|
+
class TokensInfo
|
47
|
+
include ::Google::Protobuf::MessageExts
|
48
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
49
|
+
end
|
50
|
+
|
51
|
+
# Response message for ComputeTokens RPC call.
|
52
|
+
# @!attribute [rw] tokens_info
|
53
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::TokensInfo>]
|
54
|
+
# Lists of tokens info from the input. A ComputeTokensRequest could have
|
55
|
+
# multiple instances with a prompt in each instance. We also need to return
|
56
|
+
# lists of tokens info for the request with multiple instances.
|
57
|
+
class ComputeTokensResponse
|
58
|
+
include ::Google::Protobuf::MessageExts
|
59
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
60
|
+
end
|
61
|
+
end
|
62
|
+
end
|
63
|
+
end
|
64
|
+
end
|
@@ -663,6 +663,31 @@ module Google
|
|
663
663
|
# (Vertex AI makes this value available to your container code as the
|
664
664
|
# [`AIP_DEPLOYED_MODEL_ID` environment
|
665
665
|
# variable](https://cloud.google.com/vertex-ai/docs/predictions/custom-container-requirements#aip-variables).)
|
666
|
+
# @!attribute [rw] grpc_ports
|
667
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Port>]
|
668
|
+
# Immutable. List of ports to expose from the container. Vertex AI sends gRPC
|
669
|
+
# prediction requests that it receives to the first port on this list. Vertex
|
670
|
+
# AI also sends liveness and health checks to this port.
|
671
|
+
#
|
672
|
+
# If you do not specify this field, gRPC requests to the container will be
|
673
|
+
# disabled.
|
674
|
+
#
|
675
|
+
# Vertex AI does not use ports other than the first one listed. This field
|
676
|
+
# corresponds to the `ports` field of the Kubernetes Containers v1 core API.
|
677
|
+
# @!attribute [rw] deployment_timeout
|
678
|
+
# @return [::Google::Protobuf::Duration]
|
679
|
+
# Immutable. Deployment timeout.
|
680
|
+
# Limit for deployment timeout is 2 hours.
|
681
|
+
# @!attribute [rw] shared_memory_size_mb
|
682
|
+
# @return [::Integer]
|
683
|
+
# Immutable. The amount of the VM memory to reserve as the shared memory for
|
684
|
+
# the model in megabytes.
|
685
|
+
# @!attribute [rw] startup_probe
|
686
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe]
|
687
|
+
# Immutable. Specification for Kubernetes startup probe.
|
688
|
+
# @!attribute [rw] health_probe
|
689
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe]
|
690
|
+
# Immutable. Specification for Kubernetes readiness probe.
|
666
691
|
class ModelContainerSpec
|
667
692
|
include ::Google::Protobuf::MessageExts
|
668
693
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
@@ -712,6 +737,42 @@ module Google
|
|
712
737
|
GENIE = 5
|
713
738
|
end
|
714
739
|
end
|
740
|
+
|
741
|
+
# Probe describes a health check to be performed against a container to
|
742
|
+
# determine whether it is alive or ready to receive traffic.
|
743
|
+
# @!attribute [rw] exec
|
744
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe::ExecAction]
|
745
|
+
# Exec specifies the action to take.
|
746
|
+
# @!attribute [rw] period_seconds
|
747
|
+
# @return [::Integer]
|
748
|
+
# How often (in seconds) to perform the probe. Default to 10 seconds.
|
749
|
+
# Minimum value is 1. Must be less than timeout_seconds.
|
750
|
+
#
|
751
|
+
# Maps to Kubernetes probe argument 'periodSeconds'.
|
752
|
+
# @!attribute [rw] timeout_seconds
|
753
|
+
# @return [::Integer]
|
754
|
+
# Number of seconds after which the probe times out. Defaults to 1 second.
|
755
|
+
# Minimum value is 1. Must be greater or equal to period_seconds.
|
756
|
+
#
|
757
|
+
# Maps to Kubernetes probe argument 'timeoutSeconds'.
|
758
|
+
class Probe
|
759
|
+
include ::Google::Protobuf::MessageExts
|
760
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
761
|
+
|
762
|
+
# ExecAction specifies a command to execute.
|
763
|
+
# @!attribute [rw] command
|
764
|
+
# @return [::Array<::String>]
|
765
|
+
# Command is the command line to execute inside the container, the working
|
766
|
+
# directory for the command is root ('/') in the container's filesystem.
|
767
|
+
# The command is simply exec'd, it is not run inside a shell, so
|
768
|
+
# traditional shell instructions ('|', etc) won't work. To use a shell, you
|
769
|
+
# need to explicitly call out to that shell. Exit status of 0 is treated as
|
770
|
+
# live/healthy and non-zero is unhealthy.
|
771
|
+
class ExecAction
|
772
|
+
include ::Google::Protobuf::MessageExts
|
773
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
774
|
+
end
|
775
|
+
end
|
715
776
|
end
|
716
777
|
end
|
717
778
|
end
|
@@ -115,7 +115,72 @@ module Google
|
|
115
115
|
end
|
116
116
|
|
117
117
|
# Request message for
|
118
|
-
#
|
118
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
|
119
|
+
# @!attribute [rw] endpoint
|
120
|
+
# @return [::String]
|
121
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
122
|
+
# Format:
|
123
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
124
|
+
# @!attribute [rw] inputs
|
125
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
126
|
+
# The prediction input.
|
127
|
+
# @!attribute [rw] parameters
|
128
|
+
# @return [::Google::Cloud::AIPlatform::V1::Tensor]
|
129
|
+
# The parameters that govern the prediction.
|
130
|
+
class DirectPredictRequest
|
131
|
+
include ::Google::Protobuf::MessageExts
|
132
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
133
|
+
end
|
134
|
+
|
135
|
+
# Response message for
|
136
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
|
137
|
+
# @!attribute [rw] outputs
|
138
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
139
|
+
# The prediction output.
|
140
|
+
# @!attribute [rw] parameters
|
141
|
+
# @return [::Google::Cloud::AIPlatform::V1::Tensor]
|
142
|
+
# The parameters that govern the prediction.
|
143
|
+
class DirectPredictResponse
|
144
|
+
include ::Google::Protobuf::MessageExts
|
145
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
146
|
+
end
|
147
|
+
|
148
|
+
# Request message for
|
149
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
|
150
|
+
# @!attribute [rw] endpoint
|
151
|
+
# @return [::String]
|
152
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
153
|
+
# Format:
|
154
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
155
|
+
# @!attribute [rw] method_name
|
156
|
+
# @return [::String]
|
157
|
+
# Fully qualified name of the API method being invoked to perform
|
158
|
+
# predictions.
|
159
|
+
#
|
160
|
+
# Format:
|
161
|
+
# `/namespace.Service/Method/`
|
162
|
+
# Example:
|
163
|
+
# `/tensorflow.serving.PredictionService/Predict`
|
164
|
+
# @!attribute [rw] input
|
165
|
+
# @return [::String]
|
166
|
+
# The prediction input.
|
167
|
+
class DirectRawPredictRequest
|
168
|
+
include ::Google::Protobuf::MessageExts
|
169
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
170
|
+
end
|
171
|
+
|
172
|
+
# Response message for
|
173
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
|
174
|
+
# @!attribute [rw] output
|
175
|
+
# @return [::String]
|
176
|
+
# The prediction output.
|
177
|
+
class DirectRawPredictResponse
|
178
|
+
include ::Google::Protobuf::MessageExts
|
179
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
180
|
+
end
|
181
|
+
|
182
|
+
# Request message for
|
183
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
|
119
184
|
#
|
120
185
|
# The first message must contain
|
121
186
|
# {::Google::Cloud::AIPlatform::V1::StreamingPredictRequest#endpoint endpoint} field
|
@@ -137,7 +202,7 @@ module Google
|
|
137
202
|
end
|
138
203
|
|
139
204
|
# Response message for
|
140
|
-
#
|
205
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
|
141
206
|
# @!attribute [rw] outputs
|
142
207
|
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
143
208
|
# The prediction output.
|
@@ -149,6 +214,51 @@ module Google
|
|
149
214
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
150
215
|
end
|
151
216
|
|
217
|
+
# Request message for
|
218
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
|
219
|
+
#
|
220
|
+
# The first message must contain
|
221
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#endpoint endpoint}
|
222
|
+
# and
|
223
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
|
224
|
+
# fields and optionally
|
225
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}. The
|
226
|
+
# subsequent messages must contain
|
227
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}.
|
228
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
|
229
|
+
# in the subsequent messages have no effect.
|
230
|
+
# @!attribute [rw] endpoint
|
231
|
+
# @return [::String]
|
232
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
233
|
+
# Format:
|
234
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
235
|
+
# @!attribute [rw] method_name
|
236
|
+
# @return [::String]
|
237
|
+
# Fully qualified name of the API method being invoked to perform
|
238
|
+
# predictions.
|
239
|
+
#
|
240
|
+
# Format:
|
241
|
+
# `/namespace.Service/Method/`
|
242
|
+
# Example:
|
243
|
+
# `/tensorflow.serving.PredictionService/Predict`
|
244
|
+
# @!attribute [rw] input
|
245
|
+
# @return [::String]
|
246
|
+
# The prediction input.
|
247
|
+
class StreamingRawPredictRequest
|
248
|
+
include ::Google::Protobuf::MessageExts
|
249
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
250
|
+
end
|
251
|
+
|
252
|
+
# Response message for
|
253
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
|
254
|
+
# @!attribute [rw] output
|
255
|
+
# @return [::String]
|
256
|
+
# The prediction output.
|
257
|
+
class StreamingRawPredictResponse
|
258
|
+
include ::Google::Protobuf::MessageExts
|
259
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
260
|
+
end
|
261
|
+
|
152
262
|
# Request message for
|
153
263
|
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#explain PredictionService.Explain}.
|
154
264
|
# @!attribute [rw] endpoint
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: google-cloud-ai_platform-v1
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.35.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Google LLC
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-
|
11
|
+
date: 2023-12-04 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: gapic-common
|
@@ -260,6 +260,10 @@ files:
|
|
260
260
|
- lib/google/cloud/ai_platform/v1/job_service/credentials.rb
|
261
261
|
- lib/google/cloud/ai_platform/v1/job_service/operations.rb
|
262
262
|
- lib/google/cloud/ai_platform/v1/job_service/paths.rb
|
263
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service.rb
|
264
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb
|
265
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb
|
266
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb
|
263
267
|
- lib/google/cloud/ai_platform/v1/match_service.rb
|
264
268
|
- lib/google/cloud/ai_platform/v1/match_service/client.rb
|
265
269
|
- lib/google/cloud/ai_platform/v1/match_service/credentials.rb
|
@@ -371,6 +375,8 @@ files:
|
|
371
375
|
- lib/google/cloud/aiplatform/v1/job_service_services_pb.rb
|
372
376
|
- lib/google/cloud/aiplatform/v1/job_state_pb.rb
|
373
377
|
- lib/google/cloud/aiplatform/v1/lineage_subgraph_pb.rb
|
378
|
+
- lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb
|
379
|
+
- lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb
|
374
380
|
- lib/google/cloud/aiplatform/v1/machine_resources_pb.rb
|
375
381
|
- lib/google/cloud/aiplatform/v1/manual_batch_tuning_parameters_pb.rb
|
376
382
|
- lib/google/cloud/aiplatform/v1/match_service_pb.rb
|
@@ -478,6 +484,7 @@ files:
|
|
478
484
|
- proto_docs/google/cloud/aiplatform/v1/job_service.rb
|
479
485
|
- proto_docs/google/cloud/aiplatform/v1/job_state.rb
|
480
486
|
- proto_docs/google/cloud/aiplatform/v1/lineage_subgraph.rb
|
487
|
+
- proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb
|
481
488
|
- proto_docs/google/cloud/aiplatform/v1/machine_resources.rb
|
482
489
|
- proto_docs/google/cloud/aiplatform/v1/manual_batch_tuning_parameters.rb
|
483
490
|
- proto_docs/google/cloud/aiplatform/v1/match_service.rb
|