google-cloud-ai_platform-v1 0.34.0 → 0.35.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb +528 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb +47 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb +78 -0
- data/lib/google/cloud/ai_platform/v1/llm_utility_service.rb +49 -0
- data/lib/google/cloud/ai_platform/v1/prediction_service/client.rb +374 -0
- data/lib/google/cloud/ai_platform/v1/version.rb +1 -1
- data/lib/google/cloud/ai_platform/v1.rb +2 -1
- data/lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb +52 -0
- data/lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb +47 -0
- data/lib/google/cloud/aiplatform/v1/model_pb.rb +5 -1
- data/lib/google/cloud/aiplatform/v1/prediction_service_pb.rb +7 -1
- data/lib/google/cloud/aiplatform/v1/prediction_service_services_pb.rb +10 -0
- data/proto_docs/google/api/client.rb +13 -0
- data/proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb +64 -0
- data/proto_docs/google/cloud/aiplatform/v1/model.rb +61 -0
- data/proto_docs/google/cloud/aiplatform/v1/prediction_service.rb +112 -2
- metadata +9 -2
@@ -14,7 +14,7 @@ require 'google/cloud/aiplatform/v1/types_pb'
|
|
14
14
|
require 'google/protobuf/struct_pb'
|
15
15
|
|
16
16
|
|
17
|
-
descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\
|
17
|
+
descriptor_data = "\n3google/cloud/aiplatform/v1/prediction_service.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/httpbody.proto\x1a\x19google/api/resource.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a&google/cloud/aiplatform/v1/types.proto\x1a\x1cgoogle/protobuf/struct.proto\"\xaa\x01\n\x0ePredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x03 \x01(\x0b\x32\x16.google.protobuf.Value\"\x80\x02\n\x0fPredictResponse\x12+\n\x0bpredictions\x18\x01 \x03(\x0b\x32\x16.google.protobuf.Value\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12\x36\n\x05model\x18\x03 \x01(\tB\'\xe0\x41\x03\xfa\x41!\n\x1f\x61iplatform.googleapis.com/Model\x12\x1d\n\x10model_version_id\x18\x05 \x01(\tB\x03\xe0\x41\x03\x12\x1f\n\x12model_display_name\x18\x04 \x01(\tB\x03\xe0\x41\x03\x12-\n\x08metadata\x18\x06 \x01(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x03\"z\n\x11RawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\'\n\thttp_body\x18\x02 \x01(\x0b\x32\x14.google.api.HttpBody\"\xc0\x01\n\x14\x44irectPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x84\x01\n\x15\x44irectPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"{\n\x17\x44irectRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"*\n\x18\x44irectRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\xc3\x01\n\x17StreamingPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x32\n\x06inputs\x18\x02 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x03 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"\x87\x01\n\x18StreamingPredictResponse\x12\x33\n\x07outputs\x18\x01 \x03(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\x12\x36\n\nparameters\x18\x02 \x01(\x0b\x32\".google.cloud.aiplatform.v1.Tensor\"~\n\x1aStreamingRawPredictRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12\x13\n\x0bmethod_name\x18\x02 \x01(\t\x12\r\n\x05input\x18\x03 \x01(\x0c\"-\n\x1bStreamingRawPredictResponse\x12\x0e\n\x06output\x18\x01 \x01(\x0c\"\x9d\x02\n\x0e\x45xplainRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\x12*\n\nparameters\x18\x04 \x01(\x0b\x32\x16.google.protobuf.Value\x12V\n\x19\x65xplanation_spec_override\x18\x05 \x01(\x0b\x32\x33.google.cloud.aiplatform.v1.ExplanationSpecOverride\x12\x19\n\x11\x64\x65ployed_model_id\x18\x03 \x01(\t\"\x98\x01\n\x0f\x45xplainResponse\x12=\n\x0c\x65xplanations\x18\x01 \x03(\x0b\x32\'.google.cloud.aiplatform.v1.Explanation\x12\x19\n\x11\x64\x65ployed_model_id\x18\x02 \x01(\t\x12+\n\x0bpredictions\x18\x03 \x03(\x0b\x32\x16.google.protobuf.Value\"\x82\x01\n\x12\x43ountTokensRequest\x12<\n\x08\x65ndpoint\x18\x01 \x01(\tB*\xe0\x41\x02\xfa\x41$\n\"aiplatform.googleapis.com/Endpoint\x12.\n\tinstances\x18\x02 \x03(\x0b\x32\x16.google.protobuf.ValueB\x03\xe0\x41\x02\"N\n\x13\x43ountTokensResponse\x12\x14\n\x0ctotal_tokens\x18\x01 \x01(\x05\x12!\n\x19total_billable_characters\x18\x02 \x01(\x05\x32\xb6\x0e\n\x11PredictionService\x12\x94\x02\n\x07Predict\x12*.google.cloud.aiplatform.v1.PredictRequest\x1a+.google.cloud.aiplatform.v1.PredictResponse\"\xaf\x01\x82\xd3\xe4\x93\x02\x88\x01\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:predict:\x01*ZH\"C/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:predict:\x01*\xda\x41\x1d\x65ndpoint,instances,parameters\x12\xfe\x01\n\nRawPredict\x12-.google.cloud.aiplatform.v1.RawPredictRequest\x1a\x14.google.api.HttpBody\"\xaa\x01\x82\xd3\xe4\x93\x02\x8e\x01\"</v1/{endpoint=projects/*/locations/*/endpoints/*}:rawPredict:\x01*ZK\"F/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:rawPredict:\x01*\xda\x41\x12\x65ndpoint,http_body\x12\xc0\x01\n\rDirectPredict\x12\x30.google.cloud.aiplatform.v1.DirectPredictRequest\x1a\x31.google.cloud.aiplatform.v1.DirectPredictResponse\"J\x82\xd3\xe4\x93\x02\x44\"?/v1/{endpoint=projects/*/locations/*/endpoints/*}:directPredict:\x01*\x12\xcc\x01\n\x10\x44irectRawPredict\x12\x33.google.cloud.aiplatform.v1.DirectRawPredictRequest\x1a\x34.google.cloud.aiplatform.v1.DirectRawPredictResponse\"M\x82\xd3\xe4\x93\x02G\"B/v1/{endpoint=projects/*/locations/*/endpoints/*}:directRawPredict:\x01*\x12\x83\x01\n\x10StreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\x00(\x01\x30\x01\x12\xb5\x02\n\x16ServerStreamingPredict\x12\x33.google.cloud.aiplatform.v1.StreamingPredictRequest\x1a\x34.google.cloud.aiplatform.v1.StreamingPredictResponse\"\xad\x01\x82\xd3\xe4\x93\x02\xa6\x01\"H/v1/{endpoint=projects/*/locations/*/endpoints/*}:serverStreamingPredict:\x01*ZW\"R/v1/{endpoint=projects/*/locations/*/publishers/*/models/*}:serverStreamingPredict:\x01*0\x01\x12\x8c\x01\n\x13StreamingRawPredict\x12\x36.google.cloud.aiplatform.v1.StreamingRawPredictRequest\x1a\x37.google.cloud.aiplatform.v1.StreamingRawPredictResponse\"\x00(\x01\x30\x01\x12\xda\x01\n\x07\x45xplain\x12*.google.cloud.aiplatform.v1.ExplainRequest\x1a+.google.cloud.aiplatform.v1.ExplainResponse\"v\x82\xd3\xe4\x93\x02>\"9/v1/{endpoint=projects/*/locations/*/endpoints/*}:explain:\x01*\xda\x41/endpoint,instances,parameters,deployed_model_id\x1aM\xca\x41\x19\x61iplatform.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xd4\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x16PredictionServiceProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3"
|
18
18
|
|
19
19
|
pool = Google::Protobuf::DescriptorPool.generated_pool
|
20
20
|
|
@@ -51,8 +51,14 @@ module Google
|
|
51
51
|
PredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictRequest").msgclass
|
52
52
|
PredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictResponse").msgclass
|
53
53
|
RawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.RawPredictRequest").msgclass
|
54
|
+
DirectPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictRequest").msgclass
|
55
|
+
DirectPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectPredictResponse").msgclass
|
56
|
+
DirectRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictRequest").msgclass
|
57
|
+
DirectRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DirectRawPredictResponse").msgclass
|
54
58
|
StreamingPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictRequest").msgclass
|
55
59
|
StreamingPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingPredictResponse").msgclass
|
60
|
+
StreamingRawPredictRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictRequest").msgclass
|
61
|
+
StreamingRawPredictResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.StreamingRawPredictResponse").msgclass
|
56
62
|
ExplainRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainRequest").msgclass
|
57
63
|
ExplainResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.ExplainResponse").msgclass
|
58
64
|
CountTokensRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.CountTokensRequest").msgclass
|
@@ -47,9 +47,19 @@ module Google
|
|
47
47
|
# [DeployedModel][google.cloud.aiplatform.v1.DeployedModel] that served this
|
48
48
|
# prediction.
|
49
49
|
rpc :RawPredict, ::Google::Cloud::AIPlatform::V1::RawPredictRequest, ::Google::Api::HttpBody
|
50
|
+
# Perform an unary online prediction request for Vertex first-party products
|
51
|
+
# and frameworks.
|
52
|
+
rpc :DirectPredict, ::Google::Cloud::AIPlatform::V1::DirectPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectPredictResponse
|
53
|
+
# Perform an online prediction request through gRPC.
|
54
|
+
rpc :DirectRawPredict, ::Google::Cloud::AIPlatform::V1::DirectRawPredictRequest, ::Google::Cloud::AIPlatform::V1::DirectRawPredictResponse
|
55
|
+
# Perform a streaming online prediction request for Vertex first-party
|
56
|
+
# products and frameworks.
|
57
|
+
rpc :StreamingPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
|
50
58
|
# Perform a server-side streaming online prediction request for Vertex
|
51
59
|
# LLM streaming.
|
52
60
|
rpc :ServerStreamingPredict, ::Google::Cloud::AIPlatform::V1::StreamingPredictRequest, stream(::Google::Cloud::AIPlatform::V1::StreamingPredictResponse)
|
61
|
+
# Perform a streaming online prediction request through gRPC.
|
62
|
+
rpc :StreamingRawPredict, stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest), stream(::Google::Cloud::AIPlatform::V1::StreamingRawPredictResponse)
|
53
63
|
# Perform an online explanation.
|
54
64
|
#
|
55
65
|
# If
|
@@ -304,6 +304,19 @@ module Google
|
|
304
304
|
# seconds: 360 # 6 minutes
|
305
305
|
# total_poll_timeout:
|
306
306
|
# seconds: 54000 # 90 minutes
|
307
|
+
# @!attribute [rw] auto_populated_fields
|
308
|
+
# @return [::Array<::String>]
|
309
|
+
# List of top-level fields of the request message, that should be
|
310
|
+
# automatically populated by the client libraries based on their
|
311
|
+
# (google.api.field_info).format. Currently supported format: UUID4.
|
312
|
+
#
|
313
|
+
# Example of a YAML configuration:
|
314
|
+
#
|
315
|
+
# publishing:
|
316
|
+
# method_settings:
|
317
|
+
# - selector: google.example.v1.ExampleService.CreateExample
|
318
|
+
# auto_populated_fields:
|
319
|
+
# - request_id
|
307
320
|
class MethodSettings
|
308
321
|
include ::Google::Protobuf::MessageExts
|
309
322
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
@@ -0,0 +1,64 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
# Copyright 2023 Google LLC
|
4
|
+
#
|
5
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
6
|
+
# you may not use this file except in compliance with the License.
|
7
|
+
# You may obtain a copy of the License at
|
8
|
+
#
|
9
|
+
# https://www.apache.org/licenses/LICENSE-2.0
|
10
|
+
#
|
11
|
+
# Unless required by applicable law or agreed to in writing, software
|
12
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
13
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
14
|
+
# See the License for the specific language governing permissions and
|
15
|
+
# limitations under the License.
|
16
|
+
|
17
|
+
# Auto-generated by gapic-generator-ruby. DO NOT EDIT!
|
18
|
+
|
19
|
+
|
20
|
+
module Google
|
21
|
+
module Cloud
|
22
|
+
module AIPlatform
|
23
|
+
module V1
|
24
|
+
# Request message for ComputeTokens RPC call.
|
25
|
+
# @!attribute [rw] endpoint
|
26
|
+
# @return [::String]
|
27
|
+
# Required. The name of the Endpoint requested to get lists of tokens and
|
28
|
+
# token ids.
|
29
|
+
# @!attribute [rw] instances
|
30
|
+
# @return [::Array<::Google::Protobuf::Value>]
|
31
|
+
# Required. The instances that are the input to token computing API call.
|
32
|
+
# Schema is identical to the prediction schema of the text model, even for
|
33
|
+
# the non-text models, like chat models, or Codey models.
|
34
|
+
class ComputeTokensRequest
|
35
|
+
include ::Google::Protobuf::MessageExts
|
36
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
37
|
+
end
|
38
|
+
|
39
|
+
# Tokens info with a list of tokens and the corresponding list of token ids.
|
40
|
+
# @!attribute [rw] tokens
|
41
|
+
# @return [::Array<::String>]
|
42
|
+
# A list of tokens from the input.
|
43
|
+
# @!attribute [rw] token_ids
|
44
|
+
# @return [::Array<::Integer>]
|
45
|
+
# A list of token ids from the input.
|
46
|
+
class TokensInfo
|
47
|
+
include ::Google::Protobuf::MessageExts
|
48
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
49
|
+
end
|
50
|
+
|
51
|
+
# Response message for ComputeTokens RPC call.
|
52
|
+
# @!attribute [rw] tokens_info
|
53
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::TokensInfo>]
|
54
|
+
# Lists of tokens info from the input. A ComputeTokensRequest could have
|
55
|
+
# multiple instances with a prompt in each instance. We also need to return
|
56
|
+
# lists of tokens info for the request with multiple instances.
|
57
|
+
class ComputeTokensResponse
|
58
|
+
include ::Google::Protobuf::MessageExts
|
59
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
60
|
+
end
|
61
|
+
end
|
62
|
+
end
|
63
|
+
end
|
64
|
+
end
|
@@ -663,6 +663,31 @@ module Google
|
|
663
663
|
# (Vertex AI makes this value available to your container code as the
|
664
664
|
# [`AIP_DEPLOYED_MODEL_ID` environment
|
665
665
|
# variable](https://cloud.google.com/vertex-ai/docs/predictions/custom-container-requirements#aip-variables).)
|
666
|
+
# @!attribute [rw] grpc_ports
|
667
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Port>]
|
668
|
+
# Immutable. List of ports to expose from the container. Vertex AI sends gRPC
|
669
|
+
# prediction requests that it receives to the first port on this list. Vertex
|
670
|
+
# AI also sends liveness and health checks to this port.
|
671
|
+
#
|
672
|
+
# If you do not specify this field, gRPC requests to the container will be
|
673
|
+
# disabled.
|
674
|
+
#
|
675
|
+
# Vertex AI does not use ports other than the first one listed. This field
|
676
|
+
# corresponds to the `ports` field of the Kubernetes Containers v1 core API.
|
677
|
+
# @!attribute [rw] deployment_timeout
|
678
|
+
# @return [::Google::Protobuf::Duration]
|
679
|
+
# Immutable. Deployment timeout.
|
680
|
+
# Limit for deployment timeout is 2 hours.
|
681
|
+
# @!attribute [rw] shared_memory_size_mb
|
682
|
+
# @return [::Integer]
|
683
|
+
# Immutable. The amount of the VM memory to reserve as the shared memory for
|
684
|
+
# the model in megabytes.
|
685
|
+
# @!attribute [rw] startup_probe
|
686
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe]
|
687
|
+
# Immutable. Specification for Kubernetes startup probe.
|
688
|
+
# @!attribute [rw] health_probe
|
689
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe]
|
690
|
+
# Immutable. Specification for Kubernetes readiness probe.
|
666
691
|
class ModelContainerSpec
|
667
692
|
include ::Google::Protobuf::MessageExts
|
668
693
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
@@ -712,6 +737,42 @@ module Google
|
|
712
737
|
GENIE = 5
|
713
738
|
end
|
714
739
|
end
|
740
|
+
|
741
|
+
# Probe describes a health check to be performed against a container to
|
742
|
+
# determine whether it is alive or ready to receive traffic.
|
743
|
+
# @!attribute [rw] exec
|
744
|
+
# @return [::Google::Cloud::AIPlatform::V1::Probe::ExecAction]
|
745
|
+
# Exec specifies the action to take.
|
746
|
+
# @!attribute [rw] period_seconds
|
747
|
+
# @return [::Integer]
|
748
|
+
# How often (in seconds) to perform the probe. Default to 10 seconds.
|
749
|
+
# Minimum value is 1. Must be less than timeout_seconds.
|
750
|
+
#
|
751
|
+
# Maps to Kubernetes probe argument 'periodSeconds'.
|
752
|
+
# @!attribute [rw] timeout_seconds
|
753
|
+
# @return [::Integer]
|
754
|
+
# Number of seconds after which the probe times out. Defaults to 1 second.
|
755
|
+
# Minimum value is 1. Must be greater or equal to period_seconds.
|
756
|
+
#
|
757
|
+
# Maps to Kubernetes probe argument 'timeoutSeconds'.
|
758
|
+
class Probe
|
759
|
+
include ::Google::Protobuf::MessageExts
|
760
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
761
|
+
|
762
|
+
# ExecAction specifies a command to execute.
|
763
|
+
# @!attribute [rw] command
|
764
|
+
# @return [::Array<::String>]
|
765
|
+
# Command is the command line to execute inside the container, the working
|
766
|
+
# directory for the command is root ('/') in the container's filesystem.
|
767
|
+
# The command is simply exec'd, it is not run inside a shell, so
|
768
|
+
# traditional shell instructions ('|', etc) won't work. To use a shell, you
|
769
|
+
# need to explicitly call out to that shell. Exit status of 0 is treated as
|
770
|
+
# live/healthy and non-zero is unhealthy.
|
771
|
+
class ExecAction
|
772
|
+
include ::Google::Protobuf::MessageExts
|
773
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
774
|
+
end
|
775
|
+
end
|
715
776
|
end
|
716
777
|
end
|
717
778
|
end
|
@@ -115,7 +115,72 @@ module Google
|
|
115
115
|
end
|
116
116
|
|
117
117
|
# Request message for
|
118
|
-
#
|
118
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
|
119
|
+
# @!attribute [rw] endpoint
|
120
|
+
# @return [::String]
|
121
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
122
|
+
# Format:
|
123
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
124
|
+
# @!attribute [rw] inputs
|
125
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
126
|
+
# The prediction input.
|
127
|
+
# @!attribute [rw] parameters
|
128
|
+
# @return [::Google::Cloud::AIPlatform::V1::Tensor]
|
129
|
+
# The parameters that govern the prediction.
|
130
|
+
class DirectPredictRequest
|
131
|
+
include ::Google::Protobuf::MessageExts
|
132
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
133
|
+
end
|
134
|
+
|
135
|
+
# Response message for
|
136
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_predict PredictionService.DirectPredict}.
|
137
|
+
# @!attribute [rw] outputs
|
138
|
+
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
139
|
+
# The prediction output.
|
140
|
+
# @!attribute [rw] parameters
|
141
|
+
# @return [::Google::Cloud::AIPlatform::V1::Tensor]
|
142
|
+
# The parameters that govern the prediction.
|
143
|
+
class DirectPredictResponse
|
144
|
+
include ::Google::Protobuf::MessageExts
|
145
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
146
|
+
end
|
147
|
+
|
148
|
+
# Request message for
|
149
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
|
150
|
+
# @!attribute [rw] endpoint
|
151
|
+
# @return [::String]
|
152
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
153
|
+
# Format:
|
154
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
155
|
+
# @!attribute [rw] method_name
|
156
|
+
# @return [::String]
|
157
|
+
# Fully qualified name of the API method being invoked to perform
|
158
|
+
# predictions.
|
159
|
+
#
|
160
|
+
# Format:
|
161
|
+
# `/namespace.Service/Method/`
|
162
|
+
# Example:
|
163
|
+
# `/tensorflow.serving.PredictionService/Predict`
|
164
|
+
# @!attribute [rw] input
|
165
|
+
# @return [::String]
|
166
|
+
# The prediction input.
|
167
|
+
class DirectRawPredictRequest
|
168
|
+
include ::Google::Protobuf::MessageExts
|
169
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
170
|
+
end
|
171
|
+
|
172
|
+
# Response message for
|
173
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#direct_raw_predict PredictionService.DirectRawPredict}.
|
174
|
+
# @!attribute [rw] output
|
175
|
+
# @return [::String]
|
176
|
+
# The prediction output.
|
177
|
+
class DirectRawPredictResponse
|
178
|
+
include ::Google::Protobuf::MessageExts
|
179
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
180
|
+
end
|
181
|
+
|
182
|
+
# Request message for
|
183
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
|
119
184
|
#
|
120
185
|
# The first message must contain
|
121
186
|
# {::Google::Cloud::AIPlatform::V1::StreamingPredictRequest#endpoint endpoint} field
|
@@ -137,7 +202,7 @@ module Google
|
|
137
202
|
end
|
138
203
|
|
139
204
|
# Response message for
|
140
|
-
#
|
205
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_predict PredictionService.StreamingPredict}.
|
141
206
|
# @!attribute [rw] outputs
|
142
207
|
# @return [::Array<::Google::Cloud::AIPlatform::V1::Tensor>]
|
143
208
|
# The prediction output.
|
@@ -149,6 +214,51 @@ module Google
|
|
149
214
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
150
215
|
end
|
151
216
|
|
217
|
+
# Request message for
|
218
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
|
219
|
+
#
|
220
|
+
# The first message must contain
|
221
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#endpoint endpoint}
|
222
|
+
# and
|
223
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
|
224
|
+
# fields and optionally
|
225
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}. The
|
226
|
+
# subsequent messages must contain
|
227
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#input input}.
|
228
|
+
# {::Google::Cloud::AIPlatform::V1::StreamingRawPredictRequest#method_name method_name}
|
229
|
+
# in the subsequent messages have no effect.
|
230
|
+
# @!attribute [rw] endpoint
|
231
|
+
# @return [::String]
|
232
|
+
# Required. The name of the Endpoint requested to serve the prediction.
|
233
|
+
# Format:
|
234
|
+
# `projects/{project}/locations/{location}/endpoints/{endpoint}`
|
235
|
+
# @!attribute [rw] method_name
|
236
|
+
# @return [::String]
|
237
|
+
# Fully qualified name of the API method being invoked to perform
|
238
|
+
# predictions.
|
239
|
+
#
|
240
|
+
# Format:
|
241
|
+
# `/namespace.Service/Method/`
|
242
|
+
# Example:
|
243
|
+
# `/tensorflow.serving.PredictionService/Predict`
|
244
|
+
# @!attribute [rw] input
|
245
|
+
# @return [::String]
|
246
|
+
# The prediction input.
|
247
|
+
class StreamingRawPredictRequest
|
248
|
+
include ::Google::Protobuf::MessageExts
|
249
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
250
|
+
end
|
251
|
+
|
252
|
+
# Response message for
|
253
|
+
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#streaming_raw_predict PredictionService.StreamingRawPredict}.
|
254
|
+
# @!attribute [rw] output
|
255
|
+
# @return [::String]
|
256
|
+
# The prediction output.
|
257
|
+
class StreamingRawPredictResponse
|
258
|
+
include ::Google::Protobuf::MessageExts
|
259
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
260
|
+
end
|
261
|
+
|
152
262
|
# Request message for
|
153
263
|
# {::Google::Cloud::AIPlatform::V1::PredictionService::Client#explain PredictionService.Explain}.
|
154
264
|
# @!attribute [rw] endpoint
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: google-cloud-ai_platform-v1
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.35.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Google LLC
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-
|
11
|
+
date: 2023-12-04 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: gapic-common
|
@@ -260,6 +260,10 @@ files:
|
|
260
260
|
- lib/google/cloud/ai_platform/v1/job_service/credentials.rb
|
261
261
|
- lib/google/cloud/ai_platform/v1/job_service/operations.rb
|
262
262
|
- lib/google/cloud/ai_platform/v1/job_service/paths.rb
|
263
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service.rb
|
264
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/client.rb
|
265
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/credentials.rb
|
266
|
+
- lib/google/cloud/ai_platform/v1/llm_utility_service/paths.rb
|
263
267
|
- lib/google/cloud/ai_platform/v1/match_service.rb
|
264
268
|
- lib/google/cloud/ai_platform/v1/match_service/client.rb
|
265
269
|
- lib/google/cloud/ai_platform/v1/match_service/credentials.rb
|
@@ -371,6 +375,8 @@ files:
|
|
371
375
|
- lib/google/cloud/aiplatform/v1/job_service_services_pb.rb
|
372
376
|
- lib/google/cloud/aiplatform/v1/job_state_pb.rb
|
373
377
|
- lib/google/cloud/aiplatform/v1/lineage_subgraph_pb.rb
|
378
|
+
- lib/google/cloud/aiplatform/v1/llm_utility_service_pb.rb
|
379
|
+
- lib/google/cloud/aiplatform/v1/llm_utility_service_services_pb.rb
|
374
380
|
- lib/google/cloud/aiplatform/v1/machine_resources_pb.rb
|
375
381
|
- lib/google/cloud/aiplatform/v1/manual_batch_tuning_parameters_pb.rb
|
376
382
|
- lib/google/cloud/aiplatform/v1/match_service_pb.rb
|
@@ -478,6 +484,7 @@ files:
|
|
478
484
|
- proto_docs/google/cloud/aiplatform/v1/job_service.rb
|
479
485
|
- proto_docs/google/cloud/aiplatform/v1/job_state.rb
|
480
486
|
- proto_docs/google/cloud/aiplatform/v1/lineage_subgraph.rb
|
487
|
+
- proto_docs/google/cloud/aiplatform/v1/llm_utility_service.rb
|
481
488
|
- proto_docs/google/cloud/aiplatform/v1/machine_resources.rb
|
482
489
|
- proto_docs/google/cloud/aiplatform/v1/manual_batch_tuning_parameters.rb
|
483
490
|
- proto_docs/google/cloud/aiplatform/v1/match_service.rb
|