google-apis-aiplatform_v1beta1 0.35.0 → 0.37.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -0
- data/lib/google/apis/aiplatform_v1beta1/classes.rb +1069 -81
- data/lib/google/apis/aiplatform_v1beta1/gem_version.rb +3 -3
- data/lib/google/apis/aiplatform_v1beta1/representations.rb +435 -1
- data/lib/google/apis/aiplatform_v1beta1/service.rb +320 -6
- metadata +4 -7
@@ -474,7 +474,7 @@ module Google
|
|
474
474
|
end
|
475
475
|
end
|
476
476
|
|
477
|
-
# Create API error message for Vertex Pipeline.
|
477
|
+
# Create API error message for Vertex Pipeline.
|
478
478
|
class CloudAiPlatformCommonCreatePipelineJobApiErrorDetail
|
479
479
|
include Google::Apis::Core::Hashable
|
480
480
|
|
@@ -840,7 +840,8 @@ module Google
|
|
840
840
|
end
|
841
841
|
end
|
842
842
|
|
843
|
-
# The generic reusable api auth config.
|
843
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
844
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
844
845
|
class GoogleCloudAiplatformV1beta1ApiAuth
|
845
846
|
include Google::Apis::Core::Hashable
|
846
847
|
|
@@ -1310,15 +1311,22 @@ module Google
|
|
1310
1311
|
class GoogleCloudAiplatformV1beta1AuthConfigApiKeyConfig
|
1311
1312
|
include Google::Apis::Core::Hashable
|
1312
1313
|
|
1313
|
-
#
|
1314
|
+
# Optional. The name of the SecretManager secret version resource storing the
|
1314
1315
|
# API key. Format: `projects/`project`/secrets/`secrete`/versions/`version`` -
|
1315
|
-
# If
|
1316
|
-
#
|
1317
|
-
#
|
1316
|
+
# If both `api_key_secret` and `api_key_string` are specified, this field takes
|
1317
|
+
# precedence over `api_key_string`. - If specified, the `secretmanager.versions.
|
1318
|
+
# access` permission should be granted to Vertex AI Extension Service Agent (
|
1319
|
+
# https://cloud.google.com/vertex-ai/docs/general/access-control#service-agents)
|
1320
|
+
# on the specified resource.
|
1318
1321
|
# Corresponds to the JSON property `apiKeySecret`
|
1319
1322
|
# @return [String]
|
1320
1323
|
attr_accessor :api_key_secret
|
1321
1324
|
|
1325
|
+
# Optional. The API key to be used in the request directly.
|
1326
|
+
# Corresponds to the JSON property `apiKeyString`
|
1327
|
+
# @return [String]
|
1328
|
+
attr_accessor :api_key_string
|
1329
|
+
|
1322
1330
|
# Required. The location of the API key.
|
1323
1331
|
# Corresponds to the JSON property `httpElementLocation`
|
1324
1332
|
# @return [String]
|
@@ -1337,6 +1345,7 @@ module Google
|
|
1337
1345
|
# Update properties of this object
|
1338
1346
|
def update!(**args)
|
1339
1347
|
@api_key_secret = args[:api_key_secret] if args.key?(:api_key_secret)
|
1348
|
+
@api_key_string = args[:api_key_string] if args.key?(:api_key_string)
|
1340
1349
|
@http_element_location = args[:http_element_location] if args.key?(:http_element_location)
|
1341
1350
|
@name = args[:name] if args.key?(:name)
|
1342
1351
|
end
|
@@ -1460,22 +1469,22 @@ module Google
|
|
1460
1469
|
class GoogleCloudAiplatformV1beta1AutomaticResources
|
1461
1470
|
include Google::Apis::Core::Hashable
|
1462
1471
|
|
1463
|
-
# Immutable. The maximum number of replicas
|
1464
|
-
#
|
1465
|
-
#
|
1466
|
-
#
|
1467
|
-
#
|
1468
|
-
#
|
1469
|
-
#
|
1470
|
-
#
|
1472
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
1473
|
+
# traffic against it increases. If the requested value is too large, the
|
1474
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
1475
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
1476
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
1477
|
+
# traffic will be dropped. If this value is not provided, a no upper bound for
|
1478
|
+
# scaling under heavy traffic will be assume, though Vertex AI may be unable to
|
1479
|
+
# scale beyond certain replica number.
|
1471
1480
|
# Corresponds to the JSON property `maxReplicaCount`
|
1472
1481
|
# @return [Fixnum]
|
1473
1482
|
attr_accessor :max_replica_count
|
1474
1483
|
|
1475
|
-
# Immutable. The minimum number of replicas
|
1476
|
-
#
|
1477
|
-
#
|
1478
|
-
#
|
1484
|
+
# Immutable. The minimum number of replicas that will be always deployed on. If
|
1485
|
+
# traffic against it increases, it may dynamically be deployed onto more
|
1486
|
+
# replicas up to max_replica_count, and as traffic decreases, some of these
|
1487
|
+
# extra replicas may be freed. If the requested value is too large, the
|
1479
1488
|
# deployment will error.
|
1480
1489
|
# Corresponds to the JSON property `minReplicaCount`
|
1481
1490
|
# @return [Fixnum]
|
@@ -1492,6 +1501,48 @@ module Google
|
|
1492
1501
|
end
|
1493
1502
|
end
|
1494
1503
|
|
1504
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
1505
|
+
# EvaluateDataset.
|
1506
|
+
class GoogleCloudAiplatformV1beta1AutoraterConfig
|
1507
|
+
include Google::Apis::Core::Hashable
|
1508
|
+
|
1509
|
+
# Optional. The fully qualified name of the publisher model or tuned autorater
|
1510
|
+
# endpoint to use. Publisher model format: `projects/`project`/locations/`
|
1511
|
+
# location`/publishers/*/models/*` Tuned model endpoint format: `projects/`
|
1512
|
+
# project`/locations/`location`/endpoints/`endpoint``
|
1513
|
+
# Corresponds to the JSON property `autoraterModel`
|
1514
|
+
# @return [String]
|
1515
|
+
attr_accessor :autorater_model
|
1516
|
+
|
1517
|
+
# Optional. Whether to flip the candidate and baseline responses. This is only
|
1518
|
+
# applicable to the pairwise metric. If enabled, also provide PairwiseMetricSpec.
|
1519
|
+
# candidate_response_field_name and PairwiseMetricSpec.
|
1520
|
+
# baseline_response_field_name. When rendering PairwiseMetricSpec.
|
1521
|
+
# metric_prompt_template, the candidate and baseline fields will be flipped for
|
1522
|
+
# half of the samples to reduce bias.
|
1523
|
+
# Corresponds to the JSON property `flipEnabled`
|
1524
|
+
# @return [Boolean]
|
1525
|
+
attr_accessor :flip_enabled
|
1526
|
+
alias_method :flip_enabled?, :flip_enabled
|
1527
|
+
|
1528
|
+
# Optional. Number of samples for each instance in the dataset. If not specified,
|
1529
|
+
# the default is 4. Minimum value is 1, maximum value is 32.
|
1530
|
+
# Corresponds to the JSON property `samplingCount`
|
1531
|
+
# @return [Fixnum]
|
1532
|
+
attr_accessor :sampling_count
|
1533
|
+
|
1534
|
+
def initialize(**args)
|
1535
|
+
update!(**args)
|
1536
|
+
end
|
1537
|
+
|
1538
|
+
# Update properties of this object
|
1539
|
+
def update!(**args)
|
1540
|
+
@autorater_model = args[:autorater_model] if args.key?(:autorater_model)
|
1541
|
+
@flip_enabled = args[:flip_enabled] if args.key?(:flip_enabled)
|
1542
|
+
@sampling_count = args[:sampling_count] if args.key?(:sampling_count)
|
1543
|
+
end
|
1544
|
+
end
|
1545
|
+
|
1495
1546
|
# The metric specification that defines the target resource utilization (CPU
|
1496
1547
|
# utilization, accelerator's duty cycle, and so on) for calculating the desired
|
1497
1548
|
# replica count.
|
@@ -2738,7 +2789,7 @@ module Google
|
|
2738
2789
|
end
|
2739
2790
|
end
|
2740
2791
|
|
2741
|
-
# Content blob.
|
2792
|
+
# Content blob.
|
2742
2793
|
class GoogleCloudAiplatformV1beta1Blob
|
2743
2794
|
include Google::Apis::Core::Hashable
|
2744
2795
|
|
@@ -2748,6 +2799,13 @@ module Google
|
|
2748
2799
|
# @return [String]
|
2749
2800
|
attr_accessor :data
|
2750
2801
|
|
2802
|
+
# Optional. Display name of the blob. Used to provide a label or filename to
|
2803
|
+
# distinguish blobs. This field is only returned in PromptMessage for prompt
|
2804
|
+
# management. It is not currently used in the Gemini GenerateContent calls.
|
2805
|
+
# Corresponds to the JSON property `displayName`
|
2806
|
+
# @return [String]
|
2807
|
+
attr_accessor :display_name
|
2808
|
+
|
2751
2809
|
# Required. The IANA standard MIME type of the source data.
|
2752
2810
|
# Corresponds to the JSON property `mimeType`
|
2753
2811
|
# @return [String]
|
@@ -2760,6 +2818,7 @@ module Google
|
|
2760
2818
|
# Update properties of this object
|
2761
2819
|
def update!(**args)
|
2762
2820
|
@data = args[:data] if args.key?(:data)
|
2821
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
2763
2822
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
2764
2823
|
end
|
2765
2824
|
end
|
@@ -2844,7 +2903,7 @@ module Google
|
|
2844
2903
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Content>]
|
2845
2904
|
attr_accessor :contents
|
2846
2905
|
|
2847
|
-
# Output only.
|
2906
|
+
# Output only. Creation time of the cache entry.
|
2848
2907
|
# Corresponds to the JSON property `createTime`
|
2849
2908
|
# @return [String]
|
2850
2909
|
attr_accessor :create_time
|
@@ -2861,8 +2920,9 @@ module Google
|
|
2861
2920
|
# @return [String]
|
2862
2921
|
attr_accessor :expire_time
|
2863
2922
|
|
2864
|
-
# Immutable. The name of the
|
2865
|
-
# projects/`
|
2923
|
+
# Immutable. The name of the `Model` to use for cached content. Currently, only
|
2924
|
+
# the published Gemini base models are supported, in form of projects/`PROJECT`/
|
2925
|
+
# locations/`LOCATION`/publishers/google/models/`MODEL`
|
2866
2926
|
# Corresponds to the JSON property `model`
|
2867
2927
|
# @return [String]
|
2868
2928
|
attr_accessor :model
|
@@ -4152,6 +4212,11 @@ module Google
|
|
4152
4212
|
class GoogleCloudAiplatformV1beta1CountTokensResponse
|
4153
4213
|
include Google::Apis::Core::Hashable
|
4154
4214
|
|
4215
|
+
# Output only. List of modalities that were processed in the request input.
|
4216
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
4217
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
4218
|
+
attr_accessor :prompt_tokens_details
|
4219
|
+
|
4155
4220
|
# The total number of billable characters counted across all instances from the
|
4156
4221
|
# request.
|
4157
4222
|
# Corresponds to the JSON property `totalBillableCharacters`
|
@@ -4169,6 +4234,7 @@ module Google
|
|
4169
4234
|
|
4170
4235
|
# Update properties of this object
|
4171
4236
|
def update!(**args)
|
4237
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
4172
4238
|
@total_billable_characters = args[:total_billable_characters] if args.key?(:total_billable_characters)
|
4173
4239
|
@total_tokens = args[:total_tokens] if args.key?(:total_tokens)
|
4174
4240
|
end
|
@@ -5504,7 +5570,8 @@ module Google
|
|
5504
5570
|
# @return [String]
|
5505
5571
|
attr_accessor :model_reference
|
5506
5572
|
|
5507
|
-
# Output only. Identifier. The resource name of the Dataset.
|
5573
|
+
# Output only. Identifier. The resource name of the Dataset. Format: `projects/`
|
5574
|
+
# project`/locations/`location`/datasets/`dataset``
|
5508
5575
|
# Corresponds to the JSON property `name`
|
5509
5576
|
# @return [String]
|
5510
5577
|
attr_accessor :name
|
@@ -5752,7 +5819,9 @@ module Google
|
|
5752
5819
|
# @return [String]
|
5753
5820
|
attr_accessor :model_reference
|
5754
5821
|
|
5755
|
-
# Output only. Identifier. The resource name of the DatasetVersion.
|
5822
|
+
# Output only. Identifier. The resource name of the DatasetVersion. Format: `
|
5823
|
+
# projects/`project`/locations/`location`/datasets/`dataset`/datasetVersions/`
|
5824
|
+
# dataset_version``
|
5756
5825
|
# Corresponds to the JSON property `name`
|
5757
5826
|
# @return [String]
|
5758
5827
|
attr_accessor :name
|
@@ -5793,8 +5862,8 @@ module Google
|
|
5793
5862
|
end
|
5794
5863
|
end
|
5795
5864
|
|
5796
|
-
# A description of resources that are dedicated to a DeployedModel
|
5797
|
-
# need a higher degree of manual configuration.
|
5865
|
+
# A description of resources that are dedicated to a DeployedModel or
|
5866
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
5798
5867
|
class GoogleCloudAiplatformV1beta1DedicatedResources
|
5799
5868
|
include Google::Apis::Core::Hashable
|
5800
5869
|
|
@@ -5820,36 +5889,33 @@ module Google
|
|
5820
5889
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1MachineSpec]
|
5821
5890
|
attr_accessor :machine_spec
|
5822
5891
|
|
5823
|
-
# Immutable. The maximum number of replicas
|
5824
|
-
#
|
5825
|
-
#
|
5826
|
-
#
|
5827
|
-
#
|
5828
|
-
#
|
5829
|
-
#
|
5830
|
-
#
|
5831
|
-
#
|
5832
|
-
#
|
5833
|
-
# selected machine type).
|
5892
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
5893
|
+
# traffic against it increases. If the requested value is too large, the
|
5894
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
5895
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
5896
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
5897
|
+
# traffic will be dropped. If this value is not provided, will use
|
5898
|
+
# min_replica_count as the default value. The value of this field impacts the
|
5899
|
+
# charge against Vertex CPU and GPU quotas. Specifically, you will be charged
|
5900
|
+
# for (max_replica_count * number of cores in the selected machine type) and (
|
5901
|
+
# max_replica_count * number of GPUs per replica in the selected machine type).
|
5834
5902
|
# Corresponds to the JSON property `maxReplicaCount`
|
5835
5903
|
# @return [Fixnum]
|
5836
5904
|
attr_accessor :max_replica_count
|
5837
5905
|
|
5838
|
-
# Required. Immutable. The minimum number of machine replicas
|
5839
|
-
#
|
5840
|
-
#
|
5841
|
-
#
|
5842
|
-
# be freed.
|
5906
|
+
# Required. Immutable. The minimum number of machine replicas that will be
|
5907
|
+
# always deployed on. This value must be greater than or equal to 1. If traffic
|
5908
|
+
# increases, it may dynamically be deployed onto more replicas, and as traffic
|
5909
|
+
# decreases, some of these extra replicas may be freed.
|
5843
5910
|
# Corresponds to the JSON property `minReplicaCount`
|
5844
5911
|
# @return [Fixnum]
|
5845
5912
|
attr_accessor :min_replica_count
|
5846
5913
|
|
5847
5914
|
# Optional. Number of required available replicas for the deployment to succeed.
|
5848
|
-
# This field is only needed when partial
|
5849
|
-
#
|
5850
|
-
#
|
5851
|
-
#
|
5852
|
-
# be min_replica_count.
|
5915
|
+
# This field is only needed when partial deployment/mutation is desired. If set,
|
5916
|
+
# the deploy/mutate operation will succeed once available_replica_count reaches
|
5917
|
+
# required_replica_count, and the rest of the replicas will be retried. If not
|
5918
|
+
# set, the default required_replica_count will be min_replica_count.
|
5853
5919
|
# Corresponds to the JSON property `requiredReplicaCount`
|
5854
5920
|
# @return [Fixnum]
|
5855
5921
|
attr_accessor :required_replica_count
|
@@ -6259,8 +6325,8 @@ module Google
|
|
6259
6325
|
attr_accessor :accept_eula
|
6260
6326
|
alias_method :accept_eula?, :accept_eula
|
6261
6327
|
|
6262
|
-
# A description of resources that are dedicated to a DeployedModel
|
6263
|
-
# need a higher degree of manual configuration.
|
6328
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6329
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6264
6330
|
# Corresponds to the JSON property `dedicatedResources`
|
6265
6331
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6266
6332
|
attr_accessor :dedicated_resources
|
@@ -6277,9 +6343,11 @@ module Google
|
|
6277
6343
|
# @return [String]
|
6278
6344
|
attr_accessor :hugging_face_access_token
|
6279
6345
|
|
6280
|
-
# Required. The
|
6281
|
-
#
|
6282
|
-
#
|
6346
|
+
# Required. The model to deploy. Format: 1. `publishers/`publisher`/models/`
|
6347
|
+
# publisher_model`@`version_id``, or `publishers/hf-`hugging-face-author`/models/
|
6348
|
+
# `hugging-face-model-name`@001`. 2. Hugging Face model ID like `google/gemma-2-
|
6349
|
+
# 2b-it`. 3. Custom model Google Cloud Storage URI like `gs://bucket`. 4. Custom
|
6350
|
+
# model zip file like `https://abc.com/a.zip`.
|
6283
6351
|
# Corresponds to the JSON property `model`
|
6284
6352
|
# @return [String]
|
6285
6353
|
attr_accessor :model
|
@@ -6340,8 +6408,8 @@ module Google
|
|
6340
6408
|
# @return [String]
|
6341
6409
|
attr_accessor :create_time
|
6342
6410
|
|
6343
|
-
# A description of resources that are dedicated to a DeployedModel
|
6344
|
-
# need a higher degree of manual configuration.
|
6411
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6412
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6345
6413
|
# Corresponds to the JSON property `dedicatedResources`
|
6346
6414
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6347
6415
|
attr_accessor :dedicated_resources
|
@@ -6553,8 +6621,8 @@ module Google
|
|
6553
6621
|
# @return [String]
|
6554
6622
|
attr_accessor :create_time
|
6555
6623
|
|
6556
|
-
# A description of resources that are dedicated to a DeployedModel
|
6557
|
-
# need a higher degree of manual configuration.
|
6624
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6625
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6558
6626
|
# Corresponds to the JSON property `dedicatedResources`
|
6559
6627
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6560
6628
|
attr_accessor :dedicated_resources
|
@@ -6630,6 +6698,11 @@ module Google
|
|
6630
6698
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PrivateEndpoints]
|
6631
6699
|
attr_accessor :private_endpoints
|
6632
6700
|
|
6701
|
+
# Configuration for rolling deployments.
|
6702
|
+
# Corresponds to the JSON property `rolloutOptions`
|
6703
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RolloutOptions]
|
6704
|
+
attr_accessor :rollout_options
|
6705
|
+
|
6633
6706
|
# The service account that the DeployedModel's container runs as. Specify the
|
6634
6707
|
# email address of the service account. If this service account is not specified,
|
6635
6708
|
# the container runs as a service account that doesn't have access to the
|
@@ -6646,6 +6719,11 @@ module Google
|
|
6646
6719
|
# @return [String]
|
6647
6720
|
attr_accessor :shared_resources
|
6648
6721
|
|
6722
|
+
# Configuration for Speculative Decoding.
|
6723
|
+
# Corresponds to the JSON property `speculativeDecodingSpec`
|
6724
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec]
|
6725
|
+
attr_accessor :speculative_decoding_spec
|
6726
|
+
|
6649
6727
|
# Runtime status of the deployed model.
|
6650
6728
|
# Corresponds to the JSON property `status`
|
6651
6729
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployedModelStatus]
|
@@ -6676,8 +6754,10 @@ module Google
|
|
6676
6754
|
@model = args[:model] if args.key?(:model)
|
6677
6755
|
@model_version_id = args[:model_version_id] if args.key?(:model_version_id)
|
6678
6756
|
@private_endpoints = args[:private_endpoints] if args.key?(:private_endpoints)
|
6757
|
+
@rollout_options = args[:rollout_options] if args.key?(:rollout_options)
|
6679
6758
|
@service_account = args[:service_account] if args.key?(:service_account)
|
6680
6759
|
@shared_resources = args[:shared_resources] if args.key?(:shared_resources)
|
6760
|
+
@speculative_decoding_spec = args[:speculative_decoding_spec] if args.key?(:speculative_decoding_spec)
|
6681
6761
|
@status = args[:status] if args.key?(:status)
|
6682
6762
|
@system_labels = args[:system_labels] if args.key?(:system_labels)
|
6683
6763
|
end
|
@@ -6749,8 +6829,8 @@ module Google
|
|
6749
6829
|
# @return [String]
|
6750
6830
|
attr_accessor :create_time
|
6751
6831
|
|
6752
|
-
# A description of resources that are dedicated to a DeployedModel
|
6753
|
-
# need a higher degree of manual configuration.
|
6832
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6833
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6754
6834
|
# Corresponds to the JSON property `dedicatedResources`
|
6755
6835
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6756
6836
|
attr_accessor :dedicated_resources
|
@@ -7047,9 +7127,9 @@ module Google
|
|
7047
7127
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DistillationHyperParameters]
|
7048
7128
|
attr_accessor :hyper_parameters
|
7049
7129
|
|
7050
|
-
#
|
7051
|
-
#
|
7052
|
-
#
|
7130
|
+
# Deprecated. A path in a Cloud Storage bucket, which will be treated as the
|
7131
|
+
# root output directory of the distillation pipeline. It is used by the system
|
7132
|
+
# to generate the paths of output artifacts.
|
7053
7133
|
# Corresponds to the JSON property `pipelineRootDirectory`
|
7054
7134
|
# @return [String]
|
7055
7135
|
attr_accessor :pipeline_root_directory
|
@@ -7060,7 +7140,7 @@ module Google
|
|
7060
7140
|
# @return [String]
|
7061
7141
|
attr_accessor :student_model
|
7062
7142
|
|
7063
|
-
#
|
7143
|
+
# Deprecated. Cloud Storage path to file containing training dataset for tuning.
|
7064
7144
|
# The dataset must be formatted as a JSONL file.
|
7065
7145
|
# Corresponds to the JSON property `trainingDatasetUri`
|
7066
7146
|
# @return [String]
|
@@ -7232,6 +7312,11 @@ module Google
|
|
7232
7312
|
# @return [String]
|
7233
7313
|
attr_accessor :etag
|
7234
7314
|
|
7315
|
+
# Configuration for GenAiAdvancedFeatures.
|
7316
|
+
# Corresponds to the JSON property `genAiAdvancedFeaturesConfig`
|
7317
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig]
|
7318
|
+
attr_accessor :gen_ai_advanced_features_config
|
7319
|
+
|
7235
7320
|
# The labels with user-defined metadata to organize your Endpoints. Label keys
|
7236
7321
|
# and values can be no longer than 64 characters (Unicode codepoints), can only
|
7237
7322
|
# contain lowercase letters, numeric characters, underscores and dashes.
|
@@ -7318,6 +7403,7 @@ module Google
|
|
7318
7403
|
@enable_private_service_connect = args[:enable_private_service_connect] if args.key?(:enable_private_service_connect)
|
7319
7404
|
@encryption_spec = args[:encryption_spec] if args.key?(:encryption_spec)
|
7320
7405
|
@etag = args[:etag] if args.key?(:etag)
|
7406
|
+
@gen_ai_advanced_features_config = args[:gen_ai_advanced_features_config] if args.key?(:gen_ai_advanced_features_config)
|
7321
7407
|
@labels = args[:labels] if args.key?(:labels)
|
7322
7408
|
@model_deployment_monitoring_job = args[:model_deployment_monitoring_job] if args.key?(:model_deployment_monitoring_job)
|
7323
7409
|
@name = args[:name] if args.key?(:name)
|
@@ -7545,10 +7631,54 @@ module Google
|
|
7545
7631
|
end
|
7546
7632
|
end
|
7547
7633
|
|
7634
|
+
# Request message for EvaluationService.EvaluateDataset.
|
7635
|
+
class GoogleCloudAiplatformV1beta1EvaluateDatasetRequest
|
7636
|
+
include Google::Apis::Core::Hashable
|
7637
|
+
|
7638
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7639
|
+
# EvaluateDataset.
|
7640
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7641
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7642
|
+
attr_accessor :autorater_config
|
7643
|
+
|
7644
|
+
# The dataset used for evaluation.
|
7645
|
+
# Corresponds to the JSON property `dataset`
|
7646
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EvaluationDataset]
|
7647
|
+
attr_accessor :dataset
|
7648
|
+
|
7649
|
+
# Required. The metrics used for evaluation.
|
7650
|
+
# Corresponds to the JSON property `metrics`
|
7651
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Metric>]
|
7652
|
+
attr_accessor :metrics
|
7653
|
+
|
7654
|
+
# Config for evaluation output.
|
7655
|
+
# Corresponds to the JSON property `outputConfig`
|
7656
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1OutputConfig]
|
7657
|
+
attr_accessor :output_config
|
7658
|
+
|
7659
|
+
def initialize(**args)
|
7660
|
+
update!(**args)
|
7661
|
+
end
|
7662
|
+
|
7663
|
+
# Update properties of this object
|
7664
|
+
def update!(**args)
|
7665
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7666
|
+
@dataset = args[:dataset] if args.key?(:dataset)
|
7667
|
+
@metrics = args[:metrics] if args.key?(:metrics)
|
7668
|
+
@output_config = args[:output_config] if args.key?(:output_config)
|
7669
|
+
end
|
7670
|
+
end
|
7671
|
+
|
7548
7672
|
# Request message for EvaluationService.EvaluateInstances.
|
7549
7673
|
class GoogleCloudAiplatformV1beta1EvaluateInstancesRequest
|
7550
7674
|
include Google::Apis::Core::Hashable
|
7551
7675
|
|
7676
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7677
|
+
# EvaluateDataset.
|
7678
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7679
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7680
|
+
attr_accessor :autorater_config
|
7681
|
+
|
7552
7682
|
# Input for bleu metric.
|
7553
7683
|
# Corresponds to the JSON property `bleuInput`
|
7554
7684
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuInput]
|
@@ -7710,6 +7840,7 @@ module Google
|
|
7710
7840
|
|
7711
7841
|
# Update properties of this object
|
7712
7842
|
def update!(**args)
|
7843
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7713
7844
|
@bleu_input = args[:bleu_input] if args.key?(:bleu_input)
|
7714
7845
|
@coherence_input = args[:coherence_input] if args.key?(:coherence_input)
|
7715
7846
|
@comet_input = args[:comet_input] if args.key?(:comet_input)
|
@@ -8049,6 +8180,31 @@ module Google
|
|
8049
8180
|
end
|
8050
8181
|
end
|
8051
8182
|
|
8183
|
+
# The dataset used for evaluation.
|
8184
|
+
class GoogleCloudAiplatformV1beta1EvaluationDataset
|
8185
|
+
include Google::Apis::Core::Hashable
|
8186
|
+
|
8187
|
+
# The BigQuery location for the input content.
|
8188
|
+
# Corresponds to the JSON property `bigquerySource`
|
8189
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BigQuerySource]
|
8190
|
+
attr_accessor :bigquery_source
|
8191
|
+
|
8192
|
+
# The Google Cloud Storage location for the input content.
|
8193
|
+
# Corresponds to the JSON property `gcsSource`
|
8194
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsSource]
|
8195
|
+
attr_accessor :gcs_source
|
8196
|
+
|
8197
|
+
def initialize(**args)
|
8198
|
+
update!(**args)
|
8199
|
+
end
|
8200
|
+
|
8201
|
+
# Update properties of this object
|
8202
|
+
def update!(**args)
|
8203
|
+
@bigquery_source = args[:bigquery_source] if args.key?(:bigquery_source)
|
8204
|
+
@gcs_source = args[:gcs_source] if args.key?(:gcs_source)
|
8205
|
+
end
|
8206
|
+
end
|
8207
|
+
|
8052
8208
|
# An edge describing the relationship between an Artifact and an Execution in a
|
8053
8209
|
# lineage graph.
|
8054
8210
|
class GoogleCloudAiplatformV1beta1Event
|
@@ -9572,6 +9728,51 @@ module Google
|
|
9572
9728
|
end
|
9573
9729
|
end
|
9574
9730
|
|
9731
|
+
# Runtime operation information for ModelGardenService.ExportPublisherModel.
|
9732
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelOperationMetadata
|
9733
|
+
include Google::Apis::Core::Hashable
|
9734
|
+
|
9735
|
+
# Generic Metadata shared by all operations.
|
9736
|
+
# Corresponds to the JSON property `genericMetadata`
|
9737
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenericOperationMetadata]
|
9738
|
+
attr_accessor :generic_metadata
|
9739
|
+
|
9740
|
+
def initialize(**args)
|
9741
|
+
update!(**args)
|
9742
|
+
end
|
9743
|
+
|
9744
|
+
# Update properties of this object
|
9745
|
+
def update!(**args)
|
9746
|
+
@generic_metadata = args[:generic_metadata] if args.key?(:generic_metadata)
|
9747
|
+
end
|
9748
|
+
end
|
9749
|
+
|
9750
|
+
# Response message for ModelGardenService.ExportPublisherModel.
|
9751
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelResponse
|
9752
|
+
include Google::Apis::Core::Hashable
|
9753
|
+
|
9754
|
+
# The destination uri of the model weights.
|
9755
|
+
# Corresponds to the JSON property `destinationUri`
|
9756
|
+
# @return [String]
|
9757
|
+
attr_accessor :destination_uri
|
9758
|
+
|
9759
|
+
# The name of the PublisherModel resource. Format: `publishers/`publisher`/
|
9760
|
+
# models/`publisher_model`@`version_id``
|
9761
|
+
# Corresponds to the JSON property `publisherModel`
|
9762
|
+
# @return [String]
|
9763
|
+
attr_accessor :publisher_model
|
9764
|
+
|
9765
|
+
def initialize(**args)
|
9766
|
+
update!(**args)
|
9767
|
+
end
|
9768
|
+
|
9769
|
+
# Update properties of this object
|
9770
|
+
def update!(**args)
|
9771
|
+
@destination_uri = args[:destination_uri] if args.key?(:destination_uri)
|
9772
|
+
@publisher_model = args[:publisher_model] if args.key?(:publisher_model)
|
9773
|
+
end
|
9774
|
+
end
|
9775
|
+
|
9575
9776
|
# Request message for TensorboardService.ExportTensorboardTimeSeriesData.
|
9576
9777
|
class GoogleCloudAiplatformV1beta1ExportTensorboardTimeSeriesDataRequest
|
9577
9778
|
include Google::Apis::Core::Hashable
|
@@ -12183,6 +12384,14 @@ module Google
|
|
12183
12384
|
class GoogleCloudAiplatformV1beta1FileData
|
12184
12385
|
include Google::Apis::Core::Hashable
|
12185
12386
|
|
12387
|
+
# Optional. Display name of the file data. Used to provide a label or filename
|
12388
|
+
# to distinguish file datas. This field is only returned in PromptMessage for
|
12389
|
+
# prompt management. It is not currently used in the Gemini GenerateContent
|
12390
|
+
# calls.
|
12391
|
+
# Corresponds to the JSON property `displayName`
|
12392
|
+
# @return [String]
|
12393
|
+
attr_accessor :display_name
|
12394
|
+
|
12186
12395
|
# Required. URI.
|
12187
12396
|
# Corresponds to the JSON property `fileUri`
|
12188
12397
|
# @return [String]
|
@@ -12199,6 +12408,7 @@ module Google
|
|
12199
12408
|
|
12200
12409
|
# Update properties of this object
|
12201
12410
|
def update!(**args)
|
12411
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
12202
12412
|
@file_uri = args[:file_uri] if args.key?(:file_uri)
|
12203
12413
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
12204
12414
|
end
|
@@ -12881,6 +13091,47 @@ module Google
|
|
12881
13091
|
end
|
12882
13092
|
end
|
12883
13093
|
|
13094
|
+
# Configuration for GenAiAdvancedFeatures.
|
13095
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig
|
13096
|
+
include Google::Apis::Core::Hashable
|
13097
|
+
|
13098
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13099
|
+
# Corresponds to the JSON property `ragConfig`
|
13100
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig]
|
13101
|
+
attr_accessor :rag_config
|
13102
|
+
|
13103
|
+
def initialize(**args)
|
13104
|
+
update!(**args)
|
13105
|
+
end
|
13106
|
+
|
13107
|
+
# Update properties of this object
|
13108
|
+
def update!(**args)
|
13109
|
+
@rag_config = args[:rag_config] if args.key?(:rag_config)
|
13110
|
+
end
|
13111
|
+
end
|
13112
|
+
|
13113
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13114
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig
|
13115
|
+
include Google::Apis::Core::Hashable
|
13116
|
+
|
13117
|
+
# If true, enable Retrieval Augmented Generation in ChatCompletion request. Once
|
13118
|
+
# enabled, the endpoint will be identified as GenAI endpoint and Arthedain
|
13119
|
+
# router will be used.
|
13120
|
+
# Corresponds to the JSON property `enableRag`
|
13121
|
+
# @return [Boolean]
|
13122
|
+
attr_accessor :enable_rag
|
13123
|
+
alias_method :enable_rag?, :enable_rag
|
13124
|
+
|
13125
|
+
def initialize(**args)
|
13126
|
+
update!(**args)
|
13127
|
+
end
|
13128
|
+
|
13129
|
+
# Update properties of this object
|
13130
|
+
def update!(**args)
|
13131
|
+
@enable_rag = args[:enable_rag] if args.key?(:enable_rag)
|
13132
|
+
end
|
13133
|
+
end
|
13134
|
+
|
12884
13135
|
# Request message for NotebookInternalService.GenerateAccessToken.
|
12885
13136
|
class GoogleCloudAiplatformV1beta1GenerateAccessTokenRequest
|
12886
13137
|
include Google::Apis::Core::Hashable
|
@@ -13028,6 +13279,11 @@ module Google
|
|
13028
13279
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Candidate>]
|
13029
13280
|
attr_accessor :candidates
|
13030
13281
|
|
13282
|
+
# Output only. Timestamp when the request is made to the server.
|
13283
|
+
# Corresponds to the JSON property `createTime`
|
13284
|
+
# @return [String]
|
13285
|
+
attr_accessor :create_time
|
13286
|
+
|
13031
13287
|
# Output only. The model version used to generate the response.
|
13032
13288
|
# Corresponds to the JSON property `modelVersion`
|
13033
13289
|
# @return [String]
|
@@ -13038,6 +13294,12 @@ module Google
|
|
13038
13294
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponsePromptFeedback]
|
13039
13295
|
attr_accessor :prompt_feedback
|
13040
13296
|
|
13297
|
+
# Output only. response_id is used to identify each response. It is the encoding
|
13298
|
+
# of the event_id.
|
13299
|
+
# Corresponds to the JSON property `responseId`
|
13300
|
+
# @return [String]
|
13301
|
+
attr_accessor :response_id
|
13302
|
+
|
13041
13303
|
# Usage metadata about response(s).
|
13042
13304
|
# Corresponds to the JSON property `usageMetadata`
|
13043
13305
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata]
|
@@ -13050,8 +13312,10 @@ module Google
|
|
13050
13312
|
# Update properties of this object
|
13051
13313
|
def update!(**args)
|
13052
13314
|
@candidates = args[:candidates] if args.key?(:candidates)
|
13315
|
+
@create_time = args[:create_time] if args.key?(:create_time)
|
13053
13316
|
@model_version = args[:model_version] if args.key?(:model_version)
|
13054
13317
|
@prompt_feedback = args[:prompt_feedback] if args.key?(:prompt_feedback)
|
13318
|
+
@response_id = args[:response_id] if args.key?(:response_id)
|
13055
13319
|
@usage_metadata = args[:usage_metadata] if args.key?(:usage_metadata)
|
13056
13320
|
end
|
13057
13321
|
end
|
@@ -13091,6 +13355,11 @@ module Google
|
|
13091
13355
|
class GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata
|
13092
13356
|
include Google::Apis::Core::Hashable
|
13093
13357
|
|
13358
|
+
# Output only. List of modalities of the cached content in the request input.
|
13359
|
+
# Corresponds to the JSON property `cacheTokensDetails`
|
13360
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13361
|
+
attr_accessor :cache_tokens_details
|
13362
|
+
|
13094
13363
|
# Output only. Number of tokens in the cached part in the input (the cached
|
13095
13364
|
# content).
|
13096
13365
|
# Corresponds to the JSON property `cachedContentTokenCount`
|
@@ -13102,6 +13371,11 @@ module Google
|
|
13102
13371
|
# @return [Fixnum]
|
13103
13372
|
attr_accessor :candidates_token_count
|
13104
13373
|
|
13374
|
+
# Output only. List of modalities that were returned in the response.
|
13375
|
+
# Corresponds to the JSON property `candidatesTokensDetails`
|
13376
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13377
|
+
attr_accessor :candidates_tokens_details
|
13378
|
+
|
13105
13379
|
# Number of tokens in the request. When `cached_content` is set, this is still
|
13106
13380
|
# the total effective prompt size meaning this includes the number of tokens in
|
13107
13381
|
# the cached content.
|
@@ -13109,6 +13383,11 @@ module Google
|
|
13109
13383
|
# @return [Fixnum]
|
13110
13384
|
attr_accessor :prompt_token_count
|
13111
13385
|
|
13386
|
+
# Output only. List of modalities that were processed in the request input.
|
13387
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
13388
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13389
|
+
attr_accessor :prompt_tokens_details
|
13390
|
+
|
13112
13391
|
# Total token count for prompt and response candidates.
|
13113
13392
|
# Corresponds to the JSON property `totalTokenCount`
|
13114
13393
|
# @return [Fixnum]
|
@@ -13120,9 +13399,12 @@ module Google
|
|
13120
13399
|
|
13121
13400
|
# Update properties of this object
|
13122
13401
|
def update!(**args)
|
13402
|
+
@cache_tokens_details = args[:cache_tokens_details] if args.key?(:cache_tokens_details)
|
13123
13403
|
@cached_content_token_count = args[:cached_content_token_count] if args.key?(:cached_content_token_count)
|
13124
13404
|
@candidates_token_count = args[:candidates_token_count] if args.key?(:candidates_token_count)
|
13405
|
+
@candidates_tokens_details = args[:candidates_tokens_details] if args.key?(:candidates_tokens_details)
|
13125
13406
|
@prompt_token_count = args[:prompt_token_count] if args.key?(:prompt_token_count)
|
13407
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
13126
13408
|
@total_token_count = args[:total_token_count] if args.key?(:total_token_count)
|
13127
13409
|
end
|
13128
13410
|
end
|
@@ -13189,6 +13471,11 @@ module Google
|
|
13189
13471
|
# @return [Fixnum]
|
13190
13472
|
attr_accessor :max_output_tokens
|
13191
13473
|
|
13474
|
+
# Optional. If specified, the media resolution specified will be used.
|
13475
|
+
# Corresponds to the JSON property `mediaResolution`
|
13476
|
+
# @return [String]
|
13477
|
+
attr_accessor :media_resolution
|
13478
|
+
|
13192
13479
|
# Optional. Positive penalties.
|
13193
13480
|
# Corresponds to the JSON property `presencePenalty`
|
13194
13481
|
# @return [Float]
|
@@ -13246,11 +13533,6 @@ module Google
|
|
13246
13533
|
# @return [Float]
|
13247
13534
|
attr_accessor :temperature
|
13248
13535
|
|
13249
|
-
# Optional. If specified, the token resolution specified will be used.
|
13250
|
-
# Corresponds to the JSON property `tokenResolution`
|
13251
|
-
# @return [String]
|
13252
|
-
attr_accessor :token_resolution
|
13253
|
-
|
13254
13536
|
# Optional. If specified, top-k sampling will be used.
|
13255
13537
|
# Corresponds to the JSON property `topK`
|
13256
13538
|
# @return [Float]
|
@@ -13272,6 +13554,7 @@ module Google
|
|
13272
13554
|
@frequency_penalty = args[:frequency_penalty] if args.key?(:frequency_penalty)
|
13273
13555
|
@logprobs = args[:logprobs] if args.key?(:logprobs)
|
13274
13556
|
@max_output_tokens = args[:max_output_tokens] if args.key?(:max_output_tokens)
|
13557
|
+
@media_resolution = args[:media_resolution] if args.key?(:media_resolution)
|
13275
13558
|
@presence_penalty = args[:presence_penalty] if args.key?(:presence_penalty)
|
13276
13559
|
@response_logprobs = args[:response_logprobs] if args.key?(:response_logprobs)
|
13277
13560
|
@response_mime_type = args[:response_mime_type] if args.key?(:response_mime_type)
|
@@ -13282,7 +13565,6 @@ module Google
|
|
13282
13565
|
@speech_config = args[:speech_config] if args.key?(:speech_config)
|
13283
13566
|
@stop_sequences = args[:stop_sequences] if args.key?(:stop_sequences)
|
13284
13567
|
@temperature = args[:temperature] if args.key?(:temperature)
|
13285
|
-
@token_resolution = args[:token_resolution] if args.key?(:token_resolution)
|
13286
13568
|
@top_k = args[:top_k] if args.key?(:top_k)
|
13287
13569
|
@top_p = args[:top_p] if args.key?(:top_p)
|
13288
13570
|
end
|
@@ -16075,6 +16357,32 @@ module Google
|
|
16075
16357
|
end
|
16076
16358
|
end
|
16077
16359
|
|
16360
|
+
# Response message for ModelService.ListModelVersionCheckpoints
|
16361
|
+
class GoogleCloudAiplatformV1beta1ListModelVersionCheckpointsResponse
|
16362
|
+
include Google::Apis::Core::Hashable
|
16363
|
+
|
16364
|
+
# List of Model Version checkpoints.
|
16365
|
+
# Corresponds to the JSON property `checkpoints`
|
16366
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelVersionCheckpoint>]
|
16367
|
+
attr_accessor :checkpoints
|
16368
|
+
|
16369
|
+
# A token to retrieve the next page of results. Pass to
|
16370
|
+
# ListModelVersionCheckpointsRequest.page_token to obtain that page.
|
16371
|
+
# Corresponds to the JSON property `nextPageToken`
|
16372
|
+
# @return [String]
|
16373
|
+
attr_accessor :next_page_token
|
16374
|
+
|
16375
|
+
def initialize(**args)
|
16376
|
+
update!(**args)
|
16377
|
+
end
|
16378
|
+
|
16379
|
+
# Update properties of this object
|
16380
|
+
def update!(**args)
|
16381
|
+
@checkpoints = args[:checkpoints] if args.key?(:checkpoints)
|
16382
|
+
@next_page_token = args[:next_page_token] if args.key?(:next_page_token)
|
16383
|
+
end
|
16384
|
+
end
|
16385
|
+
|
16078
16386
|
# Response message for ModelService.ListModelVersions
|
16079
16387
|
class GoogleCloudAiplatformV1beta1ListModelVersionsResponse
|
16080
16388
|
include Google::Apis::Core::Hashable
|
@@ -17147,6 +17455,58 @@ module Google
|
|
17147
17455
|
end
|
17148
17456
|
end
|
17149
17457
|
|
17458
|
+
# The metric used for dataset level evaluation.
|
17459
|
+
class GoogleCloudAiplatformV1beta1Metric
|
17460
|
+
include Google::Apis::Core::Hashable
|
17461
|
+
|
17462
|
+
# Optional. The aggregation metrics to use.
|
17463
|
+
# Corresponds to the JSON property `aggregationMetrics`
|
17464
|
+
# @return [Array<String>]
|
17465
|
+
attr_accessor :aggregation_metrics
|
17466
|
+
|
17467
|
+
# Spec for bleu score metric - calculates the precision of n-grams in the
|
17468
|
+
# prediction as compared to reference - returns a score ranging between 0 to 1.
|
17469
|
+
# Corresponds to the JSON property `bleuSpec`
|
17470
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuSpec]
|
17471
|
+
attr_accessor :bleu_spec
|
17472
|
+
|
17473
|
+
# Spec for exact match metric - returns 1 if prediction and reference exactly
|
17474
|
+
# matches, otherwise 0.
|
17475
|
+
# Corresponds to the JSON property `exactMatchSpec`
|
17476
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ExactMatchSpec]
|
17477
|
+
attr_accessor :exact_match_spec
|
17478
|
+
|
17479
|
+
# Spec for pairwise metric.
|
17480
|
+
# Corresponds to the JSON property `pairwiseMetricSpec`
|
17481
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PairwiseMetricSpec]
|
17482
|
+
attr_accessor :pairwise_metric_spec
|
17483
|
+
|
17484
|
+
# Spec for pointwise metric.
|
17485
|
+
# Corresponds to the JSON property `pointwiseMetricSpec`
|
17486
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PointwiseMetricSpec]
|
17487
|
+
attr_accessor :pointwise_metric_spec
|
17488
|
+
|
17489
|
+
# Spec for rouge score metric - calculates the recall of n-grams in prediction
|
17490
|
+
# as compared to reference - returns a score ranging between 0 and 1.
|
17491
|
+
# Corresponds to the JSON property `rougeSpec`
|
17492
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RougeSpec]
|
17493
|
+
attr_accessor :rouge_spec
|
17494
|
+
|
17495
|
+
def initialize(**args)
|
17496
|
+
update!(**args)
|
17497
|
+
end
|
17498
|
+
|
17499
|
+
# Update properties of this object
|
17500
|
+
def update!(**args)
|
17501
|
+
@aggregation_metrics = args[:aggregation_metrics] if args.key?(:aggregation_metrics)
|
17502
|
+
@bleu_spec = args[:bleu_spec] if args.key?(:bleu_spec)
|
17503
|
+
@exact_match_spec = args[:exact_match_spec] if args.key?(:exact_match_spec)
|
17504
|
+
@pairwise_metric_spec = args[:pairwise_metric_spec] if args.key?(:pairwise_metric_spec)
|
17505
|
+
@pointwise_metric_spec = args[:pointwise_metric_spec] if args.key?(:pointwise_metric_spec)
|
17506
|
+
@rouge_spec = args[:rouge_spec] if args.key?(:rouge_spec)
|
17507
|
+
end
|
17508
|
+
end
|
17509
|
+
|
17150
17510
|
# Input for MetricX metric.
|
17151
17511
|
class GoogleCloudAiplatformV1beta1MetricxInput
|
17152
17512
|
include Google::Apis::Core::Hashable
|
@@ -17665,6 +18025,31 @@ module Google
|
|
17665
18025
|
end
|
17666
18026
|
end
|
17667
18027
|
|
18028
|
+
# Represents token counting info for a single modality.
|
18029
|
+
class GoogleCloudAiplatformV1beta1ModalityTokenCount
|
18030
|
+
include Google::Apis::Core::Hashable
|
18031
|
+
|
18032
|
+
# The modality associated with this token count.
|
18033
|
+
# Corresponds to the JSON property `modality`
|
18034
|
+
# @return [String]
|
18035
|
+
attr_accessor :modality
|
18036
|
+
|
18037
|
+
# Number of tokens.
|
18038
|
+
# Corresponds to the JSON property `tokenCount`
|
18039
|
+
# @return [Fixnum]
|
18040
|
+
attr_accessor :token_count
|
18041
|
+
|
18042
|
+
def initialize(**args)
|
18043
|
+
update!(**args)
|
18044
|
+
end
|
18045
|
+
|
18046
|
+
# Update properties of this object
|
18047
|
+
def update!(**args)
|
18048
|
+
@modality = args[:modality] if args.key?(:modality)
|
18049
|
+
@token_count = args[:token_count] if args.key?(:token_count)
|
18050
|
+
end
|
18051
|
+
end
|
18052
|
+
|
17668
18053
|
# A trained machine learning Model.
|
17669
18054
|
class GoogleCloudAiplatformV1beta1Model
|
17670
18055
|
include Google::Apis::Core::Hashable
|
@@ -17694,6 +18079,11 @@ module Google
|
|
17694
18079
|
# @return [String]
|
17695
18080
|
attr_accessor :create_time
|
17696
18081
|
|
18082
|
+
# The default checkpoint id of a model version.
|
18083
|
+
# Corresponds to the JSON property `defaultCheckpointId`
|
18084
|
+
# @return [String]
|
18085
|
+
attr_accessor :default_checkpoint_id
|
18086
|
+
|
17697
18087
|
# Output only. The pointers to DeployedModels created from this Model. Note that
|
17698
18088
|
# Model could have been deployed to Endpoints in different Locations.
|
17699
18089
|
# Corresponds to the JSON property `deployedModels`
|
@@ -17908,6 +18298,7 @@ module Google
|
|
17908
18298
|
@base_model_source = args[:base_model_source] if args.key?(:base_model_source)
|
17909
18299
|
@container_spec = args[:container_spec] if args.key?(:container_spec)
|
17910
18300
|
@create_time = args[:create_time] if args.key?(:create_time)
|
18301
|
+
@default_checkpoint_id = args[:default_checkpoint_id] if args.key?(:default_checkpoint_id)
|
17911
18302
|
@deployed_models = args[:deployed_models] if args.key?(:deployed_models)
|
17912
18303
|
@description = args[:description] if args.key?(:description)
|
17913
18304
|
@display_name = args[:display_name] if args.key?(:display_name)
|
@@ -18110,6 +18501,12 @@ module Google
|
|
18110
18501
|
# @return [String]
|
18111
18502
|
attr_accessor :image_uri
|
18112
18503
|
|
18504
|
+
# Probe describes a health check to be performed against a container to
|
18505
|
+
# determine whether it is alive or ready to receive traffic.
|
18506
|
+
# Corresponds to the JSON property `livenessProbe`
|
18507
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Probe]
|
18508
|
+
attr_accessor :liveness_probe
|
18509
|
+
|
18113
18510
|
# Immutable. List of ports to expose from the container. Vertex AI sends any
|
18114
18511
|
# prediction requests that it receives to the first port on this list. Vertex AI
|
18115
18512
|
# also sends [liveness and health checks](https://cloud.google.com/vertex-ai/
|
@@ -18172,6 +18569,7 @@ module Google
|
|
18172
18569
|
@health_probe = args[:health_probe] if args.key?(:health_probe)
|
18173
18570
|
@health_route = args[:health_route] if args.key?(:health_route)
|
18174
18571
|
@image_uri = args[:image_uri] if args.key?(:image_uri)
|
18572
|
+
@liveness_probe = args[:liveness_probe] if args.key?(:liveness_probe)
|
18175
18573
|
@ports = args[:ports] if args.key?(:ports)
|
18176
18574
|
@predict_route = args[:predict_route] if args.key?(:predict_route)
|
18177
18575
|
@shared_memory_size_mb = args[:shared_memory_size_mb] if args.key?(:shared_memory_size_mb)
|
@@ -18909,7 +19307,7 @@ module Google
|
|
18909
19307
|
# model in SavedModel format. * `tf-js` A [TensorFlow.js](https://www.tensorflow.
|
18910
19308
|
# org/js) model that can be used in the browser and in Node.js using JavaScript.
|
18911
19309
|
# * `core-ml` Used for iOS mobile devices. * `custom-trained` A Model that was
|
18912
|
-
# uploaded or trained by custom code.
|
19310
|
+
# uploaded or trained by custom code. * `genie` A tuned Model Garden model.
|
18913
19311
|
# Corresponds to the JSON property `id`
|
18914
19312
|
# @return [String]
|
18915
19313
|
attr_accessor :id
|
@@ -18935,6 +19333,17 @@ module Google
|
|
18935
19333
|
# @return [String]
|
18936
19334
|
attr_accessor :public_model_name
|
18937
19335
|
|
19336
|
+
# Optional. Whether to avoid pulling the model from the HF cache.
|
19337
|
+
# Corresponds to the JSON property `skipHfModelCache`
|
19338
|
+
# @return [Boolean]
|
19339
|
+
attr_accessor :skip_hf_model_cache
|
19340
|
+
alias_method :skip_hf_model_cache?, :skip_hf_model_cache
|
19341
|
+
|
19342
|
+
# Optional. The model garden source model version ID.
|
19343
|
+
# Corresponds to the JSON property `versionId`
|
19344
|
+
# @return [String]
|
19345
|
+
attr_accessor :version_id
|
19346
|
+
|
18938
19347
|
def initialize(**args)
|
18939
19348
|
update!(**args)
|
18940
19349
|
end
|
@@ -18942,6 +19351,8 @@ module Google
|
|
18942
19351
|
# Update properties of this object
|
18943
19352
|
def update!(**args)
|
18944
19353
|
@public_model_name = args[:public_model_name] if args.key?(:public_model_name)
|
19354
|
+
@skip_hf_model_cache = args[:skip_hf_model_cache] if args.key?(:skip_hf_model_cache)
|
19355
|
+
@version_id = args[:version_id] if args.key?(:version_id)
|
18945
19356
|
end
|
18946
19357
|
end
|
18947
19358
|
|
@@ -20594,6 +21005,45 @@ module Google
|
|
20594
21005
|
end
|
20595
21006
|
end
|
20596
21007
|
|
21008
|
+
# Describes the machine learning model version checkpoint.
|
21009
|
+
class GoogleCloudAiplatformV1beta1ModelVersionCheckpoint
|
21010
|
+
include Google::Apis::Core::Hashable
|
21011
|
+
|
21012
|
+
# The ID of the checkpoint.
|
21013
|
+
# Corresponds to the JSON property `checkpointId`
|
21014
|
+
# @return [String]
|
21015
|
+
attr_accessor :checkpoint_id
|
21016
|
+
|
21017
|
+
# The epoch of the checkpoint.
|
21018
|
+
# Corresponds to the JSON property `epoch`
|
21019
|
+
# @return [Fixnum]
|
21020
|
+
attr_accessor :epoch
|
21021
|
+
|
21022
|
+
# Identifier. The resource name of the ModelVersionCheckpoint. Format: `projects/
|
21023
|
+
# `project`/locations/`location`/models/`model`/versions/`version`/checkpoints/`
|
21024
|
+
# checkpoint``
|
21025
|
+
# Corresponds to the JSON property `name`
|
21026
|
+
# @return [String]
|
21027
|
+
attr_accessor :name
|
21028
|
+
|
21029
|
+
# The step of the checkpoint.
|
21030
|
+
# Corresponds to the JSON property `step`
|
21031
|
+
# @return [Fixnum]
|
21032
|
+
attr_accessor :step
|
21033
|
+
|
21034
|
+
def initialize(**args)
|
21035
|
+
update!(**args)
|
21036
|
+
end
|
21037
|
+
|
21038
|
+
# Update properties of this object
|
21039
|
+
def update!(**args)
|
21040
|
+
@checkpoint_id = args[:checkpoint_id] if args.key?(:checkpoint_id)
|
21041
|
+
@epoch = args[:epoch] if args.key?(:epoch)
|
21042
|
+
@name = args[:name] if args.key?(:name)
|
21043
|
+
@step = args[:step] if args.key?(:step)
|
21044
|
+
end
|
21045
|
+
end
|
21046
|
+
|
20597
21047
|
# Runtime operation information for IndexEndpointService.MutateDeployedIndex.
|
20598
21048
|
class GoogleCloudAiplatformV1beta1MutateDeployedIndexOperationMetadata
|
20599
21049
|
include Google::Apis::Core::Hashable
|
@@ -21703,8 +22153,8 @@ module Google
|
|
21703
22153
|
# @return [String]
|
21704
22154
|
attr_accessor :notebook_runtime_template_resource_name
|
21705
22155
|
|
21706
|
-
#
|
21707
|
-
#
|
22156
|
+
# The Schedule resource name if this job is triggered by one. Format: `projects/`
|
22157
|
+
# project_id`/locations/`location`/schedules/`schedule_id``
|
21708
22158
|
# Corresponds to the JSON property `scheduleResourceName`
|
21709
22159
|
# @return [String]
|
21710
22160
|
attr_accessor :schedule_resource_name
|
@@ -22067,6 +22517,11 @@ module Google
|
|
22067
22517
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22068
22518
|
attr_accessor :shielded_vm_config
|
22069
22519
|
|
22520
|
+
# Notebook Software Config.
|
22521
|
+
# Corresponds to the JSON property `softwareConfig`
|
22522
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22523
|
+
attr_accessor :software_config
|
22524
|
+
|
22070
22525
|
# Output only. Timestamp when this NotebookRuntime was most recently updated.
|
22071
22526
|
# Corresponds to the JSON property `updateTime`
|
22072
22527
|
# @return [String]
|
@@ -22107,6 +22562,7 @@ module Google
|
|
22107
22562
|
@satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
|
22108
22563
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22109
22564
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22565
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22110
22566
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22111
22567
|
@version = args[:version] if args.key?(:version)
|
22112
22568
|
end
|
@@ -22225,6 +22681,11 @@ module Google
|
|
22225
22681
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22226
22682
|
attr_accessor :shielded_vm_config
|
22227
22683
|
|
22684
|
+
# Notebook Software Config.
|
22685
|
+
# Corresponds to the JSON property `softwareConfig`
|
22686
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22687
|
+
attr_accessor :software_config
|
22688
|
+
|
22228
22689
|
# Output only. Timestamp when this NotebookRuntimeTemplate was most recently
|
22229
22690
|
# updated.
|
22230
22691
|
# Corresponds to the JSON property `updateTime`
|
@@ -22254,6 +22715,7 @@ module Google
|
|
22254
22715
|
@notebook_runtime_type = args[:notebook_runtime_type] if args.key?(:notebook_runtime_type)
|
22255
22716
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22256
22717
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22718
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22257
22719
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22258
22720
|
end
|
22259
22721
|
end
|
@@ -22277,6 +22739,51 @@ module Google
|
|
22277
22739
|
end
|
22278
22740
|
end
|
22279
22741
|
|
22742
|
+
# Notebook Software Config.
|
22743
|
+
class GoogleCloudAiplatformV1beta1NotebookSoftwareConfig
|
22744
|
+
include Google::Apis::Core::Hashable
|
22745
|
+
|
22746
|
+
# Optional. Environment variables to be passed to the container. Maximum limit
|
22747
|
+
# is 100.
|
22748
|
+
# Corresponds to the JSON property `env`
|
22749
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnvVar>]
|
22750
|
+
attr_accessor :env
|
22751
|
+
|
22752
|
+
# Post startup script config.
|
22753
|
+
# Corresponds to the JSON property `postStartupScriptConfig`
|
22754
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PostStartupScriptConfig]
|
22755
|
+
attr_accessor :post_startup_script_config
|
22756
|
+
|
22757
|
+
def initialize(**args)
|
22758
|
+
update!(**args)
|
22759
|
+
end
|
22760
|
+
|
22761
|
+
# Update properties of this object
|
22762
|
+
def update!(**args)
|
22763
|
+
@env = args[:env] if args.key?(:env)
|
22764
|
+
@post_startup_script_config = args[:post_startup_script_config] if args.key?(:post_startup_script_config)
|
22765
|
+
end
|
22766
|
+
end
|
22767
|
+
|
22768
|
+
# Config for evaluation output.
|
22769
|
+
class GoogleCloudAiplatformV1beta1OutputConfig
|
22770
|
+
include Google::Apis::Core::Hashable
|
22771
|
+
|
22772
|
+
# The Google Cloud Storage location where the output is to be written to.
|
22773
|
+
# Corresponds to the JSON property `gcsDestination`
|
22774
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsDestination]
|
22775
|
+
attr_accessor :gcs_destination
|
22776
|
+
|
22777
|
+
def initialize(**args)
|
22778
|
+
update!(**args)
|
22779
|
+
end
|
22780
|
+
|
22781
|
+
# Update properties of this object
|
22782
|
+
def update!(**args)
|
22783
|
+
@gcs_destination = args[:gcs_destination] if args.key?(:gcs_destination)
|
22784
|
+
end
|
22785
|
+
end
|
22786
|
+
|
22280
22787
|
# PSC config that is used to automatically create forwarding rule via
|
22281
22788
|
# ServiceConnectionMap.
|
22282
22789
|
class GoogleCloudAiplatformV1beta1PscAutomationConfig
|
@@ -22383,18 +22890,36 @@ module Google
|
|
22383
22890
|
class GoogleCloudAiplatformV1beta1PairwiseMetricSpec
|
22384
22891
|
include Google::Apis::Core::Hashable
|
22385
22892
|
|
22893
|
+
# Optional. The field name of the baseline response.
|
22894
|
+
# Corresponds to the JSON property `baselineResponseFieldName`
|
22895
|
+
# @return [String]
|
22896
|
+
attr_accessor :baseline_response_field_name
|
22897
|
+
|
22898
|
+
# Optional. The field name of the candidate response.
|
22899
|
+
# Corresponds to the JSON property `candidateResponseFieldName`
|
22900
|
+
# @return [String]
|
22901
|
+
attr_accessor :candidate_response_field_name
|
22902
|
+
|
22386
22903
|
# Required. Metric prompt template for pairwise metric.
|
22387
22904
|
# Corresponds to the JSON property `metricPromptTemplate`
|
22388
22905
|
# @return [String]
|
22389
22906
|
attr_accessor :metric_prompt_template
|
22390
22907
|
|
22908
|
+
# Optional. System instructions for pairwise metric.
|
22909
|
+
# Corresponds to the JSON property `systemInstruction`
|
22910
|
+
# @return [String]
|
22911
|
+
attr_accessor :system_instruction
|
22912
|
+
|
22391
22913
|
def initialize(**args)
|
22392
22914
|
update!(**args)
|
22393
22915
|
end
|
22394
22916
|
|
22395
22917
|
# Update properties of this object
|
22396
22918
|
def update!(**args)
|
22919
|
+
@baseline_response_field_name = args[:baseline_response_field_name] if args.key?(:baseline_response_field_name)
|
22920
|
+
@candidate_response_field_name = args[:candidate_response_field_name] if args.key?(:candidate_response_field_name)
|
22397
22921
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
22922
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
22398
22923
|
end
|
22399
22924
|
end
|
22400
22925
|
|
@@ -22691,7 +23216,7 @@ module Google
|
|
22691
23216
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionResponse]
|
22692
23217
|
attr_accessor :function_response
|
22693
23218
|
|
22694
|
-
# Content blob.
|
23219
|
+
# Content blob.
|
22695
23220
|
# Corresponds to the JSON property `inlineData`
|
22696
23221
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Blob]
|
22697
23222
|
attr_accessor :inline_data
|
@@ -22701,6 +23226,12 @@ module Google
|
|
22701
23226
|
# @return [String]
|
22702
23227
|
attr_accessor :text
|
22703
23228
|
|
23229
|
+
# Output only. Indicates if the part is thought from the model.
|
23230
|
+
# Corresponds to the JSON property `thought`
|
23231
|
+
# @return [Boolean]
|
23232
|
+
attr_accessor :thought
|
23233
|
+
alias_method :thought?, :thought
|
23234
|
+
|
22704
23235
|
# Metadata describes the input video content.
|
22705
23236
|
# Corresponds to the JSON property `videoMetadata`
|
22706
23237
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1VideoMetadata]
|
@@ -22719,6 +23250,7 @@ module Google
|
|
22719
23250
|
@function_response = args[:function_response] if args.key?(:function_response)
|
22720
23251
|
@inline_data = args[:inline_data] if args.key?(:inline_data)
|
22721
23252
|
@text = args[:text] if args.key?(:text)
|
23253
|
+
@thought = args[:thought] if args.key?(:thought)
|
22722
23254
|
@video_metadata = args[:video_metadata] if args.key?(:video_metadata)
|
22723
23255
|
end
|
22724
23256
|
end
|
@@ -23785,6 +24317,11 @@ module Google
|
|
23785
24317
|
# @return [String]
|
23786
24318
|
attr_accessor :metric_prompt_template
|
23787
24319
|
|
24320
|
+
# Optional. System instructions for pointwise metric.
|
24321
|
+
# Corresponds to the JSON property `systemInstruction`
|
24322
|
+
# @return [String]
|
24323
|
+
attr_accessor :system_instruction
|
24324
|
+
|
23788
24325
|
def initialize(**args)
|
23789
24326
|
update!(**args)
|
23790
24327
|
end
|
@@ -23792,6 +24329,7 @@ module Google
|
|
23792
24329
|
# Update properties of this object
|
23793
24330
|
def update!(**args)
|
23794
24331
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
24332
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
23795
24333
|
end
|
23796
24334
|
end
|
23797
24335
|
|
@@ -23815,6 +24353,39 @@ module Google
|
|
23815
24353
|
end
|
23816
24354
|
end
|
23817
24355
|
|
24356
|
+
# Post startup script config.
|
24357
|
+
class GoogleCloudAiplatformV1beta1PostStartupScriptConfig
|
24358
|
+
include Google::Apis::Core::Hashable
|
24359
|
+
|
24360
|
+
# Optional. Post startup script to run after runtime is started.
|
24361
|
+
# Corresponds to the JSON property `postStartupScript`
|
24362
|
+
# @return [String]
|
24363
|
+
attr_accessor :post_startup_script
|
24364
|
+
|
24365
|
+
# Optional. Post startup script behavior that defines download and execution
|
24366
|
+
# behavior.
|
24367
|
+
# Corresponds to the JSON property `postStartupScriptBehavior`
|
24368
|
+
# @return [String]
|
24369
|
+
attr_accessor :post_startup_script_behavior
|
24370
|
+
|
24371
|
+
# Optional. Post startup script url to download. Example: https://bucket/script.
|
24372
|
+
# sh
|
24373
|
+
# Corresponds to the JSON property `postStartupScriptUrl`
|
24374
|
+
# @return [String]
|
24375
|
+
attr_accessor :post_startup_script_url
|
24376
|
+
|
24377
|
+
def initialize(**args)
|
24378
|
+
update!(**args)
|
24379
|
+
end
|
24380
|
+
|
24381
|
+
# Update properties of this object
|
24382
|
+
def update!(**args)
|
24383
|
+
@post_startup_script = args[:post_startup_script] if args.key?(:post_startup_script)
|
24384
|
+
@post_startup_script_behavior = args[:post_startup_script_behavior] if args.key?(:post_startup_script_behavior)
|
24385
|
+
@post_startup_script_url = args[:post_startup_script_url] if args.key?(:post_startup_script_url)
|
24386
|
+
end
|
24387
|
+
end
|
24388
|
+
|
23818
24389
|
# The configuration for the prebuilt speaker to use.
|
23819
24390
|
class GoogleCloudAiplatformV1beta1PrebuiltVoiceConfig
|
23820
24391
|
include Google::Apis::Core::Hashable
|
@@ -24221,6 +24792,28 @@ module Google
|
|
24221
24792
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeExecAction]
|
24222
24793
|
attr_accessor :exec
|
24223
24794
|
|
24795
|
+
# Number of consecutive failures before the probe is considered failed. Defaults
|
24796
|
+
# to 3. Minimum value is 1. Maps to Kubernetes probe argument 'failureThreshold'.
|
24797
|
+
# Corresponds to the JSON property `failureThreshold`
|
24798
|
+
# @return [Fixnum]
|
24799
|
+
attr_accessor :failure_threshold
|
24800
|
+
|
24801
|
+
# GrpcAction checks the health of a container using a gRPC service.
|
24802
|
+
# Corresponds to the JSON property `grpc`
|
24803
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeGrpcAction]
|
24804
|
+
attr_accessor :grpc
|
24805
|
+
|
24806
|
+
# HttpGetAction describes an action based on HTTP Get requests.
|
24807
|
+
# Corresponds to the JSON property `httpGet`
|
24808
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpGetAction]
|
24809
|
+
attr_accessor :http_get
|
24810
|
+
|
24811
|
+
# Number of seconds to wait before starting the probe. Defaults to 0. Minimum
|
24812
|
+
# value is 0. Maps to Kubernetes probe argument 'initialDelaySeconds'.
|
24813
|
+
# Corresponds to the JSON property `initialDelaySeconds`
|
24814
|
+
# @return [Fixnum]
|
24815
|
+
attr_accessor :initial_delay_seconds
|
24816
|
+
|
24224
24817
|
# How often (in seconds) to perform the probe. Default to 10 seconds. Minimum
|
24225
24818
|
# value is 1. Must be less than timeout_seconds. Maps to Kubernetes probe
|
24226
24819
|
# argument 'periodSeconds'.
|
@@ -24228,6 +24821,19 @@ module Google
|
|
24228
24821
|
# @return [Fixnum]
|
24229
24822
|
attr_accessor :period_seconds
|
24230
24823
|
|
24824
|
+
# Number of consecutive successes before the probe is considered successful.
|
24825
|
+
# Defaults to 1. Minimum value is 1. Maps to Kubernetes probe argument '
|
24826
|
+
# successThreshold'.
|
24827
|
+
# Corresponds to the JSON property `successThreshold`
|
24828
|
+
# @return [Fixnum]
|
24829
|
+
attr_accessor :success_threshold
|
24830
|
+
|
24831
|
+
# TcpSocketAction probes the health of a container by opening a TCP socket
|
24832
|
+
# connection.
|
24833
|
+
# Corresponds to the JSON property `tcpSocket`
|
24834
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeTcpSocketAction]
|
24835
|
+
attr_accessor :tcp_socket
|
24836
|
+
|
24231
24837
|
# Number of seconds after which the probe times out. Defaults to 1 second.
|
24232
24838
|
# Minimum value is 1. Must be greater or equal to period_seconds. Maps to
|
24233
24839
|
# Kubernetes probe argument 'timeoutSeconds'.
|
@@ -24242,7 +24848,13 @@ module Google
|
|
24242
24848
|
# Update properties of this object
|
24243
24849
|
def update!(**args)
|
24244
24850
|
@exec = args[:exec] if args.key?(:exec)
|
24851
|
+
@failure_threshold = args[:failure_threshold] if args.key?(:failure_threshold)
|
24852
|
+
@grpc = args[:grpc] if args.key?(:grpc)
|
24853
|
+
@http_get = args[:http_get] if args.key?(:http_get)
|
24854
|
+
@initial_delay_seconds = args[:initial_delay_seconds] if args.key?(:initial_delay_seconds)
|
24245
24855
|
@period_seconds = args[:period_seconds] if args.key?(:period_seconds)
|
24856
|
+
@success_threshold = args[:success_threshold] if args.key?(:success_threshold)
|
24857
|
+
@tcp_socket = args[:tcp_socket] if args.key?(:tcp_socket)
|
24246
24858
|
@timeout_seconds = args[:timeout_seconds] if args.key?(:timeout_seconds)
|
24247
24859
|
end
|
24248
24860
|
end
|
@@ -24271,6 +24883,133 @@ module Google
|
|
24271
24883
|
end
|
24272
24884
|
end
|
24273
24885
|
|
24886
|
+
# GrpcAction checks the health of a container using a gRPC service.
|
24887
|
+
class GoogleCloudAiplatformV1beta1ProbeGrpcAction
|
24888
|
+
include Google::Apis::Core::Hashable
|
24889
|
+
|
24890
|
+
# Port number of the gRPC service. Number must be in the range 1 to 65535.
|
24891
|
+
# Corresponds to the JSON property `port`
|
24892
|
+
# @return [Fixnum]
|
24893
|
+
attr_accessor :port
|
24894
|
+
|
24895
|
+
# Service is the name of the service to place in the gRPC HealthCheckRequest (
|
24896
|
+
# see https://github.com/grpc/grpc/blob/master/doc/health-checking.md). If this
|
24897
|
+
# is not specified, the default behavior is defined by gRPC.
|
24898
|
+
# Corresponds to the JSON property `service`
|
24899
|
+
# @return [String]
|
24900
|
+
attr_accessor :service
|
24901
|
+
|
24902
|
+
def initialize(**args)
|
24903
|
+
update!(**args)
|
24904
|
+
end
|
24905
|
+
|
24906
|
+
# Update properties of this object
|
24907
|
+
def update!(**args)
|
24908
|
+
@port = args[:port] if args.key?(:port)
|
24909
|
+
@service = args[:service] if args.key?(:service)
|
24910
|
+
end
|
24911
|
+
end
|
24912
|
+
|
24913
|
+
# HttpGetAction describes an action based on HTTP Get requests.
|
24914
|
+
class GoogleCloudAiplatformV1beta1ProbeHttpGetAction
|
24915
|
+
include Google::Apis::Core::Hashable
|
24916
|
+
|
24917
|
+
# Host name to connect to, defaults to the model serving container's IP. You
|
24918
|
+
# probably want to set "Host" in httpHeaders instead.
|
24919
|
+
# Corresponds to the JSON property `host`
|
24920
|
+
# @return [String]
|
24921
|
+
attr_accessor :host
|
24922
|
+
|
24923
|
+
# Custom headers to set in the request. HTTP allows repeated headers.
|
24924
|
+
# Corresponds to the JSON property `httpHeaders`
|
24925
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpHeader>]
|
24926
|
+
attr_accessor :http_headers
|
24927
|
+
|
24928
|
+
# Path to access on the HTTP server.
|
24929
|
+
# Corresponds to the JSON property `path`
|
24930
|
+
# @return [String]
|
24931
|
+
attr_accessor :path
|
24932
|
+
|
24933
|
+
# Number of the port to access on the container. Number must be in the range 1
|
24934
|
+
# to 65535.
|
24935
|
+
# Corresponds to the JSON property `port`
|
24936
|
+
# @return [Fixnum]
|
24937
|
+
attr_accessor :port
|
24938
|
+
|
24939
|
+
# Scheme to use for connecting to the host. Defaults to HTTP. Acceptable values
|
24940
|
+
# are "HTTP" or "HTTPS".
|
24941
|
+
# Corresponds to the JSON property `scheme`
|
24942
|
+
# @return [String]
|
24943
|
+
attr_accessor :scheme
|
24944
|
+
|
24945
|
+
def initialize(**args)
|
24946
|
+
update!(**args)
|
24947
|
+
end
|
24948
|
+
|
24949
|
+
# Update properties of this object
|
24950
|
+
def update!(**args)
|
24951
|
+
@host = args[:host] if args.key?(:host)
|
24952
|
+
@http_headers = args[:http_headers] if args.key?(:http_headers)
|
24953
|
+
@path = args[:path] if args.key?(:path)
|
24954
|
+
@port = args[:port] if args.key?(:port)
|
24955
|
+
@scheme = args[:scheme] if args.key?(:scheme)
|
24956
|
+
end
|
24957
|
+
end
|
24958
|
+
|
24959
|
+
# HttpHeader describes a custom header to be used in HTTP probes
|
24960
|
+
class GoogleCloudAiplatformV1beta1ProbeHttpHeader
|
24961
|
+
include Google::Apis::Core::Hashable
|
24962
|
+
|
24963
|
+
# The header field name. This will be canonicalized upon output, so case-variant
|
24964
|
+
# names will be understood as the same header.
|
24965
|
+
# Corresponds to the JSON property `name`
|
24966
|
+
# @return [String]
|
24967
|
+
attr_accessor :name
|
24968
|
+
|
24969
|
+
# The header field value
|
24970
|
+
# Corresponds to the JSON property `value`
|
24971
|
+
# @return [String]
|
24972
|
+
attr_accessor :value
|
24973
|
+
|
24974
|
+
def initialize(**args)
|
24975
|
+
update!(**args)
|
24976
|
+
end
|
24977
|
+
|
24978
|
+
# Update properties of this object
|
24979
|
+
def update!(**args)
|
24980
|
+
@name = args[:name] if args.key?(:name)
|
24981
|
+
@value = args[:value] if args.key?(:value)
|
24982
|
+
end
|
24983
|
+
end
|
24984
|
+
|
24985
|
+
# TcpSocketAction probes the health of a container by opening a TCP socket
|
24986
|
+
# connection.
|
24987
|
+
class GoogleCloudAiplatformV1beta1ProbeTcpSocketAction
|
24988
|
+
include Google::Apis::Core::Hashable
|
24989
|
+
|
24990
|
+
# Optional: Host name to connect to, defaults to the model serving container's
|
24991
|
+
# IP.
|
24992
|
+
# Corresponds to the JSON property `host`
|
24993
|
+
# @return [String]
|
24994
|
+
attr_accessor :host
|
24995
|
+
|
24996
|
+
# Number of the port to access on the container. Number must be in the range 1
|
24997
|
+
# to 65535.
|
24998
|
+
# Corresponds to the JSON property `port`
|
24999
|
+
# @return [Fixnum]
|
25000
|
+
attr_accessor :port
|
25001
|
+
|
25002
|
+
def initialize(**args)
|
25003
|
+
update!(**args)
|
25004
|
+
end
|
25005
|
+
|
25006
|
+
# Update properties of this object
|
25007
|
+
def update!(**args)
|
25008
|
+
@host = args[:host] if args.key?(:host)
|
25009
|
+
@port = args[:port] if args.key?(:port)
|
25010
|
+
end
|
25011
|
+
end
|
25012
|
+
|
24274
25013
|
# PscAutomatedEndpoints defines the output of the forwarding rule automatically
|
24275
25014
|
# created by each PscAutomationConfig.
|
24276
25015
|
class GoogleCloudAiplatformV1beta1PscAutomatedEndpoints
|
@@ -24536,8 +25275,8 @@ module Google
|
|
24536
25275
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelContainerSpec]
|
24537
25276
|
attr_accessor :container_spec
|
24538
25277
|
|
24539
|
-
# A description of resources that are dedicated to a DeployedModel
|
24540
|
-
# need a higher degree of manual configuration.
|
25278
|
+
# A description of resources that are dedicated to a DeployedModel or
|
25279
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
24541
25280
|
# Corresponds to the JSON property `dedicatedResources`
|
24542
25281
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
24543
25282
|
attr_accessor :dedicated_resources
|
@@ -25867,6 +26606,11 @@ module Google
|
|
25867
26606
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagEmbeddingModelConfig]
|
25868
26607
|
attr_accessor :rag_embedding_model_config
|
25869
26608
|
|
26609
|
+
# Output only. Number of RagFiles in the RagCorpus.
|
26610
|
+
# Corresponds to the JSON property `ragFilesCount`
|
26611
|
+
# @return [Fixnum]
|
26612
|
+
attr_accessor :rag_files_count
|
26613
|
+
|
25870
26614
|
# Config for the Vector DB to use for RAG.
|
25871
26615
|
# Corresponds to the JSON property `ragVectorDbConfig`
|
25872
26616
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagVectorDbConfig]
|
@@ -25899,6 +26643,7 @@ module Google
|
|
25899
26643
|
@display_name = args[:display_name] if args.key?(:display_name)
|
25900
26644
|
@name = args[:name] if args.key?(:name)
|
25901
26645
|
@rag_embedding_model_config = args[:rag_embedding_model_config] if args.key?(:rag_embedding_model_config)
|
26646
|
+
@rag_files_count = args[:rag_files_count] if args.key?(:rag_files_count)
|
25902
26647
|
@rag_vector_db_config = args[:rag_vector_db_config] if args.key?(:rag_vector_db_config)
|
25903
26648
|
@update_time = args[:update_time] if args.key?(:update_time)
|
25904
26649
|
@vector_db_config = args[:vector_db_config] if args.key?(:vector_db_config)
|
@@ -26215,6 +26960,11 @@ module Google
|
|
26215
26960
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagFileParsingConfigLayoutParser]
|
26216
26961
|
attr_accessor :layout_parser
|
26217
26962
|
|
26963
|
+
# Specifies the advanced parsing for RagFiles.
|
26964
|
+
# Corresponds to the JSON property `llmParser`
|
26965
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagFileParsingConfigLlmParser]
|
26966
|
+
attr_accessor :llm_parser
|
26967
|
+
|
26218
26968
|
# Whether to use advanced PDF parsing.
|
26219
26969
|
# Corresponds to the JSON property `useAdvancedPdfParsing`
|
26220
26970
|
# @return [Boolean]
|
@@ -26229,6 +26979,7 @@ module Google
|
|
26229
26979
|
def update!(**args)
|
26230
26980
|
@advanced_parser = args[:advanced_parser] if args.key?(:advanced_parser)
|
26231
26981
|
@layout_parser = args[:layout_parser] if args.key?(:layout_parser)
|
26982
|
+
@llm_parser = args[:llm_parser] if args.key?(:llm_parser)
|
26232
26983
|
@use_advanced_pdf_parsing = args[:use_advanced_pdf_parsing] if args.key?(:use_advanced_pdf_parsing)
|
26233
26984
|
end
|
26234
26985
|
end
|
@@ -26286,6 +27037,41 @@ module Google
|
|
26286
27037
|
end
|
26287
27038
|
end
|
26288
27039
|
|
27040
|
+
# Specifies the advanced parsing for RagFiles.
|
27041
|
+
class GoogleCloudAiplatformV1beta1RagFileParsingConfigLlmParser
|
27042
|
+
include Google::Apis::Core::Hashable
|
27043
|
+
|
27044
|
+
# The prompt to use for parsing. If not specified, a default prompt will be used.
|
27045
|
+
# Corresponds to the JSON property `customParsingPrompt`
|
27046
|
+
# @return [String]
|
27047
|
+
attr_accessor :custom_parsing_prompt
|
27048
|
+
|
27049
|
+
# The maximum number of requests the job is allowed to make to the LLM model per
|
27050
|
+
# minute. Consult https://cloud.google.com/vertex-ai/generative-ai/docs/quotas
|
27051
|
+
# and your document size to set an appropriate value here. If unspecified, a
|
27052
|
+
# default value of 5000 QPM would be used.
|
27053
|
+
# Corresponds to the JSON property `maxParsingRequestsPerMin`
|
27054
|
+
# @return [Fixnum]
|
27055
|
+
attr_accessor :max_parsing_requests_per_min
|
27056
|
+
|
27057
|
+
# The name of a LLM model used for parsing. Format: * `projects/`project_id`/
|
27058
|
+
# locations/`location`/publishers/`publisher`/models/`model``
|
27059
|
+
# Corresponds to the JSON property `modelName`
|
27060
|
+
# @return [String]
|
27061
|
+
attr_accessor :model_name
|
27062
|
+
|
27063
|
+
def initialize(**args)
|
27064
|
+
update!(**args)
|
27065
|
+
end
|
27066
|
+
|
27067
|
+
# Update properties of this object
|
27068
|
+
def update!(**args)
|
27069
|
+
@custom_parsing_prompt = args[:custom_parsing_prompt] if args.key?(:custom_parsing_prompt)
|
27070
|
+
@max_parsing_requests_per_min = args[:max_parsing_requests_per_min] if args.key?(:max_parsing_requests_per_min)
|
27071
|
+
@model_name = args[:model_name] if args.key?(:model_name)
|
27072
|
+
end
|
27073
|
+
end
|
27074
|
+
|
26289
27075
|
# Specifies the transformation config for RagFiles.
|
26290
27076
|
class GoogleCloudAiplatformV1beta1RagFileTransformationConfig
|
26291
27077
|
include Google::Apis::Core::Hashable
|
@@ -26524,7 +27310,8 @@ module Google
|
|
26524
27310
|
class GoogleCloudAiplatformV1beta1RagVectorDbConfig
|
26525
27311
|
include Google::Apis::Core::Hashable
|
26526
27312
|
|
26527
|
-
# The generic reusable api auth config.
|
27313
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
27314
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
26528
27315
|
# Corresponds to the JSON property `apiAuth`
|
26529
27316
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ApiAuth]
|
26530
27317
|
attr_accessor :api_auth
|
@@ -27803,6 +28590,34 @@ module Google
|
|
27803
28590
|
end
|
27804
28591
|
end
|
27805
28592
|
|
28593
|
+
# Retrieval config.
|
28594
|
+
class GoogleCloudAiplatformV1beta1RetrievalConfig
|
28595
|
+
include Google::Apis::Core::Hashable
|
28596
|
+
|
28597
|
+
# The language code of the user.
|
28598
|
+
# Corresponds to the JSON property `languageCode`
|
28599
|
+
# @return [String]
|
28600
|
+
attr_accessor :language_code
|
28601
|
+
|
28602
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
28603
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
28604
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
28605
|
+
# must be within normalized ranges.
|
28606
|
+
# Corresponds to the JSON property `latLng`
|
28607
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleTypeLatLng]
|
28608
|
+
attr_accessor :lat_lng
|
28609
|
+
|
28610
|
+
def initialize(**args)
|
28611
|
+
update!(**args)
|
28612
|
+
end
|
28613
|
+
|
28614
|
+
# Update properties of this object
|
28615
|
+
def update!(**args)
|
28616
|
+
@language_code = args[:language_code] if args.key?(:language_code)
|
28617
|
+
@lat_lng = args[:lat_lng] if args.key?(:lat_lng)
|
28618
|
+
end
|
28619
|
+
end
|
28620
|
+
|
27806
28621
|
# Metadata related to retrieval in the grounding flow.
|
27807
28622
|
class GoogleCloudAiplatformV1beta1RetrievalMetadata
|
27808
28623
|
include Google::Apis::Core::Hashable
|
@@ -27930,6 +28745,59 @@ module Google
|
|
27930
28745
|
end
|
27931
28746
|
end
|
27932
28747
|
|
28748
|
+
# Configuration for rolling deployments.
|
28749
|
+
class GoogleCloudAiplatformV1beta1RolloutOptions
|
28750
|
+
include Google::Apis::Core::Hashable
|
28751
|
+
|
28752
|
+
# Percentage of allowed additional replicas. For autoscaling deployments, this
|
28753
|
+
# refers to the target replica count.
|
28754
|
+
# Corresponds to the JSON property `maxSurgePercentage`
|
28755
|
+
# @return [Fixnum]
|
28756
|
+
attr_accessor :max_surge_percentage
|
28757
|
+
|
28758
|
+
# Absolute count of allowed additional replicas.
|
28759
|
+
# Corresponds to the JSON property `maxSurgeReplicas`
|
28760
|
+
# @return [Fixnum]
|
28761
|
+
attr_accessor :max_surge_replicas
|
28762
|
+
|
28763
|
+
# Percentage of replicas allowed to be unavailable. For autoscaling deployments,
|
28764
|
+
# this refers to the target replica count.
|
28765
|
+
# Corresponds to the JSON property `maxUnavailablePercentage`
|
28766
|
+
# @return [Fixnum]
|
28767
|
+
attr_accessor :max_unavailable_percentage
|
28768
|
+
|
28769
|
+
# Absolute count of replicas allowed to be unavailable.
|
28770
|
+
# Corresponds to the JSON property `maxUnavailableReplicas`
|
28771
|
+
# @return [Fixnum]
|
28772
|
+
attr_accessor :max_unavailable_replicas
|
28773
|
+
|
28774
|
+
# ID of the DeployedModel that this deployment should replace.
|
28775
|
+
# Corresponds to the JSON property `previousDeployedModel`
|
28776
|
+
# @return [String]
|
28777
|
+
attr_accessor :previous_deployed_model
|
28778
|
+
|
28779
|
+
# Output only. Read-only. Revision number determines the relative priority of
|
28780
|
+
# DeployedModels in the same rollout. The DeployedModel with the largest
|
28781
|
+
# revision number specifies the intended state of the deployment.
|
28782
|
+
# Corresponds to the JSON property `revisionNumber`
|
28783
|
+
# @return [Fixnum]
|
28784
|
+
attr_accessor :revision_number
|
28785
|
+
|
28786
|
+
def initialize(**args)
|
28787
|
+
update!(**args)
|
28788
|
+
end
|
28789
|
+
|
28790
|
+
# Update properties of this object
|
28791
|
+
def update!(**args)
|
28792
|
+
@max_surge_percentage = args[:max_surge_percentage] if args.key?(:max_surge_percentage)
|
28793
|
+
@max_surge_replicas = args[:max_surge_replicas] if args.key?(:max_surge_replicas)
|
28794
|
+
@max_unavailable_percentage = args[:max_unavailable_percentage] if args.key?(:max_unavailable_percentage)
|
28795
|
+
@max_unavailable_replicas = args[:max_unavailable_replicas] if args.key?(:max_unavailable_replicas)
|
28796
|
+
@previous_deployed_model = args[:previous_deployed_model] if args.key?(:previous_deployed_model)
|
28797
|
+
@revision_number = args[:revision_number] if args.key?(:revision_number)
|
28798
|
+
end
|
28799
|
+
end
|
28800
|
+
|
27933
28801
|
# Input for rouge metric.
|
27934
28802
|
class GoogleCloudAiplatformV1beta1RougeInput
|
27935
28803
|
include Google::Apis::Core::Hashable
|
@@ -32218,8 +33086,9 @@ module Google
|
|
32218
33086
|
class GoogleCloudAiplatformV1beta1SchemaTextDataItem
|
32219
33087
|
include Google::Apis::Core::Hashable
|
32220
33088
|
|
32221
|
-
# Output only. Google Cloud Storage URI points to the original text in
|
32222
|
-
# bucket. The text file is up to 10MB
|
33089
|
+
# Output only. Google Cloud Storage URI points to a copy of the original text in
|
33090
|
+
# the Vertex-managed bucket in the user's project. The text file is up to 10MB
|
33091
|
+
# in size.
|
32223
33092
|
# Corresponds to the JSON property `gcsUri`
|
32224
33093
|
# @return [String]
|
32225
33094
|
attr_accessor :gcs_uri
|
@@ -36520,6 +37389,81 @@ module Google
|
|
36520
37389
|
end
|
36521
37390
|
end
|
36522
37391
|
|
37392
|
+
# Configuration for Speculative Decoding.
|
37393
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec
|
37394
|
+
include Google::Apis::Core::Hashable
|
37395
|
+
|
37396
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37397
|
+
# tokens for speculative decoding.
|
37398
|
+
# Corresponds to the JSON property `draftModelSpeculation`
|
37399
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation]
|
37400
|
+
attr_accessor :draft_model_speculation
|
37401
|
+
|
37402
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37403
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37404
|
+
# Corresponds to the JSON property `ngramSpeculation`
|
37405
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation]
|
37406
|
+
attr_accessor :ngram_speculation
|
37407
|
+
|
37408
|
+
# The number of speculative tokens to generate at each step.
|
37409
|
+
# Corresponds to the JSON property `speculativeTokenCount`
|
37410
|
+
# @return [Fixnum]
|
37411
|
+
attr_accessor :speculative_token_count
|
37412
|
+
|
37413
|
+
def initialize(**args)
|
37414
|
+
update!(**args)
|
37415
|
+
end
|
37416
|
+
|
37417
|
+
# Update properties of this object
|
37418
|
+
def update!(**args)
|
37419
|
+
@draft_model_speculation = args[:draft_model_speculation] if args.key?(:draft_model_speculation)
|
37420
|
+
@ngram_speculation = args[:ngram_speculation] if args.key?(:ngram_speculation)
|
37421
|
+
@speculative_token_count = args[:speculative_token_count] if args.key?(:speculative_token_count)
|
37422
|
+
end
|
37423
|
+
end
|
37424
|
+
|
37425
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37426
|
+
# tokens for speculative decoding.
|
37427
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation
|
37428
|
+
include Google::Apis::Core::Hashable
|
37429
|
+
|
37430
|
+
# Required. The resource name of the draft model.
|
37431
|
+
# Corresponds to the JSON property `draftModel`
|
37432
|
+
# @return [String]
|
37433
|
+
attr_accessor :draft_model
|
37434
|
+
|
37435
|
+
def initialize(**args)
|
37436
|
+
update!(**args)
|
37437
|
+
end
|
37438
|
+
|
37439
|
+
# Update properties of this object
|
37440
|
+
def update!(**args)
|
37441
|
+
@draft_model = args[:draft_model] if args.key?(:draft_model)
|
37442
|
+
end
|
37443
|
+
end
|
37444
|
+
|
37445
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37446
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37447
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation
|
37448
|
+
include Google::Apis::Core::Hashable
|
37449
|
+
|
37450
|
+
# The number of last N input tokens used as ngram to search/match against the
|
37451
|
+
# previous prompt sequence. This is equal to the N in N-Gram. The default value
|
37452
|
+
# is 3 if not specified.
|
37453
|
+
# Corresponds to the JSON property `ngramSize`
|
37454
|
+
# @return [Fixnum]
|
37455
|
+
attr_accessor :ngram_size
|
37456
|
+
|
37457
|
+
def initialize(**args)
|
37458
|
+
update!(**args)
|
37459
|
+
end
|
37460
|
+
|
37461
|
+
# Update properties of this object
|
37462
|
+
def update!(**args)
|
37463
|
+
@ngram_size = args[:ngram_size] if args.key?(:ngram_size)
|
37464
|
+
end
|
37465
|
+
end
|
37466
|
+
|
36523
37467
|
# The speech generation config.
|
36524
37468
|
class GoogleCloudAiplatformV1beta1SpeechConfig
|
36525
37469
|
include Google::Apis::Core::Hashable
|
@@ -38245,6 +39189,12 @@ module Google
|
|
38245
39189
|
class GoogleCloudAiplatformV1beta1SupervisedTuningDataStats
|
38246
39190
|
include Google::Apis::Core::Hashable
|
38247
39191
|
|
39192
|
+
# Output only. For each index in `truncated_example_indices`, the user-facing
|
39193
|
+
# reason why the example was dropped. Must not include example itself.
|
39194
|
+
# Corresponds to the JSON property `droppedExampleReasons`
|
39195
|
+
# @return [Array<String>]
|
39196
|
+
attr_accessor :dropped_example_reasons
|
39197
|
+
|
38248
39198
|
# Output only. Number of billable characters in the tuning dataset.
|
38249
39199
|
# Corresponds to the JSON property `totalBillableCharacterCount`
|
38250
39200
|
# @return [Fixnum]
|
@@ -38255,7 +39205,9 @@ module Google
|
|
38255
39205
|
# @return [Fixnum]
|
38256
39206
|
attr_accessor :total_billable_token_count
|
38257
39207
|
|
38258
|
-
# The number of examples in the dataset that have been
|
39208
|
+
# Output only. The number of examples in the dataset that have been dropped. An
|
39209
|
+
# example can be dropped for reasons including: too many tokens, contains an
|
39210
|
+
# invalid image, contains too many images, etc.
|
38259
39211
|
# Corresponds to the JSON property `totalTruncatedExampleCount`
|
38260
39212
|
# @return [Fixnum]
|
38261
39213
|
attr_accessor :total_truncated_example_count
|
@@ -38265,7 +39217,8 @@ module Google
|
|
38265
39217
|
# @return [Fixnum]
|
38266
39218
|
attr_accessor :total_tuning_character_count
|
38267
39219
|
|
38268
|
-
# A partial sample of the indices (starting from 1) of the
|
39220
|
+
# Output only. A partial sample of the indices (starting from 1) of the dropped
|
39221
|
+
# examples.
|
38269
39222
|
# Corresponds to the JSON property `truncatedExampleIndices`
|
38270
39223
|
# @return [Array<Fixnum>]
|
38271
39224
|
attr_accessor :truncated_example_indices
|
@@ -38306,6 +39259,7 @@ module Google
|
|
38306
39259
|
|
38307
39260
|
# Update properties of this object
|
38308
39261
|
def update!(**args)
|
39262
|
+
@dropped_example_reasons = args[:dropped_example_reasons] if args.key?(:dropped_example_reasons)
|
38309
39263
|
@total_billable_character_count = args[:total_billable_character_count] if args.key?(:total_billable_character_count)
|
38310
39264
|
@total_billable_token_count = args[:total_billable_token_count] if args.key?(:total_billable_token_count)
|
38311
39265
|
@total_truncated_example_count = args[:total_truncated_example_count] if args.key?(:total_truncated_example_count)
|
@@ -39426,6 +40380,11 @@ module Google
|
|
39426
40380
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionCallingConfig]
|
39427
40381
|
attr_accessor :function_calling_config
|
39428
40382
|
|
40383
|
+
# Retrieval config.
|
40384
|
+
# Corresponds to the JSON property `retrievalConfig`
|
40385
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RetrievalConfig]
|
40386
|
+
attr_accessor :retrieval_config
|
40387
|
+
|
39429
40388
|
def initialize(**args)
|
39430
40389
|
update!(**args)
|
39431
40390
|
end
|
@@ -39433,6 +40392,7 @@ module Google
|
|
39433
40392
|
# Update properties of this object
|
39434
40393
|
def update!(**args)
|
39435
40394
|
@function_calling_config = args[:function_calling_config] if args.key?(:function_calling_config)
|
40395
|
+
@retrieval_config = args[:retrieval_config] if args.key?(:retrieval_config)
|
39436
40396
|
end
|
39437
40397
|
end
|
39438
40398
|
|
@@ -40815,7 +41775,7 @@ module Google
|
|
40815
41775
|
end
|
40816
41776
|
end
|
40817
41777
|
|
40818
|
-
# The Model Registry Model and Online Prediction Endpoint
|
41778
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
40819
41779
|
# TuningJob.
|
40820
41780
|
class GoogleCloudAiplatformV1beta1TunedModel
|
40821
41781
|
include Google::Apis::Core::Hashable
|
@@ -41005,7 +41965,7 @@ module Google
|
|
41005
41965
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SupervisedTuningSpec]
|
41006
41966
|
attr_accessor :supervised_tuning_spec
|
41007
41967
|
|
41008
|
-
# The Model Registry Model and Online Prediction Endpoint
|
41968
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
41009
41969
|
# TuningJob.
|
41010
41970
|
# Corresponds to the JSON property `tunedModel`
|
41011
41971
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1TunedModel]
|
@@ -43004,6 +43964,34 @@ module Google
|
|
43004
43964
|
end
|
43005
43965
|
end
|
43006
43966
|
|
43967
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
43968
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
43969
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
43970
|
+
# must be within normalized ranges.
|
43971
|
+
class GoogleTypeLatLng
|
43972
|
+
include Google::Apis::Core::Hashable
|
43973
|
+
|
43974
|
+
# The latitude in degrees. It must be in the range [-90.0, +90.0].
|
43975
|
+
# Corresponds to the JSON property `latitude`
|
43976
|
+
# @return [Float]
|
43977
|
+
attr_accessor :latitude
|
43978
|
+
|
43979
|
+
# The longitude in degrees. It must be in the range [-180.0, +180.0].
|
43980
|
+
# Corresponds to the JSON property `longitude`
|
43981
|
+
# @return [Float]
|
43982
|
+
attr_accessor :longitude
|
43983
|
+
|
43984
|
+
def initialize(**args)
|
43985
|
+
update!(**args)
|
43986
|
+
end
|
43987
|
+
|
43988
|
+
# Update properties of this object
|
43989
|
+
def update!(**args)
|
43990
|
+
@latitude = args[:latitude] if args.key?(:latitude)
|
43991
|
+
@longitude = args[:longitude] if args.key?(:longitude)
|
43992
|
+
end
|
43993
|
+
end
|
43994
|
+
|
43007
43995
|
# Represents an amount of money with its currency type.
|
43008
43996
|
class GoogleTypeMoney
|
43009
43997
|
include Google::Apis::Core::Hashable
|