google-apis-aiplatform_v1beta1 0.36.0 → 0.37.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -0
- data/lib/google/apis/aiplatform_v1beta1/classes.rb +845 -66
- data/lib/google/apis/aiplatform_v1beta1/gem_version.rb +3 -3
- data/lib/google/apis/aiplatform_v1beta1/representations.rb +347 -0
- data/lib/google/apis/aiplatform_v1beta1/service.rb +193 -4
- metadata +4 -7
@@ -474,7 +474,7 @@ module Google
|
|
474
474
|
end
|
475
475
|
end
|
476
476
|
|
477
|
-
# Create API error message for Vertex Pipeline.
|
477
|
+
# Create API error message for Vertex Pipeline.
|
478
478
|
class CloudAiPlatformCommonCreatePipelineJobApiErrorDetail
|
479
479
|
include Google::Apis::Core::Hashable
|
480
480
|
|
@@ -840,7 +840,8 @@ module Google
|
|
840
840
|
end
|
841
841
|
end
|
842
842
|
|
843
|
-
# The generic reusable api auth config.
|
843
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
844
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
844
845
|
class GoogleCloudAiplatformV1beta1ApiAuth
|
845
846
|
include Google::Apis::Core::Hashable
|
846
847
|
|
@@ -1468,22 +1469,22 @@ module Google
|
|
1468
1469
|
class GoogleCloudAiplatformV1beta1AutomaticResources
|
1469
1470
|
include Google::Apis::Core::Hashable
|
1470
1471
|
|
1471
|
-
# Immutable. The maximum number of replicas
|
1472
|
-
#
|
1473
|
-
#
|
1474
|
-
#
|
1475
|
-
#
|
1476
|
-
#
|
1477
|
-
#
|
1478
|
-
#
|
1472
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
1473
|
+
# traffic against it increases. If the requested value is too large, the
|
1474
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
1475
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
1476
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
1477
|
+
# traffic will be dropped. If this value is not provided, a no upper bound for
|
1478
|
+
# scaling under heavy traffic will be assume, though Vertex AI may be unable to
|
1479
|
+
# scale beyond certain replica number.
|
1479
1480
|
# Corresponds to the JSON property `maxReplicaCount`
|
1480
1481
|
# @return [Fixnum]
|
1481
1482
|
attr_accessor :max_replica_count
|
1482
1483
|
|
1483
|
-
# Immutable. The minimum number of replicas
|
1484
|
-
#
|
1485
|
-
#
|
1486
|
-
#
|
1484
|
+
# Immutable. The minimum number of replicas that will be always deployed on. If
|
1485
|
+
# traffic against it increases, it may dynamically be deployed onto more
|
1486
|
+
# replicas up to max_replica_count, and as traffic decreases, some of these
|
1487
|
+
# extra replicas may be freed. If the requested value is too large, the
|
1487
1488
|
# deployment will error.
|
1488
1489
|
# Corresponds to the JSON property `minReplicaCount`
|
1489
1490
|
# @return [Fixnum]
|
@@ -1500,6 +1501,48 @@ module Google
|
|
1500
1501
|
end
|
1501
1502
|
end
|
1502
1503
|
|
1504
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
1505
|
+
# EvaluateDataset.
|
1506
|
+
class GoogleCloudAiplatformV1beta1AutoraterConfig
|
1507
|
+
include Google::Apis::Core::Hashable
|
1508
|
+
|
1509
|
+
# Optional. The fully qualified name of the publisher model or tuned autorater
|
1510
|
+
# endpoint to use. Publisher model format: `projects/`project`/locations/`
|
1511
|
+
# location`/publishers/*/models/*` Tuned model endpoint format: `projects/`
|
1512
|
+
# project`/locations/`location`/endpoints/`endpoint``
|
1513
|
+
# Corresponds to the JSON property `autoraterModel`
|
1514
|
+
# @return [String]
|
1515
|
+
attr_accessor :autorater_model
|
1516
|
+
|
1517
|
+
# Optional. Whether to flip the candidate and baseline responses. This is only
|
1518
|
+
# applicable to the pairwise metric. If enabled, also provide PairwiseMetricSpec.
|
1519
|
+
# candidate_response_field_name and PairwiseMetricSpec.
|
1520
|
+
# baseline_response_field_name. When rendering PairwiseMetricSpec.
|
1521
|
+
# metric_prompt_template, the candidate and baseline fields will be flipped for
|
1522
|
+
# half of the samples to reduce bias.
|
1523
|
+
# Corresponds to the JSON property `flipEnabled`
|
1524
|
+
# @return [Boolean]
|
1525
|
+
attr_accessor :flip_enabled
|
1526
|
+
alias_method :flip_enabled?, :flip_enabled
|
1527
|
+
|
1528
|
+
# Optional. Number of samples for each instance in the dataset. If not specified,
|
1529
|
+
# the default is 4. Minimum value is 1, maximum value is 32.
|
1530
|
+
# Corresponds to the JSON property `samplingCount`
|
1531
|
+
# @return [Fixnum]
|
1532
|
+
attr_accessor :sampling_count
|
1533
|
+
|
1534
|
+
def initialize(**args)
|
1535
|
+
update!(**args)
|
1536
|
+
end
|
1537
|
+
|
1538
|
+
# Update properties of this object
|
1539
|
+
def update!(**args)
|
1540
|
+
@autorater_model = args[:autorater_model] if args.key?(:autorater_model)
|
1541
|
+
@flip_enabled = args[:flip_enabled] if args.key?(:flip_enabled)
|
1542
|
+
@sampling_count = args[:sampling_count] if args.key?(:sampling_count)
|
1543
|
+
end
|
1544
|
+
end
|
1545
|
+
|
1503
1546
|
# The metric specification that defines the target resource utilization (CPU
|
1504
1547
|
# utilization, accelerator's duty cycle, and so on) for calculating the desired
|
1505
1548
|
# replica count.
|
@@ -2756,6 +2799,13 @@ module Google
|
|
2756
2799
|
# @return [String]
|
2757
2800
|
attr_accessor :data
|
2758
2801
|
|
2802
|
+
# Optional. Display name of the blob. Used to provide a label or filename to
|
2803
|
+
# distinguish blobs. This field is only returned in PromptMessage for prompt
|
2804
|
+
# management. It is not currently used in the Gemini GenerateContent calls.
|
2805
|
+
# Corresponds to the JSON property `displayName`
|
2806
|
+
# @return [String]
|
2807
|
+
attr_accessor :display_name
|
2808
|
+
|
2759
2809
|
# Required. The IANA standard MIME type of the source data.
|
2760
2810
|
# Corresponds to the JSON property `mimeType`
|
2761
2811
|
# @return [String]
|
@@ -2768,6 +2818,7 @@ module Google
|
|
2768
2818
|
# Update properties of this object
|
2769
2819
|
def update!(**args)
|
2770
2820
|
@data = args[:data] if args.key?(:data)
|
2821
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
2771
2822
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
2772
2823
|
end
|
2773
2824
|
end
|
@@ -2852,7 +2903,7 @@ module Google
|
|
2852
2903
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Content>]
|
2853
2904
|
attr_accessor :contents
|
2854
2905
|
|
2855
|
-
# Output only.
|
2906
|
+
# Output only. Creation time of the cache entry.
|
2856
2907
|
# Corresponds to the JSON property `createTime`
|
2857
2908
|
# @return [String]
|
2858
2909
|
attr_accessor :create_time
|
@@ -2869,8 +2920,9 @@ module Google
|
|
2869
2920
|
# @return [String]
|
2870
2921
|
attr_accessor :expire_time
|
2871
2922
|
|
2872
|
-
# Immutable. The name of the
|
2873
|
-
# projects/`
|
2923
|
+
# Immutable. The name of the `Model` to use for cached content. Currently, only
|
2924
|
+
# the published Gemini base models are supported, in form of projects/`PROJECT`/
|
2925
|
+
# locations/`LOCATION`/publishers/google/models/`MODEL`
|
2874
2926
|
# Corresponds to the JSON property `model`
|
2875
2927
|
# @return [String]
|
2876
2928
|
attr_accessor :model
|
@@ -4160,6 +4212,11 @@ module Google
|
|
4160
4212
|
class GoogleCloudAiplatformV1beta1CountTokensResponse
|
4161
4213
|
include Google::Apis::Core::Hashable
|
4162
4214
|
|
4215
|
+
# Output only. List of modalities that were processed in the request input.
|
4216
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
4217
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
4218
|
+
attr_accessor :prompt_tokens_details
|
4219
|
+
|
4163
4220
|
# The total number of billable characters counted across all instances from the
|
4164
4221
|
# request.
|
4165
4222
|
# Corresponds to the JSON property `totalBillableCharacters`
|
@@ -4177,6 +4234,7 @@ module Google
|
|
4177
4234
|
|
4178
4235
|
# Update properties of this object
|
4179
4236
|
def update!(**args)
|
4237
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
4180
4238
|
@total_billable_characters = args[:total_billable_characters] if args.key?(:total_billable_characters)
|
4181
4239
|
@total_tokens = args[:total_tokens] if args.key?(:total_tokens)
|
4182
4240
|
end
|
@@ -5761,7 +5819,9 @@ module Google
|
|
5761
5819
|
# @return [String]
|
5762
5820
|
attr_accessor :model_reference
|
5763
5821
|
|
5764
|
-
# Output only. Identifier. The resource name of the DatasetVersion.
|
5822
|
+
# Output only. Identifier. The resource name of the DatasetVersion. Format: `
|
5823
|
+
# projects/`project`/locations/`location`/datasets/`dataset`/datasetVersions/`
|
5824
|
+
# dataset_version``
|
5765
5825
|
# Corresponds to the JSON property `name`
|
5766
5826
|
# @return [String]
|
5767
5827
|
attr_accessor :name
|
@@ -5802,8 +5862,8 @@ module Google
|
|
5802
5862
|
end
|
5803
5863
|
end
|
5804
5864
|
|
5805
|
-
# A description of resources that are dedicated to a DeployedModel
|
5806
|
-
# need a higher degree of manual configuration.
|
5865
|
+
# A description of resources that are dedicated to a DeployedModel or
|
5866
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
5807
5867
|
class GoogleCloudAiplatformV1beta1DedicatedResources
|
5808
5868
|
include Google::Apis::Core::Hashable
|
5809
5869
|
|
@@ -5829,36 +5889,33 @@ module Google
|
|
5829
5889
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1MachineSpec]
|
5830
5890
|
attr_accessor :machine_spec
|
5831
5891
|
|
5832
|
-
# Immutable. The maximum number of replicas
|
5833
|
-
#
|
5834
|
-
#
|
5835
|
-
#
|
5836
|
-
#
|
5837
|
-
#
|
5838
|
-
#
|
5839
|
-
#
|
5840
|
-
#
|
5841
|
-
#
|
5842
|
-
# selected machine type).
|
5892
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
5893
|
+
# traffic against it increases. If the requested value is too large, the
|
5894
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
5895
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
5896
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
5897
|
+
# traffic will be dropped. If this value is not provided, will use
|
5898
|
+
# min_replica_count as the default value. The value of this field impacts the
|
5899
|
+
# charge against Vertex CPU and GPU quotas. Specifically, you will be charged
|
5900
|
+
# for (max_replica_count * number of cores in the selected machine type) and (
|
5901
|
+
# max_replica_count * number of GPUs per replica in the selected machine type).
|
5843
5902
|
# Corresponds to the JSON property `maxReplicaCount`
|
5844
5903
|
# @return [Fixnum]
|
5845
5904
|
attr_accessor :max_replica_count
|
5846
5905
|
|
5847
|
-
# Required. Immutable. The minimum number of machine replicas
|
5848
|
-
#
|
5849
|
-
#
|
5850
|
-
#
|
5851
|
-
# be freed.
|
5906
|
+
# Required. Immutable. The minimum number of machine replicas that will be
|
5907
|
+
# always deployed on. This value must be greater than or equal to 1. If traffic
|
5908
|
+
# increases, it may dynamically be deployed onto more replicas, and as traffic
|
5909
|
+
# decreases, some of these extra replicas may be freed.
|
5852
5910
|
# Corresponds to the JSON property `minReplicaCount`
|
5853
5911
|
# @return [Fixnum]
|
5854
5912
|
attr_accessor :min_replica_count
|
5855
5913
|
|
5856
5914
|
# Optional. Number of required available replicas for the deployment to succeed.
|
5857
|
-
# This field is only needed when partial
|
5858
|
-
#
|
5859
|
-
#
|
5860
|
-
#
|
5861
|
-
# be min_replica_count.
|
5915
|
+
# This field is only needed when partial deployment/mutation is desired. If set,
|
5916
|
+
# the deploy/mutate operation will succeed once available_replica_count reaches
|
5917
|
+
# required_replica_count, and the rest of the replicas will be retried. If not
|
5918
|
+
# set, the default required_replica_count will be min_replica_count.
|
5862
5919
|
# Corresponds to the JSON property `requiredReplicaCount`
|
5863
5920
|
# @return [Fixnum]
|
5864
5921
|
attr_accessor :required_replica_count
|
@@ -6268,8 +6325,8 @@ module Google
|
|
6268
6325
|
attr_accessor :accept_eula
|
6269
6326
|
alias_method :accept_eula?, :accept_eula
|
6270
6327
|
|
6271
|
-
# A description of resources that are dedicated to a DeployedModel
|
6272
|
-
# need a higher degree of manual configuration.
|
6328
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6329
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6273
6330
|
# Corresponds to the JSON property `dedicatedResources`
|
6274
6331
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6275
6332
|
attr_accessor :dedicated_resources
|
@@ -6286,9 +6343,11 @@ module Google
|
|
6286
6343
|
# @return [String]
|
6287
6344
|
attr_accessor :hugging_face_access_token
|
6288
6345
|
|
6289
|
-
# Required. The
|
6290
|
-
#
|
6291
|
-
#
|
6346
|
+
# Required. The model to deploy. Format: 1. `publishers/`publisher`/models/`
|
6347
|
+
# publisher_model`@`version_id``, or `publishers/hf-`hugging-face-author`/models/
|
6348
|
+
# `hugging-face-model-name`@001`. 2. Hugging Face model ID like `google/gemma-2-
|
6349
|
+
# 2b-it`. 3. Custom model Google Cloud Storage URI like `gs://bucket`. 4. Custom
|
6350
|
+
# model zip file like `https://abc.com/a.zip`.
|
6292
6351
|
# Corresponds to the JSON property `model`
|
6293
6352
|
# @return [String]
|
6294
6353
|
attr_accessor :model
|
@@ -6349,8 +6408,8 @@ module Google
|
|
6349
6408
|
# @return [String]
|
6350
6409
|
attr_accessor :create_time
|
6351
6410
|
|
6352
|
-
# A description of resources that are dedicated to a DeployedModel
|
6353
|
-
# need a higher degree of manual configuration.
|
6411
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6412
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6354
6413
|
# Corresponds to the JSON property `dedicatedResources`
|
6355
6414
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6356
6415
|
attr_accessor :dedicated_resources
|
@@ -6562,8 +6621,8 @@ module Google
|
|
6562
6621
|
# @return [String]
|
6563
6622
|
attr_accessor :create_time
|
6564
6623
|
|
6565
|
-
# A description of resources that are dedicated to a DeployedModel
|
6566
|
-
# need a higher degree of manual configuration.
|
6624
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6625
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6567
6626
|
# Corresponds to the JSON property `dedicatedResources`
|
6568
6627
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6569
6628
|
attr_accessor :dedicated_resources
|
@@ -6639,6 +6698,11 @@ module Google
|
|
6639
6698
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PrivateEndpoints]
|
6640
6699
|
attr_accessor :private_endpoints
|
6641
6700
|
|
6701
|
+
# Configuration for rolling deployments.
|
6702
|
+
# Corresponds to the JSON property `rolloutOptions`
|
6703
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RolloutOptions]
|
6704
|
+
attr_accessor :rollout_options
|
6705
|
+
|
6642
6706
|
# The service account that the DeployedModel's container runs as. Specify the
|
6643
6707
|
# email address of the service account. If this service account is not specified,
|
6644
6708
|
# the container runs as a service account that doesn't have access to the
|
@@ -6655,6 +6719,11 @@ module Google
|
|
6655
6719
|
# @return [String]
|
6656
6720
|
attr_accessor :shared_resources
|
6657
6721
|
|
6722
|
+
# Configuration for Speculative Decoding.
|
6723
|
+
# Corresponds to the JSON property `speculativeDecodingSpec`
|
6724
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec]
|
6725
|
+
attr_accessor :speculative_decoding_spec
|
6726
|
+
|
6658
6727
|
# Runtime status of the deployed model.
|
6659
6728
|
# Corresponds to the JSON property `status`
|
6660
6729
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployedModelStatus]
|
@@ -6685,8 +6754,10 @@ module Google
|
|
6685
6754
|
@model = args[:model] if args.key?(:model)
|
6686
6755
|
@model_version_id = args[:model_version_id] if args.key?(:model_version_id)
|
6687
6756
|
@private_endpoints = args[:private_endpoints] if args.key?(:private_endpoints)
|
6757
|
+
@rollout_options = args[:rollout_options] if args.key?(:rollout_options)
|
6688
6758
|
@service_account = args[:service_account] if args.key?(:service_account)
|
6689
6759
|
@shared_resources = args[:shared_resources] if args.key?(:shared_resources)
|
6760
|
+
@speculative_decoding_spec = args[:speculative_decoding_spec] if args.key?(:speculative_decoding_spec)
|
6690
6761
|
@status = args[:status] if args.key?(:status)
|
6691
6762
|
@system_labels = args[:system_labels] if args.key?(:system_labels)
|
6692
6763
|
end
|
@@ -6758,8 +6829,8 @@ module Google
|
|
6758
6829
|
# @return [String]
|
6759
6830
|
attr_accessor :create_time
|
6760
6831
|
|
6761
|
-
# A description of resources that are dedicated to a DeployedModel
|
6762
|
-
# need a higher degree of manual configuration.
|
6832
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6833
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6763
6834
|
# Corresponds to the JSON property `dedicatedResources`
|
6764
6835
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6765
6836
|
attr_accessor :dedicated_resources
|
@@ -7241,6 +7312,11 @@ module Google
|
|
7241
7312
|
# @return [String]
|
7242
7313
|
attr_accessor :etag
|
7243
7314
|
|
7315
|
+
# Configuration for GenAiAdvancedFeatures.
|
7316
|
+
# Corresponds to the JSON property `genAiAdvancedFeaturesConfig`
|
7317
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig]
|
7318
|
+
attr_accessor :gen_ai_advanced_features_config
|
7319
|
+
|
7244
7320
|
# The labels with user-defined metadata to organize your Endpoints. Label keys
|
7245
7321
|
# and values can be no longer than 64 characters (Unicode codepoints), can only
|
7246
7322
|
# contain lowercase letters, numeric characters, underscores and dashes.
|
@@ -7327,6 +7403,7 @@ module Google
|
|
7327
7403
|
@enable_private_service_connect = args[:enable_private_service_connect] if args.key?(:enable_private_service_connect)
|
7328
7404
|
@encryption_spec = args[:encryption_spec] if args.key?(:encryption_spec)
|
7329
7405
|
@etag = args[:etag] if args.key?(:etag)
|
7406
|
+
@gen_ai_advanced_features_config = args[:gen_ai_advanced_features_config] if args.key?(:gen_ai_advanced_features_config)
|
7330
7407
|
@labels = args[:labels] if args.key?(:labels)
|
7331
7408
|
@model_deployment_monitoring_job = args[:model_deployment_monitoring_job] if args.key?(:model_deployment_monitoring_job)
|
7332
7409
|
@name = args[:name] if args.key?(:name)
|
@@ -7554,10 +7631,54 @@ module Google
|
|
7554
7631
|
end
|
7555
7632
|
end
|
7556
7633
|
|
7634
|
+
# Request message for EvaluationService.EvaluateDataset.
|
7635
|
+
class GoogleCloudAiplatformV1beta1EvaluateDatasetRequest
|
7636
|
+
include Google::Apis::Core::Hashable
|
7637
|
+
|
7638
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7639
|
+
# EvaluateDataset.
|
7640
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7641
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7642
|
+
attr_accessor :autorater_config
|
7643
|
+
|
7644
|
+
# The dataset used for evaluation.
|
7645
|
+
# Corresponds to the JSON property `dataset`
|
7646
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EvaluationDataset]
|
7647
|
+
attr_accessor :dataset
|
7648
|
+
|
7649
|
+
# Required. The metrics used for evaluation.
|
7650
|
+
# Corresponds to the JSON property `metrics`
|
7651
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Metric>]
|
7652
|
+
attr_accessor :metrics
|
7653
|
+
|
7654
|
+
# Config for evaluation output.
|
7655
|
+
# Corresponds to the JSON property `outputConfig`
|
7656
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1OutputConfig]
|
7657
|
+
attr_accessor :output_config
|
7658
|
+
|
7659
|
+
def initialize(**args)
|
7660
|
+
update!(**args)
|
7661
|
+
end
|
7662
|
+
|
7663
|
+
# Update properties of this object
|
7664
|
+
def update!(**args)
|
7665
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7666
|
+
@dataset = args[:dataset] if args.key?(:dataset)
|
7667
|
+
@metrics = args[:metrics] if args.key?(:metrics)
|
7668
|
+
@output_config = args[:output_config] if args.key?(:output_config)
|
7669
|
+
end
|
7670
|
+
end
|
7671
|
+
|
7557
7672
|
# Request message for EvaluationService.EvaluateInstances.
|
7558
7673
|
class GoogleCloudAiplatformV1beta1EvaluateInstancesRequest
|
7559
7674
|
include Google::Apis::Core::Hashable
|
7560
7675
|
|
7676
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7677
|
+
# EvaluateDataset.
|
7678
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7679
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7680
|
+
attr_accessor :autorater_config
|
7681
|
+
|
7561
7682
|
# Input for bleu metric.
|
7562
7683
|
# Corresponds to the JSON property `bleuInput`
|
7563
7684
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuInput]
|
@@ -7719,6 +7840,7 @@ module Google
|
|
7719
7840
|
|
7720
7841
|
# Update properties of this object
|
7721
7842
|
def update!(**args)
|
7843
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7722
7844
|
@bleu_input = args[:bleu_input] if args.key?(:bleu_input)
|
7723
7845
|
@coherence_input = args[:coherence_input] if args.key?(:coherence_input)
|
7724
7846
|
@comet_input = args[:comet_input] if args.key?(:comet_input)
|
@@ -8058,6 +8180,31 @@ module Google
|
|
8058
8180
|
end
|
8059
8181
|
end
|
8060
8182
|
|
8183
|
+
# The dataset used for evaluation.
|
8184
|
+
class GoogleCloudAiplatformV1beta1EvaluationDataset
|
8185
|
+
include Google::Apis::Core::Hashable
|
8186
|
+
|
8187
|
+
# The BigQuery location for the input content.
|
8188
|
+
# Corresponds to the JSON property `bigquerySource`
|
8189
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BigQuerySource]
|
8190
|
+
attr_accessor :bigquery_source
|
8191
|
+
|
8192
|
+
# The Google Cloud Storage location for the input content.
|
8193
|
+
# Corresponds to the JSON property `gcsSource`
|
8194
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsSource]
|
8195
|
+
attr_accessor :gcs_source
|
8196
|
+
|
8197
|
+
def initialize(**args)
|
8198
|
+
update!(**args)
|
8199
|
+
end
|
8200
|
+
|
8201
|
+
# Update properties of this object
|
8202
|
+
def update!(**args)
|
8203
|
+
@bigquery_source = args[:bigquery_source] if args.key?(:bigquery_source)
|
8204
|
+
@gcs_source = args[:gcs_source] if args.key?(:gcs_source)
|
8205
|
+
end
|
8206
|
+
end
|
8207
|
+
|
8061
8208
|
# An edge describing the relationship between an Artifact and an Execution in a
|
8062
8209
|
# lineage graph.
|
8063
8210
|
class GoogleCloudAiplatformV1beta1Event
|
@@ -9581,6 +9728,51 @@ module Google
|
|
9581
9728
|
end
|
9582
9729
|
end
|
9583
9730
|
|
9731
|
+
# Runtime operation information for ModelGardenService.ExportPublisherModel.
|
9732
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelOperationMetadata
|
9733
|
+
include Google::Apis::Core::Hashable
|
9734
|
+
|
9735
|
+
# Generic Metadata shared by all operations.
|
9736
|
+
# Corresponds to the JSON property `genericMetadata`
|
9737
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenericOperationMetadata]
|
9738
|
+
attr_accessor :generic_metadata
|
9739
|
+
|
9740
|
+
def initialize(**args)
|
9741
|
+
update!(**args)
|
9742
|
+
end
|
9743
|
+
|
9744
|
+
# Update properties of this object
|
9745
|
+
def update!(**args)
|
9746
|
+
@generic_metadata = args[:generic_metadata] if args.key?(:generic_metadata)
|
9747
|
+
end
|
9748
|
+
end
|
9749
|
+
|
9750
|
+
# Response message for ModelGardenService.ExportPublisherModel.
|
9751
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelResponse
|
9752
|
+
include Google::Apis::Core::Hashable
|
9753
|
+
|
9754
|
+
# The destination uri of the model weights.
|
9755
|
+
# Corresponds to the JSON property `destinationUri`
|
9756
|
+
# @return [String]
|
9757
|
+
attr_accessor :destination_uri
|
9758
|
+
|
9759
|
+
# The name of the PublisherModel resource. Format: `publishers/`publisher`/
|
9760
|
+
# models/`publisher_model`@`version_id``
|
9761
|
+
# Corresponds to the JSON property `publisherModel`
|
9762
|
+
# @return [String]
|
9763
|
+
attr_accessor :publisher_model
|
9764
|
+
|
9765
|
+
def initialize(**args)
|
9766
|
+
update!(**args)
|
9767
|
+
end
|
9768
|
+
|
9769
|
+
# Update properties of this object
|
9770
|
+
def update!(**args)
|
9771
|
+
@destination_uri = args[:destination_uri] if args.key?(:destination_uri)
|
9772
|
+
@publisher_model = args[:publisher_model] if args.key?(:publisher_model)
|
9773
|
+
end
|
9774
|
+
end
|
9775
|
+
|
9584
9776
|
# Request message for TensorboardService.ExportTensorboardTimeSeriesData.
|
9585
9777
|
class GoogleCloudAiplatformV1beta1ExportTensorboardTimeSeriesDataRequest
|
9586
9778
|
include Google::Apis::Core::Hashable
|
@@ -12192,6 +12384,14 @@ module Google
|
|
12192
12384
|
class GoogleCloudAiplatformV1beta1FileData
|
12193
12385
|
include Google::Apis::Core::Hashable
|
12194
12386
|
|
12387
|
+
# Optional. Display name of the file data. Used to provide a label or filename
|
12388
|
+
# to distinguish file datas. This field is only returned in PromptMessage for
|
12389
|
+
# prompt management. It is not currently used in the Gemini GenerateContent
|
12390
|
+
# calls.
|
12391
|
+
# Corresponds to the JSON property `displayName`
|
12392
|
+
# @return [String]
|
12393
|
+
attr_accessor :display_name
|
12394
|
+
|
12195
12395
|
# Required. URI.
|
12196
12396
|
# Corresponds to the JSON property `fileUri`
|
12197
12397
|
# @return [String]
|
@@ -12208,6 +12408,7 @@ module Google
|
|
12208
12408
|
|
12209
12409
|
# Update properties of this object
|
12210
12410
|
def update!(**args)
|
12411
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
12211
12412
|
@file_uri = args[:file_uri] if args.key?(:file_uri)
|
12212
12413
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
12213
12414
|
end
|
@@ -12890,6 +13091,47 @@ module Google
|
|
12890
13091
|
end
|
12891
13092
|
end
|
12892
13093
|
|
13094
|
+
# Configuration for GenAiAdvancedFeatures.
|
13095
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig
|
13096
|
+
include Google::Apis::Core::Hashable
|
13097
|
+
|
13098
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13099
|
+
# Corresponds to the JSON property `ragConfig`
|
13100
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig]
|
13101
|
+
attr_accessor :rag_config
|
13102
|
+
|
13103
|
+
def initialize(**args)
|
13104
|
+
update!(**args)
|
13105
|
+
end
|
13106
|
+
|
13107
|
+
# Update properties of this object
|
13108
|
+
def update!(**args)
|
13109
|
+
@rag_config = args[:rag_config] if args.key?(:rag_config)
|
13110
|
+
end
|
13111
|
+
end
|
13112
|
+
|
13113
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13114
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig
|
13115
|
+
include Google::Apis::Core::Hashable
|
13116
|
+
|
13117
|
+
# If true, enable Retrieval Augmented Generation in ChatCompletion request. Once
|
13118
|
+
# enabled, the endpoint will be identified as GenAI endpoint and Arthedain
|
13119
|
+
# router will be used.
|
13120
|
+
# Corresponds to the JSON property `enableRag`
|
13121
|
+
# @return [Boolean]
|
13122
|
+
attr_accessor :enable_rag
|
13123
|
+
alias_method :enable_rag?, :enable_rag
|
13124
|
+
|
13125
|
+
def initialize(**args)
|
13126
|
+
update!(**args)
|
13127
|
+
end
|
13128
|
+
|
13129
|
+
# Update properties of this object
|
13130
|
+
def update!(**args)
|
13131
|
+
@enable_rag = args[:enable_rag] if args.key?(:enable_rag)
|
13132
|
+
end
|
13133
|
+
end
|
13134
|
+
|
12893
13135
|
# Request message for NotebookInternalService.GenerateAccessToken.
|
12894
13136
|
class GoogleCloudAiplatformV1beta1GenerateAccessTokenRequest
|
12895
13137
|
include Google::Apis::Core::Hashable
|
@@ -13037,6 +13279,11 @@ module Google
|
|
13037
13279
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Candidate>]
|
13038
13280
|
attr_accessor :candidates
|
13039
13281
|
|
13282
|
+
# Output only. Timestamp when the request is made to the server.
|
13283
|
+
# Corresponds to the JSON property `createTime`
|
13284
|
+
# @return [String]
|
13285
|
+
attr_accessor :create_time
|
13286
|
+
|
13040
13287
|
# Output only. The model version used to generate the response.
|
13041
13288
|
# Corresponds to the JSON property `modelVersion`
|
13042
13289
|
# @return [String]
|
@@ -13047,6 +13294,12 @@ module Google
|
|
13047
13294
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponsePromptFeedback]
|
13048
13295
|
attr_accessor :prompt_feedback
|
13049
13296
|
|
13297
|
+
# Output only. response_id is used to identify each response. It is the encoding
|
13298
|
+
# of the event_id.
|
13299
|
+
# Corresponds to the JSON property `responseId`
|
13300
|
+
# @return [String]
|
13301
|
+
attr_accessor :response_id
|
13302
|
+
|
13050
13303
|
# Usage metadata about response(s).
|
13051
13304
|
# Corresponds to the JSON property `usageMetadata`
|
13052
13305
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata]
|
@@ -13059,8 +13312,10 @@ module Google
|
|
13059
13312
|
# Update properties of this object
|
13060
13313
|
def update!(**args)
|
13061
13314
|
@candidates = args[:candidates] if args.key?(:candidates)
|
13315
|
+
@create_time = args[:create_time] if args.key?(:create_time)
|
13062
13316
|
@model_version = args[:model_version] if args.key?(:model_version)
|
13063
13317
|
@prompt_feedback = args[:prompt_feedback] if args.key?(:prompt_feedback)
|
13318
|
+
@response_id = args[:response_id] if args.key?(:response_id)
|
13064
13319
|
@usage_metadata = args[:usage_metadata] if args.key?(:usage_metadata)
|
13065
13320
|
end
|
13066
13321
|
end
|
@@ -13100,6 +13355,11 @@ module Google
|
|
13100
13355
|
class GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata
|
13101
13356
|
include Google::Apis::Core::Hashable
|
13102
13357
|
|
13358
|
+
# Output only. List of modalities of the cached content in the request input.
|
13359
|
+
# Corresponds to the JSON property `cacheTokensDetails`
|
13360
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13361
|
+
attr_accessor :cache_tokens_details
|
13362
|
+
|
13103
13363
|
# Output only. Number of tokens in the cached part in the input (the cached
|
13104
13364
|
# content).
|
13105
13365
|
# Corresponds to the JSON property `cachedContentTokenCount`
|
@@ -13111,6 +13371,11 @@ module Google
|
|
13111
13371
|
# @return [Fixnum]
|
13112
13372
|
attr_accessor :candidates_token_count
|
13113
13373
|
|
13374
|
+
# Output only. List of modalities that were returned in the response.
|
13375
|
+
# Corresponds to the JSON property `candidatesTokensDetails`
|
13376
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13377
|
+
attr_accessor :candidates_tokens_details
|
13378
|
+
|
13114
13379
|
# Number of tokens in the request. When `cached_content` is set, this is still
|
13115
13380
|
# the total effective prompt size meaning this includes the number of tokens in
|
13116
13381
|
# the cached content.
|
@@ -13118,6 +13383,11 @@ module Google
|
|
13118
13383
|
# @return [Fixnum]
|
13119
13384
|
attr_accessor :prompt_token_count
|
13120
13385
|
|
13386
|
+
# Output only. List of modalities that were processed in the request input.
|
13387
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
13388
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13389
|
+
attr_accessor :prompt_tokens_details
|
13390
|
+
|
13121
13391
|
# Total token count for prompt and response candidates.
|
13122
13392
|
# Corresponds to the JSON property `totalTokenCount`
|
13123
13393
|
# @return [Fixnum]
|
@@ -13129,9 +13399,12 @@ module Google
|
|
13129
13399
|
|
13130
13400
|
# Update properties of this object
|
13131
13401
|
def update!(**args)
|
13402
|
+
@cache_tokens_details = args[:cache_tokens_details] if args.key?(:cache_tokens_details)
|
13132
13403
|
@cached_content_token_count = args[:cached_content_token_count] if args.key?(:cached_content_token_count)
|
13133
13404
|
@candidates_token_count = args[:candidates_token_count] if args.key?(:candidates_token_count)
|
13405
|
+
@candidates_tokens_details = args[:candidates_tokens_details] if args.key?(:candidates_tokens_details)
|
13134
13406
|
@prompt_token_count = args[:prompt_token_count] if args.key?(:prompt_token_count)
|
13407
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
13135
13408
|
@total_token_count = args[:total_token_count] if args.key?(:total_token_count)
|
13136
13409
|
end
|
13137
13410
|
end
|
@@ -16084,6 +16357,32 @@ module Google
|
|
16084
16357
|
end
|
16085
16358
|
end
|
16086
16359
|
|
16360
|
+
# Response message for ModelService.ListModelVersionCheckpoints
|
16361
|
+
class GoogleCloudAiplatformV1beta1ListModelVersionCheckpointsResponse
|
16362
|
+
include Google::Apis::Core::Hashable
|
16363
|
+
|
16364
|
+
# List of Model Version checkpoints.
|
16365
|
+
# Corresponds to the JSON property `checkpoints`
|
16366
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelVersionCheckpoint>]
|
16367
|
+
attr_accessor :checkpoints
|
16368
|
+
|
16369
|
+
# A token to retrieve the next page of results. Pass to
|
16370
|
+
# ListModelVersionCheckpointsRequest.page_token to obtain that page.
|
16371
|
+
# Corresponds to the JSON property `nextPageToken`
|
16372
|
+
# @return [String]
|
16373
|
+
attr_accessor :next_page_token
|
16374
|
+
|
16375
|
+
def initialize(**args)
|
16376
|
+
update!(**args)
|
16377
|
+
end
|
16378
|
+
|
16379
|
+
# Update properties of this object
|
16380
|
+
def update!(**args)
|
16381
|
+
@checkpoints = args[:checkpoints] if args.key?(:checkpoints)
|
16382
|
+
@next_page_token = args[:next_page_token] if args.key?(:next_page_token)
|
16383
|
+
end
|
16384
|
+
end
|
16385
|
+
|
16087
16386
|
# Response message for ModelService.ListModelVersions
|
16088
16387
|
class GoogleCloudAiplatformV1beta1ListModelVersionsResponse
|
16089
16388
|
include Google::Apis::Core::Hashable
|
@@ -17156,6 +17455,58 @@ module Google
|
|
17156
17455
|
end
|
17157
17456
|
end
|
17158
17457
|
|
17458
|
+
# The metric used for dataset level evaluation.
|
17459
|
+
class GoogleCloudAiplatformV1beta1Metric
|
17460
|
+
include Google::Apis::Core::Hashable
|
17461
|
+
|
17462
|
+
# Optional. The aggregation metrics to use.
|
17463
|
+
# Corresponds to the JSON property `aggregationMetrics`
|
17464
|
+
# @return [Array<String>]
|
17465
|
+
attr_accessor :aggregation_metrics
|
17466
|
+
|
17467
|
+
# Spec for bleu score metric - calculates the precision of n-grams in the
|
17468
|
+
# prediction as compared to reference - returns a score ranging between 0 to 1.
|
17469
|
+
# Corresponds to the JSON property `bleuSpec`
|
17470
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuSpec]
|
17471
|
+
attr_accessor :bleu_spec
|
17472
|
+
|
17473
|
+
# Spec for exact match metric - returns 1 if prediction and reference exactly
|
17474
|
+
# matches, otherwise 0.
|
17475
|
+
# Corresponds to the JSON property `exactMatchSpec`
|
17476
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ExactMatchSpec]
|
17477
|
+
attr_accessor :exact_match_spec
|
17478
|
+
|
17479
|
+
# Spec for pairwise metric.
|
17480
|
+
# Corresponds to the JSON property `pairwiseMetricSpec`
|
17481
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PairwiseMetricSpec]
|
17482
|
+
attr_accessor :pairwise_metric_spec
|
17483
|
+
|
17484
|
+
# Spec for pointwise metric.
|
17485
|
+
# Corresponds to the JSON property `pointwiseMetricSpec`
|
17486
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PointwiseMetricSpec]
|
17487
|
+
attr_accessor :pointwise_metric_spec
|
17488
|
+
|
17489
|
+
# Spec for rouge score metric - calculates the recall of n-grams in prediction
|
17490
|
+
# as compared to reference - returns a score ranging between 0 and 1.
|
17491
|
+
# Corresponds to the JSON property `rougeSpec`
|
17492
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RougeSpec]
|
17493
|
+
attr_accessor :rouge_spec
|
17494
|
+
|
17495
|
+
def initialize(**args)
|
17496
|
+
update!(**args)
|
17497
|
+
end
|
17498
|
+
|
17499
|
+
# Update properties of this object
|
17500
|
+
def update!(**args)
|
17501
|
+
@aggregation_metrics = args[:aggregation_metrics] if args.key?(:aggregation_metrics)
|
17502
|
+
@bleu_spec = args[:bleu_spec] if args.key?(:bleu_spec)
|
17503
|
+
@exact_match_spec = args[:exact_match_spec] if args.key?(:exact_match_spec)
|
17504
|
+
@pairwise_metric_spec = args[:pairwise_metric_spec] if args.key?(:pairwise_metric_spec)
|
17505
|
+
@pointwise_metric_spec = args[:pointwise_metric_spec] if args.key?(:pointwise_metric_spec)
|
17506
|
+
@rouge_spec = args[:rouge_spec] if args.key?(:rouge_spec)
|
17507
|
+
end
|
17508
|
+
end
|
17509
|
+
|
17159
17510
|
# Input for MetricX metric.
|
17160
17511
|
class GoogleCloudAiplatformV1beta1MetricxInput
|
17161
17512
|
include Google::Apis::Core::Hashable
|
@@ -17674,6 +18025,31 @@ module Google
|
|
17674
18025
|
end
|
17675
18026
|
end
|
17676
18027
|
|
18028
|
+
# Represents token counting info for a single modality.
|
18029
|
+
class GoogleCloudAiplatformV1beta1ModalityTokenCount
|
18030
|
+
include Google::Apis::Core::Hashable
|
18031
|
+
|
18032
|
+
# The modality associated with this token count.
|
18033
|
+
# Corresponds to the JSON property `modality`
|
18034
|
+
# @return [String]
|
18035
|
+
attr_accessor :modality
|
18036
|
+
|
18037
|
+
# Number of tokens.
|
18038
|
+
# Corresponds to the JSON property `tokenCount`
|
18039
|
+
# @return [Fixnum]
|
18040
|
+
attr_accessor :token_count
|
18041
|
+
|
18042
|
+
def initialize(**args)
|
18043
|
+
update!(**args)
|
18044
|
+
end
|
18045
|
+
|
18046
|
+
# Update properties of this object
|
18047
|
+
def update!(**args)
|
18048
|
+
@modality = args[:modality] if args.key?(:modality)
|
18049
|
+
@token_count = args[:token_count] if args.key?(:token_count)
|
18050
|
+
end
|
18051
|
+
end
|
18052
|
+
|
17677
18053
|
# A trained machine learning Model.
|
17678
18054
|
class GoogleCloudAiplatformV1beta1Model
|
17679
18055
|
include Google::Apis::Core::Hashable
|
@@ -17703,6 +18079,11 @@ module Google
|
|
17703
18079
|
# @return [String]
|
17704
18080
|
attr_accessor :create_time
|
17705
18081
|
|
18082
|
+
# The default checkpoint id of a model version.
|
18083
|
+
# Corresponds to the JSON property `defaultCheckpointId`
|
18084
|
+
# @return [String]
|
18085
|
+
attr_accessor :default_checkpoint_id
|
18086
|
+
|
17706
18087
|
# Output only. The pointers to DeployedModels created from this Model. Note that
|
17707
18088
|
# Model could have been deployed to Endpoints in different Locations.
|
17708
18089
|
# Corresponds to the JSON property `deployedModels`
|
@@ -17917,6 +18298,7 @@ module Google
|
|
17917
18298
|
@base_model_source = args[:base_model_source] if args.key?(:base_model_source)
|
17918
18299
|
@container_spec = args[:container_spec] if args.key?(:container_spec)
|
17919
18300
|
@create_time = args[:create_time] if args.key?(:create_time)
|
18301
|
+
@default_checkpoint_id = args[:default_checkpoint_id] if args.key?(:default_checkpoint_id)
|
17920
18302
|
@deployed_models = args[:deployed_models] if args.key?(:deployed_models)
|
17921
18303
|
@description = args[:description] if args.key?(:description)
|
17922
18304
|
@display_name = args[:display_name] if args.key?(:display_name)
|
@@ -18925,7 +19307,7 @@ module Google
|
|
18925
19307
|
# model in SavedModel format. * `tf-js` A [TensorFlow.js](https://www.tensorflow.
|
18926
19308
|
# org/js) model that can be used in the browser and in Node.js using JavaScript.
|
18927
19309
|
# * `core-ml` Used for iOS mobile devices. * `custom-trained` A Model that was
|
18928
|
-
# uploaded or trained by custom code.
|
19310
|
+
# uploaded or trained by custom code. * `genie` A tuned Model Garden model.
|
18929
19311
|
# Corresponds to the JSON property `id`
|
18930
19312
|
# @return [String]
|
18931
19313
|
attr_accessor :id
|
@@ -18951,6 +19333,17 @@ module Google
|
|
18951
19333
|
# @return [String]
|
18952
19334
|
attr_accessor :public_model_name
|
18953
19335
|
|
19336
|
+
# Optional. Whether to avoid pulling the model from the HF cache.
|
19337
|
+
# Corresponds to the JSON property `skipHfModelCache`
|
19338
|
+
# @return [Boolean]
|
19339
|
+
attr_accessor :skip_hf_model_cache
|
19340
|
+
alias_method :skip_hf_model_cache?, :skip_hf_model_cache
|
19341
|
+
|
19342
|
+
# Optional. The model garden source model version ID.
|
19343
|
+
# Corresponds to the JSON property `versionId`
|
19344
|
+
# @return [String]
|
19345
|
+
attr_accessor :version_id
|
19346
|
+
|
18954
19347
|
def initialize(**args)
|
18955
19348
|
update!(**args)
|
18956
19349
|
end
|
@@ -18958,6 +19351,8 @@ module Google
|
|
18958
19351
|
# Update properties of this object
|
18959
19352
|
def update!(**args)
|
18960
19353
|
@public_model_name = args[:public_model_name] if args.key?(:public_model_name)
|
19354
|
+
@skip_hf_model_cache = args[:skip_hf_model_cache] if args.key?(:skip_hf_model_cache)
|
19355
|
+
@version_id = args[:version_id] if args.key?(:version_id)
|
18961
19356
|
end
|
18962
19357
|
end
|
18963
19358
|
|
@@ -20610,6 +21005,45 @@ module Google
|
|
20610
21005
|
end
|
20611
21006
|
end
|
20612
21007
|
|
21008
|
+
# Describes the machine learning model version checkpoint.
|
21009
|
+
class GoogleCloudAiplatformV1beta1ModelVersionCheckpoint
|
21010
|
+
include Google::Apis::Core::Hashable
|
21011
|
+
|
21012
|
+
# The ID of the checkpoint.
|
21013
|
+
# Corresponds to the JSON property `checkpointId`
|
21014
|
+
# @return [String]
|
21015
|
+
attr_accessor :checkpoint_id
|
21016
|
+
|
21017
|
+
# The epoch of the checkpoint.
|
21018
|
+
# Corresponds to the JSON property `epoch`
|
21019
|
+
# @return [Fixnum]
|
21020
|
+
attr_accessor :epoch
|
21021
|
+
|
21022
|
+
# Identifier. The resource name of the ModelVersionCheckpoint. Format: `projects/
|
21023
|
+
# `project`/locations/`location`/models/`model`/versions/`version`/checkpoints/`
|
21024
|
+
# checkpoint``
|
21025
|
+
# Corresponds to the JSON property `name`
|
21026
|
+
# @return [String]
|
21027
|
+
attr_accessor :name
|
21028
|
+
|
21029
|
+
# The step of the checkpoint.
|
21030
|
+
# Corresponds to the JSON property `step`
|
21031
|
+
# @return [Fixnum]
|
21032
|
+
attr_accessor :step
|
21033
|
+
|
21034
|
+
def initialize(**args)
|
21035
|
+
update!(**args)
|
21036
|
+
end
|
21037
|
+
|
21038
|
+
# Update properties of this object
|
21039
|
+
def update!(**args)
|
21040
|
+
@checkpoint_id = args[:checkpoint_id] if args.key?(:checkpoint_id)
|
21041
|
+
@epoch = args[:epoch] if args.key?(:epoch)
|
21042
|
+
@name = args[:name] if args.key?(:name)
|
21043
|
+
@step = args[:step] if args.key?(:step)
|
21044
|
+
end
|
21045
|
+
end
|
21046
|
+
|
20613
21047
|
# Runtime operation information for IndexEndpointService.MutateDeployedIndex.
|
20614
21048
|
class GoogleCloudAiplatformV1beta1MutateDeployedIndexOperationMetadata
|
20615
21049
|
include Google::Apis::Core::Hashable
|
@@ -21719,8 +22153,8 @@ module Google
|
|
21719
22153
|
# @return [String]
|
21720
22154
|
attr_accessor :notebook_runtime_template_resource_name
|
21721
22155
|
|
21722
|
-
#
|
21723
|
-
#
|
22156
|
+
# The Schedule resource name if this job is triggered by one. Format: `projects/`
|
22157
|
+
# project_id`/locations/`location`/schedules/`schedule_id``
|
21724
22158
|
# Corresponds to the JSON property `scheduleResourceName`
|
21725
22159
|
# @return [String]
|
21726
22160
|
attr_accessor :schedule_resource_name
|
@@ -22083,6 +22517,11 @@ module Google
|
|
22083
22517
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22084
22518
|
attr_accessor :shielded_vm_config
|
22085
22519
|
|
22520
|
+
# Notebook Software Config.
|
22521
|
+
# Corresponds to the JSON property `softwareConfig`
|
22522
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22523
|
+
attr_accessor :software_config
|
22524
|
+
|
22086
22525
|
# Output only. Timestamp when this NotebookRuntime was most recently updated.
|
22087
22526
|
# Corresponds to the JSON property `updateTime`
|
22088
22527
|
# @return [String]
|
@@ -22123,6 +22562,7 @@ module Google
|
|
22123
22562
|
@satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
|
22124
22563
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22125
22564
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22565
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22126
22566
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22127
22567
|
@version = args[:version] if args.key?(:version)
|
22128
22568
|
end
|
@@ -22241,6 +22681,11 @@ module Google
|
|
22241
22681
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22242
22682
|
attr_accessor :shielded_vm_config
|
22243
22683
|
|
22684
|
+
# Notebook Software Config.
|
22685
|
+
# Corresponds to the JSON property `softwareConfig`
|
22686
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22687
|
+
attr_accessor :software_config
|
22688
|
+
|
22244
22689
|
# Output only. Timestamp when this NotebookRuntimeTemplate was most recently
|
22245
22690
|
# updated.
|
22246
22691
|
# Corresponds to the JSON property `updateTime`
|
@@ -22270,6 +22715,7 @@ module Google
|
|
22270
22715
|
@notebook_runtime_type = args[:notebook_runtime_type] if args.key?(:notebook_runtime_type)
|
22271
22716
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22272
22717
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22718
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22273
22719
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22274
22720
|
end
|
22275
22721
|
end
|
@@ -22293,6 +22739,51 @@ module Google
|
|
22293
22739
|
end
|
22294
22740
|
end
|
22295
22741
|
|
22742
|
+
# Notebook Software Config.
|
22743
|
+
class GoogleCloudAiplatformV1beta1NotebookSoftwareConfig
|
22744
|
+
include Google::Apis::Core::Hashable
|
22745
|
+
|
22746
|
+
# Optional. Environment variables to be passed to the container. Maximum limit
|
22747
|
+
# is 100.
|
22748
|
+
# Corresponds to the JSON property `env`
|
22749
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnvVar>]
|
22750
|
+
attr_accessor :env
|
22751
|
+
|
22752
|
+
# Post startup script config.
|
22753
|
+
# Corresponds to the JSON property `postStartupScriptConfig`
|
22754
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PostStartupScriptConfig]
|
22755
|
+
attr_accessor :post_startup_script_config
|
22756
|
+
|
22757
|
+
def initialize(**args)
|
22758
|
+
update!(**args)
|
22759
|
+
end
|
22760
|
+
|
22761
|
+
# Update properties of this object
|
22762
|
+
def update!(**args)
|
22763
|
+
@env = args[:env] if args.key?(:env)
|
22764
|
+
@post_startup_script_config = args[:post_startup_script_config] if args.key?(:post_startup_script_config)
|
22765
|
+
end
|
22766
|
+
end
|
22767
|
+
|
22768
|
+
# Config for evaluation output.
|
22769
|
+
class GoogleCloudAiplatformV1beta1OutputConfig
|
22770
|
+
include Google::Apis::Core::Hashable
|
22771
|
+
|
22772
|
+
# The Google Cloud Storage location where the output is to be written to.
|
22773
|
+
# Corresponds to the JSON property `gcsDestination`
|
22774
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsDestination]
|
22775
|
+
attr_accessor :gcs_destination
|
22776
|
+
|
22777
|
+
def initialize(**args)
|
22778
|
+
update!(**args)
|
22779
|
+
end
|
22780
|
+
|
22781
|
+
# Update properties of this object
|
22782
|
+
def update!(**args)
|
22783
|
+
@gcs_destination = args[:gcs_destination] if args.key?(:gcs_destination)
|
22784
|
+
end
|
22785
|
+
end
|
22786
|
+
|
22296
22787
|
# PSC config that is used to automatically create forwarding rule via
|
22297
22788
|
# ServiceConnectionMap.
|
22298
22789
|
class GoogleCloudAiplatformV1beta1PscAutomationConfig
|
@@ -22399,18 +22890,36 @@ module Google
|
|
22399
22890
|
class GoogleCloudAiplatformV1beta1PairwiseMetricSpec
|
22400
22891
|
include Google::Apis::Core::Hashable
|
22401
22892
|
|
22893
|
+
# Optional. The field name of the baseline response.
|
22894
|
+
# Corresponds to the JSON property `baselineResponseFieldName`
|
22895
|
+
# @return [String]
|
22896
|
+
attr_accessor :baseline_response_field_name
|
22897
|
+
|
22898
|
+
# Optional. The field name of the candidate response.
|
22899
|
+
# Corresponds to the JSON property `candidateResponseFieldName`
|
22900
|
+
# @return [String]
|
22901
|
+
attr_accessor :candidate_response_field_name
|
22902
|
+
|
22402
22903
|
# Required. Metric prompt template for pairwise metric.
|
22403
22904
|
# Corresponds to the JSON property `metricPromptTemplate`
|
22404
22905
|
# @return [String]
|
22405
22906
|
attr_accessor :metric_prompt_template
|
22406
22907
|
|
22908
|
+
# Optional. System instructions for pairwise metric.
|
22909
|
+
# Corresponds to the JSON property `systemInstruction`
|
22910
|
+
# @return [String]
|
22911
|
+
attr_accessor :system_instruction
|
22912
|
+
|
22407
22913
|
def initialize(**args)
|
22408
22914
|
update!(**args)
|
22409
22915
|
end
|
22410
22916
|
|
22411
22917
|
# Update properties of this object
|
22412
22918
|
def update!(**args)
|
22919
|
+
@baseline_response_field_name = args[:baseline_response_field_name] if args.key?(:baseline_response_field_name)
|
22920
|
+
@candidate_response_field_name = args[:candidate_response_field_name] if args.key?(:candidate_response_field_name)
|
22413
22921
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
22922
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
22414
22923
|
end
|
22415
22924
|
end
|
22416
22925
|
|
@@ -22717,7 +23226,7 @@ module Google
|
|
22717
23226
|
# @return [String]
|
22718
23227
|
attr_accessor :text
|
22719
23228
|
|
22720
|
-
#
|
23229
|
+
# Output only. Indicates if the part is thought from the model.
|
22721
23230
|
# Corresponds to the JSON property `thought`
|
22722
23231
|
# @return [Boolean]
|
22723
23232
|
attr_accessor :thought
|
@@ -23808,6 +24317,11 @@ module Google
|
|
23808
24317
|
# @return [String]
|
23809
24318
|
attr_accessor :metric_prompt_template
|
23810
24319
|
|
24320
|
+
# Optional. System instructions for pointwise metric.
|
24321
|
+
# Corresponds to the JSON property `systemInstruction`
|
24322
|
+
# @return [String]
|
24323
|
+
attr_accessor :system_instruction
|
24324
|
+
|
23811
24325
|
def initialize(**args)
|
23812
24326
|
update!(**args)
|
23813
24327
|
end
|
@@ -23815,6 +24329,7 @@ module Google
|
|
23815
24329
|
# Update properties of this object
|
23816
24330
|
def update!(**args)
|
23817
24331
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
24332
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
23818
24333
|
end
|
23819
24334
|
end
|
23820
24335
|
|
@@ -23838,6 +24353,39 @@ module Google
|
|
23838
24353
|
end
|
23839
24354
|
end
|
23840
24355
|
|
24356
|
+
# Post startup script config.
|
24357
|
+
class GoogleCloudAiplatformV1beta1PostStartupScriptConfig
|
24358
|
+
include Google::Apis::Core::Hashable
|
24359
|
+
|
24360
|
+
# Optional. Post startup script to run after runtime is started.
|
24361
|
+
# Corresponds to the JSON property `postStartupScript`
|
24362
|
+
# @return [String]
|
24363
|
+
attr_accessor :post_startup_script
|
24364
|
+
|
24365
|
+
# Optional. Post startup script behavior that defines download and execution
|
24366
|
+
# behavior.
|
24367
|
+
# Corresponds to the JSON property `postStartupScriptBehavior`
|
24368
|
+
# @return [String]
|
24369
|
+
attr_accessor :post_startup_script_behavior
|
24370
|
+
|
24371
|
+
# Optional. Post startup script url to download. Example: https://bucket/script.
|
24372
|
+
# sh
|
24373
|
+
# Corresponds to the JSON property `postStartupScriptUrl`
|
24374
|
+
# @return [String]
|
24375
|
+
attr_accessor :post_startup_script_url
|
24376
|
+
|
24377
|
+
def initialize(**args)
|
24378
|
+
update!(**args)
|
24379
|
+
end
|
24380
|
+
|
24381
|
+
# Update properties of this object
|
24382
|
+
def update!(**args)
|
24383
|
+
@post_startup_script = args[:post_startup_script] if args.key?(:post_startup_script)
|
24384
|
+
@post_startup_script_behavior = args[:post_startup_script_behavior] if args.key?(:post_startup_script_behavior)
|
24385
|
+
@post_startup_script_url = args[:post_startup_script_url] if args.key?(:post_startup_script_url)
|
24386
|
+
end
|
24387
|
+
end
|
24388
|
+
|
23841
24389
|
# The configuration for the prebuilt speaker to use.
|
23842
24390
|
class GoogleCloudAiplatformV1beta1PrebuiltVoiceConfig
|
23843
24391
|
include Google::Apis::Core::Hashable
|
@@ -24244,6 +24792,12 @@ module Google
|
|
24244
24792
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeExecAction]
|
24245
24793
|
attr_accessor :exec
|
24246
24794
|
|
24795
|
+
# Number of consecutive failures before the probe is considered failed. Defaults
|
24796
|
+
# to 3. Minimum value is 1. Maps to Kubernetes probe argument 'failureThreshold'.
|
24797
|
+
# Corresponds to the JSON property `failureThreshold`
|
24798
|
+
# @return [Fixnum]
|
24799
|
+
attr_accessor :failure_threshold
|
24800
|
+
|
24247
24801
|
# GrpcAction checks the health of a container using a gRPC service.
|
24248
24802
|
# Corresponds to the JSON property `grpc`
|
24249
24803
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeGrpcAction]
|
@@ -24254,6 +24808,12 @@ module Google
|
|
24254
24808
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpGetAction]
|
24255
24809
|
attr_accessor :http_get
|
24256
24810
|
|
24811
|
+
# Number of seconds to wait before starting the probe. Defaults to 0. Minimum
|
24812
|
+
# value is 0. Maps to Kubernetes probe argument 'initialDelaySeconds'.
|
24813
|
+
# Corresponds to the JSON property `initialDelaySeconds`
|
24814
|
+
# @return [Fixnum]
|
24815
|
+
attr_accessor :initial_delay_seconds
|
24816
|
+
|
24257
24817
|
# How often (in seconds) to perform the probe. Default to 10 seconds. Minimum
|
24258
24818
|
# value is 1. Must be less than timeout_seconds. Maps to Kubernetes probe
|
24259
24819
|
# argument 'periodSeconds'.
|
@@ -24261,6 +24821,13 @@ module Google
|
|
24261
24821
|
# @return [Fixnum]
|
24262
24822
|
attr_accessor :period_seconds
|
24263
24823
|
|
24824
|
+
# Number of consecutive successes before the probe is considered successful.
|
24825
|
+
# Defaults to 1. Minimum value is 1. Maps to Kubernetes probe argument '
|
24826
|
+
# successThreshold'.
|
24827
|
+
# Corresponds to the JSON property `successThreshold`
|
24828
|
+
# @return [Fixnum]
|
24829
|
+
attr_accessor :success_threshold
|
24830
|
+
|
24264
24831
|
# TcpSocketAction probes the health of a container by opening a TCP socket
|
24265
24832
|
# connection.
|
24266
24833
|
# Corresponds to the JSON property `tcpSocket`
|
@@ -24281,9 +24848,12 @@ module Google
|
|
24281
24848
|
# Update properties of this object
|
24282
24849
|
def update!(**args)
|
24283
24850
|
@exec = args[:exec] if args.key?(:exec)
|
24851
|
+
@failure_threshold = args[:failure_threshold] if args.key?(:failure_threshold)
|
24284
24852
|
@grpc = args[:grpc] if args.key?(:grpc)
|
24285
24853
|
@http_get = args[:http_get] if args.key?(:http_get)
|
24854
|
+
@initial_delay_seconds = args[:initial_delay_seconds] if args.key?(:initial_delay_seconds)
|
24286
24855
|
@period_seconds = args[:period_seconds] if args.key?(:period_seconds)
|
24856
|
+
@success_threshold = args[:success_threshold] if args.key?(:success_threshold)
|
24287
24857
|
@tcp_socket = args[:tcp_socket] if args.key?(:tcp_socket)
|
24288
24858
|
@timeout_seconds = args[:timeout_seconds] if args.key?(:timeout_seconds)
|
24289
24859
|
end
|
@@ -24705,8 +25275,8 @@ module Google
|
|
24705
25275
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelContainerSpec]
|
24706
25276
|
attr_accessor :container_spec
|
24707
25277
|
|
24708
|
-
# A description of resources that are dedicated to a DeployedModel
|
24709
|
-
# need a higher degree of manual configuration.
|
25278
|
+
# A description of resources that are dedicated to a DeployedModel or
|
25279
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
24710
25280
|
# Corresponds to the JSON property `dedicatedResources`
|
24711
25281
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
24712
25282
|
attr_accessor :dedicated_resources
|
@@ -26036,6 +26606,11 @@ module Google
|
|
26036
26606
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagEmbeddingModelConfig]
|
26037
26607
|
attr_accessor :rag_embedding_model_config
|
26038
26608
|
|
26609
|
+
# Output only. Number of RagFiles in the RagCorpus.
|
26610
|
+
# Corresponds to the JSON property `ragFilesCount`
|
26611
|
+
# @return [Fixnum]
|
26612
|
+
attr_accessor :rag_files_count
|
26613
|
+
|
26039
26614
|
# Config for the Vector DB to use for RAG.
|
26040
26615
|
# Corresponds to the JSON property `ragVectorDbConfig`
|
26041
26616
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagVectorDbConfig]
|
@@ -26068,6 +26643,7 @@ module Google
|
|
26068
26643
|
@display_name = args[:display_name] if args.key?(:display_name)
|
26069
26644
|
@name = args[:name] if args.key?(:name)
|
26070
26645
|
@rag_embedding_model_config = args[:rag_embedding_model_config] if args.key?(:rag_embedding_model_config)
|
26646
|
+
@rag_files_count = args[:rag_files_count] if args.key?(:rag_files_count)
|
26071
26647
|
@rag_vector_db_config = args[:rag_vector_db_config] if args.key?(:rag_vector_db_config)
|
26072
26648
|
@update_time = args[:update_time] if args.key?(:update_time)
|
26073
26649
|
@vector_db_config = args[:vector_db_config] if args.key?(:vector_db_config)
|
@@ -26478,7 +27054,8 @@ module Google
|
|
26478
27054
|
# @return [Fixnum]
|
26479
27055
|
attr_accessor :max_parsing_requests_per_min
|
26480
27056
|
|
26481
|
-
# The name of a LLM model used for parsing. Format: `
|
27057
|
+
# The name of a LLM model used for parsing. Format: * `projects/`project_id`/
|
27058
|
+
# locations/`location`/publishers/`publisher`/models/`model``
|
26482
27059
|
# Corresponds to the JSON property `modelName`
|
26483
27060
|
# @return [String]
|
26484
27061
|
attr_accessor :model_name
|
@@ -26733,7 +27310,8 @@ module Google
|
|
26733
27310
|
class GoogleCloudAiplatformV1beta1RagVectorDbConfig
|
26734
27311
|
include Google::Apis::Core::Hashable
|
26735
27312
|
|
26736
|
-
# The generic reusable api auth config.
|
27313
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
27314
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
26737
27315
|
# Corresponds to the JSON property `apiAuth`
|
26738
27316
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ApiAuth]
|
26739
27317
|
attr_accessor :api_auth
|
@@ -28012,6 +28590,34 @@ module Google
|
|
28012
28590
|
end
|
28013
28591
|
end
|
28014
28592
|
|
28593
|
+
# Retrieval config.
|
28594
|
+
class GoogleCloudAiplatformV1beta1RetrievalConfig
|
28595
|
+
include Google::Apis::Core::Hashable
|
28596
|
+
|
28597
|
+
# The language code of the user.
|
28598
|
+
# Corresponds to the JSON property `languageCode`
|
28599
|
+
# @return [String]
|
28600
|
+
attr_accessor :language_code
|
28601
|
+
|
28602
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
28603
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
28604
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
28605
|
+
# must be within normalized ranges.
|
28606
|
+
# Corresponds to the JSON property `latLng`
|
28607
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleTypeLatLng]
|
28608
|
+
attr_accessor :lat_lng
|
28609
|
+
|
28610
|
+
def initialize(**args)
|
28611
|
+
update!(**args)
|
28612
|
+
end
|
28613
|
+
|
28614
|
+
# Update properties of this object
|
28615
|
+
def update!(**args)
|
28616
|
+
@language_code = args[:language_code] if args.key?(:language_code)
|
28617
|
+
@lat_lng = args[:lat_lng] if args.key?(:lat_lng)
|
28618
|
+
end
|
28619
|
+
end
|
28620
|
+
|
28015
28621
|
# Metadata related to retrieval in the grounding flow.
|
28016
28622
|
class GoogleCloudAiplatformV1beta1RetrievalMetadata
|
28017
28623
|
include Google::Apis::Core::Hashable
|
@@ -28139,6 +28745,59 @@ module Google
|
|
28139
28745
|
end
|
28140
28746
|
end
|
28141
28747
|
|
28748
|
+
# Configuration for rolling deployments.
|
28749
|
+
class GoogleCloudAiplatformV1beta1RolloutOptions
|
28750
|
+
include Google::Apis::Core::Hashable
|
28751
|
+
|
28752
|
+
# Percentage of allowed additional replicas. For autoscaling deployments, this
|
28753
|
+
# refers to the target replica count.
|
28754
|
+
# Corresponds to the JSON property `maxSurgePercentage`
|
28755
|
+
# @return [Fixnum]
|
28756
|
+
attr_accessor :max_surge_percentage
|
28757
|
+
|
28758
|
+
# Absolute count of allowed additional replicas.
|
28759
|
+
# Corresponds to the JSON property `maxSurgeReplicas`
|
28760
|
+
# @return [Fixnum]
|
28761
|
+
attr_accessor :max_surge_replicas
|
28762
|
+
|
28763
|
+
# Percentage of replicas allowed to be unavailable. For autoscaling deployments,
|
28764
|
+
# this refers to the target replica count.
|
28765
|
+
# Corresponds to the JSON property `maxUnavailablePercentage`
|
28766
|
+
# @return [Fixnum]
|
28767
|
+
attr_accessor :max_unavailable_percentage
|
28768
|
+
|
28769
|
+
# Absolute count of replicas allowed to be unavailable.
|
28770
|
+
# Corresponds to the JSON property `maxUnavailableReplicas`
|
28771
|
+
# @return [Fixnum]
|
28772
|
+
attr_accessor :max_unavailable_replicas
|
28773
|
+
|
28774
|
+
# ID of the DeployedModel that this deployment should replace.
|
28775
|
+
# Corresponds to the JSON property `previousDeployedModel`
|
28776
|
+
# @return [String]
|
28777
|
+
attr_accessor :previous_deployed_model
|
28778
|
+
|
28779
|
+
# Output only. Read-only. Revision number determines the relative priority of
|
28780
|
+
# DeployedModels in the same rollout. The DeployedModel with the largest
|
28781
|
+
# revision number specifies the intended state of the deployment.
|
28782
|
+
# Corresponds to the JSON property `revisionNumber`
|
28783
|
+
# @return [Fixnum]
|
28784
|
+
attr_accessor :revision_number
|
28785
|
+
|
28786
|
+
def initialize(**args)
|
28787
|
+
update!(**args)
|
28788
|
+
end
|
28789
|
+
|
28790
|
+
# Update properties of this object
|
28791
|
+
def update!(**args)
|
28792
|
+
@max_surge_percentage = args[:max_surge_percentage] if args.key?(:max_surge_percentage)
|
28793
|
+
@max_surge_replicas = args[:max_surge_replicas] if args.key?(:max_surge_replicas)
|
28794
|
+
@max_unavailable_percentage = args[:max_unavailable_percentage] if args.key?(:max_unavailable_percentage)
|
28795
|
+
@max_unavailable_replicas = args[:max_unavailable_replicas] if args.key?(:max_unavailable_replicas)
|
28796
|
+
@previous_deployed_model = args[:previous_deployed_model] if args.key?(:previous_deployed_model)
|
28797
|
+
@revision_number = args[:revision_number] if args.key?(:revision_number)
|
28798
|
+
end
|
28799
|
+
end
|
28800
|
+
|
28142
28801
|
# Input for rouge metric.
|
28143
28802
|
class GoogleCloudAiplatformV1beta1RougeInput
|
28144
28803
|
include Google::Apis::Core::Hashable
|
@@ -32427,8 +33086,9 @@ module Google
|
|
32427
33086
|
class GoogleCloudAiplatformV1beta1SchemaTextDataItem
|
32428
33087
|
include Google::Apis::Core::Hashable
|
32429
33088
|
|
32430
|
-
# Output only. Google Cloud Storage URI points to the original text in
|
32431
|
-
# bucket. The text file is up to 10MB
|
33089
|
+
# Output only. Google Cloud Storage URI points to a copy of the original text in
|
33090
|
+
# the Vertex-managed bucket in the user's project. The text file is up to 10MB
|
33091
|
+
# in size.
|
32432
33092
|
# Corresponds to the JSON property `gcsUri`
|
32433
33093
|
# @return [String]
|
32434
33094
|
attr_accessor :gcs_uri
|
@@ -36729,6 +37389,81 @@ module Google
|
|
36729
37389
|
end
|
36730
37390
|
end
|
36731
37391
|
|
37392
|
+
# Configuration for Speculative Decoding.
|
37393
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec
|
37394
|
+
include Google::Apis::Core::Hashable
|
37395
|
+
|
37396
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37397
|
+
# tokens for speculative decoding.
|
37398
|
+
# Corresponds to the JSON property `draftModelSpeculation`
|
37399
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation]
|
37400
|
+
attr_accessor :draft_model_speculation
|
37401
|
+
|
37402
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37403
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37404
|
+
# Corresponds to the JSON property `ngramSpeculation`
|
37405
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation]
|
37406
|
+
attr_accessor :ngram_speculation
|
37407
|
+
|
37408
|
+
# The number of speculative tokens to generate at each step.
|
37409
|
+
# Corresponds to the JSON property `speculativeTokenCount`
|
37410
|
+
# @return [Fixnum]
|
37411
|
+
attr_accessor :speculative_token_count
|
37412
|
+
|
37413
|
+
def initialize(**args)
|
37414
|
+
update!(**args)
|
37415
|
+
end
|
37416
|
+
|
37417
|
+
# Update properties of this object
|
37418
|
+
def update!(**args)
|
37419
|
+
@draft_model_speculation = args[:draft_model_speculation] if args.key?(:draft_model_speculation)
|
37420
|
+
@ngram_speculation = args[:ngram_speculation] if args.key?(:ngram_speculation)
|
37421
|
+
@speculative_token_count = args[:speculative_token_count] if args.key?(:speculative_token_count)
|
37422
|
+
end
|
37423
|
+
end
|
37424
|
+
|
37425
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37426
|
+
# tokens for speculative decoding.
|
37427
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation
|
37428
|
+
include Google::Apis::Core::Hashable
|
37429
|
+
|
37430
|
+
# Required. The resource name of the draft model.
|
37431
|
+
# Corresponds to the JSON property `draftModel`
|
37432
|
+
# @return [String]
|
37433
|
+
attr_accessor :draft_model
|
37434
|
+
|
37435
|
+
def initialize(**args)
|
37436
|
+
update!(**args)
|
37437
|
+
end
|
37438
|
+
|
37439
|
+
# Update properties of this object
|
37440
|
+
def update!(**args)
|
37441
|
+
@draft_model = args[:draft_model] if args.key?(:draft_model)
|
37442
|
+
end
|
37443
|
+
end
|
37444
|
+
|
37445
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37446
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37447
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation
|
37448
|
+
include Google::Apis::Core::Hashable
|
37449
|
+
|
37450
|
+
# The number of last N input tokens used as ngram to search/match against the
|
37451
|
+
# previous prompt sequence. This is equal to the N in N-Gram. The default value
|
37452
|
+
# is 3 if not specified.
|
37453
|
+
# Corresponds to the JSON property `ngramSize`
|
37454
|
+
# @return [Fixnum]
|
37455
|
+
attr_accessor :ngram_size
|
37456
|
+
|
37457
|
+
def initialize(**args)
|
37458
|
+
update!(**args)
|
37459
|
+
end
|
37460
|
+
|
37461
|
+
# Update properties of this object
|
37462
|
+
def update!(**args)
|
37463
|
+
@ngram_size = args[:ngram_size] if args.key?(:ngram_size)
|
37464
|
+
end
|
37465
|
+
end
|
37466
|
+
|
36732
37467
|
# The speech generation config.
|
36733
37468
|
class GoogleCloudAiplatformV1beta1SpeechConfig
|
36734
37469
|
include Google::Apis::Core::Hashable
|
@@ -38454,6 +39189,12 @@ module Google
|
|
38454
39189
|
class GoogleCloudAiplatformV1beta1SupervisedTuningDataStats
|
38455
39190
|
include Google::Apis::Core::Hashable
|
38456
39191
|
|
39192
|
+
# Output only. For each index in `truncated_example_indices`, the user-facing
|
39193
|
+
# reason why the example was dropped. Must not include example itself.
|
39194
|
+
# Corresponds to the JSON property `droppedExampleReasons`
|
39195
|
+
# @return [Array<String>]
|
39196
|
+
attr_accessor :dropped_example_reasons
|
39197
|
+
|
38457
39198
|
# Output only. Number of billable characters in the tuning dataset.
|
38458
39199
|
# Corresponds to the JSON property `totalBillableCharacterCount`
|
38459
39200
|
# @return [Fixnum]
|
@@ -38464,7 +39205,9 @@ module Google
|
|
38464
39205
|
# @return [Fixnum]
|
38465
39206
|
attr_accessor :total_billable_token_count
|
38466
39207
|
|
38467
|
-
# The number of examples in the dataset that have been
|
39208
|
+
# Output only. The number of examples in the dataset that have been dropped. An
|
39209
|
+
# example can be dropped for reasons including: too many tokens, contains an
|
39210
|
+
# invalid image, contains too many images, etc.
|
38468
39211
|
# Corresponds to the JSON property `totalTruncatedExampleCount`
|
38469
39212
|
# @return [Fixnum]
|
38470
39213
|
attr_accessor :total_truncated_example_count
|
@@ -38474,7 +39217,8 @@ module Google
|
|
38474
39217
|
# @return [Fixnum]
|
38475
39218
|
attr_accessor :total_tuning_character_count
|
38476
39219
|
|
38477
|
-
# A partial sample of the indices (starting from 1) of the
|
39220
|
+
# Output only. A partial sample of the indices (starting from 1) of the dropped
|
39221
|
+
# examples.
|
38478
39222
|
# Corresponds to the JSON property `truncatedExampleIndices`
|
38479
39223
|
# @return [Array<Fixnum>]
|
38480
39224
|
attr_accessor :truncated_example_indices
|
@@ -38515,6 +39259,7 @@ module Google
|
|
38515
39259
|
|
38516
39260
|
# Update properties of this object
|
38517
39261
|
def update!(**args)
|
39262
|
+
@dropped_example_reasons = args[:dropped_example_reasons] if args.key?(:dropped_example_reasons)
|
38518
39263
|
@total_billable_character_count = args[:total_billable_character_count] if args.key?(:total_billable_character_count)
|
38519
39264
|
@total_billable_token_count = args[:total_billable_token_count] if args.key?(:total_billable_token_count)
|
38520
39265
|
@total_truncated_example_count = args[:total_truncated_example_count] if args.key?(:total_truncated_example_count)
|
@@ -39635,6 +40380,11 @@ module Google
|
|
39635
40380
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionCallingConfig]
|
39636
40381
|
attr_accessor :function_calling_config
|
39637
40382
|
|
40383
|
+
# Retrieval config.
|
40384
|
+
# Corresponds to the JSON property `retrievalConfig`
|
40385
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RetrievalConfig]
|
40386
|
+
attr_accessor :retrieval_config
|
40387
|
+
|
39638
40388
|
def initialize(**args)
|
39639
40389
|
update!(**args)
|
39640
40390
|
end
|
@@ -39642,6 +40392,7 @@ module Google
|
|
39642
40392
|
# Update properties of this object
|
39643
40393
|
def update!(**args)
|
39644
40394
|
@function_calling_config = args[:function_calling_config] if args.key?(:function_calling_config)
|
40395
|
+
@retrieval_config = args[:retrieval_config] if args.key?(:retrieval_config)
|
39645
40396
|
end
|
39646
40397
|
end
|
39647
40398
|
|
@@ -41024,7 +41775,7 @@ module Google
|
|
41024
41775
|
end
|
41025
41776
|
end
|
41026
41777
|
|
41027
|
-
# The Model Registry Model and Online Prediction Endpoint
|
41778
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
41028
41779
|
# TuningJob.
|
41029
41780
|
class GoogleCloudAiplatformV1beta1TunedModel
|
41030
41781
|
include Google::Apis::Core::Hashable
|
@@ -41214,7 +41965,7 @@ module Google
|
|
41214
41965
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SupervisedTuningSpec]
|
41215
41966
|
attr_accessor :supervised_tuning_spec
|
41216
41967
|
|
41217
|
-
# The Model Registry Model and Online Prediction Endpoint
|
41968
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
41218
41969
|
# TuningJob.
|
41219
41970
|
# Corresponds to the JSON property `tunedModel`
|
41220
41971
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1TunedModel]
|
@@ -43213,6 +43964,34 @@ module Google
|
|
43213
43964
|
end
|
43214
43965
|
end
|
43215
43966
|
|
43967
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
43968
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
43969
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
43970
|
+
# must be within normalized ranges.
|
43971
|
+
class GoogleTypeLatLng
|
43972
|
+
include Google::Apis::Core::Hashable
|
43973
|
+
|
43974
|
+
# The latitude in degrees. It must be in the range [-90.0, +90.0].
|
43975
|
+
# Corresponds to the JSON property `latitude`
|
43976
|
+
# @return [Float]
|
43977
|
+
attr_accessor :latitude
|
43978
|
+
|
43979
|
+
# The longitude in degrees. It must be in the range [-180.0, +180.0].
|
43980
|
+
# Corresponds to the JSON property `longitude`
|
43981
|
+
# @return [Float]
|
43982
|
+
attr_accessor :longitude
|
43983
|
+
|
43984
|
+
def initialize(**args)
|
43985
|
+
update!(**args)
|
43986
|
+
end
|
43987
|
+
|
43988
|
+
# Update properties of this object
|
43989
|
+
def update!(**args)
|
43990
|
+
@latitude = args[:latitude] if args.key?(:latitude)
|
43991
|
+
@longitude = args[:longitude] if args.key?(:longitude)
|
43992
|
+
end
|
43993
|
+
end
|
43994
|
+
|
43216
43995
|
# Represents an amount of money with its currency type.
|
43217
43996
|
class GoogleTypeMoney
|
43218
43997
|
include Google::Apis::Core::Hashable
|