google-apis-aiplatform_v1beta1 0.36.0 → 0.38.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -0
- data/lib/google/apis/aiplatform_v1beta1/classes.rb +1226 -73
- data/lib/google/apis/aiplatform_v1beta1/gem_version.rb +3 -3
- data/lib/google/apis/aiplatform_v1beta1/representations.rb +514 -0
- data/lib/google/apis/aiplatform_v1beta1/service.rb +193 -4
- metadata +4 -7
@@ -41,6 +41,11 @@ module Google
|
|
41
41
|
# @return [Array<String>]
|
42
42
|
attr_accessor :rai_media_filtered_reasons
|
43
43
|
|
44
|
+
# List of videos, used to align naming with the external response.
|
45
|
+
# Corresponds to the JSON property `videos`
|
46
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::CloudAiLargeModelsVisionGenerateVideoResponseVideo>]
|
47
|
+
attr_accessor :videos
|
48
|
+
|
44
49
|
def initialize(**args)
|
45
50
|
update!(**args)
|
46
51
|
end
|
@@ -50,6 +55,38 @@ module Google
|
|
50
55
|
@generated_samples = args[:generated_samples] if args.key?(:generated_samples)
|
51
56
|
@rai_media_filtered_count = args[:rai_media_filtered_count] if args.key?(:rai_media_filtered_count)
|
52
57
|
@rai_media_filtered_reasons = args[:rai_media_filtered_reasons] if args.key?(:rai_media_filtered_reasons)
|
58
|
+
@videos = args[:videos] if args.key?(:videos)
|
59
|
+
end
|
60
|
+
end
|
61
|
+
|
62
|
+
#
|
63
|
+
class CloudAiLargeModelsVisionGenerateVideoResponseVideo
|
64
|
+
include Google::Apis::Core::Hashable
|
65
|
+
|
66
|
+
# Base64 encoded bytes string representing the video.
|
67
|
+
# Corresponds to the JSON property `bytesBase64Encoded`
|
68
|
+
# @return [String]
|
69
|
+
attr_accessor :bytes_base64_encoded
|
70
|
+
|
71
|
+
# Cloud Storage URI where the generated video is written.
|
72
|
+
# Corresponds to the JSON property `gcsUri`
|
73
|
+
# @return [String]
|
74
|
+
attr_accessor :gcs_uri
|
75
|
+
|
76
|
+
# The MIME type of the content of the video. - video/mp4
|
77
|
+
# Corresponds to the JSON property `mimeType`
|
78
|
+
# @return [String]
|
79
|
+
attr_accessor :mime_type
|
80
|
+
|
81
|
+
def initialize(**args)
|
82
|
+
update!(**args)
|
83
|
+
end
|
84
|
+
|
85
|
+
# Update properties of this object
|
86
|
+
def update!(**args)
|
87
|
+
@bytes_base64_encoded = args[:bytes_base64_encoded] if args.key?(:bytes_base64_encoded)
|
88
|
+
@gcs_uri = args[:gcs_uri] if args.key?(:gcs_uri)
|
89
|
+
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
53
90
|
end
|
54
91
|
end
|
55
92
|
|
@@ -450,6 +487,11 @@ module Google
|
|
450
487
|
# @return [String]
|
451
488
|
attr_accessor :encoding
|
452
489
|
|
490
|
+
# Text/Expanded text input for Help Me Write.
|
491
|
+
# Corresponds to the JSON property `text`
|
492
|
+
# @return [String]
|
493
|
+
attr_accessor :text
|
494
|
+
|
453
495
|
# Path to another storage (typically Google Cloud Storage).
|
454
496
|
# Corresponds to the JSON property `uri`
|
455
497
|
# @return [String]
|
@@ -469,12 +511,13 @@ module Google
|
|
469
511
|
def update!(**args)
|
470
512
|
@encoded_video = args[:encoded_video] if args.key?(:encoded_video)
|
471
513
|
@encoding = args[:encoding] if args.key?(:encoding)
|
514
|
+
@text = args[:text] if args.key?(:text)
|
472
515
|
@uri = args[:uri] if args.key?(:uri)
|
473
516
|
@video = args[:video] if args.key?(:video)
|
474
517
|
end
|
475
518
|
end
|
476
519
|
|
477
|
-
# Create API error message for Vertex Pipeline.
|
520
|
+
# Create API error message for Vertex Pipeline.
|
478
521
|
class CloudAiPlatformCommonCreatePipelineJobApiErrorDetail
|
479
522
|
include Google::Apis::Core::Hashable
|
480
523
|
|
@@ -840,7 +883,8 @@ module Google
|
|
840
883
|
end
|
841
884
|
end
|
842
885
|
|
843
|
-
# The generic reusable api auth config.
|
886
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
887
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
844
888
|
class GoogleCloudAiplatformV1beta1ApiAuth
|
845
889
|
include Google::Apis::Core::Hashable
|
846
890
|
|
@@ -1468,22 +1512,22 @@ module Google
|
|
1468
1512
|
class GoogleCloudAiplatformV1beta1AutomaticResources
|
1469
1513
|
include Google::Apis::Core::Hashable
|
1470
1514
|
|
1471
|
-
# Immutable. The maximum number of replicas
|
1472
|
-
#
|
1473
|
-
#
|
1474
|
-
#
|
1475
|
-
#
|
1476
|
-
#
|
1477
|
-
#
|
1478
|
-
#
|
1515
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
1516
|
+
# traffic against it increases. If the requested value is too large, the
|
1517
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
1518
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
1519
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
1520
|
+
# traffic will be dropped. If this value is not provided, a no upper bound for
|
1521
|
+
# scaling under heavy traffic will be assume, though Vertex AI may be unable to
|
1522
|
+
# scale beyond certain replica number.
|
1479
1523
|
# Corresponds to the JSON property `maxReplicaCount`
|
1480
1524
|
# @return [Fixnum]
|
1481
1525
|
attr_accessor :max_replica_count
|
1482
1526
|
|
1483
|
-
# Immutable. The minimum number of replicas
|
1484
|
-
#
|
1485
|
-
#
|
1486
|
-
#
|
1527
|
+
# Immutable. The minimum number of replicas that will be always deployed on. If
|
1528
|
+
# traffic against it increases, it may dynamically be deployed onto more
|
1529
|
+
# replicas up to max_replica_count, and as traffic decreases, some of these
|
1530
|
+
# extra replicas may be freed. If the requested value is too large, the
|
1487
1531
|
# deployment will error.
|
1488
1532
|
# Corresponds to the JSON property `minReplicaCount`
|
1489
1533
|
# @return [Fixnum]
|
@@ -1500,6 +1544,48 @@ module Google
|
|
1500
1544
|
end
|
1501
1545
|
end
|
1502
1546
|
|
1547
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
1548
|
+
# EvaluateDataset.
|
1549
|
+
class GoogleCloudAiplatformV1beta1AutoraterConfig
|
1550
|
+
include Google::Apis::Core::Hashable
|
1551
|
+
|
1552
|
+
# Optional. The fully qualified name of the publisher model or tuned autorater
|
1553
|
+
# endpoint to use. Publisher model format: `projects/`project`/locations/`
|
1554
|
+
# location`/publishers/*/models/*` Tuned model endpoint format: `projects/`
|
1555
|
+
# project`/locations/`location`/endpoints/`endpoint``
|
1556
|
+
# Corresponds to the JSON property `autoraterModel`
|
1557
|
+
# @return [String]
|
1558
|
+
attr_accessor :autorater_model
|
1559
|
+
|
1560
|
+
# Optional. Whether to flip the candidate and baseline responses. This is only
|
1561
|
+
# applicable to the pairwise metric. If enabled, also provide PairwiseMetricSpec.
|
1562
|
+
# candidate_response_field_name and PairwiseMetricSpec.
|
1563
|
+
# baseline_response_field_name. When rendering PairwiseMetricSpec.
|
1564
|
+
# metric_prompt_template, the candidate and baseline fields will be flipped for
|
1565
|
+
# half of the samples to reduce bias.
|
1566
|
+
# Corresponds to the JSON property `flipEnabled`
|
1567
|
+
# @return [Boolean]
|
1568
|
+
attr_accessor :flip_enabled
|
1569
|
+
alias_method :flip_enabled?, :flip_enabled
|
1570
|
+
|
1571
|
+
# Optional. Number of samples for each instance in the dataset. If not specified,
|
1572
|
+
# the default is 4. Minimum value is 1, maximum value is 32.
|
1573
|
+
# Corresponds to the JSON property `samplingCount`
|
1574
|
+
# @return [Fixnum]
|
1575
|
+
attr_accessor :sampling_count
|
1576
|
+
|
1577
|
+
def initialize(**args)
|
1578
|
+
update!(**args)
|
1579
|
+
end
|
1580
|
+
|
1581
|
+
# Update properties of this object
|
1582
|
+
def update!(**args)
|
1583
|
+
@autorater_model = args[:autorater_model] if args.key?(:autorater_model)
|
1584
|
+
@flip_enabled = args[:flip_enabled] if args.key?(:flip_enabled)
|
1585
|
+
@sampling_count = args[:sampling_count] if args.key?(:sampling_count)
|
1586
|
+
end
|
1587
|
+
end
|
1588
|
+
|
1503
1589
|
# The metric specification that defines the target resource utilization (CPU
|
1504
1590
|
# utilization, accelerator's duty cycle, and so on) for calculating the desired
|
1505
1591
|
# replica count.
|
@@ -2756,6 +2842,13 @@ module Google
|
|
2756
2842
|
# @return [String]
|
2757
2843
|
attr_accessor :data
|
2758
2844
|
|
2845
|
+
# Optional. Display name of the blob. Used to provide a label or filename to
|
2846
|
+
# distinguish blobs. This field is only returned in PromptMessage for prompt
|
2847
|
+
# management. It is not currently used in the Gemini GenerateContent calls.
|
2848
|
+
# Corresponds to the JSON property `displayName`
|
2849
|
+
# @return [String]
|
2850
|
+
attr_accessor :display_name
|
2851
|
+
|
2759
2852
|
# Required. The IANA standard MIME type of the source data.
|
2760
2853
|
# Corresponds to the JSON property `mimeType`
|
2761
2854
|
# @return [String]
|
@@ -2768,6 +2861,7 @@ module Google
|
|
2768
2861
|
# Update properties of this object
|
2769
2862
|
def update!(**args)
|
2770
2863
|
@data = args[:data] if args.key?(:data)
|
2864
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
2771
2865
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
2772
2866
|
end
|
2773
2867
|
end
|
@@ -2852,7 +2946,7 @@ module Google
|
|
2852
2946
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Content>]
|
2853
2947
|
attr_accessor :contents
|
2854
2948
|
|
2855
|
-
# Output only.
|
2949
|
+
# Output only. Creation time of the cache entry.
|
2856
2950
|
# Corresponds to the JSON property `createTime`
|
2857
2951
|
# @return [String]
|
2858
2952
|
attr_accessor :create_time
|
@@ -2869,8 +2963,9 @@ module Google
|
|
2869
2963
|
# @return [String]
|
2870
2964
|
attr_accessor :expire_time
|
2871
2965
|
|
2872
|
-
# Immutable. The name of the
|
2873
|
-
# projects/`
|
2966
|
+
# Immutable. The name of the `Model` to use for cached content. Currently, only
|
2967
|
+
# the published Gemini base models are supported, in form of projects/`PROJECT`/
|
2968
|
+
# locations/`LOCATION`/publishers/google/models/`MODEL`
|
2874
2969
|
# Corresponds to the JSON property `model`
|
2875
2970
|
# @return [String]
|
2876
2971
|
attr_accessor :model
|
@@ -4160,6 +4255,11 @@ module Google
|
|
4160
4255
|
class GoogleCloudAiplatformV1beta1CountTokensResponse
|
4161
4256
|
include Google::Apis::Core::Hashable
|
4162
4257
|
|
4258
|
+
# Output only. List of modalities that were processed in the request input.
|
4259
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
4260
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
4261
|
+
attr_accessor :prompt_tokens_details
|
4262
|
+
|
4163
4263
|
# The total number of billable characters counted across all instances from the
|
4164
4264
|
# request.
|
4165
4265
|
# Corresponds to the JSON property `totalBillableCharacters`
|
@@ -4177,6 +4277,7 @@ module Google
|
|
4177
4277
|
|
4178
4278
|
# Update properties of this object
|
4179
4279
|
def update!(**args)
|
4280
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
4180
4281
|
@total_billable_characters = args[:total_billable_characters] if args.key?(:total_billable_characters)
|
4181
4282
|
@total_tokens = args[:total_tokens] if args.key?(:total_tokens)
|
4182
4283
|
end
|
@@ -5761,7 +5862,9 @@ module Google
|
|
5761
5862
|
# @return [String]
|
5762
5863
|
attr_accessor :model_reference
|
5763
5864
|
|
5764
|
-
# Output only. Identifier. The resource name of the DatasetVersion.
|
5865
|
+
# Output only. Identifier. The resource name of the DatasetVersion. Format: `
|
5866
|
+
# projects/`project`/locations/`location`/datasets/`dataset`/datasetVersions/`
|
5867
|
+
# dataset_version``
|
5765
5868
|
# Corresponds to the JSON property `name`
|
5766
5869
|
# @return [String]
|
5767
5870
|
attr_accessor :name
|
@@ -5802,8 +5905,8 @@ module Google
|
|
5802
5905
|
end
|
5803
5906
|
end
|
5804
5907
|
|
5805
|
-
# A description of resources that are dedicated to a DeployedModel
|
5806
|
-
# need a higher degree of manual configuration.
|
5908
|
+
# A description of resources that are dedicated to a DeployedModel or
|
5909
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
5807
5910
|
class GoogleCloudAiplatformV1beta1DedicatedResources
|
5808
5911
|
include Google::Apis::Core::Hashable
|
5809
5912
|
|
@@ -5829,36 +5932,33 @@ module Google
|
|
5829
5932
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1MachineSpec]
|
5830
5933
|
attr_accessor :machine_spec
|
5831
5934
|
|
5832
|
-
# Immutable. The maximum number of replicas
|
5833
|
-
#
|
5834
|
-
#
|
5835
|
-
#
|
5836
|
-
#
|
5837
|
-
#
|
5838
|
-
#
|
5839
|
-
#
|
5840
|
-
#
|
5841
|
-
#
|
5842
|
-
# selected machine type).
|
5935
|
+
# Immutable. The maximum number of replicas that may be deployed on when the
|
5936
|
+
# traffic against it increases. If the requested value is too large, the
|
5937
|
+
# deployment will error, but if deployment succeeds then the ability to scale to
|
5938
|
+
# that many replicas is guaranteed (barring service outages). If traffic
|
5939
|
+
# increases beyond what its replicas at maximum may handle, a portion of the
|
5940
|
+
# traffic will be dropped. If this value is not provided, will use
|
5941
|
+
# min_replica_count as the default value. The value of this field impacts the
|
5942
|
+
# charge against Vertex CPU and GPU quotas. Specifically, you will be charged
|
5943
|
+
# for (max_replica_count * number of cores in the selected machine type) and (
|
5944
|
+
# max_replica_count * number of GPUs per replica in the selected machine type).
|
5843
5945
|
# Corresponds to the JSON property `maxReplicaCount`
|
5844
5946
|
# @return [Fixnum]
|
5845
5947
|
attr_accessor :max_replica_count
|
5846
5948
|
|
5847
|
-
# Required. Immutable. The minimum number of machine replicas
|
5848
|
-
#
|
5849
|
-
#
|
5850
|
-
#
|
5851
|
-
# be freed.
|
5949
|
+
# Required. Immutable. The minimum number of machine replicas that will be
|
5950
|
+
# always deployed on. This value must be greater than or equal to 1. If traffic
|
5951
|
+
# increases, it may dynamically be deployed onto more replicas, and as traffic
|
5952
|
+
# decreases, some of these extra replicas may be freed.
|
5852
5953
|
# Corresponds to the JSON property `minReplicaCount`
|
5853
5954
|
# @return [Fixnum]
|
5854
5955
|
attr_accessor :min_replica_count
|
5855
5956
|
|
5856
5957
|
# Optional. Number of required available replicas for the deployment to succeed.
|
5857
|
-
# This field is only needed when partial
|
5858
|
-
#
|
5859
|
-
#
|
5860
|
-
#
|
5861
|
-
# be min_replica_count.
|
5958
|
+
# This field is only needed when partial deployment/mutation is desired. If set,
|
5959
|
+
# the deploy/mutate operation will succeed once available_replica_count reaches
|
5960
|
+
# required_replica_count, and the rest of the replicas will be retried. If not
|
5961
|
+
# set, the default required_replica_count will be min_replica_count.
|
5862
5962
|
# Corresponds to the JSON property `requiredReplicaCount`
|
5863
5963
|
# @return [Fixnum]
|
5864
5964
|
attr_accessor :required_replica_count
|
@@ -6268,8 +6368,8 @@ module Google
|
|
6268
6368
|
attr_accessor :accept_eula
|
6269
6369
|
alias_method :accept_eula?, :accept_eula
|
6270
6370
|
|
6271
|
-
# A description of resources that are dedicated to a DeployedModel
|
6272
|
-
# need a higher degree of manual configuration.
|
6371
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6372
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6273
6373
|
# Corresponds to the JSON property `dedicatedResources`
|
6274
6374
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6275
6375
|
attr_accessor :dedicated_resources
|
@@ -6286,9 +6386,11 @@ module Google
|
|
6286
6386
|
# @return [String]
|
6287
6387
|
attr_accessor :hugging_face_access_token
|
6288
6388
|
|
6289
|
-
# Required. The
|
6290
|
-
#
|
6291
|
-
#
|
6389
|
+
# Required. The model to deploy. Format: 1. `publishers/`publisher`/models/`
|
6390
|
+
# publisher_model`@`version_id``, or `publishers/hf-`hugging-face-author`/models/
|
6391
|
+
# `hugging-face-model-name`@001`. 2. Hugging Face model ID like `google/gemma-2-
|
6392
|
+
# 2b-it`. 3. Custom model Google Cloud Storage URI like `gs://bucket`. 4. Custom
|
6393
|
+
# model zip file like `https://abc.com/a.zip`.
|
6292
6394
|
# Corresponds to the JSON property `model`
|
6293
6395
|
# @return [String]
|
6294
6396
|
attr_accessor :model
|
@@ -6314,6 +6416,165 @@ module Google
|
|
6314
6416
|
end
|
6315
6417
|
end
|
6316
6418
|
|
6419
|
+
# Request message for ModelGardenService.Deploy.
|
6420
|
+
class GoogleCloudAiplatformV1beta1DeployRequest
|
6421
|
+
include Google::Apis::Core::Hashable
|
6422
|
+
|
6423
|
+
# The deploy config to use for the deployment.
|
6424
|
+
# Corresponds to the JSON property `deployConfig`
|
6425
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployRequestDeployConfig]
|
6426
|
+
attr_accessor :deploy_config
|
6427
|
+
|
6428
|
+
# The endpoint config to use for the deployment.
|
6429
|
+
# Corresponds to the JSON property `endpointConfig`
|
6430
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployRequestEndpointConfig]
|
6431
|
+
attr_accessor :endpoint_config
|
6432
|
+
|
6433
|
+
# The Hugging Face model to deploy. Format: Hugging Face model ID like `google/
|
6434
|
+
# gemma-2-2b-it`.
|
6435
|
+
# Corresponds to the JSON property `huggingFaceModelId`
|
6436
|
+
# @return [String]
|
6437
|
+
attr_accessor :hugging_face_model_id
|
6438
|
+
|
6439
|
+
# The model config to use for the deployment.
|
6440
|
+
# Corresponds to the JSON property `modelConfig`
|
6441
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployRequestModelConfig]
|
6442
|
+
attr_accessor :model_config
|
6443
|
+
|
6444
|
+
# The Model Garden model to deploy. Format: `publishers/`publisher`/models/`
|
6445
|
+
# publisher_model`@`version_id``, or `publishers/hf-`hugging-face-author`/models/
|
6446
|
+
# `hugging-face-model-name`@001`.
|
6447
|
+
# Corresponds to the JSON property `publisherModelName`
|
6448
|
+
# @return [String]
|
6449
|
+
attr_accessor :publisher_model_name
|
6450
|
+
|
6451
|
+
def initialize(**args)
|
6452
|
+
update!(**args)
|
6453
|
+
end
|
6454
|
+
|
6455
|
+
# Update properties of this object
|
6456
|
+
def update!(**args)
|
6457
|
+
@deploy_config = args[:deploy_config] if args.key?(:deploy_config)
|
6458
|
+
@endpoint_config = args[:endpoint_config] if args.key?(:endpoint_config)
|
6459
|
+
@hugging_face_model_id = args[:hugging_face_model_id] if args.key?(:hugging_face_model_id)
|
6460
|
+
@model_config = args[:model_config] if args.key?(:model_config)
|
6461
|
+
@publisher_model_name = args[:publisher_model_name] if args.key?(:publisher_model_name)
|
6462
|
+
end
|
6463
|
+
end
|
6464
|
+
|
6465
|
+
# The deploy config to use for the deployment.
|
6466
|
+
class GoogleCloudAiplatformV1beta1DeployRequestDeployConfig
|
6467
|
+
include Google::Apis::Core::Hashable
|
6468
|
+
|
6469
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6470
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6471
|
+
# Corresponds to the JSON property `dedicatedResources`
|
6472
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6473
|
+
attr_accessor :dedicated_resources
|
6474
|
+
|
6475
|
+
# Optional. If true, enable the QMT fast tryout feature for this model if
|
6476
|
+
# possible.
|
6477
|
+
# Corresponds to the JSON property `fastTryoutEnabled`
|
6478
|
+
# @return [Boolean]
|
6479
|
+
attr_accessor :fast_tryout_enabled
|
6480
|
+
alias_method :fast_tryout_enabled?, :fast_tryout_enabled
|
6481
|
+
|
6482
|
+
def initialize(**args)
|
6483
|
+
update!(**args)
|
6484
|
+
end
|
6485
|
+
|
6486
|
+
# Update properties of this object
|
6487
|
+
def update!(**args)
|
6488
|
+
@dedicated_resources = args[:dedicated_resources] if args.key?(:dedicated_resources)
|
6489
|
+
@fast_tryout_enabled = args[:fast_tryout_enabled] if args.key?(:fast_tryout_enabled)
|
6490
|
+
end
|
6491
|
+
end
|
6492
|
+
|
6493
|
+
# The endpoint config to use for the deployment.
|
6494
|
+
class GoogleCloudAiplatformV1beta1DeployRequestEndpointConfig
|
6495
|
+
include Google::Apis::Core::Hashable
|
6496
|
+
|
6497
|
+
# Optional. If true, the endpoint will be exposed through a dedicated DNS [
|
6498
|
+
# Endpoint.dedicated_endpoint_dns]. Your request to the dedicated DNS will be
|
6499
|
+
# isolated from other users' traffic and will have better performance and
|
6500
|
+
# reliability. Note: Once you enabled dedicated endpoint, you won't be able to
|
6501
|
+
# send request to the shared DNS `region`-aiplatform.googleapis.com. The
|
6502
|
+
# limitations will be removed soon.
|
6503
|
+
# Corresponds to the JSON property `dedicatedEndpointEnabled`
|
6504
|
+
# @return [Boolean]
|
6505
|
+
attr_accessor :dedicated_endpoint_enabled
|
6506
|
+
alias_method :dedicated_endpoint_enabled?, :dedicated_endpoint_enabled
|
6507
|
+
|
6508
|
+
# Optional. The user-specified display name of the endpoint. If not set, a
|
6509
|
+
# default name will be used.
|
6510
|
+
# Corresponds to the JSON property `endpointDisplayName`
|
6511
|
+
# @return [String]
|
6512
|
+
attr_accessor :endpoint_display_name
|
6513
|
+
|
6514
|
+
def initialize(**args)
|
6515
|
+
update!(**args)
|
6516
|
+
end
|
6517
|
+
|
6518
|
+
# Update properties of this object
|
6519
|
+
def update!(**args)
|
6520
|
+
@dedicated_endpoint_enabled = args[:dedicated_endpoint_enabled] if args.key?(:dedicated_endpoint_enabled)
|
6521
|
+
@endpoint_display_name = args[:endpoint_display_name] if args.key?(:endpoint_display_name)
|
6522
|
+
end
|
6523
|
+
end
|
6524
|
+
|
6525
|
+
# The model config to use for the deployment.
|
6526
|
+
class GoogleCloudAiplatformV1beta1DeployRequestModelConfig
|
6527
|
+
include Google::Apis::Core::Hashable
|
6528
|
+
|
6529
|
+
# Optional. Whether the user accepts the End User License Agreement (EULA) for
|
6530
|
+
# the model.
|
6531
|
+
# Corresponds to the JSON property `acceptEula`
|
6532
|
+
# @return [Boolean]
|
6533
|
+
attr_accessor :accept_eula
|
6534
|
+
alias_method :accept_eula?, :accept_eula
|
6535
|
+
|
6536
|
+
# Specification of a container for serving predictions. Some fields in this
|
6537
|
+
# message correspond to fields in the [Kubernetes Container v1 core
|
6538
|
+
# specification](https://kubernetes.io/docs/reference/generated/kubernetes-api/
|
6539
|
+
# v1.23/#container-v1-core).
|
6540
|
+
# Corresponds to the JSON property `containerSpec`
|
6541
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelContainerSpec]
|
6542
|
+
attr_accessor :container_spec
|
6543
|
+
|
6544
|
+
# Optional. The Hugging Face read access token used to access the model
|
6545
|
+
# artifacts of gated models.
|
6546
|
+
# Corresponds to the JSON property `huggingFaceAccessToken`
|
6547
|
+
# @return [String]
|
6548
|
+
attr_accessor :hugging_face_access_token
|
6549
|
+
|
6550
|
+
# Optional. If true, the model will deploy with a cached version instead of
|
6551
|
+
# directly downloading the model artifacts from Hugging Face. This is suitable
|
6552
|
+
# for VPC-SC users with limited internet access.
|
6553
|
+
# Corresponds to the JSON property `huggingFaceCacheEnabled`
|
6554
|
+
# @return [Boolean]
|
6555
|
+
attr_accessor :hugging_face_cache_enabled
|
6556
|
+
alias_method :hugging_face_cache_enabled?, :hugging_face_cache_enabled
|
6557
|
+
|
6558
|
+
# Optional. The user-specified display name of the uploaded model. If not set, a
|
6559
|
+
# default name will be used.
|
6560
|
+
# Corresponds to the JSON property `modelDisplayName`
|
6561
|
+
# @return [String]
|
6562
|
+
attr_accessor :model_display_name
|
6563
|
+
|
6564
|
+
def initialize(**args)
|
6565
|
+
update!(**args)
|
6566
|
+
end
|
6567
|
+
|
6568
|
+
# Update properties of this object
|
6569
|
+
def update!(**args)
|
6570
|
+
@accept_eula = args[:accept_eula] if args.key?(:accept_eula)
|
6571
|
+
@container_spec = args[:container_spec] if args.key?(:container_spec)
|
6572
|
+
@hugging_face_access_token = args[:hugging_face_access_token] if args.key?(:hugging_face_access_token)
|
6573
|
+
@hugging_face_cache_enabled = args[:hugging_face_cache_enabled] if args.key?(:hugging_face_cache_enabled)
|
6574
|
+
@model_display_name = args[:model_display_name] if args.key?(:model_display_name)
|
6575
|
+
end
|
6576
|
+
end
|
6577
|
+
|
6317
6578
|
# Runtime operation information for SolverService.DeploySolver.
|
6318
6579
|
class GoogleCloudAiplatformV1beta1DeploySolverOperationMetadata
|
6319
6580
|
include Google::Apis::Core::Hashable
|
@@ -6349,8 +6610,8 @@ module Google
|
|
6349
6610
|
# @return [String]
|
6350
6611
|
attr_accessor :create_time
|
6351
6612
|
|
6352
|
-
# A description of resources that are dedicated to a DeployedModel
|
6353
|
-
# need a higher degree of manual configuration.
|
6613
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6614
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6354
6615
|
# Corresponds to the JSON property `dedicatedResources`
|
6355
6616
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6356
6617
|
attr_accessor :dedicated_resources
|
@@ -6562,8 +6823,8 @@ module Google
|
|
6562
6823
|
# @return [String]
|
6563
6824
|
attr_accessor :create_time
|
6564
6825
|
|
6565
|
-
# A description of resources that are dedicated to a DeployedModel
|
6566
|
-
# need a higher degree of manual configuration.
|
6826
|
+
# A description of resources that are dedicated to a DeployedModel or
|
6827
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6567
6828
|
# Corresponds to the JSON property `dedicatedResources`
|
6568
6829
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6569
6830
|
attr_accessor :dedicated_resources
|
@@ -6639,6 +6900,11 @@ module Google
|
|
6639
6900
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PrivateEndpoints]
|
6640
6901
|
attr_accessor :private_endpoints
|
6641
6902
|
|
6903
|
+
# Configuration for rolling deployments.
|
6904
|
+
# Corresponds to the JSON property `rolloutOptions`
|
6905
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RolloutOptions]
|
6906
|
+
attr_accessor :rollout_options
|
6907
|
+
|
6642
6908
|
# The service account that the DeployedModel's container runs as. Specify the
|
6643
6909
|
# email address of the service account. If this service account is not specified,
|
6644
6910
|
# the container runs as a service account that doesn't have access to the
|
@@ -6655,6 +6921,11 @@ module Google
|
|
6655
6921
|
# @return [String]
|
6656
6922
|
attr_accessor :shared_resources
|
6657
6923
|
|
6924
|
+
# Configuration for Speculative Decoding.
|
6925
|
+
# Corresponds to the JSON property `speculativeDecodingSpec`
|
6926
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec]
|
6927
|
+
attr_accessor :speculative_decoding_spec
|
6928
|
+
|
6658
6929
|
# Runtime status of the deployed model.
|
6659
6930
|
# Corresponds to the JSON property `status`
|
6660
6931
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployedModelStatus]
|
@@ -6685,8 +6956,10 @@ module Google
|
|
6685
6956
|
@model = args[:model] if args.key?(:model)
|
6686
6957
|
@model_version_id = args[:model_version_id] if args.key?(:model_version_id)
|
6687
6958
|
@private_endpoints = args[:private_endpoints] if args.key?(:private_endpoints)
|
6959
|
+
@rollout_options = args[:rollout_options] if args.key?(:rollout_options)
|
6688
6960
|
@service_account = args[:service_account] if args.key?(:service_account)
|
6689
6961
|
@shared_resources = args[:shared_resources] if args.key?(:shared_resources)
|
6962
|
+
@speculative_decoding_spec = args[:speculative_decoding_spec] if args.key?(:speculative_decoding_spec)
|
6690
6963
|
@status = args[:status] if args.key?(:status)
|
6691
6964
|
@system_labels = args[:system_labels] if args.key?(:system_labels)
|
6692
6965
|
end
|
@@ -6758,8 +7031,8 @@ module Google
|
|
6758
7031
|
# @return [String]
|
6759
7032
|
attr_accessor :create_time
|
6760
7033
|
|
6761
|
-
# A description of resources that are dedicated to a DeployedModel
|
6762
|
-
# need a higher degree of manual configuration.
|
7034
|
+
# A description of resources that are dedicated to a DeployedModel or
|
7035
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
6763
7036
|
# Corresponds to the JSON property `dedicatedResources`
|
6764
7037
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
6765
7038
|
attr_accessor :dedicated_resources
|
@@ -7241,6 +7514,11 @@ module Google
|
|
7241
7514
|
# @return [String]
|
7242
7515
|
attr_accessor :etag
|
7243
7516
|
|
7517
|
+
# Configuration for GenAiAdvancedFeatures.
|
7518
|
+
# Corresponds to the JSON property `genAiAdvancedFeaturesConfig`
|
7519
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig]
|
7520
|
+
attr_accessor :gen_ai_advanced_features_config
|
7521
|
+
|
7244
7522
|
# The labels with user-defined metadata to organize your Endpoints. Label keys
|
7245
7523
|
# and values can be no longer than 64 characters (Unicode codepoints), can only
|
7246
7524
|
# contain lowercase letters, numeric characters, underscores and dashes.
|
@@ -7327,6 +7605,7 @@ module Google
|
|
7327
7605
|
@enable_private_service_connect = args[:enable_private_service_connect] if args.key?(:enable_private_service_connect)
|
7328
7606
|
@encryption_spec = args[:encryption_spec] if args.key?(:encryption_spec)
|
7329
7607
|
@etag = args[:etag] if args.key?(:etag)
|
7608
|
+
@gen_ai_advanced_features_config = args[:gen_ai_advanced_features_config] if args.key?(:gen_ai_advanced_features_config)
|
7330
7609
|
@labels = args[:labels] if args.key?(:labels)
|
7331
7610
|
@model_deployment_monitoring_job = args[:model_deployment_monitoring_job] if args.key?(:model_deployment_monitoring_job)
|
7332
7611
|
@name = args[:name] if args.key?(:name)
|
@@ -7340,6 +7619,20 @@ module Google
|
|
7340
7619
|
end
|
7341
7620
|
end
|
7342
7621
|
|
7622
|
+
# Tool to search public web data, powered by Vertex AI Search and Sec4
|
7623
|
+
# compliance.
|
7624
|
+
class GoogleCloudAiplatformV1beta1EnterpriseWebSearch
|
7625
|
+
include Google::Apis::Core::Hashable
|
7626
|
+
|
7627
|
+
def initialize(**args)
|
7628
|
+
update!(**args)
|
7629
|
+
end
|
7630
|
+
|
7631
|
+
# Update properties of this object
|
7632
|
+
def update!(**args)
|
7633
|
+
end
|
7634
|
+
end
|
7635
|
+
|
7343
7636
|
# Selector for entityId. Getting ids from the given source.
|
7344
7637
|
class GoogleCloudAiplatformV1beta1EntityIdSelector
|
7345
7638
|
include Google::Apis::Core::Hashable
|
@@ -7554,10 +7847,54 @@ module Google
|
|
7554
7847
|
end
|
7555
7848
|
end
|
7556
7849
|
|
7850
|
+
# Request message for EvaluationService.EvaluateDataset.
|
7851
|
+
class GoogleCloudAiplatformV1beta1EvaluateDatasetRequest
|
7852
|
+
include Google::Apis::Core::Hashable
|
7853
|
+
|
7854
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7855
|
+
# EvaluateDataset.
|
7856
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7857
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7858
|
+
attr_accessor :autorater_config
|
7859
|
+
|
7860
|
+
# The dataset used for evaluation.
|
7861
|
+
# Corresponds to the JSON property `dataset`
|
7862
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EvaluationDataset]
|
7863
|
+
attr_accessor :dataset
|
7864
|
+
|
7865
|
+
# Required. The metrics used for evaluation.
|
7866
|
+
# Corresponds to the JSON property `metrics`
|
7867
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Metric>]
|
7868
|
+
attr_accessor :metrics
|
7869
|
+
|
7870
|
+
# Config for evaluation output.
|
7871
|
+
# Corresponds to the JSON property `outputConfig`
|
7872
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1OutputConfig]
|
7873
|
+
attr_accessor :output_config
|
7874
|
+
|
7875
|
+
def initialize(**args)
|
7876
|
+
update!(**args)
|
7877
|
+
end
|
7878
|
+
|
7879
|
+
# Update properties of this object
|
7880
|
+
def update!(**args)
|
7881
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7882
|
+
@dataset = args[:dataset] if args.key?(:dataset)
|
7883
|
+
@metrics = args[:metrics] if args.key?(:metrics)
|
7884
|
+
@output_config = args[:output_config] if args.key?(:output_config)
|
7885
|
+
end
|
7886
|
+
end
|
7887
|
+
|
7557
7888
|
# Request message for EvaluationService.EvaluateInstances.
|
7558
7889
|
class GoogleCloudAiplatformV1beta1EvaluateInstancesRequest
|
7559
7890
|
include Google::Apis::Core::Hashable
|
7560
7891
|
|
7892
|
+
# The configs for autorater. This is applicable to both EvaluateInstances and
|
7893
|
+
# EvaluateDataset.
|
7894
|
+
# Corresponds to the JSON property `autoraterConfig`
|
7895
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
|
7896
|
+
attr_accessor :autorater_config
|
7897
|
+
|
7561
7898
|
# Input for bleu metric.
|
7562
7899
|
# Corresponds to the JSON property `bleuInput`
|
7563
7900
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuInput]
|
@@ -7719,6 +8056,7 @@ module Google
|
|
7719
8056
|
|
7720
8057
|
# Update properties of this object
|
7721
8058
|
def update!(**args)
|
8059
|
+
@autorater_config = args[:autorater_config] if args.key?(:autorater_config)
|
7722
8060
|
@bleu_input = args[:bleu_input] if args.key?(:bleu_input)
|
7723
8061
|
@coherence_input = args[:coherence_input] if args.key?(:coherence_input)
|
7724
8062
|
@comet_input = args[:comet_input] if args.key?(:comet_input)
|
@@ -8058,6 +8396,31 @@ module Google
|
|
8058
8396
|
end
|
8059
8397
|
end
|
8060
8398
|
|
8399
|
+
# The dataset used for evaluation.
|
8400
|
+
class GoogleCloudAiplatformV1beta1EvaluationDataset
|
8401
|
+
include Google::Apis::Core::Hashable
|
8402
|
+
|
8403
|
+
# The BigQuery location for the input content.
|
8404
|
+
# Corresponds to the JSON property `bigquerySource`
|
8405
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BigQuerySource]
|
8406
|
+
attr_accessor :bigquery_source
|
8407
|
+
|
8408
|
+
# The Google Cloud Storage location for the input content.
|
8409
|
+
# Corresponds to the JSON property `gcsSource`
|
8410
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsSource]
|
8411
|
+
attr_accessor :gcs_source
|
8412
|
+
|
8413
|
+
def initialize(**args)
|
8414
|
+
update!(**args)
|
8415
|
+
end
|
8416
|
+
|
8417
|
+
# Update properties of this object
|
8418
|
+
def update!(**args)
|
8419
|
+
@bigquery_source = args[:bigquery_source] if args.key?(:bigquery_source)
|
8420
|
+
@gcs_source = args[:gcs_source] if args.key?(:gcs_source)
|
8421
|
+
end
|
8422
|
+
end
|
8423
|
+
|
8061
8424
|
# An edge describing the relationship between an Artifact and an Execution in a
|
8062
8425
|
# lineage graph.
|
8063
8426
|
class GoogleCloudAiplatformV1beta1Event
|
@@ -9581,6 +9944,51 @@ module Google
|
|
9581
9944
|
end
|
9582
9945
|
end
|
9583
9946
|
|
9947
|
+
# Runtime operation information for ModelGardenService.ExportPublisherModel.
|
9948
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelOperationMetadata
|
9949
|
+
include Google::Apis::Core::Hashable
|
9950
|
+
|
9951
|
+
# Generic Metadata shared by all operations.
|
9952
|
+
# Corresponds to the JSON property `genericMetadata`
|
9953
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenericOperationMetadata]
|
9954
|
+
attr_accessor :generic_metadata
|
9955
|
+
|
9956
|
+
def initialize(**args)
|
9957
|
+
update!(**args)
|
9958
|
+
end
|
9959
|
+
|
9960
|
+
# Update properties of this object
|
9961
|
+
def update!(**args)
|
9962
|
+
@generic_metadata = args[:generic_metadata] if args.key?(:generic_metadata)
|
9963
|
+
end
|
9964
|
+
end
|
9965
|
+
|
9966
|
+
# Response message for ModelGardenService.ExportPublisherModel.
|
9967
|
+
class GoogleCloudAiplatformV1beta1ExportPublisherModelResponse
|
9968
|
+
include Google::Apis::Core::Hashable
|
9969
|
+
|
9970
|
+
# The destination uri of the model weights.
|
9971
|
+
# Corresponds to the JSON property `destinationUri`
|
9972
|
+
# @return [String]
|
9973
|
+
attr_accessor :destination_uri
|
9974
|
+
|
9975
|
+
# The name of the PublisherModel resource. Format: `publishers/`publisher`/
|
9976
|
+
# models/`publisher_model`@`version_id``
|
9977
|
+
# Corresponds to the JSON property `publisherModel`
|
9978
|
+
# @return [String]
|
9979
|
+
attr_accessor :publisher_model
|
9980
|
+
|
9981
|
+
def initialize(**args)
|
9982
|
+
update!(**args)
|
9983
|
+
end
|
9984
|
+
|
9985
|
+
# Update properties of this object
|
9986
|
+
def update!(**args)
|
9987
|
+
@destination_uri = args[:destination_uri] if args.key?(:destination_uri)
|
9988
|
+
@publisher_model = args[:publisher_model] if args.key?(:publisher_model)
|
9989
|
+
end
|
9990
|
+
end
|
9991
|
+
|
9584
9992
|
# Request message for TensorboardService.ExportTensorboardTimeSeriesData.
|
9585
9993
|
class GoogleCloudAiplatformV1beta1ExportTensorboardTimeSeriesDataRequest
|
9586
9994
|
include Google::Apis::Core::Hashable
|
@@ -12192,6 +12600,14 @@ module Google
|
|
12192
12600
|
class GoogleCloudAiplatformV1beta1FileData
|
12193
12601
|
include Google::Apis::Core::Hashable
|
12194
12602
|
|
12603
|
+
# Optional. Display name of the file data. Used to provide a label or filename
|
12604
|
+
# to distinguish file datas. This field is only returned in PromptMessage for
|
12605
|
+
# prompt management. It is not currently used in the Gemini GenerateContent
|
12606
|
+
# calls.
|
12607
|
+
# Corresponds to the JSON property `displayName`
|
12608
|
+
# @return [String]
|
12609
|
+
attr_accessor :display_name
|
12610
|
+
|
12195
12611
|
# Required. URI.
|
12196
12612
|
# Corresponds to the JSON property `fileUri`
|
12197
12613
|
# @return [String]
|
@@ -12208,6 +12624,7 @@ module Google
|
|
12208
12624
|
|
12209
12625
|
# Update properties of this object
|
12210
12626
|
def update!(**args)
|
12627
|
+
@display_name = args[:display_name] if args.key?(:display_name)
|
12211
12628
|
@file_uri = args[:file_uri] if args.key?(:file_uri)
|
12212
12629
|
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
12213
12630
|
end
|
@@ -12890,6 +13307,47 @@ module Google
|
|
12890
13307
|
end
|
12891
13308
|
end
|
12892
13309
|
|
13310
|
+
# Configuration for GenAiAdvancedFeatures.
|
13311
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig
|
13312
|
+
include Google::Apis::Core::Hashable
|
13313
|
+
|
13314
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13315
|
+
# Corresponds to the JSON property `ragConfig`
|
13316
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig]
|
13317
|
+
attr_accessor :rag_config
|
13318
|
+
|
13319
|
+
def initialize(**args)
|
13320
|
+
update!(**args)
|
13321
|
+
end
|
13322
|
+
|
13323
|
+
# Update properties of this object
|
13324
|
+
def update!(**args)
|
13325
|
+
@rag_config = args[:rag_config] if args.key?(:rag_config)
|
13326
|
+
end
|
13327
|
+
end
|
13328
|
+
|
13329
|
+
# Configuration for Retrieval Augmented Generation feature.
|
13330
|
+
class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig
|
13331
|
+
include Google::Apis::Core::Hashable
|
13332
|
+
|
13333
|
+
# If true, enable Retrieval Augmented Generation in ChatCompletion request. Once
|
13334
|
+
# enabled, the endpoint will be identified as GenAI endpoint and Arthedain
|
13335
|
+
# router will be used.
|
13336
|
+
# Corresponds to the JSON property `enableRag`
|
13337
|
+
# @return [Boolean]
|
13338
|
+
attr_accessor :enable_rag
|
13339
|
+
alias_method :enable_rag?, :enable_rag
|
13340
|
+
|
13341
|
+
def initialize(**args)
|
13342
|
+
update!(**args)
|
13343
|
+
end
|
13344
|
+
|
13345
|
+
# Update properties of this object
|
13346
|
+
def update!(**args)
|
13347
|
+
@enable_rag = args[:enable_rag] if args.key?(:enable_rag)
|
13348
|
+
end
|
13349
|
+
end
|
13350
|
+
|
12893
13351
|
# Request message for NotebookInternalService.GenerateAccessToken.
|
12894
13352
|
class GoogleCloudAiplatformV1beta1GenerateAccessTokenRequest
|
12895
13353
|
include Google::Apis::Core::Hashable
|
@@ -13037,6 +13495,11 @@ module Google
|
|
13037
13495
|
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Candidate>]
|
13038
13496
|
attr_accessor :candidates
|
13039
13497
|
|
13498
|
+
# Output only. Timestamp when the request is made to the server.
|
13499
|
+
# Corresponds to the JSON property `createTime`
|
13500
|
+
# @return [String]
|
13501
|
+
attr_accessor :create_time
|
13502
|
+
|
13040
13503
|
# Output only. The model version used to generate the response.
|
13041
13504
|
# Corresponds to the JSON property `modelVersion`
|
13042
13505
|
# @return [String]
|
@@ -13047,6 +13510,12 @@ module Google
|
|
13047
13510
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponsePromptFeedback]
|
13048
13511
|
attr_accessor :prompt_feedback
|
13049
13512
|
|
13513
|
+
# Output only. response_id is used to identify each response. It is the encoding
|
13514
|
+
# of the event_id.
|
13515
|
+
# Corresponds to the JSON property `responseId`
|
13516
|
+
# @return [String]
|
13517
|
+
attr_accessor :response_id
|
13518
|
+
|
13050
13519
|
# Usage metadata about response(s).
|
13051
13520
|
# Corresponds to the JSON property `usageMetadata`
|
13052
13521
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata]
|
@@ -13059,8 +13528,10 @@ module Google
|
|
13059
13528
|
# Update properties of this object
|
13060
13529
|
def update!(**args)
|
13061
13530
|
@candidates = args[:candidates] if args.key?(:candidates)
|
13531
|
+
@create_time = args[:create_time] if args.key?(:create_time)
|
13062
13532
|
@model_version = args[:model_version] if args.key?(:model_version)
|
13063
13533
|
@prompt_feedback = args[:prompt_feedback] if args.key?(:prompt_feedback)
|
13534
|
+
@response_id = args[:response_id] if args.key?(:response_id)
|
13064
13535
|
@usage_metadata = args[:usage_metadata] if args.key?(:usage_metadata)
|
13065
13536
|
end
|
13066
13537
|
end
|
@@ -13100,6 +13571,11 @@ module Google
|
|
13100
13571
|
class GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata
|
13101
13572
|
include Google::Apis::Core::Hashable
|
13102
13573
|
|
13574
|
+
# Output only. List of modalities of the cached content in the request input.
|
13575
|
+
# Corresponds to the JSON property `cacheTokensDetails`
|
13576
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13577
|
+
attr_accessor :cache_tokens_details
|
13578
|
+
|
13103
13579
|
# Output only. Number of tokens in the cached part in the input (the cached
|
13104
13580
|
# content).
|
13105
13581
|
# Corresponds to the JSON property `cachedContentTokenCount`
|
@@ -13111,6 +13587,11 @@ module Google
|
|
13111
13587
|
# @return [Fixnum]
|
13112
13588
|
attr_accessor :candidates_token_count
|
13113
13589
|
|
13590
|
+
# Output only. List of modalities that were returned in the response.
|
13591
|
+
# Corresponds to the JSON property `candidatesTokensDetails`
|
13592
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13593
|
+
attr_accessor :candidates_tokens_details
|
13594
|
+
|
13114
13595
|
# Number of tokens in the request. When `cached_content` is set, this is still
|
13115
13596
|
# the total effective prompt size meaning this includes the number of tokens in
|
13116
13597
|
# the cached content.
|
@@ -13118,7 +13599,24 @@ module Google
|
|
13118
13599
|
# @return [Fixnum]
|
13119
13600
|
attr_accessor :prompt_token_count
|
13120
13601
|
|
13121
|
-
#
|
13602
|
+
# Output only. List of modalities that were processed in the request input.
|
13603
|
+
# Corresponds to the JSON property `promptTokensDetails`
|
13604
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13605
|
+
attr_accessor :prompt_tokens_details
|
13606
|
+
|
13607
|
+
# Output only. Number of tokens present in tool-use prompt(s).
|
13608
|
+
# Corresponds to the JSON property `toolUsePromptTokenCount`
|
13609
|
+
# @return [Fixnum]
|
13610
|
+
attr_accessor :tool_use_prompt_token_count
|
13611
|
+
|
13612
|
+
# Output only. List of modalities that were processed for tool-use request
|
13613
|
+
# inputs.
|
13614
|
+
# Corresponds to the JSON property `toolUsePromptTokensDetails`
|
13615
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
|
13616
|
+
attr_accessor :tool_use_prompt_tokens_details
|
13617
|
+
|
13618
|
+
# Total token count for prompt, response candidates, and tool-use prompts (if
|
13619
|
+
# present).
|
13122
13620
|
# Corresponds to the JSON property `totalTokenCount`
|
13123
13621
|
# @return [Fixnum]
|
13124
13622
|
attr_accessor :total_token_count
|
@@ -13129,9 +13627,14 @@ module Google
|
|
13129
13627
|
|
13130
13628
|
# Update properties of this object
|
13131
13629
|
def update!(**args)
|
13630
|
+
@cache_tokens_details = args[:cache_tokens_details] if args.key?(:cache_tokens_details)
|
13132
13631
|
@cached_content_token_count = args[:cached_content_token_count] if args.key?(:cached_content_token_count)
|
13133
13632
|
@candidates_token_count = args[:candidates_token_count] if args.key?(:candidates_token_count)
|
13633
|
+
@candidates_tokens_details = args[:candidates_tokens_details] if args.key?(:candidates_tokens_details)
|
13134
13634
|
@prompt_token_count = args[:prompt_token_count] if args.key?(:prompt_token_count)
|
13635
|
+
@prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
|
13636
|
+
@tool_use_prompt_token_count = args[:tool_use_prompt_token_count] if args.key?(:tool_use_prompt_token_count)
|
13637
|
+
@tool_use_prompt_tokens_details = args[:tool_use_prompt_tokens_details] if args.key?(:tool_use_prompt_tokens_details)
|
13135
13638
|
@total_token_count = args[:total_token_count] if args.key?(:total_token_count)
|
13136
13639
|
end
|
13137
13640
|
end
|
@@ -13155,6 +13658,11 @@ module Google
|
|
13155
13658
|
# @return [Array<String>]
|
13156
13659
|
attr_accessor :rai_media_filtered_reasons
|
13157
13660
|
|
13661
|
+
# List of video bytes or Cloud Storage URIs of the generated videos.
|
13662
|
+
# Corresponds to the JSON property `videos`
|
13663
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateVideoResponseVideo>]
|
13664
|
+
attr_accessor :videos
|
13665
|
+
|
13158
13666
|
def initialize(**args)
|
13159
13667
|
update!(**args)
|
13160
13668
|
end
|
@@ -13164,6 +13672,38 @@ module Google
|
|
13164
13672
|
@generated_samples = args[:generated_samples] if args.key?(:generated_samples)
|
13165
13673
|
@rai_media_filtered_count = args[:rai_media_filtered_count] if args.key?(:rai_media_filtered_count)
|
13166
13674
|
@rai_media_filtered_reasons = args[:rai_media_filtered_reasons] if args.key?(:rai_media_filtered_reasons)
|
13675
|
+
@videos = args[:videos] if args.key?(:videos)
|
13676
|
+
end
|
13677
|
+
end
|
13678
|
+
|
13679
|
+
# A generated video.
|
13680
|
+
class GoogleCloudAiplatformV1beta1GenerateVideoResponseVideo
|
13681
|
+
include Google::Apis::Core::Hashable
|
13682
|
+
|
13683
|
+
# Base64 encoded bytes string representing the video.
|
13684
|
+
# Corresponds to the JSON property `bytesBase64Encoded`
|
13685
|
+
# @return [String]
|
13686
|
+
attr_accessor :bytes_base64_encoded
|
13687
|
+
|
13688
|
+
# Cloud Storage URI where the generated video is written.
|
13689
|
+
# Corresponds to the JSON property `gcsUri`
|
13690
|
+
# @return [String]
|
13691
|
+
attr_accessor :gcs_uri
|
13692
|
+
|
13693
|
+
# The MIME type of the content of the video. - video/mp4
|
13694
|
+
# Corresponds to the JSON property `mimeType`
|
13695
|
+
# @return [String]
|
13696
|
+
attr_accessor :mime_type
|
13697
|
+
|
13698
|
+
def initialize(**args)
|
13699
|
+
update!(**args)
|
13700
|
+
end
|
13701
|
+
|
13702
|
+
# Update properties of this object
|
13703
|
+
def update!(**args)
|
13704
|
+
@bytes_base64_encoded = args[:bytes_base64_encoded] if args.key?(:bytes_base64_encoded)
|
13705
|
+
@gcs_uri = args[:gcs_uri] if args.key?(:gcs_uri)
|
13706
|
+
@mime_type = args[:mime_type] if args.key?(:mime_type)
|
13167
13707
|
end
|
13168
13708
|
end
|
13169
13709
|
|
@@ -16084,6 +16624,32 @@ module Google
|
|
16084
16624
|
end
|
16085
16625
|
end
|
16086
16626
|
|
16627
|
+
# Response message for ModelService.ListModelVersionCheckpoints
|
16628
|
+
class GoogleCloudAiplatformV1beta1ListModelVersionCheckpointsResponse
|
16629
|
+
include Google::Apis::Core::Hashable
|
16630
|
+
|
16631
|
+
# List of Model Version checkpoints.
|
16632
|
+
# Corresponds to the JSON property `checkpoints`
|
16633
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelVersionCheckpoint>]
|
16634
|
+
attr_accessor :checkpoints
|
16635
|
+
|
16636
|
+
# A token to retrieve the next page of results. Pass to
|
16637
|
+
# ListModelVersionCheckpointsRequest.page_token to obtain that page.
|
16638
|
+
# Corresponds to the JSON property `nextPageToken`
|
16639
|
+
# @return [String]
|
16640
|
+
attr_accessor :next_page_token
|
16641
|
+
|
16642
|
+
def initialize(**args)
|
16643
|
+
update!(**args)
|
16644
|
+
end
|
16645
|
+
|
16646
|
+
# Update properties of this object
|
16647
|
+
def update!(**args)
|
16648
|
+
@checkpoints = args[:checkpoints] if args.key?(:checkpoints)
|
16649
|
+
@next_page_token = args[:next_page_token] if args.key?(:next_page_token)
|
16650
|
+
end
|
16651
|
+
end
|
16652
|
+
|
16087
16653
|
# Response message for ModelService.ListModelVersions
|
16088
16654
|
class GoogleCloudAiplatformV1beta1ListModelVersionsResponse
|
16089
16655
|
include Google::Apis::Core::Hashable
|
@@ -16866,6 +17432,12 @@ module Google
|
|
16866
17432
|
# @return [String]
|
16867
17433
|
attr_accessor :machine_type
|
16868
17434
|
|
17435
|
+
# Optional. Immutable. The number of nodes per replica for multihost GPU
|
17436
|
+
# deployments.
|
17437
|
+
# Corresponds to the JSON property `multihostGpuNodeCount`
|
17438
|
+
# @return [Fixnum]
|
17439
|
+
attr_accessor :multihost_gpu_node_count
|
17440
|
+
|
16869
17441
|
# A ReservationAffinity can be used to configure a Vertex AI resource (e.g., a
|
16870
17442
|
# DeployedModel) to draw its Compute Engine resources from a Shared Reservation,
|
16871
17443
|
# or exclusively from on-demand capacity.
|
@@ -16888,6 +17460,7 @@ module Google
|
|
16888
17460
|
@accelerator_count = args[:accelerator_count] if args.key?(:accelerator_count)
|
16889
17461
|
@accelerator_type = args[:accelerator_type] if args.key?(:accelerator_type)
|
16890
17462
|
@machine_type = args[:machine_type] if args.key?(:machine_type)
|
17463
|
+
@multihost_gpu_node_count = args[:multihost_gpu_node_count] if args.key?(:multihost_gpu_node_count)
|
16891
17464
|
@reservation_affinity = args[:reservation_affinity] if args.key?(:reservation_affinity)
|
16892
17465
|
@tpu_topology = args[:tpu_topology] if args.key?(:tpu_topology)
|
16893
17466
|
end
|
@@ -17156,6 +17729,58 @@ module Google
|
|
17156
17729
|
end
|
17157
17730
|
end
|
17158
17731
|
|
17732
|
+
# The metric used for dataset level evaluation.
|
17733
|
+
class GoogleCloudAiplatformV1beta1Metric
|
17734
|
+
include Google::Apis::Core::Hashable
|
17735
|
+
|
17736
|
+
# Optional. The aggregation metrics to use.
|
17737
|
+
# Corresponds to the JSON property `aggregationMetrics`
|
17738
|
+
# @return [Array<String>]
|
17739
|
+
attr_accessor :aggregation_metrics
|
17740
|
+
|
17741
|
+
# Spec for bleu score metric - calculates the precision of n-grams in the
|
17742
|
+
# prediction as compared to reference - returns a score ranging between 0 to 1.
|
17743
|
+
# Corresponds to the JSON property `bleuSpec`
|
17744
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuSpec]
|
17745
|
+
attr_accessor :bleu_spec
|
17746
|
+
|
17747
|
+
# Spec for exact match metric - returns 1 if prediction and reference exactly
|
17748
|
+
# matches, otherwise 0.
|
17749
|
+
# Corresponds to the JSON property `exactMatchSpec`
|
17750
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ExactMatchSpec]
|
17751
|
+
attr_accessor :exact_match_spec
|
17752
|
+
|
17753
|
+
# Spec for pairwise metric.
|
17754
|
+
# Corresponds to the JSON property `pairwiseMetricSpec`
|
17755
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PairwiseMetricSpec]
|
17756
|
+
attr_accessor :pairwise_metric_spec
|
17757
|
+
|
17758
|
+
# Spec for pointwise metric.
|
17759
|
+
# Corresponds to the JSON property `pointwiseMetricSpec`
|
17760
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PointwiseMetricSpec]
|
17761
|
+
attr_accessor :pointwise_metric_spec
|
17762
|
+
|
17763
|
+
# Spec for rouge score metric - calculates the recall of n-grams in prediction
|
17764
|
+
# as compared to reference - returns a score ranging between 0 and 1.
|
17765
|
+
# Corresponds to the JSON property `rougeSpec`
|
17766
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RougeSpec]
|
17767
|
+
attr_accessor :rouge_spec
|
17768
|
+
|
17769
|
+
def initialize(**args)
|
17770
|
+
update!(**args)
|
17771
|
+
end
|
17772
|
+
|
17773
|
+
# Update properties of this object
|
17774
|
+
def update!(**args)
|
17775
|
+
@aggregation_metrics = args[:aggregation_metrics] if args.key?(:aggregation_metrics)
|
17776
|
+
@bleu_spec = args[:bleu_spec] if args.key?(:bleu_spec)
|
17777
|
+
@exact_match_spec = args[:exact_match_spec] if args.key?(:exact_match_spec)
|
17778
|
+
@pairwise_metric_spec = args[:pairwise_metric_spec] if args.key?(:pairwise_metric_spec)
|
17779
|
+
@pointwise_metric_spec = args[:pointwise_metric_spec] if args.key?(:pointwise_metric_spec)
|
17780
|
+
@rouge_spec = args[:rouge_spec] if args.key?(:rouge_spec)
|
17781
|
+
end
|
17782
|
+
end
|
17783
|
+
|
17159
17784
|
# Input for MetricX metric.
|
17160
17785
|
class GoogleCloudAiplatformV1beta1MetricxInput
|
17161
17786
|
include Google::Apis::Core::Hashable
|
@@ -17674,6 +18299,31 @@ module Google
|
|
17674
18299
|
end
|
17675
18300
|
end
|
17676
18301
|
|
18302
|
+
# Represents token counting info for a single modality.
|
18303
|
+
class GoogleCloudAiplatformV1beta1ModalityTokenCount
|
18304
|
+
include Google::Apis::Core::Hashable
|
18305
|
+
|
18306
|
+
# The modality associated with this token count.
|
18307
|
+
# Corresponds to the JSON property `modality`
|
18308
|
+
# @return [String]
|
18309
|
+
attr_accessor :modality
|
18310
|
+
|
18311
|
+
# Number of tokens.
|
18312
|
+
# Corresponds to the JSON property `tokenCount`
|
18313
|
+
# @return [Fixnum]
|
18314
|
+
attr_accessor :token_count
|
18315
|
+
|
18316
|
+
def initialize(**args)
|
18317
|
+
update!(**args)
|
18318
|
+
end
|
18319
|
+
|
18320
|
+
# Update properties of this object
|
18321
|
+
def update!(**args)
|
18322
|
+
@modality = args[:modality] if args.key?(:modality)
|
18323
|
+
@token_count = args[:token_count] if args.key?(:token_count)
|
18324
|
+
end
|
18325
|
+
end
|
18326
|
+
|
17677
18327
|
# A trained machine learning Model.
|
17678
18328
|
class GoogleCloudAiplatformV1beta1Model
|
17679
18329
|
include Google::Apis::Core::Hashable
|
@@ -17703,6 +18353,11 @@ module Google
|
|
17703
18353
|
# @return [String]
|
17704
18354
|
attr_accessor :create_time
|
17705
18355
|
|
18356
|
+
# The default checkpoint id of a model version.
|
18357
|
+
# Corresponds to the JSON property `defaultCheckpointId`
|
18358
|
+
# @return [String]
|
18359
|
+
attr_accessor :default_checkpoint_id
|
18360
|
+
|
17706
18361
|
# Output only. The pointers to DeployedModels created from this Model. Note that
|
17707
18362
|
# Model could have been deployed to Endpoints in different Locations.
|
17708
18363
|
# Corresponds to the JSON property `deployedModels`
|
@@ -17917,6 +18572,7 @@ module Google
|
|
17917
18572
|
@base_model_source = args[:base_model_source] if args.key?(:base_model_source)
|
17918
18573
|
@container_spec = args[:container_spec] if args.key?(:container_spec)
|
17919
18574
|
@create_time = args[:create_time] if args.key?(:create_time)
|
18575
|
+
@default_checkpoint_id = args[:default_checkpoint_id] if args.key?(:default_checkpoint_id)
|
17920
18576
|
@deployed_models = args[:deployed_models] if args.key?(:deployed_models)
|
17921
18577
|
@description = args[:description] if args.key?(:description)
|
17922
18578
|
@display_name = args[:display_name] if args.key?(:display_name)
|
@@ -18925,7 +19581,7 @@ module Google
|
|
18925
19581
|
# model in SavedModel format. * `tf-js` A [TensorFlow.js](https://www.tensorflow.
|
18926
19582
|
# org/js) model that can be used in the browser and in Node.js using JavaScript.
|
18927
19583
|
# * `core-ml` Used for iOS mobile devices. * `custom-trained` A Model that was
|
18928
|
-
# uploaded or trained by custom code.
|
19584
|
+
# uploaded or trained by custom code. * `genie` A tuned Model Garden model.
|
18929
19585
|
# Corresponds to the JSON property `id`
|
18930
19586
|
# @return [String]
|
18931
19587
|
attr_accessor :id
|
@@ -18951,6 +19607,17 @@ module Google
|
|
18951
19607
|
# @return [String]
|
18952
19608
|
attr_accessor :public_model_name
|
18953
19609
|
|
19610
|
+
# Optional. Whether to avoid pulling the model from the HF cache.
|
19611
|
+
# Corresponds to the JSON property `skipHfModelCache`
|
19612
|
+
# @return [Boolean]
|
19613
|
+
attr_accessor :skip_hf_model_cache
|
19614
|
+
alias_method :skip_hf_model_cache?, :skip_hf_model_cache
|
19615
|
+
|
19616
|
+
# Optional. The model garden source model version ID.
|
19617
|
+
# Corresponds to the JSON property `versionId`
|
19618
|
+
# @return [String]
|
19619
|
+
attr_accessor :version_id
|
19620
|
+
|
18954
19621
|
def initialize(**args)
|
18955
19622
|
update!(**args)
|
18956
19623
|
end
|
@@ -18958,6 +19625,8 @@ module Google
|
|
18958
19625
|
# Update properties of this object
|
18959
19626
|
def update!(**args)
|
18960
19627
|
@public_model_name = args[:public_model_name] if args.key?(:public_model_name)
|
19628
|
+
@skip_hf_model_cache = args[:skip_hf_model_cache] if args.key?(:skip_hf_model_cache)
|
19629
|
+
@version_id = args[:version_id] if args.key?(:version_id)
|
18961
19630
|
end
|
18962
19631
|
end
|
18963
19632
|
|
@@ -20610,6 +21279,45 @@ module Google
|
|
20610
21279
|
end
|
20611
21280
|
end
|
20612
21281
|
|
21282
|
+
# Describes the machine learning model version checkpoint.
|
21283
|
+
class GoogleCloudAiplatformV1beta1ModelVersionCheckpoint
|
21284
|
+
include Google::Apis::Core::Hashable
|
21285
|
+
|
21286
|
+
# The ID of the checkpoint.
|
21287
|
+
# Corresponds to the JSON property `checkpointId`
|
21288
|
+
# @return [String]
|
21289
|
+
attr_accessor :checkpoint_id
|
21290
|
+
|
21291
|
+
# The epoch of the checkpoint.
|
21292
|
+
# Corresponds to the JSON property `epoch`
|
21293
|
+
# @return [Fixnum]
|
21294
|
+
attr_accessor :epoch
|
21295
|
+
|
21296
|
+
# Identifier. The resource name of the ModelVersionCheckpoint. Format: `projects/
|
21297
|
+
# `project`/locations/`location`/models/`model`/versions/`version`/checkpoints/`
|
21298
|
+
# checkpoint``
|
21299
|
+
# Corresponds to the JSON property `name`
|
21300
|
+
# @return [String]
|
21301
|
+
attr_accessor :name
|
21302
|
+
|
21303
|
+
# The step of the checkpoint.
|
21304
|
+
# Corresponds to the JSON property `step`
|
21305
|
+
# @return [Fixnum]
|
21306
|
+
attr_accessor :step
|
21307
|
+
|
21308
|
+
def initialize(**args)
|
21309
|
+
update!(**args)
|
21310
|
+
end
|
21311
|
+
|
21312
|
+
# Update properties of this object
|
21313
|
+
def update!(**args)
|
21314
|
+
@checkpoint_id = args[:checkpoint_id] if args.key?(:checkpoint_id)
|
21315
|
+
@epoch = args[:epoch] if args.key?(:epoch)
|
21316
|
+
@name = args[:name] if args.key?(:name)
|
21317
|
+
@step = args[:step] if args.key?(:step)
|
21318
|
+
end
|
21319
|
+
end
|
21320
|
+
|
20613
21321
|
# Runtime operation information for IndexEndpointService.MutateDeployedIndex.
|
20614
21322
|
class GoogleCloudAiplatformV1beta1MutateDeployedIndexOperationMetadata
|
20615
21323
|
include Google::Apis::Core::Hashable
|
@@ -21719,8 +22427,8 @@ module Google
|
|
21719
22427
|
# @return [String]
|
21720
22428
|
attr_accessor :notebook_runtime_template_resource_name
|
21721
22429
|
|
21722
|
-
#
|
21723
|
-
#
|
22430
|
+
# The Schedule resource name if this job is triggered by one. Format: `projects/`
|
22431
|
+
# project_id`/locations/`location`/schedules/`schedule_id``
|
21724
22432
|
# Corresponds to the JSON property `scheduleResourceName`
|
21725
22433
|
# @return [String]
|
21726
22434
|
attr_accessor :schedule_resource_name
|
@@ -22083,6 +22791,11 @@ module Google
|
|
22083
22791
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22084
22792
|
attr_accessor :shielded_vm_config
|
22085
22793
|
|
22794
|
+
# Notebook Software Config.
|
22795
|
+
# Corresponds to the JSON property `softwareConfig`
|
22796
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22797
|
+
attr_accessor :software_config
|
22798
|
+
|
22086
22799
|
# Output only. Timestamp when this NotebookRuntime was most recently updated.
|
22087
22800
|
# Corresponds to the JSON property `updateTime`
|
22088
22801
|
# @return [String]
|
@@ -22123,6 +22836,7 @@ module Google
|
|
22123
22836
|
@satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
|
22124
22837
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22125
22838
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22839
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22126
22840
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22127
22841
|
@version = args[:version] if args.key?(:version)
|
22128
22842
|
end
|
@@ -22241,6 +22955,11 @@ module Google
|
|
22241
22955
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
|
22242
22956
|
attr_accessor :shielded_vm_config
|
22243
22957
|
|
22958
|
+
# Notebook Software Config.
|
22959
|
+
# Corresponds to the JSON property `softwareConfig`
|
22960
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
|
22961
|
+
attr_accessor :software_config
|
22962
|
+
|
22244
22963
|
# Output only. Timestamp when this NotebookRuntimeTemplate was most recently
|
22245
22964
|
# updated.
|
22246
22965
|
# Corresponds to the JSON property `updateTime`
|
@@ -22270,6 +22989,7 @@ module Google
|
|
22270
22989
|
@notebook_runtime_type = args[:notebook_runtime_type] if args.key?(:notebook_runtime_type)
|
22271
22990
|
@service_account = args[:service_account] if args.key?(:service_account)
|
22272
22991
|
@shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
|
22992
|
+
@software_config = args[:software_config] if args.key?(:software_config)
|
22273
22993
|
@update_time = args[:update_time] if args.key?(:update_time)
|
22274
22994
|
end
|
22275
22995
|
end
|
@@ -22293,6 +23013,51 @@ module Google
|
|
22293
23013
|
end
|
22294
23014
|
end
|
22295
23015
|
|
23016
|
+
# Notebook Software Config.
|
23017
|
+
class GoogleCloudAiplatformV1beta1NotebookSoftwareConfig
|
23018
|
+
include Google::Apis::Core::Hashable
|
23019
|
+
|
23020
|
+
# Optional. Environment variables to be passed to the container. Maximum limit
|
23021
|
+
# is 100.
|
23022
|
+
# Corresponds to the JSON property `env`
|
23023
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnvVar>]
|
23024
|
+
attr_accessor :env
|
23025
|
+
|
23026
|
+
# Post startup script config.
|
23027
|
+
# Corresponds to the JSON property `postStartupScriptConfig`
|
23028
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PostStartupScriptConfig]
|
23029
|
+
attr_accessor :post_startup_script_config
|
23030
|
+
|
23031
|
+
def initialize(**args)
|
23032
|
+
update!(**args)
|
23033
|
+
end
|
23034
|
+
|
23035
|
+
# Update properties of this object
|
23036
|
+
def update!(**args)
|
23037
|
+
@env = args[:env] if args.key?(:env)
|
23038
|
+
@post_startup_script_config = args[:post_startup_script_config] if args.key?(:post_startup_script_config)
|
23039
|
+
end
|
23040
|
+
end
|
23041
|
+
|
23042
|
+
# Config for evaluation output.
|
23043
|
+
class GoogleCloudAiplatformV1beta1OutputConfig
|
23044
|
+
include Google::Apis::Core::Hashable
|
23045
|
+
|
23046
|
+
# The Google Cloud Storage location where the output is to be written to.
|
23047
|
+
# Corresponds to the JSON property `gcsDestination`
|
23048
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsDestination]
|
23049
|
+
attr_accessor :gcs_destination
|
23050
|
+
|
23051
|
+
def initialize(**args)
|
23052
|
+
update!(**args)
|
23053
|
+
end
|
23054
|
+
|
23055
|
+
# Update properties of this object
|
23056
|
+
def update!(**args)
|
23057
|
+
@gcs_destination = args[:gcs_destination] if args.key?(:gcs_destination)
|
23058
|
+
end
|
23059
|
+
end
|
23060
|
+
|
22296
23061
|
# PSC config that is used to automatically create forwarding rule via
|
22297
23062
|
# ServiceConnectionMap.
|
22298
23063
|
class GoogleCloudAiplatformV1beta1PscAutomationConfig
|
@@ -22399,18 +23164,36 @@ module Google
|
|
22399
23164
|
class GoogleCloudAiplatformV1beta1PairwiseMetricSpec
|
22400
23165
|
include Google::Apis::Core::Hashable
|
22401
23166
|
|
23167
|
+
# Optional. The field name of the baseline response.
|
23168
|
+
# Corresponds to the JSON property `baselineResponseFieldName`
|
23169
|
+
# @return [String]
|
23170
|
+
attr_accessor :baseline_response_field_name
|
23171
|
+
|
23172
|
+
# Optional. The field name of the candidate response.
|
23173
|
+
# Corresponds to the JSON property `candidateResponseFieldName`
|
23174
|
+
# @return [String]
|
23175
|
+
attr_accessor :candidate_response_field_name
|
23176
|
+
|
22402
23177
|
# Required. Metric prompt template for pairwise metric.
|
22403
23178
|
# Corresponds to the JSON property `metricPromptTemplate`
|
22404
23179
|
# @return [String]
|
22405
23180
|
attr_accessor :metric_prompt_template
|
22406
23181
|
|
23182
|
+
# Optional. System instructions for pairwise metric.
|
23183
|
+
# Corresponds to the JSON property `systemInstruction`
|
23184
|
+
# @return [String]
|
23185
|
+
attr_accessor :system_instruction
|
23186
|
+
|
22407
23187
|
def initialize(**args)
|
22408
23188
|
update!(**args)
|
22409
23189
|
end
|
22410
23190
|
|
22411
23191
|
# Update properties of this object
|
22412
23192
|
def update!(**args)
|
23193
|
+
@baseline_response_field_name = args[:baseline_response_field_name] if args.key?(:baseline_response_field_name)
|
23194
|
+
@candidate_response_field_name = args[:candidate_response_field_name] if args.key?(:candidate_response_field_name)
|
22413
23195
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
23196
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
22414
23197
|
end
|
22415
23198
|
end
|
22416
23199
|
|
@@ -22717,7 +23500,7 @@ module Google
|
|
22717
23500
|
# @return [String]
|
22718
23501
|
attr_accessor :text
|
22719
23502
|
|
22720
|
-
#
|
23503
|
+
# Output only. Indicates if the part is thought from the model.
|
22721
23504
|
# Corresponds to the JSON property `thought`
|
22722
23505
|
# @return [Boolean]
|
22723
23506
|
attr_accessor :thought
|
@@ -23808,6 +24591,11 @@ module Google
|
|
23808
24591
|
# @return [String]
|
23809
24592
|
attr_accessor :metric_prompt_template
|
23810
24593
|
|
24594
|
+
# Optional. System instructions for pointwise metric.
|
24595
|
+
# Corresponds to the JSON property `systemInstruction`
|
24596
|
+
# @return [String]
|
24597
|
+
attr_accessor :system_instruction
|
24598
|
+
|
23811
24599
|
def initialize(**args)
|
23812
24600
|
update!(**args)
|
23813
24601
|
end
|
@@ -23815,6 +24603,7 @@ module Google
|
|
23815
24603
|
# Update properties of this object
|
23816
24604
|
def update!(**args)
|
23817
24605
|
@metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
|
24606
|
+
@system_instruction = args[:system_instruction] if args.key?(:system_instruction)
|
23818
24607
|
end
|
23819
24608
|
end
|
23820
24609
|
|
@@ -23838,6 +24627,39 @@ module Google
|
|
23838
24627
|
end
|
23839
24628
|
end
|
23840
24629
|
|
24630
|
+
# Post startup script config.
|
24631
|
+
class GoogleCloudAiplatformV1beta1PostStartupScriptConfig
|
24632
|
+
include Google::Apis::Core::Hashable
|
24633
|
+
|
24634
|
+
# Optional. Post startup script to run after runtime is started.
|
24635
|
+
# Corresponds to the JSON property `postStartupScript`
|
24636
|
+
# @return [String]
|
24637
|
+
attr_accessor :post_startup_script
|
24638
|
+
|
24639
|
+
# Optional. Post startup script behavior that defines download and execution
|
24640
|
+
# behavior.
|
24641
|
+
# Corresponds to the JSON property `postStartupScriptBehavior`
|
24642
|
+
# @return [String]
|
24643
|
+
attr_accessor :post_startup_script_behavior
|
24644
|
+
|
24645
|
+
# Optional. Post startup script url to download. Example: https://bucket/script.
|
24646
|
+
# sh
|
24647
|
+
# Corresponds to the JSON property `postStartupScriptUrl`
|
24648
|
+
# @return [String]
|
24649
|
+
attr_accessor :post_startup_script_url
|
24650
|
+
|
24651
|
+
def initialize(**args)
|
24652
|
+
update!(**args)
|
24653
|
+
end
|
24654
|
+
|
24655
|
+
# Update properties of this object
|
24656
|
+
def update!(**args)
|
24657
|
+
@post_startup_script = args[:post_startup_script] if args.key?(:post_startup_script)
|
24658
|
+
@post_startup_script_behavior = args[:post_startup_script_behavior] if args.key?(:post_startup_script_behavior)
|
24659
|
+
@post_startup_script_url = args[:post_startup_script_url] if args.key?(:post_startup_script_url)
|
24660
|
+
end
|
24661
|
+
end
|
24662
|
+
|
23841
24663
|
# The configuration for the prebuilt speaker to use.
|
23842
24664
|
class GoogleCloudAiplatformV1beta1PrebuiltVoiceConfig
|
23843
24665
|
include Google::Apis::Core::Hashable
|
@@ -24244,6 +25066,12 @@ module Google
|
|
24244
25066
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeExecAction]
|
24245
25067
|
attr_accessor :exec
|
24246
25068
|
|
25069
|
+
# Number of consecutive failures before the probe is considered failed. Defaults
|
25070
|
+
# to 3. Minimum value is 1. Maps to Kubernetes probe argument 'failureThreshold'.
|
25071
|
+
# Corresponds to the JSON property `failureThreshold`
|
25072
|
+
# @return [Fixnum]
|
25073
|
+
attr_accessor :failure_threshold
|
25074
|
+
|
24247
25075
|
# GrpcAction checks the health of a container using a gRPC service.
|
24248
25076
|
# Corresponds to the JSON property `grpc`
|
24249
25077
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeGrpcAction]
|
@@ -24254,6 +25082,12 @@ module Google
|
|
24254
25082
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpGetAction]
|
24255
25083
|
attr_accessor :http_get
|
24256
25084
|
|
25085
|
+
# Number of seconds to wait before starting the probe. Defaults to 0. Minimum
|
25086
|
+
# value is 0. Maps to Kubernetes probe argument 'initialDelaySeconds'.
|
25087
|
+
# Corresponds to the JSON property `initialDelaySeconds`
|
25088
|
+
# @return [Fixnum]
|
25089
|
+
attr_accessor :initial_delay_seconds
|
25090
|
+
|
24257
25091
|
# How often (in seconds) to perform the probe. Default to 10 seconds. Minimum
|
24258
25092
|
# value is 1. Must be less than timeout_seconds. Maps to Kubernetes probe
|
24259
25093
|
# argument 'periodSeconds'.
|
@@ -24261,6 +25095,13 @@ module Google
|
|
24261
25095
|
# @return [Fixnum]
|
24262
25096
|
attr_accessor :period_seconds
|
24263
25097
|
|
25098
|
+
# Number of consecutive successes before the probe is considered successful.
|
25099
|
+
# Defaults to 1. Minimum value is 1. Maps to Kubernetes probe argument '
|
25100
|
+
# successThreshold'.
|
25101
|
+
# Corresponds to the JSON property `successThreshold`
|
25102
|
+
# @return [Fixnum]
|
25103
|
+
attr_accessor :success_threshold
|
25104
|
+
|
24264
25105
|
# TcpSocketAction probes the health of a container by opening a TCP socket
|
24265
25106
|
# connection.
|
24266
25107
|
# Corresponds to the JSON property `tcpSocket`
|
@@ -24281,9 +25122,12 @@ module Google
|
|
24281
25122
|
# Update properties of this object
|
24282
25123
|
def update!(**args)
|
24283
25124
|
@exec = args[:exec] if args.key?(:exec)
|
25125
|
+
@failure_threshold = args[:failure_threshold] if args.key?(:failure_threshold)
|
24284
25126
|
@grpc = args[:grpc] if args.key?(:grpc)
|
24285
25127
|
@http_get = args[:http_get] if args.key?(:http_get)
|
25128
|
+
@initial_delay_seconds = args[:initial_delay_seconds] if args.key?(:initial_delay_seconds)
|
24286
25129
|
@period_seconds = args[:period_seconds] if args.key?(:period_seconds)
|
25130
|
+
@success_threshold = args[:success_threshold] if args.key?(:success_threshold)
|
24287
25131
|
@tcp_socket = args[:tcp_socket] if args.key?(:tcp_socket)
|
24288
25132
|
@timeout_seconds = args[:timeout_seconds] if args.key?(:timeout_seconds)
|
24289
25133
|
end
|
@@ -24705,8 +25549,8 @@ module Google
|
|
24705
25549
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelContainerSpec]
|
24706
25550
|
attr_accessor :container_spec
|
24707
25551
|
|
24708
|
-
# A description of resources that are dedicated to a DeployedModel
|
24709
|
-
# need a higher degree of manual configuration.
|
25552
|
+
# A description of resources that are dedicated to a DeployedModel or
|
25553
|
+
# DeployedIndex, and that need a higher degree of manual configuration.
|
24710
25554
|
# Corresponds to the JSON property `dedicatedResources`
|
24711
25555
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
|
24712
25556
|
attr_accessor :dedicated_resources
|
@@ -26036,6 +26880,11 @@ module Google
|
|
26036
26880
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagEmbeddingModelConfig]
|
26037
26881
|
attr_accessor :rag_embedding_model_config
|
26038
26882
|
|
26883
|
+
# Output only. Number of RagFiles in the RagCorpus.
|
26884
|
+
# Corresponds to the JSON property `ragFilesCount`
|
26885
|
+
# @return [Fixnum]
|
26886
|
+
attr_accessor :rag_files_count
|
26887
|
+
|
26039
26888
|
# Config for the Vector DB to use for RAG.
|
26040
26889
|
# Corresponds to the JSON property `ragVectorDbConfig`
|
26041
26890
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagVectorDbConfig]
|
@@ -26068,6 +26917,7 @@ module Google
|
|
26068
26917
|
@display_name = args[:display_name] if args.key?(:display_name)
|
26069
26918
|
@name = args[:name] if args.key?(:name)
|
26070
26919
|
@rag_embedding_model_config = args[:rag_embedding_model_config] if args.key?(:rag_embedding_model_config)
|
26920
|
+
@rag_files_count = args[:rag_files_count] if args.key?(:rag_files_count)
|
26071
26921
|
@rag_vector_db_config = args[:rag_vector_db_config] if args.key?(:rag_vector_db_config)
|
26072
26922
|
@update_time = args[:update_time] if args.key?(:update_time)
|
26073
26923
|
@vector_db_config = args[:vector_db_config] if args.key?(:vector_db_config)
|
@@ -26478,7 +27328,8 @@ module Google
|
|
26478
27328
|
# @return [Fixnum]
|
26479
27329
|
attr_accessor :max_parsing_requests_per_min
|
26480
27330
|
|
26481
|
-
# The name of a LLM model used for parsing. Format: `
|
27331
|
+
# The name of a LLM model used for parsing. Format: * `projects/`project_id`/
|
27332
|
+
# locations/`location`/publishers/`publisher`/models/`model``
|
26482
27333
|
# Corresponds to the JSON property `modelName`
|
26483
27334
|
# @return [String]
|
26484
27335
|
attr_accessor :model_name
|
@@ -26733,7 +27584,8 @@ module Google
|
|
26733
27584
|
class GoogleCloudAiplatformV1beta1RagVectorDbConfig
|
26734
27585
|
include Google::Apis::Core::Hashable
|
26735
27586
|
|
26736
|
-
# The generic reusable api auth config.
|
27587
|
+
# The generic reusable api auth config. Deprecated. Please use AuthConfig (
|
27588
|
+
# google/cloud/aiplatform/master/auth.proto) instead.
|
26737
27589
|
# Corresponds to the JSON property `apiAuth`
|
26738
27590
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ApiAuth]
|
26739
27591
|
attr_accessor :api_auth
|
@@ -27413,6 +28265,11 @@ module Google
|
|
27413
28265
|
# @return [Array<Hash<String,Object>>]
|
27414
28266
|
attr_accessor :class_methods
|
27415
28267
|
|
28268
|
+
# The specification of a Reasoning Engine deployment.
|
28269
|
+
# Corresponds to the JSON property `deploymentSpec`
|
28270
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ReasoningEngineSpecDeploymentSpec]
|
28271
|
+
attr_accessor :deployment_spec
|
28272
|
+
|
27416
28273
|
# User provided package spec like pickled object and package requirements.
|
27417
28274
|
# Corresponds to the JSON property `packageSpec`
|
27418
28275
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ReasoningEngineSpecPackageSpec]
|
@@ -27425,10 +28282,40 @@ module Google
|
|
27425
28282
|
# Update properties of this object
|
27426
28283
|
def update!(**args)
|
27427
28284
|
@class_methods = args[:class_methods] if args.key?(:class_methods)
|
28285
|
+
@deployment_spec = args[:deployment_spec] if args.key?(:deployment_spec)
|
27428
28286
|
@package_spec = args[:package_spec] if args.key?(:package_spec)
|
27429
28287
|
end
|
27430
28288
|
end
|
27431
28289
|
|
28290
|
+
# The specification of a Reasoning Engine deployment.
|
28291
|
+
class GoogleCloudAiplatformV1beta1ReasoningEngineSpecDeploymentSpec
|
28292
|
+
include Google::Apis::Core::Hashable
|
28293
|
+
|
28294
|
+
# Optional. Environment variables to be set with the Reasoning Engine deployment.
|
28295
|
+
# The environment variables can be updated through the UpdateReasoningEngine
|
28296
|
+
# API.
|
28297
|
+
# Corresponds to the JSON property `env`
|
28298
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnvVar>]
|
28299
|
+
attr_accessor :env
|
28300
|
+
|
28301
|
+
# Optional. Environment variables where the value is a secret in Cloud Secret
|
28302
|
+
# Manager. To use this feature, add 'Secret Manager Secret Accessor' role (roles/
|
28303
|
+
# secretmanager.secretAccessor) to AI Platform Reasoning Engine Service Agent.
|
28304
|
+
# Corresponds to the JSON property `secretEnv`
|
28305
|
+
# @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SecretEnvVar>]
|
28306
|
+
attr_accessor :secret_env
|
28307
|
+
|
28308
|
+
def initialize(**args)
|
28309
|
+
update!(**args)
|
28310
|
+
end
|
28311
|
+
|
28312
|
+
# Update properties of this object
|
28313
|
+
def update!(**args)
|
28314
|
+
@env = args[:env] if args.key?(:env)
|
28315
|
+
@secret_env = args[:secret_env] if args.key?(:secret_env)
|
28316
|
+
end
|
28317
|
+
end
|
28318
|
+
|
27432
28319
|
# User provided package spec like pickled object and package requirements.
|
27433
28320
|
class GoogleCloudAiplatformV1beta1ReasoningEngineSpecPackageSpec
|
27434
28321
|
include Google::Apis::Core::Hashable
|
@@ -27742,7 +28629,7 @@ module Google
|
|
27742
28629
|
attr_accessor :reservation_affinity_type
|
27743
28630
|
|
27744
28631
|
# Optional. Corresponds to the label values of a reservation resource. This must
|
27745
|
-
# be the full resource name of the reservation.
|
28632
|
+
# be the full resource name of the reservation or reservation block.
|
27746
28633
|
# Corresponds to the JSON property `values`
|
27747
28634
|
# @return [Array<String>]
|
27748
28635
|
attr_accessor :values
|
@@ -27989,8 +28876,9 @@ module Google
|
|
27989
28876
|
attr_accessor :disable_attribution
|
27990
28877
|
alias_method :disable_attribution?, :disable_attribution
|
27991
28878
|
|
27992
|
-
# Retrieve from Vertex AI Search datastore for grounding.
|
27993
|
-
# google.com/products/agent-
|
28879
|
+
# Retrieve from Vertex AI Search datastore or engine for grounding. datastore
|
28880
|
+
# and engine are mutually exclusive. See https://cloud.google.com/products/agent-
|
28881
|
+
# builder
|
27994
28882
|
# Corresponds to the JSON property `vertexAiSearch`
|
27995
28883
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1VertexAiSearch]
|
27996
28884
|
attr_accessor :vertex_ai_search
|
@@ -28012,6 +28900,34 @@ module Google
|
|
28012
28900
|
end
|
28013
28901
|
end
|
28014
28902
|
|
28903
|
+
# Retrieval config.
|
28904
|
+
class GoogleCloudAiplatformV1beta1RetrievalConfig
|
28905
|
+
include Google::Apis::Core::Hashable
|
28906
|
+
|
28907
|
+
# The language code of the user.
|
28908
|
+
# Corresponds to the JSON property `languageCode`
|
28909
|
+
# @return [String]
|
28910
|
+
attr_accessor :language_code
|
28911
|
+
|
28912
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
28913
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
28914
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
28915
|
+
# must be within normalized ranges.
|
28916
|
+
# Corresponds to the JSON property `latLng`
|
28917
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleTypeLatLng]
|
28918
|
+
attr_accessor :lat_lng
|
28919
|
+
|
28920
|
+
def initialize(**args)
|
28921
|
+
update!(**args)
|
28922
|
+
end
|
28923
|
+
|
28924
|
+
# Update properties of this object
|
28925
|
+
def update!(**args)
|
28926
|
+
@language_code = args[:language_code] if args.key?(:language_code)
|
28927
|
+
@lat_lng = args[:lat_lng] if args.key?(:lat_lng)
|
28928
|
+
end
|
28929
|
+
end
|
28930
|
+
|
28015
28931
|
# Metadata related to retrieval in the grounding flow.
|
28016
28932
|
class GoogleCloudAiplatformV1beta1RetrievalMetadata
|
28017
28933
|
include Google::Apis::Core::Hashable
|
@@ -28139,6 +29055,59 @@ module Google
|
|
28139
29055
|
end
|
28140
29056
|
end
|
28141
29057
|
|
29058
|
+
# Configuration for rolling deployments.
|
29059
|
+
class GoogleCloudAiplatformV1beta1RolloutOptions
|
29060
|
+
include Google::Apis::Core::Hashable
|
29061
|
+
|
29062
|
+
# Percentage of allowed additional replicas. For autoscaling deployments, this
|
29063
|
+
# refers to the target replica count.
|
29064
|
+
# Corresponds to the JSON property `maxSurgePercentage`
|
29065
|
+
# @return [Fixnum]
|
29066
|
+
attr_accessor :max_surge_percentage
|
29067
|
+
|
29068
|
+
# Absolute count of allowed additional replicas.
|
29069
|
+
# Corresponds to the JSON property `maxSurgeReplicas`
|
29070
|
+
# @return [Fixnum]
|
29071
|
+
attr_accessor :max_surge_replicas
|
29072
|
+
|
29073
|
+
# Percentage of replicas allowed to be unavailable. For autoscaling deployments,
|
29074
|
+
# this refers to the target replica count.
|
29075
|
+
# Corresponds to the JSON property `maxUnavailablePercentage`
|
29076
|
+
# @return [Fixnum]
|
29077
|
+
attr_accessor :max_unavailable_percentage
|
29078
|
+
|
29079
|
+
# Absolute count of replicas allowed to be unavailable.
|
29080
|
+
# Corresponds to the JSON property `maxUnavailableReplicas`
|
29081
|
+
# @return [Fixnum]
|
29082
|
+
attr_accessor :max_unavailable_replicas
|
29083
|
+
|
29084
|
+
# ID of the DeployedModel that this deployment should replace.
|
29085
|
+
# Corresponds to the JSON property `previousDeployedModel`
|
29086
|
+
# @return [String]
|
29087
|
+
attr_accessor :previous_deployed_model
|
29088
|
+
|
29089
|
+
# Output only. Read-only. Revision number determines the relative priority of
|
29090
|
+
# DeployedModels in the same rollout. The DeployedModel with the largest
|
29091
|
+
# revision number specifies the intended state of the deployment.
|
29092
|
+
# Corresponds to the JSON property `revisionNumber`
|
29093
|
+
# @return [Fixnum]
|
29094
|
+
attr_accessor :revision_number
|
29095
|
+
|
29096
|
+
def initialize(**args)
|
29097
|
+
update!(**args)
|
29098
|
+
end
|
29099
|
+
|
29100
|
+
# Update properties of this object
|
29101
|
+
def update!(**args)
|
29102
|
+
@max_surge_percentage = args[:max_surge_percentage] if args.key?(:max_surge_percentage)
|
29103
|
+
@max_surge_replicas = args[:max_surge_replicas] if args.key?(:max_surge_replicas)
|
29104
|
+
@max_unavailable_percentage = args[:max_unavailable_percentage] if args.key?(:max_unavailable_percentage)
|
29105
|
+
@max_unavailable_replicas = args[:max_unavailable_replicas] if args.key?(:max_unavailable_replicas)
|
29106
|
+
@previous_deployed_model = args[:previous_deployed_model] if args.key?(:previous_deployed_model)
|
29107
|
+
@revision_number = args[:revision_number] if args.key?(:revision_number)
|
29108
|
+
end
|
29109
|
+
end
|
29110
|
+
|
28142
29111
|
# Input for rouge metric.
|
28143
29112
|
class GoogleCloudAiplatformV1beta1RougeInput
|
28144
29113
|
include Google::Apis::Core::Hashable
|
@@ -32427,8 +33396,9 @@ module Google
|
|
32427
33396
|
class GoogleCloudAiplatformV1beta1SchemaTextDataItem
|
32428
33397
|
include Google::Apis::Core::Hashable
|
32429
33398
|
|
32430
|
-
# Output only. Google Cloud Storage URI points to the original text in
|
32431
|
-
# bucket. The text file is up to 10MB
|
33399
|
+
# Output only. Google Cloud Storage URI points to a copy of the original text in
|
33400
|
+
# the Vertex-managed bucket in the user's project. The text file is up to 10MB
|
33401
|
+
# in size.
|
32432
33402
|
# Corresponds to the JSON property `gcsUri`
|
32433
33403
|
# @return [String]
|
32434
33404
|
attr_accessor :gcs_uri
|
@@ -36362,6 +37332,62 @@ module Google
|
|
36362
37332
|
end
|
36363
37333
|
end
|
36364
37334
|
|
37335
|
+
# Represents an environment variable where the value is a secret in Cloud Secret
|
37336
|
+
# Manager.
|
37337
|
+
class GoogleCloudAiplatformV1beta1SecretEnvVar
|
37338
|
+
include Google::Apis::Core::Hashable
|
37339
|
+
|
37340
|
+
# Required. Name of the secret environment variable.
|
37341
|
+
# Corresponds to the JSON property `name`
|
37342
|
+
# @return [String]
|
37343
|
+
attr_accessor :name
|
37344
|
+
|
37345
|
+
# Reference to a secret stored in the Cloud Secret Manager that will provide the
|
37346
|
+
# value for this environment variable.
|
37347
|
+
# Corresponds to the JSON property `secretRef`
|
37348
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SecretRef]
|
37349
|
+
attr_accessor :secret_ref
|
37350
|
+
|
37351
|
+
def initialize(**args)
|
37352
|
+
update!(**args)
|
37353
|
+
end
|
37354
|
+
|
37355
|
+
# Update properties of this object
|
37356
|
+
def update!(**args)
|
37357
|
+
@name = args[:name] if args.key?(:name)
|
37358
|
+
@secret_ref = args[:secret_ref] if args.key?(:secret_ref)
|
37359
|
+
end
|
37360
|
+
end
|
37361
|
+
|
37362
|
+
# Reference to a secret stored in the Cloud Secret Manager that will provide the
|
37363
|
+
# value for this environment variable.
|
37364
|
+
class GoogleCloudAiplatformV1beta1SecretRef
|
37365
|
+
include Google::Apis::Core::Hashable
|
37366
|
+
|
37367
|
+
# Required. The name of the secret in Cloud Secret Manager. Format: `secret_name`
|
37368
|
+
# if the secret is in the same project. projects/`project`/secrets/`secret_name`
|
37369
|
+
# if the secret is in a different project.
|
37370
|
+
# Corresponds to the JSON property `secret`
|
37371
|
+
# @return [String]
|
37372
|
+
attr_accessor :secret
|
37373
|
+
|
37374
|
+
# The Cloud Secret Manager secret version. Can be 'latest' for the latest
|
37375
|
+
# version, an integer for a specific version, or a version alias.
|
37376
|
+
# Corresponds to the JSON property `version`
|
37377
|
+
# @return [String]
|
37378
|
+
attr_accessor :version
|
37379
|
+
|
37380
|
+
def initialize(**args)
|
37381
|
+
update!(**args)
|
37382
|
+
end
|
37383
|
+
|
37384
|
+
# Update properties of this object
|
37385
|
+
def update!(**args)
|
37386
|
+
@secret = args[:secret] if args.key?(:secret)
|
37387
|
+
@version = args[:version] if args.key?(:version)
|
37388
|
+
end
|
37389
|
+
end
|
37390
|
+
|
36365
37391
|
# Segment of the content.
|
36366
37392
|
class GoogleCloudAiplatformV1beta1Segment
|
36367
37393
|
include Google::Apis::Core::Hashable
|
@@ -36729,6 +37755,81 @@ module Google
|
|
36729
37755
|
end
|
36730
37756
|
end
|
36731
37757
|
|
37758
|
+
# Configuration for Speculative Decoding.
|
37759
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec
|
37760
|
+
include Google::Apis::Core::Hashable
|
37761
|
+
|
37762
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37763
|
+
# tokens for speculative decoding.
|
37764
|
+
# Corresponds to the JSON property `draftModelSpeculation`
|
37765
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation]
|
37766
|
+
attr_accessor :draft_model_speculation
|
37767
|
+
|
37768
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37769
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37770
|
+
# Corresponds to the JSON property `ngramSpeculation`
|
37771
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation]
|
37772
|
+
attr_accessor :ngram_speculation
|
37773
|
+
|
37774
|
+
# The number of speculative tokens to generate at each step.
|
37775
|
+
# Corresponds to the JSON property `speculativeTokenCount`
|
37776
|
+
# @return [Fixnum]
|
37777
|
+
attr_accessor :speculative_token_count
|
37778
|
+
|
37779
|
+
def initialize(**args)
|
37780
|
+
update!(**args)
|
37781
|
+
end
|
37782
|
+
|
37783
|
+
# Update properties of this object
|
37784
|
+
def update!(**args)
|
37785
|
+
@draft_model_speculation = args[:draft_model_speculation] if args.key?(:draft_model_speculation)
|
37786
|
+
@ngram_speculation = args[:ngram_speculation] if args.key?(:ngram_speculation)
|
37787
|
+
@speculative_token_count = args[:speculative_token_count] if args.key?(:speculative_token_count)
|
37788
|
+
end
|
37789
|
+
end
|
37790
|
+
|
37791
|
+
# Draft model speculation works by using the smaller model to generate candidate
|
37792
|
+
# tokens for speculative decoding.
|
37793
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation
|
37794
|
+
include Google::Apis::Core::Hashable
|
37795
|
+
|
37796
|
+
# Required. The resource name of the draft model.
|
37797
|
+
# Corresponds to the JSON property `draftModel`
|
37798
|
+
# @return [String]
|
37799
|
+
attr_accessor :draft_model
|
37800
|
+
|
37801
|
+
def initialize(**args)
|
37802
|
+
update!(**args)
|
37803
|
+
end
|
37804
|
+
|
37805
|
+
# Update properties of this object
|
37806
|
+
def update!(**args)
|
37807
|
+
@draft_model = args[:draft_model] if args.key?(:draft_model)
|
37808
|
+
end
|
37809
|
+
end
|
37810
|
+
|
37811
|
+
# N-Gram speculation works by trying to find matching tokens in the previous
|
37812
|
+
# prompt sequence and use those as speculation for generating new tokens.
|
37813
|
+
class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation
|
37814
|
+
include Google::Apis::Core::Hashable
|
37815
|
+
|
37816
|
+
# The number of last N input tokens used as ngram to search/match against the
|
37817
|
+
# previous prompt sequence. This is equal to the N in N-Gram. The default value
|
37818
|
+
# is 3 if not specified.
|
37819
|
+
# Corresponds to the JSON property `ngramSize`
|
37820
|
+
# @return [Fixnum]
|
37821
|
+
attr_accessor :ngram_size
|
37822
|
+
|
37823
|
+
def initialize(**args)
|
37824
|
+
update!(**args)
|
37825
|
+
end
|
37826
|
+
|
37827
|
+
# Update properties of this object
|
37828
|
+
def update!(**args)
|
37829
|
+
@ngram_size = args[:ngram_size] if args.key?(:ngram_size)
|
37830
|
+
end
|
37831
|
+
end
|
37832
|
+
|
36732
37833
|
# The speech generation config.
|
36733
37834
|
class GoogleCloudAiplatformV1beta1SpeechConfig
|
36734
37835
|
include Google::Apis::Core::Hashable
|
@@ -38454,6 +39555,12 @@ module Google
|
|
38454
39555
|
class GoogleCloudAiplatformV1beta1SupervisedTuningDataStats
|
38455
39556
|
include Google::Apis::Core::Hashable
|
38456
39557
|
|
39558
|
+
# Output only. For each index in `truncated_example_indices`, the user-facing
|
39559
|
+
# reason why the example was dropped. Must not include example itself.
|
39560
|
+
# Corresponds to the JSON property `droppedExampleReasons`
|
39561
|
+
# @return [Array<String>]
|
39562
|
+
attr_accessor :dropped_example_reasons
|
39563
|
+
|
38457
39564
|
# Output only. Number of billable characters in the tuning dataset.
|
38458
39565
|
# Corresponds to the JSON property `totalBillableCharacterCount`
|
38459
39566
|
# @return [Fixnum]
|
@@ -38464,7 +39571,9 @@ module Google
|
|
38464
39571
|
# @return [Fixnum]
|
38465
39572
|
attr_accessor :total_billable_token_count
|
38466
39573
|
|
38467
|
-
# The number of examples in the dataset that have been
|
39574
|
+
# Output only. The number of examples in the dataset that have been dropped. An
|
39575
|
+
# example can be dropped for reasons including: too many tokens, contains an
|
39576
|
+
# invalid image, contains too many images, etc.
|
38468
39577
|
# Corresponds to the JSON property `totalTruncatedExampleCount`
|
38469
39578
|
# @return [Fixnum]
|
38470
39579
|
attr_accessor :total_truncated_example_count
|
@@ -38474,7 +39583,8 @@ module Google
|
|
38474
39583
|
# @return [Fixnum]
|
38475
39584
|
attr_accessor :total_tuning_character_count
|
38476
39585
|
|
38477
|
-
# A partial sample of the indices (starting from 1) of the
|
39586
|
+
# Output only. A partial sample of the indices (starting from 1) of the dropped
|
39587
|
+
# examples.
|
38478
39588
|
# Corresponds to the JSON property `truncatedExampleIndices`
|
38479
39589
|
# @return [Array<Fixnum>]
|
38480
39590
|
attr_accessor :truncated_example_indices
|
@@ -38515,6 +39625,7 @@ module Google
|
|
38515
39625
|
|
38516
39626
|
# Update properties of this object
|
38517
39627
|
def update!(**args)
|
39628
|
+
@dropped_example_reasons = args[:dropped_example_reasons] if args.key?(:dropped_example_reasons)
|
38518
39629
|
@total_billable_character_count = args[:total_billable_character_count] if args.key?(:total_billable_character_count)
|
38519
39630
|
@total_billable_token_count = args[:total_billable_token_count] if args.key?(:total_billable_token_count)
|
38520
39631
|
@total_truncated_example_count = args[:total_truncated_example_count] if args.key?(:total_truncated_example_count)
|
@@ -39445,6 +40556,12 @@ module Google
|
|
39445
40556
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ToolCodeExecution]
|
39446
40557
|
attr_accessor :code_execution
|
39447
40558
|
|
40559
|
+
# Tool to search public web data, powered by Vertex AI Search and Sec4
|
40560
|
+
# compliance.
|
40561
|
+
# Corresponds to the JSON property `enterpriseWebSearch`
|
40562
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnterpriseWebSearch]
|
40563
|
+
attr_accessor :enterprise_web_search
|
40564
|
+
|
39448
40565
|
# Optional. Function tool type. One or more function declarations to be passed
|
39449
40566
|
# to the model along with the current user query. Model may decide to call a
|
39450
40567
|
# subset of these functions by populating FunctionCall in the response. User
|
@@ -39478,6 +40595,7 @@ module Google
|
|
39478
40595
|
# Update properties of this object
|
39479
40596
|
def update!(**args)
|
39480
40597
|
@code_execution = args[:code_execution] if args.key?(:code_execution)
|
40598
|
+
@enterprise_web_search = args[:enterprise_web_search] if args.key?(:enterprise_web_search)
|
39481
40599
|
@function_declarations = args[:function_declarations] if args.key?(:function_declarations)
|
39482
40600
|
@google_search = args[:google_search] if args.key?(:google_search)
|
39483
40601
|
@google_search_retrieval = args[:google_search_retrieval] if args.key?(:google_search_retrieval)
|
@@ -39635,6 +40753,11 @@ module Google
|
|
39635
40753
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionCallingConfig]
|
39636
40754
|
attr_accessor :function_calling_config
|
39637
40755
|
|
40756
|
+
# Retrieval config.
|
40757
|
+
# Corresponds to the JSON property `retrievalConfig`
|
40758
|
+
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RetrievalConfig]
|
40759
|
+
attr_accessor :retrieval_config
|
40760
|
+
|
39638
40761
|
def initialize(**args)
|
39639
40762
|
update!(**args)
|
39640
40763
|
end
|
@@ -39642,6 +40765,7 @@ module Google
|
|
39642
40765
|
# Update properties of this object
|
39643
40766
|
def update!(**args)
|
39644
40767
|
@function_calling_config = args[:function_calling_config] if args.key?(:function_calling_config)
|
40768
|
+
@retrieval_config = args[:retrieval_config] if args.key?(:retrieval_config)
|
39645
40769
|
end
|
39646
40770
|
end
|
39647
40771
|
|
@@ -41024,7 +42148,7 @@ module Google
|
|
41024
42148
|
end
|
41025
42149
|
end
|
41026
42150
|
|
41027
|
-
# The Model Registry Model and Online Prediction Endpoint
|
42151
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
41028
42152
|
# TuningJob.
|
41029
42153
|
class GoogleCloudAiplatformV1beta1TunedModel
|
41030
42154
|
include Google::Apis::Core::Hashable
|
@@ -41214,7 +42338,7 @@ module Google
|
|
41214
42338
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SupervisedTuningSpec]
|
41215
42339
|
attr_accessor :supervised_tuning_spec
|
41216
42340
|
|
41217
|
-
# The Model Registry Model and Online Prediction Endpoint
|
42341
|
+
# The Model Registry Model and Online Prediction Endpoint associated with this
|
41218
42342
|
# TuningJob.
|
41219
42343
|
# Corresponds to the JSON property `tunedModel`
|
41220
42344
|
# @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1TunedModel]
|
@@ -42075,12 +43199,13 @@ module Google
|
|
42075
43199
|
end
|
42076
43200
|
end
|
42077
43201
|
|
42078
|
-
# Retrieve from Vertex AI Search datastore for grounding.
|
42079
|
-
# google.com/products/agent-
|
43202
|
+
# Retrieve from Vertex AI Search datastore or engine for grounding. datastore
|
43203
|
+
# and engine are mutually exclusive. See https://cloud.google.com/products/agent-
|
43204
|
+
# builder
|
42080
43205
|
class GoogleCloudAiplatformV1beta1VertexAiSearch
|
42081
43206
|
include Google::Apis::Core::Hashable
|
42082
43207
|
|
42083
|
-
#
|
43208
|
+
# Optional. Fully-qualified Vertex AI Search data store resource ID. Format: `
|
42084
43209
|
# projects/`project`/locations/`location`/collections/`collection`/dataStores/`
|
42085
43210
|
# dataStore``
|
42086
43211
|
# Corresponds to the JSON property `datastore`
|
@@ -43213,6 +44338,34 @@ module Google
|
|
43213
44338
|
end
|
43214
44339
|
end
|
43215
44340
|
|
44341
|
+
# An object that represents a latitude/longitude pair. This is expressed as a
|
44342
|
+
# pair of doubles to represent degrees latitude and degrees longitude. Unless
|
44343
|
+
# specified otherwise, this object must conform to the WGS84 standard. Values
|
44344
|
+
# must be within normalized ranges.
|
44345
|
+
class GoogleTypeLatLng
|
44346
|
+
include Google::Apis::Core::Hashable
|
44347
|
+
|
44348
|
+
# The latitude in degrees. It must be in the range [-90.0, +90.0].
|
44349
|
+
# Corresponds to the JSON property `latitude`
|
44350
|
+
# @return [Float]
|
44351
|
+
attr_accessor :latitude
|
44352
|
+
|
44353
|
+
# The longitude in degrees. It must be in the range [-180.0, +180.0].
|
44354
|
+
# Corresponds to the JSON property `longitude`
|
44355
|
+
# @return [Float]
|
44356
|
+
attr_accessor :longitude
|
44357
|
+
|
44358
|
+
def initialize(**args)
|
44359
|
+
update!(**args)
|
44360
|
+
end
|
44361
|
+
|
44362
|
+
# Update properties of this object
|
44363
|
+
def update!(**args)
|
44364
|
+
@latitude = args[:latitude] if args.key?(:latitude)
|
44365
|
+
@longitude = args[:longitude] if args.key?(:longitude)
|
44366
|
+
end
|
44367
|
+
end
|
44368
|
+
|
43216
44369
|
# Represents an amount of money with its currency type.
|
43217
44370
|
class GoogleTypeMoney
|
43218
44371
|
include Google::Apis::Core::Hashable
|