google-apis-aiplatform_v1beta1 0.35.0 → 0.37.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -474,7 +474,7 @@ module Google
474
474
  end
475
475
  end
476
476
 
477
- # Create API error message for Vertex Pipeline. Next Id: 3.
477
+ # Create API error message for Vertex Pipeline.
478
478
  class CloudAiPlatformCommonCreatePipelineJobApiErrorDetail
479
479
  include Google::Apis::Core::Hashable
480
480
 
@@ -840,7 +840,8 @@ module Google
840
840
  end
841
841
  end
842
842
 
843
- # The generic reusable api auth config.
843
+ # The generic reusable api auth config. Deprecated. Please use AuthConfig (
844
+ # google/cloud/aiplatform/master/auth.proto) instead.
844
845
  class GoogleCloudAiplatformV1beta1ApiAuth
845
846
  include Google::Apis::Core::Hashable
846
847
 
@@ -1310,15 +1311,22 @@ module Google
1310
1311
  class GoogleCloudAiplatformV1beta1AuthConfigApiKeyConfig
1311
1312
  include Google::Apis::Core::Hashable
1312
1313
 
1313
- # Required. The name of the SecretManager secret version resource storing the
1314
+ # Optional. The name of the SecretManager secret version resource storing the
1314
1315
  # API key. Format: `projects/`project`/secrets/`secrete`/versions/`version`` -
1315
- # If specified, the `secretmanager.versions.access` permission should be granted
1316
- # to Vertex AI Extension Service Agent (https://cloud.google.com/vertex-ai/docs/
1317
- # general/access-control#service-agents) on the specified resource.
1316
+ # If both `api_key_secret` and `api_key_string` are specified, this field takes
1317
+ # precedence over `api_key_string`. - If specified, the `secretmanager.versions.
1318
+ # access` permission should be granted to Vertex AI Extension Service Agent (
1319
+ # https://cloud.google.com/vertex-ai/docs/general/access-control#service-agents)
1320
+ # on the specified resource.
1318
1321
  # Corresponds to the JSON property `apiKeySecret`
1319
1322
  # @return [String]
1320
1323
  attr_accessor :api_key_secret
1321
1324
 
1325
+ # Optional. The API key to be used in the request directly.
1326
+ # Corresponds to the JSON property `apiKeyString`
1327
+ # @return [String]
1328
+ attr_accessor :api_key_string
1329
+
1322
1330
  # Required. The location of the API key.
1323
1331
  # Corresponds to the JSON property `httpElementLocation`
1324
1332
  # @return [String]
@@ -1337,6 +1345,7 @@ module Google
1337
1345
  # Update properties of this object
1338
1346
  def update!(**args)
1339
1347
  @api_key_secret = args[:api_key_secret] if args.key?(:api_key_secret)
1348
+ @api_key_string = args[:api_key_string] if args.key?(:api_key_string)
1340
1349
  @http_element_location = args[:http_element_location] if args.key?(:http_element_location)
1341
1350
  @name = args[:name] if args.key?(:name)
1342
1351
  end
@@ -1460,22 +1469,22 @@ module Google
1460
1469
  class GoogleCloudAiplatformV1beta1AutomaticResources
1461
1470
  include Google::Apis::Core::Hashable
1462
1471
 
1463
- # Immutable. The maximum number of replicas this DeployedModel may be deployed
1464
- # on when the traffic against it increases. If the requested value is too large,
1465
- # the deployment will error, but if deployment succeeds then the ability to
1466
- # scale the model to that many replicas is guaranteed (barring service outages).
1467
- # If traffic against the DeployedModel increases beyond what its replicas at
1468
- # maximum may handle, a portion of the traffic will be dropped. If this value is
1469
- # not provided, a no upper bound for scaling under heavy traffic will be assume,
1470
- # though Vertex AI may be unable to scale beyond certain replica number.
1472
+ # Immutable. The maximum number of replicas that may be deployed on when the
1473
+ # traffic against it increases. If the requested value is too large, the
1474
+ # deployment will error, but if deployment succeeds then the ability to scale to
1475
+ # that many replicas is guaranteed (barring service outages). If traffic
1476
+ # increases beyond what its replicas at maximum may handle, a portion of the
1477
+ # traffic will be dropped. If this value is not provided, a no upper bound for
1478
+ # scaling under heavy traffic will be assume, though Vertex AI may be unable to
1479
+ # scale beyond certain replica number.
1471
1480
  # Corresponds to the JSON property `maxReplicaCount`
1472
1481
  # @return [Fixnum]
1473
1482
  attr_accessor :max_replica_count
1474
1483
 
1475
- # Immutable. The minimum number of replicas this DeployedModel will be always
1476
- # deployed on. If traffic against it increases, it may dynamically be deployed
1477
- # onto more replicas up to max_replica_count, and as traffic decreases, some of
1478
- # these extra replicas may be freed. If the requested value is too large, the
1484
+ # Immutable. The minimum number of replicas that will be always deployed on. If
1485
+ # traffic against it increases, it may dynamically be deployed onto more
1486
+ # replicas up to max_replica_count, and as traffic decreases, some of these
1487
+ # extra replicas may be freed. If the requested value is too large, the
1479
1488
  # deployment will error.
1480
1489
  # Corresponds to the JSON property `minReplicaCount`
1481
1490
  # @return [Fixnum]
@@ -1492,6 +1501,48 @@ module Google
1492
1501
  end
1493
1502
  end
1494
1503
 
1504
+ # The configs for autorater. This is applicable to both EvaluateInstances and
1505
+ # EvaluateDataset.
1506
+ class GoogleCloudAiplatformV1beta1AutoraterConfig
1507
+ include Google::Apis::Core::Hashable
1508
+
1509
+ # Optional. The fully qualified name of the publisher model or tuned autorater
1510
+ # endpoint to use. Publisher model format: `projects/`project`/locations/`
1511
+ # location`/publishers/*/models/*` Tuned model endpoint format: `projects/`
1512
+ # project`/locations/`location`/endpoints/`endpoint``
1513
+ # Corresponds to the JSON property `autoraterModel`
1514
+ # @return [String]
1515
+ attr_accessor :autorater_model
1516
+
1517
+ # Optional. Whether to flip the candidate and baseline responses. This is only
1518
+ # applicable to the pairwise metric. If enabled, also provide PairwiseMetricSpec.
1519
+ # candidate_response_field_name and PairwiseMetricSpec.
1520
+ # baseline_response_field_name. When rendering PairwiseMetricSpec.
1521
+ # metric_prompt_template, the candidate and baseline fields will be flipped for
1522
+ # half of the samples to reduce bias.
1523
+ # Corresponds to the JSON property `flipEnabled`
1524
+ # @return [Boolean]
1525
+ attr_accessor :flip_enabled
1526
+ alias_method :flip_enabled?, :flip_enabled
1527
+
1528
+ # Optional. Number of samples for each instance in the dataset. If not specified,
1529
+ # the default is 4. Minimum value is 1, maximum value is 32.
1530
+ # Corresponds to the JSON property `samplingCount`
1531
+ # @return [Fixnum]
1532
+ attr_accessor :sampling_count
1533
+
1534
+ def initialize(**args)
1535
+ update!(**args)
1536
+ end
1537
+
1538
+ # Update properties of this object
1539
+ def update!(**args)
1540
+ @autorater_model = args[:autorater_model] if args.key?(:autorater_model)
1541
+ @flip_enabled = args[:flip_enabled] if args.key?(:flip_enabled)
1542
+ @sampling_count = args[:sampling_count] if args.key?(:sampling_count)
1543
+ end
1544
+ end
1545
+
1495
1546
  # The metric specification that defines the target resource utilization (CPU
1496
1547
  # utilization, accelerator's duty cycle, and so on) for calculating the desired
1497
1548
  # replica count.
@@ -2738,7 +2789,7 @@ module Google
2738
2789
  end
2739
2790
  end
2740
2791
 
2741
- # Content blob. It's preferred to send as text directly rather than raw bytes.
2792
+ # Content blob.
2742
2793
  class GoogleCloudAiplatformV1beta1Blob
2743
2794
  include Google::Apis::Core::Hashable
2744
2795
 
@@ -2748,6 +2799,13 @@ module Google
2748
2799
  # @return [String]
2749
2800
  attr_accessor :data
2750
2801
 
2802
+ # Optional. Display name of the blob. Used to provide a label or filename to
2803
+ # distinguish blobs. This field is only returned in PromptMessage for prompt
2804
+ # management. It is not currently used in the Gemini GenerateContent calls.
2805
+ # Corresponds to the JSON property `displayName`
2806
+ # @return [String]
2807
+ attr_accessor :display_name
2808
+
2751
2809
  # Required. The IANA standard MIME type of the source data.
2752
2810
  # Corresponds to the JSON property `mimeType`
2753
2811
  # @return [String]
@@ -2760,6 +2818,7 @@ module Google
2760
2818
  # Update properties of this object
2761
2819
  def update!(**args)
2762
2820
  @data = args[:data] if args.key?(:data)
2821
+ @display_name = args[:display_name] if args.key?(:display_name)
2763
2822
  @mime_type = args[:mime_type] if args.key?(:mime_type)
2764
2823
  end
2765
2824
  end
@@ -2844,7 +2903,7 @@ module Google
2844
2903
  # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Content>]
2845
2904
  attr_accessor :contents
2846
2905
 
2847
- # Output only. Creatation time of the cache entry.
2906
+ # Output only. Creation time of the cache entry.
2848
2907
  # Corresponds to the JSON property `createTime`
2849
2908
  # @return [String]
2850
2909
  attr_accessor :create_time
@@ -2861,8 +2920,9 @@ module Google
2861
2920
  # @return [String]
2862
2921
  attr_accessor :expire_time
2863
2922
 
2864
- # Immutable. The name of the publisher model to use for cached content. Format:
2865
- # projects/`project`/locations/`location`/publishers/`publisher`/models/`model`
2923
+ # Immutable. The name of the `Model` to use for cached content. Currently, only
2924
+ # the published Gemini base models are supported, in form of projects/`PROJECT`/
2925
+ # locations/`LOCATION`/publishers/google/models/`MODEL`
2866
2926
  # Corresponds to the JSON property `model`
2867
2927
  # @return [String]
2868
2928
  attr_accessor :model
@@ -4152,6 +4212,11 @@ module Google
4152
4212
  class GoogleCloudAiplatformV1beta1CountTokensResponse
4153
4213
  include Google::Apis::Core::Hashable
4154
4214
 
4215
+ # Output only. List of modalities that were processed in the request input.
4216
+ # Corresponds to the JSON property `promptTokensDetails`
4217
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
4218
+ attr_accessor :prompt_tokens_details
4219
+
4155
4220
  # The total number of billable characters counted across all instances from the
4156
4221
  # request.
4157
4222
  # Corresponds to the JSON property `totalBillableCharacters`
@@ -4169,6 +4234,7 @@ module Google
4169
4234
 
4170
4235
  # Update properties of this object
4171
4236
  def update!(**args)
4237
+ @prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
4172
4238
  @total_billable_characters = args[:total_billable_characters] if args.key?(:total_billable_characters)
4173
4239
  @total_tokens = args[:total_tokens] if args.key?(:total_tokens)
4174
4240
  end
@@ -5504,7 +5570,8 @@ module Google
5504
5570
  # @return [String]
5505
5571
  attr_accessor :model_reference
5506
5572
 
5507
- # Output only. Identifier. The resource name of the Dataset.
5573
+ # Output only. Identifier. The resource name of the Dataset. Format: `projects/`
5574
+ # project`/locations/`location`/datasets/`dataset``
5508
5575
  # Corresponds to the JSON property `name`
5509
5576
  # @return [String]
5510
5577
  attr_accessor :name
@@ -5752,7 +5819,9 @@ module Google
5752
5819
  # @return [String]
5753
5820
  attr_accessor :model_reference
5754
5821
 
5755
- # Output only. Identifier. The resource name of the DatasetVersion.
5822
+ # Output only. Identifier. The resource name of the DatasetVersion. Format: `
5823
+ # projects/`project`/locations/`location`/datasets/`dataset`/datasetVersions/`
5824
+ # dataset_version``
5756
5825
  # Corresponds to the JSON property `name`
5757
5826
  # @return [String]
5758
5827
  attr_accessor :name
@@ -5793,8 +5862,8 @@ module Google
5793
5862
  end
5794
5863
  end
5795
5864
 
5796
- # A description of resources that are dedicated to a DeployedModel, and that
5797
- # need a higher degree of manual configuration.
5865
+ # A description of resources that are dedicated to a DeployedModel or
5866
+ # DeployedIndex, and that need a higher degree of manual configuration.
5798
5867
  class GoogleCloudAiplatformV1beta1DedicatedResources
5799
5868
  include Google::Apis::Core::Hashable
5800
5869
 
@@ -5820,36 +5889,33 @@ module Google
5820
5889
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1MachineSpec]
5821
5890
  attr_accessor :machine_spec
5822
5891
 
5823
- # Immutable. The maximum number of replicas this DeployedModel may be deployed
5824
- # on when the traffic against it increases. If the requested value is too large,
5825
- # the deployment will error, but if deployment succeeds then the ability to
5826
- # scale the model to that many replicas is guaranteed (barring service outages).
5827
- # If traffic against the DeployedModel increases beyond what its replicas at
5828
- # maximum may handle, a portion of the traffic will be dropped. If this value is
5829
- # not provided, will use min_replica_count as the default value. The value of
5830
- # this field impacts the charge against Vertex CPU and GPU quotas. Specifically,
5831
- # you will be charged for (max_replica_count * number of cores in the selected
5832
- # machine type) and (max_replica_count * number of GPUs per replica in the
5833
- # selected machine type).
5892
+ # Immutable. The maximum number of replicas that may be deployed on when the
5893
+ # traffic against it increases. If the requested value is too large, the
5894
+ # deployment will error, but if deployment succeeds then the ability to scale to
5895
+ # that many replicas is guaranteed (barring service outages). If traffic
5896
+ # increases beyond what its replicas at maximum may handle, a portion of the
5897
+ # traffic will be dropped. If this value is not provided, will use
5898
+ # min_replica_count as the default value. The value of this field impacts the
5899
+ # charge against Vertex CPU and GPU quotas. Specifically, you will be charged
5900
+ # for (max_replica_count * number of cores in the selected machine type) and (
5901
+ # max_replica_count * number of GPUs per replica in the selected machine type).
5834
5902
  # Corresponds to the JSON property `maxReplicaCount`
5835
5903
  # @return [Fixnum]
5836
5904
  attr_accessor :max_replica_count
5837
5905
 
5838
- # Required. Immutable. The minimum number of machine replicas this DeployedModel
5839
- # will be always deployed on. This value must be greater than or equal to 1. If
5840
- # traffic against the DeployedModel increases, it may dynamically be deployed
5841
- # onto more replicas, and as traffic decreases, some of these extra replicas may
5842
- # be freed.
5906
+ # Required. Immutable. The minimum number of machine replicas that will be
5907
+ # always deployed on. This value must be greater than or equal to 1. If traffic
5908
+ # increases, it may dynamically be deployed onto more replicas, and as traffic
5909
+ # decreases, some of these extra replicas may be freed.
5843
5910
  # Corresponds to the JSON property `minReplicaCount`
5844
5911
  # @return [Fixnum]
5845
5912
  attr_accessor :min_replica_count
5846
5913
 
5847
5914
  # Optional. Number of required available replicas for the deployment to succeed.
5848
- # This field is only needed when partial model deployment/mutation is desired.
5849
- # If set, the model deploy/mutate operation will succeed once
5850
- # available_replica_count reaches required_replica_count, and the rest of the
5851
- # replicas will be retried. If not set, the default required_replica_count will
5852
- # be min_replica_count.
5915
+ # This field is only needed when partial deployment/mutation is desired. If set,
5916
+ # the deploy/mutate operation will succeed once available_replica_count reaches
5917
+ # required_replica_count, and the rest of the replicas will be retried. If not
5918
+ # set, the default required_replica_count will be min_replica_count.
5853
5919
  # Corresponds to the JSON property `requiredReplicaCount`
5854
5920
  # @return [Fixnum]
5855
5921
  attr_accessor :required_replica_count
@@ -6259,8 +6325,8 @@ module Google
6259
6325
  attr_accessor :accept_eula
6260
6326
  alias_method :accept_eula?, :accept_eula
6261
6327
 
6262
- # A description of resources that are dedicated to a DeployedModel, and that
6263
- # need a higher degree of manual configuration.
6328
+ # A description of resources that are dedicated to a DeployedModel or
6329
+ # DeployedIndex, and that need a higher degree of manual configuration.
6264
6330
  # Corresponds to the JSON property `dedicatedResources`
6265
6331
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
6266
6332
  attr_accessor :dedicated_resources
@@ -6277,9 +6343,11 @@ module Google
6277
6343
  # @return [String]
6278
6344
  attr_accessor :hugging_face_access_token
6279
6345
 
6280
- # Required. The name of the PublisherModel resource. Format: `publishers/`
6281
- # publisher`/models/`publisher_model`@`version_id``, or `publishers/hf-`hugging-
6282
- # face-author`/models/`hugging-face-model-name`@001`
6346
+ # Required. The model to deploy. Format: 1. `publishers/`publisher`/models/`
6347
+ # publisher_model`@`version_id``, or `publishers/hf-`hugging-face-author`/models/
6348
+ # `hugging-face-model-name`@001`. 2. Hugging Face model ID like `google/gemma-2-
6349
+ # 2b-it`. 3. Custom model Google Cloud Storage URI like `gs://bucket`. 4. Custom
6350
+ # model zip file like `https://abc.com/a.zip`.
6283
6351
  # Corresponds to the JSON property `model`
6284
6352
  # @return [String]
6285
6353
  attr_accessor :model
@@ -6340,8 +6408,8 @@ module Google
6340
6408
  # @return [String]
6341
6409
  attr_accessor :create_time
6342
6410
 
6343
- # A description of resources that are dedicated to a DeployedModel, and that
6344
- # need a higher degree of manual configuration.
6411
+ # A description of resources that are dedicated to a DeployedModel or
6412
+ # DeployedIndex, and that need a higher degree of manual configuration.
6345
6413
  # Corresponds to the JSON property `dedicatedResources`
6346
6414
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
6347
6415
  attr_accessor :dedicated_resources
@@ -6553,8 +6621,8 @@ module Google
6553
6621
  # @return [String]
6554
6622
  attr_accessor :create_time
6555
6623
 
6556
- # A description of resources that are dedicated to a DeployedModel, and that
6557
- # need a higher degree of manual configuration.
6624
+ # A description of resources that are dedicated to a DeployedModel or
6625
+ # DeployedIndex, and that need a higher degree of manual configuration.
6558
6626
  # Corresponds to the JSON property `dedicatedResources`
6559
6627
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
6560
6628
  attr_accessor :dedicated_resources
@@ -6630,6 +6698,11 @@ module Google
6630
6698
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PrivateEndpoints]
6631
6699
  attr_accessor :private_endpoints
6632
6700
 
6701
+ # Configuration for rolling deployments.
6702
+ # Corresponds to the JSON property `rolloutOptions`
6703
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RolloutOptions]
6704
+ attr_accessor :rollout_options
6705
+
6633
6706
  # The service account that the DeployedModel's container runs as. Specify the
6634
6707
  # email address of the service account. If this service account is not specified,
6635
6708
  # the container runs as a service account that doesn't have access to the
@@ -6646,6 +6719,11 @@ module Google
6646
6719
  # @return [String]
6647
6720
  attr_accessor :shared_resources
6648
6721
 
6722
+ # Configuration for Speculative Decoding.
6723
+ # Corresponds to the JSON property `speculativeDecodingSpec`
6724
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec]
6725
+ attr_accessor :speculative_decoding_spec
6726
+
6649
6727
  # Runtime status of the deployed model.
6650
6728
  # Corresponds to the JSON property `status`
6651
6729
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DeployedModelStatus]
@@ -6676,8 +6754,10 @@ module Google
6676
6754
  @model = args[:model] if args.key?(:model)
6677
6755
  @model_version_id = args[:model_version_id] if args.key?(:model_version_id)
6678
6756
  @private_endpoints = args[:private_endpoints] if args.key?(:private_endpoints)
6757
+ @rollout_options = args[:rollout_options] if args.key?(:rollout_options)
6679
6758
  @service_account = args[:service_account] if args.key?(:service_account)
6680
6759
  @shared_resources = args[:shared_resources] if args.key?(:shared_resources)
6760
+ @speculative_decoding_spec = args[:speculative_decoding_spec] if args.key?(:speculative_decoding_spec)
6681
6761
  @status = args[:status] if args.key?(:status)
6682
6762
  @system_labels = args[:system_labels] if args.key?(:system_labels)
6683
6763
  end
@@ -6749,8 +6829,8 @@ module Google
6749
6829
  # @return [String]
6750
6830
  attr_accessor :create_time
6751
6831
 
6752
- # A description of resources that are dedicated to a DeployedModel, and that
6753
- # need a higher degree of manual configuration.
6832
+ # A description of resources that are dedicated to a DeployedModel or
6833
+ # DeployedIndex, and that need a higher degree of manual configuration.
6754
6834
  # Corresponds to the JSON property `dedicatedResources`
6755
6835
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
6756
6836
  attr_accessor :dedicated_resources
@@ -7047,9 +7127,9 @@ module Google
7047
7127
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DistillationHyperParameters]
7048
7128
  attr_accessor :hyper_parameters
7049
7129
 
7050
- # Required. Deprecated. A path in a Cloud Storage bucket, which will be treated
7051
- # as the root output directory of the distillation pipeline. It is used by the
7052
- # system to generate the paths of output artifacts.
7130
+ # Deprecated. A path in a Cloud Storage bucket, which will be treated as the
7131
+ # root output directory of the distillation pipeline. It is used by the system
7132
+ # to generate the paths of output artifacts.
7053
7133
  # Corresponds to the JSON property `pipelineRootDirectory`
7054
7134
  # @return [String]
7055
7135
  attr_accessor :pipeline_root_directory
@@ -7060,7 +7140,7 @@ module Google
7060
7140
  # @return [String]
7061
7141
  attr_accessor :student_model
7062
7142
 
7063
- # Required. Cloud Storage path to file containing training dataset for tuning.
7143
+ # Deprecated. Cloud Storage path to file containing training dataset for tuning.
7064
7144
  # The dataset must be formatted as a JSONL file.
7065
7145
  # Corresponds to the JSON property `trainingDatasetUri`
7066
7146
  # @return [String]
@@ -7232,6 +7312,11 @@ module Google
7232
7312
  # @return [String]
7233
7313
  attr_accessor :etag
7234
7314
 
7315
+ # Configuration for GenAiAdvancedFeatures.
7316
+ # Corresponds to the JSON property `genAiAdvancedFeaturesConfig`
7317
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig]
7318
+ attr_accessor :gen_ai_advanced_features_config
7319
+
7235
7320
  # The labels with user-defined metadata to organize your Endpoints. Label keys
7236
7321
  # and values can be no longer than 64 characters (Unicode codepoints), can only
7237
7322
  # contain lowercase letters, numeric characters, underscores and dashes.
@@ -7318,6 +7403,7 @@ module Google
7318
7403
  @enable_private_service_connect = args[:enable_private_service_connect] if args.key?(:enable_private_service_connect)
7319
7404
  @encryption_spec = args[:encryption_spec] if args.key?(:encryption_spec)
7320
7405
  @etag = args[:etag] if args.key?(:etag)
7406
+ @gen_ai_advanced_features_config = args[:gen_ai_advanced_features_config] if args.key?(:gen_ai_advanced_features_config)
7321
7407
  @labels = args[:labels] if args.key?(:labels)
7322
7408
  @model_deployment_monitoring_job = args[:model_deployment_monitoring_job] if args.key?(:model_deployment_monitoring_job)
7323
7409
  @name = args[:name] if args.key?(:name)
@@ -7545,10 +7631,54 @@ module Google
7545
7631
  end
7546
7632
  end
7547
7633
 
7634
+ # Request message for EvaluationService.EvaluateDataset.
7635
+ class GoogleCloudAiplatformV1beta1EvaluateDatasetRequest
7636
+ include Google::Apis::Core::Hashable
7637
+
7638
+ # The configs for autorater. This is applicable to both EvaluateInstances and
7639
+ # EvaluateDataset.
7640
+ # Corresponds to the JSON property `autoraterConfig`
7641
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
7642
+ attr_accessor :autorater_config
7643
+
7644
+ # The dataset used for evaluation.
7645
+ # Corresponds to the JSON property `dataset`
7646
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EvaluationDataset]
7647
+ attr_accessor :dataset
7648
+
7649
+ # Required. The metrics used for evaluation.
7650
+ # Corresponds to the JSON property `metrics`
7651
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Metric>]
7652
+ attr_accessor :metrics
7653
+
7654
+ # Config for evaluation output.
7655
+ # Corresponds to the JSON property `outputConfig`
7656
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1OutputConfig]
7657
+ attr_accessor :output_config
7658
+
7659
+ def initialize(**args)
7660
+ update!(**args)
7661
+ end
7662
+
7663
+ # Update properties of this object
7664
+ def update!(**args)
7665
+ @autorater_config = args[:autorater_config] if args.key?(:autorater_config)
7666
+ @dataset = args[:dataset] if args.key?(:dataset)
7667
+ @metrics = args[:metrics] if args.key?(:metrics)
7668
+ @output_config = args[:output_config] if args.key?(:output_config)
7669
+ end
7670
+ end
7671
+
7548
7672
  # Request message for EvaluationService.EvaluateInstances.
7549
7673
  class GoogleCloudAiplatformV1beta1EvaluateInstancesRequest
7550
7674
  include Google::Apis::Core::Hashable
7551
7675
 
7676
+ # The configs for autorater. This is applicable to both EvaluateInstances and
7677
+ # EvaluateDataset.
7678
+ # Corresponds to the JSON property `autoraterConfig`
7679
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1AutoraterConfig]
7680
+ attr_accessor :autorater_config
7681
+
7552
7682
  # Input for bleu metric.
7553
7683
  # Corresponds to the JSON property `bleuInput`
7554
7684
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuInput]
@@ -7710,6 +7840,7 @@ module Google
7710
7840
 
7711
7841
  # Update properties of this object
7712
7842
  def update!(**args)
7843
+ @autorater_config = args[:autorater_config] if args.key?(:autorater_config)
7713
7844
  @bleu_input = args[:bleu_input] if args.key?(:bleu_input)
7714
7845
  @coherence_input = args[:coherence_input] if args.key?(:coherence_input)
7715
7846
  @comet_input = args[:comet_input] if args.key?(:comet_input)
@@ -8049,6 +8180,31 @@ module Google
8049
8180
  end
8050
8181
  end
8051
8182
 
8183
+ # The dataset used for evaluation.
8184
+ class GoogleCloudAiplatformV1beta1EvaluationDataset
8185
+ include Google::Apis::Core::Hashable
8186
+
8187
+ # The BigQuery location for the input content.
8188
+ # Corresponds to the JSON property `bigquerySource`
8189
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BigQuerySource]
8190
+ attr_accessor :bigquery_source
8191
+
8192
+ # The Google Cloud Storage location for the input content.
8193
+ # Corresponds to the JSON property `gcsSource`
8194
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsSource]
8195
+ attr_accessor :gcs_source
8196
+
8197
+ def initialize(**args)
8198
+ update!(**args)
8199
+ end
8200
+
8201
+ # Update properties of this object
8202
+ def update!(**args)
8203
+ @bigquery_source = args[:bigquery_source] if args.key?(:bigquery_source)
8204
+ @gcs_source = args[:gcs_source] if args.key?(:gcs_source)
8205
+ end
8206
+ end
8207
+
8052
8208
  # An edge describing the relationship between an Artifact and an Execution in a
8053
8209
  # lineage graph.
8054
8210
  class GoogleCloudAiplatformV1beta1Event
@@ -9572,6 +9728,51 @@ module Google
9572
9728
  end
9573
9729
  end
9574
9730
 
9731
+ # Runtime operation information for ModelGardenService.ExportPublisherModel.
9732
+ class GoogleCloudAiplatformV1beta1ExportPublisherModelOperationMetadata
9733
+ include Google::Apis::Core::Hashable
9734
+
9735
+ # Generic Metadata shared by all operations.
9736
+ # Corresponds to the JSON property `genericMetadata`
9737
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenericOperationMetadata]
9738
+ attr_accessor :generic_metadata
9739
+
9740
+ def initialize(**args)
9741
+ update!(**args)
9742
+ end
9743
+
9744
+ # Update properties of this object
9745
+ def update!(**args)
9746
+ @generic_metadata = args[:generic_metadata] if args.key?(:generic_metadata)
9747
+ end
9748
+ end
9749
+
9750
+ # Response message for ModelGardenService.ExportPublisherModel.
9751
+ class GoogleCloudAiplatformV1beta1ExportPublisherModelResponse
9752
+ include Google::Apis::Core::Hashable
9753
+
9754
+ # The destination uri of the model weights.
9755
+ # Corresponds to the JSON property `destinationUri`
9756
+ # @return [String]
9757
+ attr_accessor :destination_uri
9758
+
9759
+ # The name of the PublisherModel resource. Format: `publishers/`publisher`/
9760
+ # models/`publisher_model`@`version_id``
9761
+ # Corresponds to the JSON property `publisherModel`
9762
+ # @return [String]
9763
+ attr_accessor :publisher_model
9764
+
9765
+ def initialize(**args)
9766
+ update!(**args)
9767
+ end
9768
+
9769
+ # Update properties of this object
9770
+ def update!(**args)
9771
+ @destination_uri = args[:destination_uri] if args.key?(:destination_uri)
9772
+ @publisher_model = args[:publisher_model] if args.key?(:publisher_model)
9773
+ end
9774
+ end
9775
+
9575
9776
  # Request message for TensorboardService.ExportTensorboardTimeSeriesData.
9576
9777
  class GoogleCloudAiplatformV1beta1ExportTensorboardTimeSeriesDataRequest
9577
9778
  include Google::Apis::Core::Hashable
@@ -12183,6 +12384,14 @@ module Google
12183
12384
  class GoogleCloudAiplatformV1beta1FileData
12184
12385
  include Google::Apis::Core::Hashable
12185
12386
 
12387
+ # Optional. Display name of the file data. Used to provide a label or filename
12388
+ # to distinguish file datas. This field is only returned in PromptMessage for
12389
+ # prompt management. It is not currently used in the Gemini GenerateContent
12390
+ # calls.
12391
+ # Corresponds to the JSON property `displayName`
12392
+ # @return [String]
12393
+ attr_accessor :display_name
12394
+
12186
12395
  # Required. URI.
12187
12396
  # Corresponds to the JSON property `fileUri`
12188
12397
  # @return [String]
@@ -12199,6 +12408,7 @@ module Google
12199
12408
 
12200
12409
  # Update properties of this object
12201
12410
  def update!(**args)
12411
+ @display_name = args[:display_name] if args.key?(:display_name)
12202
12412
  @file_uri = args[:file_uri] if args.key?(:file_uri)
12203
12413
  @mime_type = args[:mime_type] if args.key?(:mime_type)
12204
12414
  end
@@ -12881,6 +13091,47 @@ module Google
12881
13091
  end
12882
13092
  end
12883
13093
 
13094
+ # Configuration for GenAiAdvancedFeatures.
13095
+ class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfig
13096
+ include Google::Apis::Core::Hashable
13097
+
13098
+ # Configuration for Retrieval Augmented Generation feature.
13099
+ # Corresponds to the JSON property `ragConfig`
13100
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig]
13101
+ attr_accessor :rag_config
13102
+
13103
+ def initialize(**args)
13104
+ update!(**args)
13105
+ end
13106
+
13107
+ # Update properties of this object
13108
+ def update!(**args)
13109
+ @rag_config = args[:rag_config] if args.key?(:rag_config)
13110
+ end
13111
+ end
13112
+
13113
+ # Configuration for Retrieval Augmented Generation feature.
13114
+ class GoogleCloudAiplatformV1beta1GenAiAdvancedFeaturesConfigRagConfig
13115
+ include Google::Apis::Core::Hashable
13116
+
13117
+ # If true, enable Retrieval Augmented Generation in ChatCompletion request. Once
13118
+ # enabled, the endpoint will be identified as GenAI endpoint and Arthedain
13119
+ # router will be used.
13120
+ # Corresponds to the JSON property `enableRag`
13121
+ # @return [Boolean]
13122
+ attr_accessor :enable_rag
13123
+ alias_method :enable_rag?, :enable_rag
13124
+
13125
+ def initialize(**args)
13126
+ update!(**args)
13127
+ end
13128
+
13129
+ # Update properties of this object
13130
+ def update!(**args)
13131
+ @enable_rag = args[:enable_rag] if args.key?(:enable_rag)
13132
+ end
13133
+ end
13134
+
12884
13135
  # Request message for NotebookInternalService.GenerateAccessToken.
12885
13136
  class GoogleCloudAiplatformV1beta1GenerateAccessTokenRequest
12886
13137
  include Google::Apis::Core::Hashable
@@ -13028,6 +13279,11 @@ module Google
13028
13279
  # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Candidate>]
13029
13280
  attr_accessor :candidates
13030
13281
 
13282
+ # Output only. Timestamp when the request is made to the server.
13283
+ # Corresponds to the JSON property `createTime`
13284
+ # @return [String]
13285
+ attr_accessor :create_time
13286
+
13031
13287
  # Output only. The model version used to generate the response.
13032
13288
  # Corresponds to the JSON property `modelVersion`
13033
13289
  # @return [String]
@@ -13038,6 +13294,12 @@ module Google
13038
13294
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponsePromptFeedback]
13039
13295
  attr_accessor :prompt_feedback
13040
13296
 
13297
+ # Output only. response_id is used to identify each response. It is the encoding
13298
+ # of the event_id.
13299
+ # Corresponds to the JSON property `responseId`
13300
+ # @return [String]
13301
+ attr_accessor :response_id
13302
+
13041
13303
  # Usage metadata about response(s).
13042
13304
  # Corresponds to the JSON property `usageMetadata`
13043
13305
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata]
@@ -13050,8 +13312,10 @@ module Google
13050
13312
  # Update properties of this object
13051
13313
  def update!(**args)
13052
13314
  @candidates = args[:candidates] if args.key?(:candidates)
13315
+ @create_time = args[:create_time] if args.key?(:create_time)
13053
13316
  @model_version = args[:model_version] if args.key?(:model_version)
13054
13317
  @prompt_feedback = args[:prompt_feedback] if args.key?(:prompt_feedback)
13318
+ @response_id = args[:response_id] if args.key?(:response_id)
13055
13319
  @usage_metadata = args[:usage_metadata] if args.key?(:usage_metadata)
13056
13320
  end
13057
13321
  end
@@ -13091,6 +13355,11 @@ module Google
13091
13355
  class GoogleCloudAiplatformV1beta1GenerateContentResponseUsageMetadata
13092
13356
  include Google::Apis::Core::Hashable
13093
13357
 
13358
+ # Output only. List of modalities of the cached content in the request input.
13359
+ # Corresponds to the JSON property `cacheTokensDetails`
13360
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
13361
+ attr_accessor :cache_tokens_details
13362
+
13094
13363
  # Output only. Number of tokens in the cached part in the input (the cached
13095
13364
  # content).
13096
13365
  # Corresponds to the JSON property `cachedContentTokenCount`
@@ -13102,6 +13371,11 @@ module Google
13102
13371
  # @return [Fixnum]
13103
13372
  attr_accessor :candidates_token_count
13104
13373
 
13374
+ # Output only. List of modalities that were returned in the response.
13375
+ # Corresponds to the JSON property `candidatesTokensDetails`
13376
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
13377
+ attr_accessor :candidates_tokens_details
13378
+
13105
13379
  # Number of tokens in the request. When `cached_content` is set, this is still
13106
13380
  # the total effective prompt size meaning this includes the number of tokens in
13107
13381
  # the cached content.
@@ -13109,6 +13383,11 @@ module Google
13109
13383
  # @return [Fixnum]
13110
13384
  attr_accessor :prompt_token_count
13111
13385
 
13386
+ # Output only. List of modalities that were processed in the request input.
13387
+ # Corresponds to the JSON property `promptTokensDetails`
13388
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModalityTokenCount>]
13389
+ attr_accessor :prompt_tokens_details
13390
+
13112
13391
  # Total token count for prompt and response candidates.
13113
13392
  # Corresponds to the JSON property `totalTokenCount`
13114
13393
  # @return [Fixnum]
@@ -13120,9 +13399,12 @@ module Google
13120
13399
 
13121
13400
  # Update properties of this object
13122
13401
  def update!(**args)
13402
+ @cache_tokens_details = args[:cache_tokens_details] if args.key?(:cache_tokens_details)
13123
13403
  @cached_content_token_count = args[:cached_content_token_count] if args.key?(:cached_content_token_count)
13124
13404
  @candidates_token_count = args[:candidates_token_count] if args.key?(:candidates_token_count)
13405
+ @candidates_tokens_details = args[:candidates_tokens_details] if args.key?(:candidates_tokens_details)
13125
13406
  @prompt_token_count = args[:prompt_token_count] if args.key?(:prompt_token_count)
13407
+ @prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
13126
13408
  @total_token_count = args[:total_token_count] if args.key?(:total_token_count)
13127
13409
  end
13128
13410
  end
@@ -13189,6 +13471,11 @@ module Google
13189
13471
  # @return [Fixnum]
13190
13472
  attr_accessor :max_output_tokens
13191
13473
 
13474
+ # Optional. If specified, the media resolution specified will be used.
13475
+ # Corresponds to the JSON property `mediaResolution`
13476
+ # @return [String]
13477
+ attr_accessor :media_resolution
13478
+
13192
13479
  # Optional. Positive penalties.
13193
13480
  # Corresponds to the JSON property `presencePenalty`
13194
13481
  # @return [Float]
@@ -13246,11 +13533,6 @@ module Google
13246
13533
  # @return [Float]
13247
13534
  attr_accessor :temperature
13248
13535
 
13249
- # Optional. If specified, the token resolution specified will be used.
13250
- # Corresponds to the JSON property `tokenResolution`
13251
- # @return [String]
13252
- attr_accessor :token_resolution
13253
-
13254
13536
  # Optional. If specified, top-k sampling will be used.
13255
13537
  # Corresponds to the JSON property `topK`
13256
13538
  # @return [Float]
@@ -13272,6 +13554,7 @@ module Google
13272
13554
  @frequency_penalty = args[:frequency_penalty] if args.key?(:frequency_penalty)
13273
13555
  @logprobs = args[:logprobs] if args.key?(:logprobs)
13274
13556
  @max_output_tokens = args[:max_output_tokens] if args.key?(:max_output_tokens)
13557
+ @media_resolution = args[:media_resolution] if args.key?(:media_resolution)
13275
13558
  @presence_penalty = args[:presence_penalty] if args.key?(:presence_penalty)
13276
13559
  @response_logprobs = args[:response_logprobs] if args.key?(:response_logprobs)
13277
13560
  @response_mime_type = args[:response_mime_type] if args.key?(:response_mime_type)
@@ -13282,7 +13565,6 @@ module Google
13282
13565
  @speech_config = args[:speech_config] if args.key?(:speech_config)
13283
13566
  @stop_sequences = args[:stop_sequences] if args.key?(:stop_sequences)
13284
13567
  @temperature = args[:temperature] if args.key?(:temperature)
13285
- @token_resolution = args[:token_resolution] if args.key?(:token_resolution)
13286
13568
  @top_k = args[:top_k] if args.key?(:top_k)
13287
13569
  @top_p = args[:top_p] if args.key?(:top_p)
13288
13570
  end
@@ -16075,6 +16357,32 @@ module Google
16075
16357
  end
16076
16358
  end
16077
16359
 
16360
+ # Response message for ModelService.ListModelVersionCheckpoints
16361
+ class GoogleCloudAiplatformV1beta1ListModelVersionCheckpointsResponse
16362
+ include Google::Apis::Core::Hashable
16363
+
16364
+ # List of Model Version checkpoints.
16365
+ # Corresponds to the JSON property `checkpoints`
16366
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelVersionCheckpoint>]
16367
+ attr_accessor :checkpoints
16368
+
16369
+ # A token to retrieve the next page of results. Pass to
16370
+ # ListModelVersionCheckpointsRequest.page_token to obtain that page.
16371
+ # Corresponds to the JSON property `nextPageToken`
16372
+ # @return [String]
16373
+ attr_accessor :next_page_token
16374
+
16375
+ def initialize(**args)
16376
+ update!(**args)
16377
+ end
16378
+
16379
+ # Update properties of this object
16380
+ def update!(**args)
16381
+ @checkpoints = args[:checkpoints] if args.key?(:checkpoints)
16382
+ @next_page_token = args[:next_page_token] if args.key?(:next_page_token)
16383
+ end
16384
+ end
16385
+
16078
16386
  # Response message for ModelService.ListModelVersions
16079
16387
  class GoogleCloudAiplatformV1beta1ListModelVersionsResponse
16080
16388
  include Google::Apis::Core::Hashable
@@ -17147,6 +17455,58 @@ module Google
17147
17455
  end
17148
17456
  end
17149
17457
 
17458
+ # The metric used for dataset level evaluation.
17459
+ class GoogleCloudAiplatformV1beta1Metric
17460
+ include Google::Apis::Core::Hashable
17461
+
17462
+ # Optional. The aggregation metrics to use.
17463
+ # Corresponds to the JSON property `aggregationMetrics`
17464
+ # @return [Array<String>]
17465
+ attr_accessor :aggregation_metrics
17466
+
17467
+ # Spec for bleu score metric - calculates the precision of n-grams in the
17468
+ # prediction as compared to reference - returns a score ranging between 0 to 1.
17469
+ # Corresponds to the JSON property `bleuSpec`
17470
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1BleuSpec]
17471
+ attr_accessor :bleu_spec
17472
+
17473
+ # Spec for exact match metric - returns 1 if prediction and reference exactly
17474
+ # matches, otherwise 0.
17475
+ # Corresponds to the JSON property `exactMatchSpec`
17476
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ExactMatchSpec]
17477
+ attr_accessor :exact_match_spec
17478
+
17479
+ # Spec for pairwise metric.
17480
+ # Corresponds to the JSON property `pairwiseMetricSpec`
17481
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PairwiseMetricSpec]
17482
+ attr_accessor :pairwise_metric_spec
17483
+
17484
+ # Spec for pointwise metric.
17485
+ # Corresponds to the JSON property `pointwiseMetricSpec`
17486
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PointwiseMetricSpec]
17487
+ attr_accessor :pointwise_metric_spec
17488
+
17489
+ # Spec for rouge score metric - calculates the recall of n-grams in prediction
17490
+ # as compared to reference - returns a score ranging between 0 and 1.
17491
+ # Corresponds to the JSON property `rougeSpec`
17492
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RougeSpec]
17493
+ attr_accessor :rouge_spec
17494
+
17495
+ def initialize(**args)
17496
+ update!(**args)
17497
+ end
17498
+
17499
+ # Update properties of this object
17500
+ def update!(**args)
17501
+ @aggregation_metrics = args[:aggregation_metrics] if args.key?(:aggregation_metrics)
17502
+ @bleu_spec = args[:bleu_spec] if args.key?(:bleu_spec)
17503
+ @exact_match_spec = args[:exact_match_spec] if args.key?(:exact_match_spec)
17504
+ @pairwise_metric_spec = args[:pairwise_metric_spec] if args.key?(:pairwise_metric_spec)
17505
+ @pointwise_metric_spec = args[:pointwise_metric_spec] if args.key?(:pointwise_metric_spec)
17506
+ @rouge_spec = args[:rouge_spec] if args.key?(:rouge_spec)
17507
+ end
17508
+ end
17509
+
17150
17510
  # Input for MetricX metric.
17151
17511
  class GoogleCloudAiplatformV1beta1MetricxInput
17152
17512
  include Google::Apis::Core::Hashable
@@ -17665,6 +18025,31 @@ module Google
17665
18025
  end
17666
18026
  end
17667
18027
 
18028
+ # Represents token counting info for a single modality.
18029
+ class GoogleCloudAiplatformV1beta1ModalityTokenCount
18030
+ include Google::Apis::Core::Hashable
18031
+
18032
+ # The modality associated with this token count.
18033
+ # Corresponds to the JSON property `modality`
18034
+ # @return [String]
18035
+ attr_accessor :modality
18036
+
18037
+ # Number of tokens.
18038
+ # Corresponds to the JSON property `tokenCount`
18039
+ # @return [Fixnum]
18040
+ attr_accessor :token_count
18041
+
18042
+ def initialize(**args)
18043
+ update!(**args)
18044
+ end
18045
+
18046
+ # Update properties of this object
18047
+ def update!(**args)
18048
+ @modality = args[:modality] if args.key?(:modality)
18049
+ @token_count = args[:token_count] if args.key?(:token_count)
18050
+ end
18051
+ end
18052
+
17668
18053
  # A trained machine learning Model.
17669
18054
  class GoogleCloudAiplatformV1beta1Model
17670
18055
  include Google::Apis::Core::Hashable
@@ -17694,6 +18079,11 @@ module Google
17694
18079
  # @return [String]
17695
18080
  attr_accessor :create_time
17696
18081
 
18082
+ # The default checkpoint id of a model version.
18083
+ # Corresponds to the JSON property `defaultCheckpointId`
18084
+ # @return [String]
18085
+ attr_accessor :default_checkpoint_id
18086
+
17697
18087
  # Output only. The pointers to DeployedModels created from this Model. Note that
17698
18088
  # Model could have been deployed to Endpoints in different Locations.
17699
18089
  # Corresponds to the JSON property `deployedModels`
@@ -17908,6 +18298,7 @@ module Google
17908
18298
  @base_model_source = args[:base_model_source] if args.key?(:base_model_source)
17909
18299
  @container_spec = args[:container_spec] if args.key?(:container_spec)
17910
18300
  @create_time = args[:create_time] if args.key?(:create_time)
18301
+ @default_checkpoint_id = args[:default_checkpoint_id] if args.key?(:default_checkpoint_id)
17911
18302
  @deployed_models = args[:deployed_models] if args.key?(:deployed_models)
17912
18303
  @description = args[:description] if args.key?(:description)
17913
18304
  @display_name = args[:display_name] if args.key?(:display_name)
@@ -18110,6 +18501,12 @@ module Google
18110
18501
  # @return [String]
18111
18502
  attr_accessor :image_uri
18112
18503
 
18504
+ # Probe describes a health check to be performed against a container to
18505
+ # determine whether it is alive or ready to receive traffic.
18506
+ # Corresponds to the JSON property `livenessProbe`
18507
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Probe]
18508
+ attr_accessor :liveness_probe
18509
+
18113
18510
  # Immutable. List of ports to expose from the container. Vertex AI sends any
18114
18511
  # prediction requests that it receives to the first port on this list. Vertex AI
18115
18512
  # also sends [liveness and health checks](https://cloud.google.com/vertex-ai/
@@ -18172,6 +18569,7 @@ module Google
18172
18569
  @health_probe = args[:health_probe] if args.key?(:health_probe)
18173
18570
  @health_route = args[:health_route] if args.key?(:health_route)
18174
18571
  @image_uri = args[:image_uri] if args.key?(:image_uri)
18572
+ @liveness_probe = args[:liveness_probe] if args.key?(:liveness_probe)
18175
18573
  @ports = args[:ports] if args.key?(:ports)
18176
18574
  @predict_route = args[:predict_route] if args.key?(:predict_route)
18177
18575
  @shared_memory_size_mb = args[:shared_memory_size_mb] if args.key?(:shared_memory_size_mb)
@@ -18909,7 +19307,7 @@ module Google
18909
19307
  # model in SavedModel format. * `tf-js` A [TensorFlow.js](https://www.tensorflow.
18910
19308
  # org/js) model that can be used in the browser and in Node.js using JavaScript.
18911
19309
  # * `core-ml` Used for iOS mobile devices. * `custom-trained` A Model that was
18912
- # uploaded or trained by custom code.
19310
+ # uploaded or trained by custom code. * `genie` A tuned Model Garden model.
18913
19311
  # Corresponds to the JSON property `id`
18914
19312
  # @return [String]
18915
19313
  attr_accessor :id
@@ -18935,6 +19333,17 @@ module Google
18935
19333
  # @return [String]
18936
19334
  attr_accessor :public_model_name
18937
19335
 
19336
+ # Optional. Whether to avoid pulling the model from the HF cache.
19337
+ # Corresponds to the JSON property `skipHfModelCache`
19338
+ # @return [Boolean]
19339
+ attr_accessor :skip_hf_model_cache
19340
+ alias_method :skip_hf_model_cache?, :skip_hf_model_cache
19341
+
19342
+ # Optional. The model garden source model version ID.
19343
+ # Corresponds to the JSON property `versionId`
19344
+ # @return [String]
19345
+ attr_accessor :version_id
19346
+
18938
19347
  def initialize(**args)
18939
19348
  update!(**args)
18940
19349
  end
@@ -18942,6 +19351,8 @@ module Google
18942
19351
  # Update properties of this object
18943
19352
  def update!(**args)
18944
19353
  @public_model_name = args[:public_model_name] if args.key?(:public_model_name)
19354
+ @skip_hf_model_cache = args[:skip_hf_model_cache] if args.key?(:skip_hf_model_cache)
19355
+ @version_id = args[:version_id] if args.key?(:version_id)
18945
19356
  end
18946
19357
  end
18947
19358
 
@@ -20594,6 +21005,45 @@ module Google
20594
21005
  end
20595
21006
  end
20596
21007
 
21008
+ # Describes the machine learning model version checkpoint.
21009
+ class GoogleCloudAiplatformV1beta1ModelVersionCheckpoint
21010
+ include Google::Apis::Core::Hashable
21011
+
21012
+ # The ID of the checkpoint.
21013
+ # Corresponds to the JSON property `checkpointId`
21014
+ # @return [String]
21015
+ attr_accessor :checkpoint_id
21016
+
21017
+ # The epoch of the checkpoint.
21018
+ # Corresponds to the JSON property `epoch`
21019
+ # @return [Fixnum]
21020
+ attr_accessor :epoch
21021
+
21022
+ # Identifier. The resource name of the ModelVersionCheckpoint. Format: `projects/
21023
+ # `project`/locations/`location`/models/`model`/versions/`version`/checkpoints/`
21024
+ # checkpoint``
21025
+ # Corresponds to the JSON property `name`
21026
+ # @return [String]
21027
+ attr_accessor :name
21028
+
21029
+ # The step of the checkpoint.
21030
+ # Corresponds to the JSON property `step`
21031
+ # @return [Fixnum]
21032
+ attr_accessor :step
21033
+
21034
+ def initialize(**args)
21035
+ update!(**args)
21036
+ end
21037
+
21038
+ # Update properties of this object
21039
+ def update!(**args)
21040
+ @checkpoint_id = args[:checkpoint_id] if args.key?(:checkpoint_id)
21041
+ @epoch = args[:epoch] if args.key?(:epoch)
21042
+ @name = args[:name] if args.key?(:name)
21043
+ @step = args[:step] if args.key?(:step)
21044
+ end
21045
+ end
21046
+
20597
21047
  # Runtime operation information for IndexEndpointService.MutateDeployedIndex.
20598
21048
  class GoogleCloudAiplatformV1beta1MutateDeployedIndexOperationMetadata
20599
21049
  include Google::Apis::Core::Hashable
@@ -21703,8 +22153,8 @@ module Google
21703
22153
  # @return [String]
21704
22154
  attr_accessor :notebook_runtime_template_resource_name
21705
22155
 
21706
- # Output only. The Schedule resource name if this job is triggered by one.
21707
- # Format: `projects/`project_id`/locations/`location`/schedules/`schedule_id``
22156
+ # The Schedule resource name if this job is triggered by one. Format: `projects/`
22157
+ # project_id`/locations/`location`/schedules/`schedule_id``
21708
22158
  # Corresponds to the JSON property `scheduleResourceName`
21709
22159
  # @return [String]
21710
22160
  attr_accessor :schedule_resource_name
@@ -22067,6 +22517,11 @@ module Google
22067
22517
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
22068
22518
  attr_accessor :shielded_vm_config
22069
22519
 
22520
+ # Notebook Software Config.
22521
+ # Corresponds to the JSON property `softwareConfig`
22522
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
22523
+ attr_accessor :software_config
22524
+
22070
22525
  # Output only. Timestamp when this NotebookRuntime was most recently updated.
22071
22526
  # Corresponds to the JSON property `updateTime`
22072
22527
  # @return [String]
@@ -22107,6 +22562,7 @@ module Google
22107
22562
  @satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
22108
22563
  @service_account = args[:service_account] if args.key?(:service_account)
22109
22564
  @shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
22565
+ @software_config = args[:software_config] if args.key?(:software_config)
22110
22566
  @update_time = args[:update_time] if args.key?(:update_time)
22111
22567
  @version = args[:version] if args.key?(:version)
22112
22568
  end
@@ -22225,6 +22681,11 @@ module Google
22225
22681
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ShieldedVmConfig]
22226
22682
  attr_accessor :shielded_vm_config
22227
22683
 
22684
+ # Notebook Software Config.
22685
+ # Corresponds to the JSON property `softwareConfig`
22686
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1NotebookSoftwareConfig]
22687
+ attr_accessor :software_config
22688
+
22228
22689
  # Output only. Timestamp when this NotebookRuntimeTemplate was most recently
22229
22690
  # updated.
22230
22691
  # Corresponds to the JSON property `updateTime`
@@ -22254,6 +22715,7 @@ module Google
22254
22715
  @notebook_runtime_type = args[:notebook_runtime_type] if args.key?(:notebook_runtime_type)
22255
22716
  @service_account = args[:service_account] if args.key?(:service_account)
22256
22717
  @shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
22718
+ @software_config = args[:software_config] if args.key?(:software_config)
22257
22719
  @update_time = args[:update_time] if args.key?(:update_time)
22258
22720
  end
22259
22721
  end
@@ -22277,6 +22739,51 @@ module Google
22277
22739
  end
22278
22740
  end
22279
22741
 
22742
+ # Notebook Software Config.
22743
+ class GoogleCloudAiplatformV1beta1NotebookSoftwareConfig
22744
+ include Google::Apis::Core::Hashable
22745
+
22746
+ # Optional. Environment variables to be passed to the container. Maximum limit
22747
+ # is 100.
22748
+ # Corresponds to the JSON property `env`
22749
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1EnvVar>]
22750
+ attr_accessor :env
22751
+
22752
+ # Post startup script config.
22753
+ # Corresponds to the JSON property `postStartupScriptConfig`
22754
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1PostStartupScriptConfig]
22755
+ attr_accessor :post_startup_script_config
22756
+
22757
+ def initialize(**args)
22758
+ update!(**args)
22759
+ end
22760
+
22761
+ # Update properties of this object
22762
+ def update!(**args)
22763
+ @env = args[:env] if args.key?(:env)
22764
+ @post_startup_script_config = args[:post_startup_script_config] if args.key?(:post_startup_script_config)
22765
+ end
22766
+ end
22767
+
22768
+ # Config for evaluation output.
22769
+ class GoogleCloudAiplatformV1beta1OutputConfig
22770
+ include Google::Apis::Core::Hashable
22771
+
22772
+ # The Google Cloud Storage location where the output is to be written to.
22773
+ # Corresponds to the JSON property `gcsDestination`
22774
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1GcsDestination]
22775
+ attr_accessor :gcs_destination
22776
+
22777
+ def initialize(**args)
22778
+ update!(**args)
22779
+ end
22780
+
22781
+ # Update properties of this object
22782
+ def update!(**args)
22783
+ @gcs_destination = args[:gcs_destination] if args.key?(:gcs_destination)
22784
+ end
22785
+ end
22786
+
22280
22787
  # PSC config that is used to automatically create forwarding rule via
22281
22788
  # ServiceConnectionMap.
22282
22789
  class GoogleCloudAiplatformV1beta1PscAutomationConfig
@@ -22383,18 +22890,36 @@ module Google
22383
22890
  class GoogleCloudAiplatformV1beta1PairwiseMetricSpec
22384
22891
  include Google::Apis::Core::Hashable
22385
22892
 
22893
+ # Optional. The field name of the baseline response.
22894
+ # Corresponds to the JSON property `baselineResponseFieldName`
22895
+ # @return [String]
22896
+ attr_accessor :baseline_response_field_name
22897
+
22898
+ # Optional. The field name of the candidate response.
22899
+ # Corresponds to the JSON property `candidateResponseFieldName`
22900
+ # @return [String]
22901
+ attr_accessor :candidate_response_field_name
22902
+
22386
22903
  # Required. Metric prompt template for pairwise metric.
22387
22904
  # Corresponds to the JSON property `metricPromptTemplate`
22388
22905
  # @return [String]
22389
22906
  attr_accessor :metric_prompt_template
22390
22907
 
22908
+ # Optional. System instructions for pairwise metric.
22909
+ # Corresponds to the JSON property `systemInstruction`
22910
+ # @return [String]
22911
+ attr_accessor :system_instruction
22912
+
22391
22913
  def initialize(**args)
22392
22914
  update!(**args)
22393
22915
  end
22394
22916
 
22395
22917
  # Update properties of this object
22396
22918
  def update!(**args)
22919
+ @baseline_response_field_name = args[:baseline_response_field_name] if args.key?(:baseline_response_field_name)
22920
+ @candidate_response_field_name = args[:candidate_response_field_name] if args.key?(:candidate_response_field_name)
22397
22921
  @metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
22922
+ @system_instruction = args[:system_instruction] if args.key?(:system_instruction)
22398
22923
  end
22399
22924
  end
22400
22925
 
@@ -22691,7 +23216,7 @@ module Google
22691
23216
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionResponse]
22692
23217
  attr_accessor :function_response
22693
23218
 
22694
- # Content blob. It's preferred to send as text directly rather than raw bytes.
23219
+ # Content blob.
22695
23220
  # Corresponds to the JSON property `inlineData`
22696
23221
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1Blob]
22697
23222
  attr_accessor :inline_data
@@ -22701,6 +23226,12 @@ module Google
22701
23226
  # @return [String]
22702
23227
  attr_accessor :text
22703
23228
 
23229
+ # Output only. Indicates if the part is thought from the model.
23230
+ # Corresponds to the JSON property `thought`
23231
+ # @return [Boolean]
23232
+ attr_accessor :thought
23233
+ alias_method :thought?, :thought
23234
+
22704
23235
  # Metadata describes the input video content.
22705
23236
  # Corresponds to the JSON property `videoMetadata`
22706
23237
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1VideoMetadata]
@@ -22719,6 +23250,7 @@ module Google
22719
23250
  @function_response = args[:function_response] if args.key?(:function_response)
22720
23251
  @inline_data = args[:inline_data] if args.key?(:inline_data)
22721
23252
  @text = args[:text] if args.key?(:text)
23253
+ @thought = args[:thought] if args.key?(:thought)
22722
23254
  @video_metadata = args[:video_metadata] if args.key?(:video_metadata)
22723
23255
  end
22724
23256
  end
@@ -23785,6 +24317,11 @@ module Google
23785
24317
  # @return [String]
23786
24318
  attr_accessor :metric_prompt_template
23787
24319
 
24320
+ # Optional. System instructions for pointwise metric.
24321
+ # Corresponds to the JSON property `systemInstruction`
24322
+ # @return [String]
24323
+ attr_accessor :system_instruction
24324
+
23788
24325
  def initialize(**args)
23789
24326
  update!(**args)
23790
24327
  end
@@ -23792,6 +24329,7 @@ module Google
23792
24329
  # Update properties of this object
23793
24330
  def update!(**args)
23794
24331
  @metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
24332
+ @system_instruction = args[:system_instruction] if args.key?(:system_instruction)
23795
24333
  end
23796
24334
  end
23797
24335
 
@@ -23815,6 +24353,39 @@ module Google
23815
24353
  end
23816
24354
  end
23817
24355
 
24356
+ # Post startup script config.
24357
+ class GoogleCloudAiplatformV1beta1PostStartupScriptConfig
24358
+ include Google::Apis::Core::Hashable
24359
+
24360
+ # Optional. Post startup script to run after runtime is started.
24361
+ # Corresponds to the JSON property `postStartupScript`
24362
+ # @return [String]
24363
+ attr_accessor :post_startup_script
24364
+
24365
+ # Optional. Post startup script behavior that defines download and execution
24366
+ # behavior.
24367
+ # Corresponds to the JSON property `postStartupScriptBehavior`
24368
+ # @return [String]
24369
+ attr_accessor :post_startup_script_behavior
24370
+
24371
+ # Optional. Post startup script url to download. Example: https://bucket/script.
24372
+ # sh
24373
+ # Corresponds to the JSON property `postStartupScriptUrl`
24374
+ # @return [String]
24375
+ attr_accessor :post_startup_script_url
24376
+
24377
+ def initialize(**args)
24378
+ update!(**args)
24379
+ end
24380
+
24381
+ # Update properties of this object
24382
+ def update!(**args)
24383
+ @post_startup_script = args[:post_startup_script] if args.key?(:post_startup_script)
24384
+ @post_startup_script_behavior = args[:post_startup_script_behavior] if args.key?(:post_startup_script_behavior)
24385
+ @post_startup_script_url = args[:post_startup_script_url] if args.key?(:post_startup_script_url)
24386
+ end
24387
+ end
24388
+
23818
24389
  # The configuration for the prebuilt speaker to use.
23819
24390
  class GoogleCloudAiplatformV1beta1PrebuiltVoiceConfig
23820
24391
  include Google::Apis::Core::Hashable
@@ -24221,6 +24792,28 @@ module Google
24221
24792
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeExecAction]
24222
24793
  attr_accessor :exec
24223
24794
 
24795
+ # Number of consecutive failures before the probe is considered failed. Defaults
24796
+ # to 3. Minimum value is 1. Maps to Kubernetes probe argument 'failureThreshold'.
24797
+ # Corresponds to the JSON property `failureThreshold`
24798
+ # @return [Fixnum]
24799
+ attr_accessor :failure_threshold
24800
+
24801
+ # GrpcAction checks the health of a container using a gRPC service.
24802
+ # Corresponds to the JSON property `grpc`
24803
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeGrpcAction]
24804
+ attr_accessor :grpc
24805
+
24806
+ # HttpGetAction describes an action based on HTTP Get requests.
24807
+ # Corresponds to the JSON property `httpGet`
24808
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpGetAction]
24809
+ attr_accessor :http_get
24810
+
24811
+ # Number of seconds to wait before starting the probe. Defaults to 0. Minimum
24812
+ # value is 0. Maps to Kubernetes probe argument 'initialDelaySeconds'.
24813
+ # Corresponds to the JSON property `initialDelaySeconds`
24814
+ # @return [Fixnum]
24815
+ attr_accessor :initial_delay_seconds
24816
+
24224
24817
  # How often (in seconds) to perform the probe. Default to 10 seconds. Minimum
24225
24818
  # value is 1. Must be less than timeout_seconds. Maps to Kubernetes probe
24226
24819
  # argument 'periodSeconds'.
@@ -24228,6 +24821,19 @@ module Google
24228
24821
  # @return [Fixnum]
24229
24822
  attr_accessor :period_seconds
24230
24823
 
24824
+ # Number of consecutive successes before the probe is considered successful.
24825
+ # Defaults to 1. Minimum value is 1. Maps to Kubernetes probe argument '
24826
+ # successThreshold'.
24827
+ # Corresponds to the JSON property `successThreshold`
24828
+ # @return [Fixnum]
24829
+ attr_accessor :success_threshold
24830
+
24831
+ # TcpSocketAction probes the health of a container by opening a TCP socket
24832
+ # connection.
24833
+ # Corresponds to the JSON property `tcpSocket`
24834
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeTcpSocketAction]
24835
+ attr_accessor :tcp_socket
24836
+
24231
24837
  # Number of seconds after which the probe times out. Defaults to 1 second.
24232
24838
  # Minimum value is 1. Must be greater or equal to period_seconds. Maps to
24233
24839
  # Kubernetes probe argument 'timeoutSeconds'.
@@ -24242,7 +24848,13 @@ module Google
24242
24848
  # Update properties of this object
24243
24849
  def update!(**args)
24244
24850
  @exec = args[:exec] if args.key?(:exec)
24851
+ @failure_threshold = args[:failure_threshold] if args.key?(:failure_threshold)
24852
+ @grpc = args[:grpc] if args.key?(:grpc)
24853
+ @http_get = args[:http_get] if args.key?(:http_get)
24854
+ @initial_delay_seconds = args[:initial_delay_seconds] if args.key?(:initial_delay_seconds)
24245
24855
  @period_seconds = args[:period_seconds] if args.key?(:period_seconds)
24856
+ @success_threshold = args[:success_threshold] if args.key?(:success_threshold)
24857
+ @tcp_socket = args[:tcp_socket] if args.key?(:tcp_socket)
24246
24858
  @timeout_seconds = args[:timeout_seconds] if args.key?(:timeout_seconds)
24247
24859
  end
24248
24860
  end
@@ -24271,6 +24883,133 @@ module Google
24271
24883
  end
24272
24884
  end
24273
24885
 
24886
+ # GrpcAction checks the health of a container using a gRPC service.
24887
+ class GoogleCloudAiplatformV1beta1ProbeGrpcAction
24888
+ include Google::Apis::Core::Hashable
24889
+
24890
+ # Port number of the gRPC service. Number must be in the range 1 to 65535.
24891
+ # Corresponds to the JSON property `port`
24892
+ # @return [Fixnum]
24893
+ attr_accessor :port
24894
+
24895
+ # Service is the name of the service to place in the gRPC HealthCheckRequest (
24896
+ # see https://github.com/grpc/grpc/blob/master/doc/health-checking.md). If this
24897
+ # is not specified, the default behavior is defined by gRPC.
24898
+ # Corresponds to the JSON property `service`
24899
+ # @return [String]
24900
+ attr_accessor :service
24901
+
24902
+ def initialize(**args)
24903
+ update!(**args)
24904
+ end
24905
+
24906
+ # Update properties of this object
24907
+ def update!(**args)
24908
+ @port = args[:port] if args.key?(:port)
24909
+ @service = args[:service] if args.key?(:service)
24910
+ end
24911
+ end
24912
+
24913
+ # HttpGetAction describes an action based on HTTP Get requests.
24914
+ class GoogleCloudAiplatformV1beta1ProbeHttpGetAction
24915
+ include Google::Apis::Core::Hashable
24916
+
24917
+ # Host name to connect to, defaults to the model serving container's IP. You
24918
+ # probably want to set "Host" in httpHeaders instead.
24919
+ # Corresponds to the JSON property `host`
24920
+ # @return [String]
24921
+ attr_accessor :host
24922
+
24923
+ # Custom headers to set in the request. HTTP allows repeated headers.
24924
+ # Corresponds to the JSON property `httpHeaders`
24925
+ # @return [Array<Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ProbeHttpHeader>]
24926
+ attr_accessor :http_headers
24927
+
24928
+ # Path to access on the HTTP server.
24929
+ # Corresponds to the JSON property `path`
24930
+ # @return [String]
24931
+ attr_accessor :path
24932
+
24933
+ # Number of the port to access on the container. Number must be in the range 1
24934
+ # to 65535.
24935
+ # Corresponds to the JSON property `port`
24936
+ # @return [Fixnum]
24937
+ attr_accessor :port
24938
+
24939
+ # Scheme to use for connecting to the host. Defaults to HTTP. Acceptable values
24940
+ # are "HTTP" or "HTTPS".
24941
+ # Corresponds to the JSON property `scheme`
24942
+ # @return [String]
24943
+ attr_accessor :scheme
24944
+
24945
+ def initialize(**args)
24946
+ update!(**args)
24947
+ end
24948
+
24949
+ # Update properties of this object
24950
+ def update!(**args)
24951
+ @host = args[:host] if args.key?(:host)
24952
+ @http_headers = args[:http_headers] if args.key?(:http_headers)
24953
+ @path = args[:path] if args.key?(:path)
24954
+ @port = args[:port] if args.key?(:port)
24955
+ @scheme = args[:scheme] if args.key?(:scheme)
24956
+ end
24957
+ end
24958
+
24959
+ # HttpHeader describes a custom header to be used in HTTP probes
24960
+ class GoogleCloudAiplatformV1beta1ProbeHttpHeader
24961
+ include Google::Apis::Core::Hashable
24962
+
24963
+ # The header field name. This will be canonicalized upon output, so case-variant
24964
+ # names will be understood as the same header.
24965
+ # Corresponds to the JSON property `name`
24966
+ # @return [String]
24967
+ attr_accessor :name
24968
+
24969
+ # The header field value
24970
+ # Corresponds to the JSON property `value`
24971
+ # @return [String]
24972
+ attr_accessor :value
24973
+
24974
+ def initialize(**args)
24975
+ update!(**args)
24976
+ end
24977
+
24978
+ # Update properties of this object
24979
+ def update!(**args)
24980
+ @name = args[:name] if args.key?(:name)
24981
+ @value = args[:value] if args.key?(:value)
24982
+ end
24983
+ end
24984
+
24985
+ # TcpSocketAction probes the health of a container by opening a TCP socket
24986
+ # connection.
24987
+ class GoogleCloudAiplatformV1beta1ProbeTcpSocketAction
24988
+ include Google::Apis::Core::Hashable
24989
+
24990
+ # Optional: Host name to connect to, defaults to the model serving container's
24991
+ # IP.
24992
+ # Corresponds to the JSON property `host`
24993
+ # @return [String]
24994
+ attr_accessor :host
24995
+
24996
+ # Number of the port to access on the container. Number must be in the range 1
24997
+ # to 65535.
24998
+ # Corresponds to the JSON property `port`
24999
+ # @return [Fixnum]
25000
+ attr_accessor :port
25001
+
25002
+ def initialize(**args)
25003
+ update!(**args)
25004
+ end
25005
+
25006
+ # Update properties of this object
25007
+ def update!(**args)
25008
+ @host = args[:host] if args.key?(:host)
25009
+ @port = args[:port] if args.key?(:port)
25010
+ end
25011
+ end
25012
+
24274
25013
  # PscAutomatedEndpoints defines the output of the forwarding rule automatically
24275
25014
  # created by each PscAutomationConfig.
24276
25015
  class GoogleCloudAiplatformV1beta1PscAutomatedEndpoints
@@ -24536,8 +25275,8 @@ module Google
24536
25275
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ModelContainerSpec]
24537
25276
  attr_accessor :container_spec
24538
25277
 
24539
- # A description of resources that are dedicated to a DeployedModel, and that
24540
- # need a higher degree of manual configuration.
25278
+ # A description of resources that are dedicated to a DeployedModel or
25279
+ # DeployedIndex, and that need a higher degree of manual configuration.
24541
25280
  # Corresponds to the JSON property `dedicatedResources`
24542
25281
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1DedicatedResources]
24543
25282
  attr_accessor :dedicated_resources
@@ -25867,6 +26606,11 @@ module Google
25867
26606
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagEmbeddingModelConfig]
25868
26607
  attr_accessor :rag_embedding_model_config
25869
26608
 
26609
+ # Output only. Number of RagFiles in the RagCorpus.
26610
+ # Corresponds to the JSON property `ragFilesCount`
26611
+ # @return [Fixnum]
26612
+ attr_accessor :rag_files_count
26613
+
25870
26614
  # Config for the Vector DB to use for RAG.
25871
26615
  # Corresponds to the JSON property `ragVectorDbConfig`
25872
26616
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagVectorDbConfig]
@@ -25899,6 +26643,7 @@ module Google
25899
26643
  @display_name = args[:display_name] if args.key?(:display_name)
25900
26644
  @name = args[:name] if args.key?(:name)
25901
26645
  @rag_embedding_model_config = args[:rag_embedding_model_config] if args.key?(:rag_embedding_model_config)
26646
+ @rag_files_count = args[:rag_files_count] if args.key?(:rag_files_count)
25902
26647
  @rag_vector_db_config = args[:rag_vector_db_config] if args.key?(:rag_vector_db_config)
25903
26648
  @update_time = args[:update_time] if args.key?(:update_time)
25904
26649
  @vector_db_config = args[:vector_db_config] if args.key?(:vector_db_config)
@@ -26215,6 +26960,11 @@ module Google
26215
26960
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagFileParsingConfigLayoutParser]
26216
26961
  attr_accessor :layout_parser
26217
26962
 
26963
+ # Specifies the advanced parsing for RagFiles.
26964
+ # Corresponds to the JSON property `llmParser`
26965
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RagFileParsingConfigLlmParser]
26966
+ attr_accessor :llm_parser
26967
+
26218
26968
  # Whether to use advanced PDF parsing.
26219
26969
  # Corresponds to the JSON property `useAdvancedPdfParsing`
26220
26970
  # @return [Boolean]
@@ -26229,6 +26979,7 @@ module Google
26229
26979
  def update!(**args)
26230
26980
  @advanced_parser = args[:advanced_parser] if args.key?(:advanced_parser)
26231
26981
  @layout_parser = args[:layout_parser] if args.key?(:layout_parser)
26982
+ @llm_parser = args[:llm_parser] if args.key?(:llm_parser)
26232
26983
  @use_advanced_pdf_parsing = args[:use_advanced_pdf_parsing] if args.key?(:use_advanced_pdf_parsing)
26233
26984
  end
26234
26985
  end
@@ -26286,6 +27037,41 @@ module Google
26286
27037
  end
26287
27038
  end
26288
27039
 
27040
+ # Specifies the advanced parsing for RagFiles.
27041
+ class GoogleCloudAiplatformV1beta1RagFileParsingConfigLlmParser
27042
+ include Google::Apis::Core::Hashable
27043
+
27044
+ # The prompt to use for parsing. If not specified, a default prompt will be used.
27045
+ # Corresponds to the JSON property `customParsingPrompt`
27046
+ # @return [String]
27047
+ attr_accessor :custom_parsing_prompt
27048
+
27049
+ # The maximum number of requests the job is allowed to make to the LLM model per
27050
+ # minute. Consult https://cloud.google.com/vertex-ai/generative-ai/docs/quotas
27051
+ # and your document size to set an appropriate value here. If unspecified, a
27052
+ # default value of 5000 QPM would be used.
27053
+ # Corresponds to the JSON property `maxParsingRequestsPerMin`
27054
+ # @return [Fixnum]
27055
+ attr_accessor :max_parsing_requests_per_min
27056
+
27057
+ # The name of a LLM model used for parsing. Format: * `projects/`project_id`/
27058
+ # locations/`location`/publishers/`publisher`/models/`model``
27059
+ # Corresponds to the JSON property `modelName`
27060
+ # @return [String]
27061
+ attr_accessor :model_name
27062
+
27063
+ def initialize(**args)
27064
+ update!(**args)
27065
+ end
27066
+
27067
+ # Update properties of this object
27068
+ def update!(**args)
27069
+ @custom_parsing_prompt = args[:custom_parsing_prompt] if args.key?(:custom_parsing_prompt)
27070
+ @max_parsing_requests_per_min = args[:max_parsing_requests_per_min] if args.key?(:max_parsing_requests_per_min)
27071
+ @model_name = args[:model_name] if args.key?(:model_name)
27072
+ end
27073
+ end
27074
+
26289
27075
  # Specifies the transformation config for RagFiles.
26290
27076
  class GoogleCloudAiplatformV1beta1RagFileTransformationConfig
26291
27077
  include Google::Apis::Core::Hashable
@@ -26524,7 +27310,8 @@ module Google
26524
27310
  class GoogleCloudAiplatformV1beta1RagVectorDbConfig
26525
27311
  include Google::Apis::Core::Hashable
26526
27312
 
26527
- # The generic reusable api auth config.
27313
+ # The generic reusable api auth config. Deprecated. Please use AuthConfig (
27314
+ # google/cloud/aiplatform/master/auth.proto) instead.
26528
27315
  # Corresponds to the JSON property `apiAuth`
26529
27316
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1ApiAuth]
26530
27317
  attr_accessor :api_auth
@@ -27803,6 +28590,34 @@ module Google
27803
28590
  end
27804
28591
  end
27805
28592
 
28593
+ # Retrieval config.
28594
+ class GoogleCloudAiplatformV1beta1RetrievalConfig
28595
+ include Google::Apis::Core::Hashable
28596
+
28597
+ # The language code of the user.
28598
+ # Corresponds to the JSON property `languageCode`
28599
+ # @return [String]
28600
+ attr_accessor :language_code
28601
+
28602
+ # An object that represents a latitude/longitude pair. This is expressed as a
28603
+ # pair of doubles to represent degrees latitude and degrees longitude. Unless
28604
+ # specified otherwise, this object must conform to the WGS84 standard. Values
28605
+ # must be within normalized ranges.
28606
+ # Corresponds to the JSON property `latLng`
28607
+ # @return [Google::Apis::AiplatformV1beta1::GoogleTypeLatLng]
28608
+ attr_accessor :lat_lng
28609
+
28610
+ def initialize(**args)
28611
+ update!(**args)
28612
+ end
28613
+
28614
+ # Update properties of this object
28615
+ def update!(**args)
28616
+ @language_code = args[:language_code] if args.key?(:language_code)
28617
+ @lat_lng = args[:lat_lng] if args.key?(:lat_lng)
28618
+ end
28619
+ end
28620
+
27806
28621
  # Metadata related to retrieval in the grounding flow.
27807
28622
  class GoogleCloudAiplatformV1beta1RetrievalMetadata
27808
28623
  include Google::Apis::Core::Hashable
@@ -27930,6 +28745,59 @@ module Google
27930
28745
  end
27931
28746
  end
27932
28747
 
28748
+ # Configuration for rolling deployments.
28749
+ class GoogleCloudAiplatformV1beta1RolloutOptions
28750
+ include Google::Apis::Core::Hashable
28751
+
28752
+ # Percentage of allowed additional replicas. For autoscaling deployments, this
28753
+ # refers to the target replica count.
28754
+ # Corresponds to the JSON property `maxSurgePercentage`
28755
+ # @return [Fixnum]
28756
+ attr_accessor :max_surge_percentage
28757
+
28758
+ # Absolute count of allowed additional replicas.
28759
+ # Corresponds to the JSON property `maxSurgeReplicas`
28760
+ # @return [Fixnum]
28761
+ attr_accessor :max_surge_replicas
28762
+
28763
+ # Percentage of replicas allowed to be unavailable. For autoscaling deployments,
28764
+ # this refers to the target replica count.
28765
+ # Corresponds to the JSON property `maxUnavailablePercentage`
28766
+ # @return [Fixnum]
28767
+ attr_accessor :max_unavailable_percentage
28768
+
28769
+ # Absolute count of replicas allowed to be unavailable.
28770
+ # Corresponds to the JSON property `maxUnavailableReplicas`
28771
+ # @return [Fixnum]
28772
+ attr_accessor :max_unavailable_replicas
28773
+
28774
+ # ID of the DeployedModel that this deployment should replace.
28775
+ # Corresponds to the JSON property `previousDeployedModel`
28776
+ # @return [String]
28777
+ attr_accessor :previous_deployed_model
28778
+
28779
+ # Output only. Read-only. Revision number determines the relative priority of
28780
+ # DeployedModels in the same rollout. The DeployedModel with the largest
28781
+ # revision number specifies the intended state of the deployment.
28782
+ # Corresponds to the JSON property `revisionNumber`
28783
+ # @return [Fixnum]
28784
+ attr_accessor :revision_number
28785
+
28786
+ def initialize(**args)
28787
+ update!(**args)
28788
+ end
28789
+
28790
+ # Update properties of this object
28791
+ def update!(**args)
28792
+ @max_surge_percentage = args[:max_surge_percentage] if args.key?(:max_surge_percentage)
28793
+ @max_surge_replicas = args[:max_surge_replicas] if args.key?(:max_surge_replicas)
28794
+ @max_unavailable_percentage = args[:max_unavailable_percentage] if args.key?(:max_unavailable_percentage)
28795
+ @max_unavailable_replicas = args[:max_unavailable_replicas] if args.key?(:max_unavailable_replicas)
28796
+ @previous_deployed_model = args[:previous_deployed_model] if args.key?(:previous_deployed_model)
28797
+ @revision_number = args[:revision_number] if args.key?(:revision_number)
28798
+ end
28799
+ end
28800
+
27933
28801
  # Input for rouge metric.
27934
28802
  class GoogleCloudAiplatformV1beta1RougeInput
27935
28803
  include Google::Apis::Core::Hashable
@@ -32218,8 +33086,9 @@ module Google
32218
33086
  class GoogleCloudAiplatformV1beta1SchemaTextDataItem
32219
33087
  include Google::Apis::Core::Hashable
32220
33088
 
32221
- # Output only. Google Cloud Storage URI points to the original text in user's
32222
- # bucket. The text file is up to 10MB in size.
33089
+ # Output only. Google Cloud Storage URI points to a copy of the original text in
33090
+ # the Vertex-managed bucket in the user's project. The text file is up to 10MB
33091
+ # in size.
32223
33092
  # Corresponds to the JSON property `gcsUri`
32224
33093
  # @return [String]
32225
33094
  attr_accessor :gcs_uri
@@ -36520,6 +37389,81 @@ module Google
36520
37389
  end
36521
37390
  end
36522
37391
 
37392
+ # Configuration for Speculative Decoding.
37393
+ class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpec
37394
+ include Google::Apis::Core::Hashable
37395
+
37396
+ # Draft model speculation works by using the smaller model to generate candidate
37397
+ # tokens for speculative decoding.
37398
+ # Corresponds to the JSON property `draftModelSpeculation`
37399
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation]
37400
+ attr_accessor :draft_model_speculation
37401
+
37402
+ # N-Gram speculation works by trying to find matching tokens in the previous
37403
+ # prompt sequence and use those as speculation for generating new tokens.
37404
+ # Corresponds to the JSON property `ngramSpeculation`
37405
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation]
37406
+ attr_accessor :ngram_speculation
37407
+
37408
+ # The number of speculative tokens to generate at each step.
37409
+ # Corresponds to the JSON property `speculativeTokenCount`
37410
+ # @return [Fixnum]
37411
+ attr_accessor :speculative_token_count
37412
+
37413
+ def initialize(**args)
37414
+ update!(**args)
37415
+ end
37416
+
37417
+ # Update properties of this object
37418
+ def update!(**args)
37419
+ @draft_model_speculation = args[:draft_model_speculation] if args.key?(:draft_model_speculation)
37420
+ @ngram_speculation = args[:ngram_speculation] if args.key?(:ngram_speculation)
37421
+ @speculative_token_count = args[:speculative_token_count] if args.key?(:speculative_token_count)
37422
+ end
37423
+ end
37424
+
37425
+ # Draft model speculation works by using the smaller model to generate candidate
37426
+ # tokens for speculative decoding.
37427
+ class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecDraftModelSpeculation
37428
+ include Google::Apis::Core::Hashable
37429
+
37430
+ # Required. The resource name of the draft model.
37431
+ # Corresponds to the JSON property `draftModel`
37432
+ # @return [String]
37433
+ attr_accessor :draft_model
37434
+
37435
+ def initialize(**args)
37436
+ update!(**args)
37437
+ end
37438
+
37439
+ # Update properties of this object
37440
+ def update!(**args)
37441
+ @draft_model = args[:draft_model] if args.key?(:draft_model)
37442
+ end
37443
+ end
37444
+
37445
+ # N-Gram speculation works by trying to find matching tokens in the previous
37446
+ # prompt sequence and use those as speculation for generating new tokens.
37447
+ class GoogleCloudAiplatformV1beta1SpeculativeDecodingSpecNgramSpeculation
37448
+ include Google::Apis::Core::Hashable
37449
+
37450
+ # The number of last N input tokens used as ngram to search/match against the
37451
+ # previous prompt sequence. This is equal to the N in N-Gram. The default value
37452
+ # is 3 if not specified.
37453
+ # Corresponds to the JSON property `ngramSize`
37454
+ # @return [Fixnum]
37455
+ attr_accessor :ngram_size
37456
+
37457
+ def initialize(**args)
37458
+ update!(**args)
37459
+ end
37460
+
37461
+ # Update properties of this object
37462
+ def update!(**args)
37463
+ @ngram_size = args[:ngram_size] if args.key?(:ngram_size)
37464
+ end
37465
+ end
37466
+
36523
37467
  # The speech generation config.
36524
37468
  class GoogleCloudAiplatformV1beta1SpeechConfig
36525
37469
  include Google::Apis::Core::Hashable
@@ -38245,6 +39189,12 @@ module Google
38245
39189
  class GoogleCloudAiplatformV1beta1SupervisedTuningDataStats
38246
39190
  include Google::Apis::Core::Hashable
38247
39191
 
39192
+ # Output only. For each index in `truncated_example_indices`, the user-facing
39193
+ # reason why the example was dropped. Must not include example itself.
39194
+ # Corresponds to the JSON property `droppedExampleReasons`
39195
+ # @return [Array<String>]
39196
+ attr_accessor :dropped_example_reasons
39197
+
38248
39198
  # Output only. Number of billable characters in the tuning dataset.
38249
39199
  # Corresponds to the JSON property `totalBillableCharacterCount`
38250
39200
  # @return [Fixnum]
@@ -38255,7 +39205,9 @@ module Google
38255
39205
  # @return [Fixnum]
38256
39206
  attr_accessor :total_billable_token_count
38257
39207
 
38258
- # The number of examples in the dataset that have been truncated by any amount.
39208
+ # Output only. The number of examples in the dataset that have been dropped. An
39209
+ # example can be dropped for reasons including: too many tokens, contains an
39210
+ # invalid image, contains too many images, etc.
38259
39211
  # Corresponds to the JSON property `totalTruncatedExampleCount`
38260
39212
  # @return [Fixnum]
38261
39213
  attr_accessor :total_truncated_example_count
@@ -38265,7 +39217,8 @@ module Google
38265
39217
  # @return [Fixnum]
38266
39218
  attr_accessor :total_tuning_character_count
38267
39219
 
38268
- # A partial sample of the indices (starting from 1) of the truncated examples.
39220
+ # Output only. A partial sample of the indices (starting from 1) of the dropped
39221
+ # examples.
38269
39222
  # Corresponds to the JSON property `truncatedExampleIndices`
38270
39223
  # @return [Array<Fixnum>]
38271
39224
  attr_accessor :truncated_example_indices
@@ -38306,6 +39259,7 @@ module Google
38306
39259
 
38307
39260
  # Update properties of this object
38308
39261
  def update!(**args)
39262
+ @dropped_example_reasons = args[:dropped_example_reasons] if args.key?(:dropped_example_reasons)
38309
39263
  @total_billable_character_count = args[:total_billable_character_count] if args.key?(:total_billable_character_count)
38310
39264
  @total_billable_token_count = args[:total_billable_token_count] if args.key?(:total_billable_token_count)
38311
39265
  @total_truncated_example_count = args[:total_truncated_example_count] if args.key?(:total_truncated_example_count)
@@ -39426,6 +40380,11 @@ module Google
39426
40380
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1FunctionCallingConfig]
39427
40381
  attr_accessor :function_calling_config
39428
40382
 
40383
+ # Retrieval config.
40384
+ # Corresponds to the JSON property `retrievalConfig`
40385
+ # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1RetrievalConfig]
40386
+ attr_accessor :retrieval_config
40387
+
39429
40388
  def initialize(**args)
39430
40389
  update!(**args)
39431
40390
  end
@@ -39433,6 +40392,7 @@ module Google
39433
40392
  # Update properties of this object
39434
40393
  def update!(**args)
39435
40394
  @function_calling_config = args[:function_calling_config] if args.key?(:function_calling_config)
40395
+ @retrieval_config = args[:retrieval_config] if args.key?(:retrieval_config)
39436
40396
  end
39437
40397
  end
39438
40398
 
@@ -40815,7 +41775,7 @@ module Google
40815
41775
  end
40816
41776
  end
40817
41777
 
40818
- # The Model Registry Model and Online Prediction Endpoint assiociated with this
41778
+ # The Model Registry Model and Online Prediction Endpoint associated with this
40819
41779
  # TuningJob.
40820
41780
  class GoogleCloudAiplatformV1beta1TunedModel
40821
41781
  include Google::Apis::Core::Hashable
@@ -41005,7 +41965,7 @@ module Google
41005
41965
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1SupervisedTuningSpec]
41006
41966
  attr_accessor :supervised_tuning_spec
41007
41967
 
41008
- # The Model Registry Model and Online Prediction Endpoint assiociated with this
41968
+ # The Model Registry Model and Online Prediction Endpoint associated with this
41009
41969
  # TuningJob.
41010
41970
  # Corresponds to the JSON property `tunedModel`
41011
41971
  # @return [Google::Apis::AiplatformV1beta1::GoogleCloudAiplatformV1beta1TunedModel]
@@ -43004,6 +43964,34 @@ module Google
43004
43964
  end
43005
43965
  end
43006
43966
 
43967
+ # An object that represents a latitude/longitude pair. This is expressed as a
43968
+ # pair of doubles to represent degrees latitude and degrees longitude. Unless
43969
+ # specified otherwise, this object must conform to the WGS84 standard. Values
43970
+ # must be within normalized ranges.
43971
+ class GoogleTypeLatLng
43972
+ include Google::Apis::Core::Hashable
43973
+
43974
+ # The latitude in degrees. It must be in the range [-90.0, +90.0].
43975
+ # Corresponds to the JSON property `latitude`
43976
+ # @return [Float]
43977
+ attr_accessor :latitude
43978
+
43979
+ # The longitude in degrees. It must be in the range [-180.0, +180.0].
43980
+ # Corresponds to the JSON property `longitude`
43981
+ # @return [Float]
43982
+ attr_accessor :longitude
43983
+
43984
+ def initialize(**args)
43985
+ update!(**args)
43986
+ end
43987
+
43988
+ # Update properties of this object
43989
+ def update!(**args)
43990
+ @latitude = args[:latitude] if args.key?(:latitude)
43991
+ @longitude = args[:longitude] if args.key?(:longitude)
43992
+ end
43993
+ end
43994
+
43007
43995
  # Represents an amount of money with its currency type.
43008
43996
  class GoogleTypeMoney
43009
43997
  include Google::Apis::Core::Hashable