google-apis-aiplatform_v1 0.42.0 → 0.44.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -474,7 +474,7 @@ module Google
474
474
  end
475
475
  end
476
476
 
477
- # Create API error message for Vertex Pipeline. Next Id: 3.
477
+ # Create API error message for Vertex Pipeline.
478
478
  class CloudAiPlatformCommonCreatePipelineJobApiErrorDetail
479
479
  include Google::Apis::Core::Hashable
480
480
 
@@ -840,7 +840,8 @@ module Google
840
840
  end
841
841
  end
842
842
 
843
- # The generic reusable api auth config.
843
+ # The generic reusable api auth config. Deprecated. Please use AuthConfig (
844
+ # google/cloud/aiplatform/master/auth.proto) instead.
844
845
  class GoogleCloudAiplatformV1ApiAuth
845
846
  include Google::Apis::Core::Hashable
846
847
 
@@ -1220,22 +1221,22 @@ module Google
1220
1221
  class GoogleCloudAiplatformV1AutomaticResources
1221
1222
  include Google::Apis::Core::Hashable
1222
1223
 
1223
- # Immutable. The maximum number of replicas this DeployedModel may be deployed
1224
- # on when the traffic against it increases. If the requested value is too large,
1225
- # the deployment will error, but if deployment succeeds then the ability to
1226
- # scale the model to that many replicas is guaranteed (barring service outages).
1227
- # If traffic against the DeployedModel increases beyond what its replicas at
1228
- # maximum may handle, a portion of the traffic will be dropped. If this value is
1229
- # not provided, a no upper bound for scaling under heavy traffic will be assume,
1230
- # though Vertex AI may be unable to scale beyond certain replica number.
1224
+ # Immutable. The maximum number of replicas that may be deployed on when the
1225
+ # traffic against it increases. If the requested value is too large, the
1226
+ # deployment will error, but if deployment succeeds then the ability to scale to
1227
+ # that many replicas is guaranteed (barring service outages). If traffic
1228
+ # increases beyond what its replicas at maximum may handle, a portion of the
1229
+ # traffic will be dropped. If this value is not provided, a no upper bound for
1230
+ # scaling under heavy traffic will be assume, though Vertex AI may be unable to
1231
+ # scale beyond certain replica number.
1231
1232
  # Corresponds to the JSON property `maxReplicaCount`
1232
1233
  # @return [Fixnum]
1233
1234
  attr_accessor :max_replica_count
1234
1235
 
1235
- # Immutable. The minimum number of replicas this DeployedModel will be always
1236
- # deployed on. If traffic against it increases, it may dynamically be deployed
1237
- # onto more replicas up to max_replica_count, and as traffic decreases, some of
1238
- # these extra replicas may be freed. If the requested value is too large, the
1236
+ # Immutable. The minimum number of replicas that will be always deployed on. If
1237
+ # traffic against it increases, it may dynamically be deployed onto more
1238
+ # replicas up to max_replica_count, and as traffic decreases, some of these
1239
+ # extra replicas may be freed. If the requested value is too large, the
1239
1240
  # deployment will error.
1240
1241
  # Corresponds to the JSON property `minReplicaCount`
1241
1242
  # @return [Fixnum]
@@ -1252,6 +1253,48 @@ module Google
1252
1253
  end
1253
1254
  end
1254
1255
 
1256
+ # The configs for autorater. This is applicable to both EvaluateInstances and
1257
+ # EvaluateDataset.
1258
+ class GoogleCloudAiplatformV1AutoraterConfig
1259
+ include Google::Apis::Core::Hashable
1260
+
1261
+ # Optional. The fully qualified name of the publisher model or tuned autorater
1262
+ # endpoint to use. Publisher model format: `projects/`project`/locations/`
1263
+ # location`/publishers/*/models/*` Tuned model endpoint format: `projects/`
1264
+ # project`/locations/`location`/endpoints/`endpoint``
1265
+ # Corresponds to the JSON property `autoraterModel`
1266
+ # @return [String]
1267
+ attr_accessor :autorater_model
1268
+
1269
+ # Optional. Whether to flip the candidate and baseline responses. This is only
1270
+ # applicable to the pairwise metric. If enabled, also provide PairwiseMetricSpec.
1271
+ # candidate_response_field_name and PairwiseMetricSpec.
1272
+ # baseline_response_field_name. When rendering PairwiseMetricSpec.
1273
+ # metric_prompt_template, the candidate and baseline fields will be flipped for
1274
+ # half of the samples to reduce bias.
1275
+ # Corresponds to the JSON property `flipEnabled`
1276
+ # @return [Boolean]
1277
+ attr_accessor :flip_enabled
1278
+ alias_method :flip_enabled?, :flip_enabled
1279
+
1280
+ # Optional. Number of samples for each instance in the dataset. If not specified,
1281
+ # the default is 4. Minimum value is 1, maximum value is 32.
1282
+ # Corresponds to the JSON property `samplingCount`
1283
+ # @return [Fixnum]
1284
+ attr_accessor :sampling_count
1285
+
1286
+ def initialize(**args)
1287
+ update!(**args)
1288
+ end
1289
+
1290
+ # Update properties of this object
1291
+ def update!(**args)
1292
+ @autorater_model = args[:autorater_model] if args.key?(:autorater_model)
1293
+ @flip_enabled = args[:flip_enabled] if args.key?(:flip_enabled)
1294
+ @sampling_count = args[:sampling_count] if args.key?(:sampling_count)
1295
+ end
1296
+ end
1297
+
1255
1298
  # The metric specification that defines the target resource utilization (CPU
1256
1299
  # utilization, accelerator's duty cycle, and so on) for calculating the desired
1257
1300
  # replica count.
@@ -2437,7 +2480,7 @@ module Google
2437
2480
  end
2438
2481
  end
2439
2482
 
2440
- # Content blob. It's preferred to send as text directly rather than raw bytes.
2483
+ # Content blob.
2441
2484
  class GoogleCloudAiplatformV1Blob
2442
2485
  include Google::Apis::Core::Hashable
2443
2486
 
@@ -2447,6 +2490,13 @@ module Google
2447
2490
  # @return [String]
2448
2491
  attr_accessor :data
2449
2492
 
2493
+ # Optional. Display name of the blob. Used to provide a label or filename to
2494
+ # distinguish blobs. This field is only returned in PromptMessage for prompt
2495
+ # management. It is not currently used in the Gemini GenerateContent calls.
2496
+ # Corresponds to the JSON property `displayName`
2497
+ # @return [String]
2498
+ attr_accessor :display_name
2499
+
2450
2500
  # Required. The IANA standard MIME type of the source data.
2451
2501
  # Corresponds to the JSON property `mimeType`
2452
2502
  # @return [String]
@@ -2459,6 +2509,7 @@ module Google
2459
2509
  # Update properties of this object
2460
2510
  def update!(**args)
2461
2511
  @data = args[:data] if args.key?(:data)
2512
+ @display_name = args[:display_name] if args.key?(:display_name)
2462
2513
  @mime_type = args[:mime_type] if args.key?(:mime_type)
2463
2514
  end
2464
2515
  end
@@ -2543,7 +2594,7 @@ module Google
2543
2594
  # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1Content>]
2544
2595
  attr_accessor :contents
2545
2596
 
2546
- # Output only. Creatation time of the cache entry.
2597
+ # Output only. Creation time of the cache entry.
2547
2598
  # Corresponds to the JSON property `createTime`
2548
2599
  # @return [String]
2549
2600
  attr_accessor :create_time
@@ -2560,8 +2611,9 @@ module Google
2560
2611
  # @return [String]
2561
2612
  attr_accessor :expire_time
2562
2613
 
2563
- # Immutable. The name of the publisher model to use for cached content. Format:
2564
- # projects/`project`/locations/`location`/publishers/`publisher`/models/`model`
2614
+ # Immutable. The name of the `Model` to use for cached content. Currently, only
2615
+ # the published Gemini base models are supported, in form of projects/`PROJECT`/
2616
+ # locations/`LOCATION`/publishers/google/models/`MODEL`
2565
2617
  # Corresponds to the JSON property `model`
2566
2618
  # @return [String]
2567
2619
  attr_accessor :model
@@ -3045,6 +3097,33 @@ module Google
3045
3097
  end
3046
3098
  end
3047
3099
 
3100
+ # Result of executing the [ExecutableCode]. Always follows a `part` containing
3101
+ # the [ExecutableCode].
3102
+ class GoogleCloudAiplatformV1CodeExecutionResult
3103
+ include Google::Apis::Core::Hashable
3104
+
3105
+ # Required. Outcome of the code execution.
3106
+ # Corresponds to the JSON property `outcome`
3107
+ # @return [String]
3108
+ attr_accessor :outcome
3109
+
3110
+ # Optional. Contains stdout when code execution is successful, stderr or other
3111
+ # description otherwise.
3112
+ # Corresponds to the JSON property `output`
3113
+ # @return [String]
3114
+ attr_accessor :output
3115
+
3116
+ def initialize(**args)
3117
+ update!(**args)
3118
+ end
3119
+
3120
+ # Update properties of this object
3121
+ def update!(**args)
3122
+ @outcome = args[:outcome] if args.key?(:outcome)
3123
+ @output = args[:output] if args.key?(:output)
3124
+ end
3125
+ end
3126
+
3048
3127
  # Input for coherence metric.
3049
3128
  class GoogleCloudAiplatformV1CoherenceInput
3050
3129
  include Google::Apis::Core::Hashable
@@ -3824,6 +3903,11 @@ module Google
3824
3903
  class GoogleCloudAiplatformV1CountTokensResponse
3825
3904
  include Google::Apis::Core::Hashable
3826
3905
 
3906
+ # Output only. List of modalities that were processed in the request input.
3907
+ # Corresponds to the JSON property `promptTokensDetails`
3908
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModalityTokenCount>]
3909
+ attr_accessor :prompt_tokens_details
3910
+
3827
3911
  # The total number of billable characters counted across all instances from the
3828
3912
  # request.
3829
3913
  # Corresponds to the JSON property `totalBillableCharacters`
@@ -3841,6 +3925,7 @@ module Google
3841
3925
 
3842
3926
  # Update properties of this object
3843
3927
  def update!(**args)
3928
+ @prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
3844
3929
  @total_billable_characters = args[:total_billable_characters] if args.key?(:total_billable_characters)
3845
3930
  @total_tokens = args[:total_tokens] if args.key?(:total_tokens)
3846
3931
  end
@@ -5077,7 +5162,8 @@ module Google
5077
5162
  # @return [String]
5078
5163
  attr_accessor :model_reference
5079
5164
 
5080
- # Output only. Identifier. The resource name of the Dataset.
5165
+ # Output only. Identifier. The resource name of the Dataset. Format: `projects/`
5166
+ # project`/locations/`location`/datasets/`dataset``
5081
5167
  # Corresponds to the JSON property `name`
5082
5168
  # @return [String]
5083
5169
  attr_accessor :name
@@ -5171,7 +5257,9 @@ module Google
5171
5257
  # @return [String]
5172
5258
  attr_accessor :model_reference
5173
5259
 
5174
- # Output only. Identifier. The resource name of the DatasetVersion.
5260
+ # Output only. Identifier. The resource name of the DatasetVersion. Format: `
5261
+ # projects/`project`/locations/`location`/datasets/`dataset`/datasetVersions/`
5262
+ # dataset_version``
5175
5263
  # Corresponds to the JSON property `name`
5176
5264
  # @return [String]
5177
5265
  attr_accessor :name
@@ -5212,8 +5300,8 @@ module Google
5212
5300
  end
5213
5301
  end
5214
5302
 
5215
- # A description of resources that are dedicated to a DeployedModel, and that
5216
- # need a higher degree of manual configuration.
5303
+ # A description of resources that are dedicated to a DeployedModel or
5304
+ # DeployedIndex, and that need a higher degree of manual configuration.
5217
5305
  class GoogleCloudAiplatformV1DedicatedResources
5218
5306
  include Google::Apis::Core::Hashable
5219
5307
 
@@ -5239,36 +5327,33 @@ module Google
5239
5327
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1MachineSpec]
5240
5328
  attr_accessor :machine_spec
5241
5329
 
5242
- # Immutable. The maximum number of replicas this DeployedModel may be deployed
5243
- # on when the traffic against it increases. If the requested value is too large,
5244
- # the deployment will error, but if deployment succeeds then the ability to
5245
- # scale the model to that many replicas is guaranteed (barring service outages).
5246
- # If traffic against the DeployedModel increases beyond what its replicas at
5247
- # maximum may handle, a portion of the traffic will be dropped. If this value is
5248
- # not provided, will use min_replica_count as the default value. The value of
5249
- # this field impacts the charge against Vertex CPU and GPU quotas. Specifically,
5250
- # you will be charged for (max_replica_count * number of cores in the selected
5251
- # machine type) and (max_replica_count * number of GPUs per replica in the
5252
- # selected machine type).
5330
+ # Immutable. The maximum number of replicas that may be deployed on when the
5331
+ # traffic against it increases. If the requested value is too large, the
5332
+ # deployment will error, but if deployment succeeds then the ability to scale to
5333
+ # that many replicas is guaranteed (barring service outages). If traffic
5334
+ # increases beyond what its replicas at maximum may handle, a portion of the
5335
+ # traffic will be dropped. If this value is not provided, will use
5336
+ # min_replica_count as the default value. The value of this field impacts the
5337
+ # charge against Vertex CPU and GPU quotas. Specifically, you will be charged
5338
+ # for (max_replica_count * number of cores in the selected machine type) and (
5339
+ # max_replica_count * number of GPUs per replica in the selected machine type).
5253
5340
  # Corresponds to the JSON property `maxReplicaCount`
5254
5341
  # @return [Fixnum]
5255
5342
  attr_accessor :max_replica_count
5256
5343
 
5257
- # Required. Immutable. The minimum number of machine replicas this DeployedModel
5258
- # will be always deployed on. This value must be greater than or equal to 1. If
5259
- # traffic against the DeployedModel increases, it may dynamically be deployed
5260
- # onto more replicas, and as traffic decreases, some of these extra replicas may
5261
- # be freed.
5344
+ # Required. Immutable. The minimum number of machine replicas that will be
5345
+ # always deployed on. This value must be greater than or equal to 1. If traffic
5346
+ # increases, it may dynamically be deployed onto more replicas, and as traffic
5347
+ # decreases, some of these extra replicas may be freed.
5262
5348
  # Corresponds to the JSON property `minReplicaCount`
5263
5349
  # @return [Fixnum]
5264
5350
  attr_accessor :min_replica_count
5265
5351
 
5266
5352
  # Optional. Number of required available replicas for the deployment to succeed.
5267
- # This field is only needed when partial model deployment/mutation is desired.
5268
- # If set, the model deploy/mutate operation will succeed once
5269
- # available_replica_count reaches required_replica_count, and the rest of the
5270
- # replicas will be retried. If not set, the default required_replica_count will
5271
- # be min_replica_count.
5353
+ # This field is only needed when partial deployment/mutation is desired. If set,
5354
+ # the deploy/mutate operation will succeed once available_replica_count reaches
5355
+ # required_replica_count, and the rest of the replicas will be retried. If not
5356
+ # set, the default required_replica_count will be min_replica_count.
5272
5357
  # Corresponds to the JSON property `requiredReplicaCount`
5273
5358
  # @return [Fixnum]
5274
5359
  attr_accessor :required_replica_count
@@ -5683,8 +5768,8 @@ module Google
5683
5768
  # @return [String]
5684
5769
  attr_accessor :create_time
5685
5770
 
5686
- # A description of resources that are dedicated to a DeployedModel, and that
5687
- # need a higher degree of manual configuration.
5771
+ # A description of resources that are dedicated to a DeployedModel or
5772
+ # DeployedIndex, and that need a higher degree of manual configuration.
5688
5773
  # Corresponds to the JSON property `dedicatedResources`
5689
5774
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1DedicatedResources]
5690
5775
  attr_accessor :dedicated_resources
@@ -5896,8 +5981,8 @@ module Google
5896
5981
  # @return [String]
5897
5982
  attr_accessor :create_time
5898
5983
 
5899
- # A description of resources that are dedicated to a DeployedModel, and that
5900
- # need a higher degree of manual configuration.
5984
+ # A description of resources that are dedicated to a DeployedModel or
5985
+ # DeployedIndex, and that need a higher degree of manual configuration.
5901
5986
  # Corresponds to the JSON property `dedicatedResources`
5902
5987
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1DedicatedResources]
5903
5988
  attr_accessor :dedicated_resources
@@ -5991,6 +6076,11 @@ module Google
5991
6076
  # @return [String]
5992
6077
  attr_accessor :shared_resources
5993
6078
 
6079
+ # Configuration for Speculative Decoding.
6080
+ # Corresponds to the JSON property `speculativeDecodingSpec`
6081
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1SpeculativeDecodingSpec]
6082
+ attr_accessor :speculative_decoding_spec
6083
+
5994
6084
  # Runtime status of the deployed model.
5995
6085
  # Corresponds to the JSON property `status`
5996
6086
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1DeployedModelStatus]
@@ -6023,6 +6113,7 @@ module Google
6023
6113
  @private_endpoints = args[:private_endpoints] if args.key?(:private_endpoints)
6024
6114
  @service_account = args[:service_account] if args.key?(:service_account)
6025
6115
  @shared_resources = args[:shared_resources] if args.key?(:shared_resources)
6116
+ @speculative_decoding_spec = args[:speculative_decoding_spec] if args.key?(:speculative_decoding_spec)
6026
6117
  @status = args[:status] if args.key?(:status)
6027
6118
  @system_labels = args[:system_labels] if args.key?(:system_labels)
6028
6119
  end
@@ -6094,8 +6185,8 @@ module Google
6094
6185
  # @return [String]
6095
6186
  attr_accessor :create_time
6096
6187
 
6097
- # A description of resources that are dedicated to a DeployedModel, and that
6098
- # need a higher degree of manual configuration.
6188
+ # A description of resources that are dedicated to a DeployedModel or
6189
+ # DeployedIndex, and that need a higher degree of manual configuration.
6099
6190
  # Corresponds to the JSON property `dedicatedResources`
6100
6191
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1DedicatedResources]
6101
6192
  attr_accessor :dedicated_resources
@@ -6465,6 +6556,11 @@ module Google
6465
6556
  # @return [String]
6466
6557
  attr_accessor :etag
6467
6558
 
6559
+ # Configuration for GenAiAdvancedFeatures.
6560
+ # Corresponds to the JSON property `genAiAdvancedFeaturesConfig`
6561
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GenAiAdvancedFeaturesConfig]
6562
+ attr_accessor :gen_ai_advanced_features_config
6563
+
6468
6564
  # The labels with user-defined metadata to organize your Endpoints. Label keys
6469
6565
  # and values can be no longer than 64 characters (Unicode codepoints), can only
6470
6566
  # contain lowercase letters, numeric characters, underscores and dashes.
@@ -6551,6 +6647,7 @@ module Google
6551
6647
  @enable_private_service_connect = args[:enable_private_service_connect] if args.key?(:enable_private_service_connect)
6552
6648
  @encryption_spec = args[:encryption_spec] if args.key?(:encryption_spec)
6553
6649
  @etag = args[:etag] if args.key?(:etag)
6650
+ @gen_ai_advanced_features_config = args[:gen_ai_advanced_features_config] if args.key?(:gen_ai_advanced_features_config)
6554
6651
  @labels = args[:labels] if args.key?(:labels)
6555
6652
  @model_deployment_monitoring_job = args[:model_deployment_monitoring_job] if args.key?(:model_deployment_monitoring_job)
6556
6653
  @name = args[:name] if args.key?(:name)
@@ -6778,10 +6875,54 @@ module Google
6778
6875
  end
6779
6876
  end
6780
6877
 
6878
+ # Request message for EvaluationService.EvaluateDataset.
6879
+ class GoogleCloudAiplatformV1EvaluateDatasetRequest
6880
+ include Google::Apis::Core::Hashable
6881
+
6882
+ # The configs for autorater. This is applicable to both EvaluateInstances and
6883
+ # EvaluateDataset.
6884
+ # Corresponds to the JSON property `autoraterConfig`
6885
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1AutoraterConfig]
6886
+ attr_accessor :autorater_config
6887
+
6888
+ # The dataset used for evaluation.
6889
+ # Corresponds to the JSON property `dataset`
6890
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1EvaluationDataset]
6891
+ attr_accessor :dataset
6892
+
6893
+ # Required. The metrics used for evaluation.
6894
+ # Corresponds to the JSON property `metrics`
6895
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1Metric>]
6896
+ attr_accessor :metrics
6897
+
6898
+ # Config for evaluation output.
6899
+ # Corresponds to the JSON property `outputConfig`
6900
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1OutputConfig]
6901
+ attr_accessor :output_config
6902
+
6903
+ def initialize(**args)
6904
+ update!(**args)
6905
+ end
6906
+
6907
+ # Update properties of this object
6908
+ def update!(**args)
6909
+ @autorater_config = args[:autorater_config] if args.key?(:autorater_config)
6910
+ @dataset = args[:dataset] if args.key?(:dataset)
6911
+ @metrics = args[:metrics] if args.key?(:metrics)
6912
+ @output_config = args[:output_config] if args.key?(:output_config)
6913
+ end
6914
+ end
6915
+
6781
6916
  # Request message for EvaluationService.EvaluateInstances.
6782
6917
  class GoogleCloudAiplatformV1EvaluateInstancesRequest
6783
6918
  include Google::Apis::Core::Hashable
6784
6919
 
6920
+ # The configs for autorater. This is applicable to both EvaluateInstances and
6921
+ # EvaluateDataset.
6922
+ # Corresponds to the JSON property `autoraterConfig`
6923
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1AutoraterConfig]
6924
+ attr_accessor :autorater_config
6925
+
6785
6926
  # Input for bleu metric.
6786
6927
  # Corresponds to the JSON property `bleuInput`
6787
6928
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1BleuInput]
@@ -6943,6 +7084,7 @@ module Google
6943
7084
 
6944
7085
  # Update properties of this object
6945
7086
  def update!(**args)
7087
+ @autorater_config = args[:autorater_config] if args.key?(:autorater_config)
6946
7088
  @bleu_input = args[:bleu_input] if args.key?(:bleu_input)
6947
7089
  @coherence_input = args[:coherence_input] if args.key?(:coherence_input)
6948
7090
  @comet_input = args[:comet_input] if args.key?(:comet_input)
@@ -7282,6 +7424,31 @@ module Google
7282
7424
  end
7283
7425
  end
7284
7426
 
7427
+ # The dataset used for evaluation.
7428
+ class GoogleCloudAiplatformV1EvaluationDataset
7429
+ include Google::Apis::Core::Hashable
7430
+
7431
+ # The BigQuery location for the input content.
7432
+ # Corresponds to the JSON property `bigquerySource`
7433
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1BigQuerySource]
7434
+ attr_accessor :bigquery_source
7435
+
7436
+ # The Google Cloud Storage location for the input content.
7437
+ # Corresponds to the JSON property `gcsSource`
7438
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GcsSource]
7439
+ attr_accessor :gcs_source
7440
+
7441
+ def initialize(**args)
7442
+ update!(**args)
7443
+ end
7444
+
7445
+ # Update properties of this object
7446
+ def update!(**args)
7447
+ @bigquery_source = args[:bigquery_source] if args.key?(:bigquery_source)
7448
+ @gcs_source = args[:gcs_source] if args.key?(:gcs_source)
7449
+ end
7450
+ end
7451
+
7285
7452
  # An edge describing the relationship between an Artifact and an Execution in a
7286
7453
  # lineage graph.
7287
7454
  class GoogleCloudAiplatformV1Event
@@ -7577,6 +7744,33 @@ module Google
7577
7744
  end
7578
7745
  end
7579
7746
 
7747
+ # Code generated by the model that is meant to be executed, and the result
7748
+ # returned to the model. Generated when using the [FunctionDeclaration] tool and
7749
+ # [FunctionCallingConfig] mode is set to [Mode.CODE].
7750
+ class GoogleCloudAiplatformV1ExecutableCode
7751
+ include Google::Apis::Core::Hashable
7752
+
7753
+ # Required. The code to be executed.
7754
+ # Corresponds to the JSON property `code`
7755
+ # @return [String]
7756
+ attr_accessor :code
7757
+
7758
+ # Required. Programming language of the `code`.
7759
+ # Corresponds to the JSON property `language`
7760
+ # @return [String]
7761
+ attr_accessor :language
7762
+
7763
+ def initialize(**args)
7764
+ update!(**args)
7765
+ end
7766
+
7767
+ # Update properties of this object
7768
+ def update!(**args)
7769
+ @code = args[:code] if args.key?(:code)
7770
+ @language = args[:language] if args.key?(:language)
7771
+ end
7772
+ end
7773
+
7580
7774
  # Instance of a general execution.
7581
7775
  class GoogleCloudAiplatformV1Execution
7582
7776
  include Google::Apis::Core::Hashable
@@ -9785,6 +9979,22 @@ module Google
9785
9979
  attr_accessor :satisfies_pzs
9786
9980
  alias_method :satisfies_pzs?, :satisfies_pzs
9787
9981
 
9982
+ # Output only. A Service Account unique to this FeatureView. The role bigquery.
9983
+ # dataViewer should be granted to this service account to allow Vertex AI
9984
+ # Feature Store to sync data to the online store.
9985
+ # Corresponds to the JSON property `serviceAccountEmail`
9986
+ # @return [String]
9987
+ attr_accessor :service_account_email
9988
+
9989
+ # Optional. Service agent type used during data sync. By default, the Vertex AI
9990
+ # Service Agent is used. When using an IAM Policy to isolate this FeatureView
9991
+ # within a project, a separate service account should be provisioned by setting
9992
+ # this field to `SERVICE_AGENT_TYPE_FEATURE_VIEW`. This will generate a separate
9993
+ # service account to access the BigQuery source table.
9994
+ # Corresponds to the JSON property `serviceAgentType`
9995
+ # @return [String]
9996
+ attr_accessor :service_agent_type
9997
+
9788
9998
  # Configuration for Sync. Only one option is set.
9789
9999
  # Corresponds to the JSON property `syncConfig`
9790
10000
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1FeatureViewSyncConfig]
@@ -9816,6 +10026,8 @@ module Google
9816
10026
  @optimized_config = args[:optimized_config] if args.key?(:optimized_config)
9817
10027
  @satisfies_pzi = args[:satisfies_pzi] if args.key?(:satisfies_pzi)
9818
10028
  @satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
10029
+ @service_account_email = args[:service_account_email] if args.key?(:service_account_email)
10030
+ @service_agent_type = args[:service_agent_type] if args.key?(:service_agent_type)
9819
10031
  @sync_config = args[:sync_config] if args.key?(:sync_config)
9820
10032
  @update_time = args[:update_time] if args.key?(:update_time)
9821
10033
  @vertex_rag_source = args[:vertex_rag_source] if args.key?(:vertex_rag_source)
@@ -10657,6 +10869,14 @@ module Google
10657
10869
  class GoogleCloudAiplatformV1FileData
10658
10870
  include Google::Apis::Core::Hashable
10659
10871
 
10872
+ # Optional. Display name of the file data. Used to provide a label or filename
10873
+ # to distinguish file datas. This field is only returned in PromptMessage for
10874
+ # prompt management. It is not currently used in the Gemini GenerateContent
10875
+ # calls.
10876
+ # Corresponds to the JSON property `displayName`
10877
+ # @return [String]
10878
+ attr_accessor :display_name
10879
+
10660
10880
  # Required. URI.
10661
10881
  # Corresponds to the JSON property `fileUri`
10662
10882
  # @return [String]
@@ -10673,6 +10893,7 @@ module Google
10673
10893
 
10674
10894
  # Update properties of this object
10675
10895
  def update!(**args)
10896
+ @display_name = args[:display_name] if args.key?(:display_name)
10676
10897
  @file_uri = args[:file_uri] if args.key?(:file_uri)
10677
10898
  @mime_type = args[:mime_type] if args.key?(:mime_type)
10678
10899
  end
@@ -11355,6 +11576,47 @@ module Google
11355
11576
  end
11356
11577
  end
11357
11578
 
11579
+ # Configuration for GenAiAdvancedFeatures.
11580
+ class GoogleCloudAiplatformV1GenAiAdvancedFeaturesConfig
11581
+ include Google::Apis::Core::Hashable
11582
+
11583
+ # Configuration for Retrieval Augmented Generation feature.
11584
+ # Corresponds to the JSON property `ragConfig`
11585
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GenAiAdvancedFeaturesConfigRagConfig]
11586
+ attr_accessor :rag_config
11587
+
11588
+ def initialize(**args)
11589
+ update!(**args)
11590
+ end
11591
+
11592
+ # Update properties of this object
11593
+ def update!(**args)
11594
+ @rag_config = args[:rag_config] if args.key?(:rag_config)
11595
+ end
11596
+ end
11597
+
11598
+ # Configuration for Retrieval Augmented Generation feature.
11599
+ class GoogleCloudAiplatformV1GenAiAdvancedFeaturesConfigRagConfig
11600
+ include Google::Apis::Core::Hashable
11601
+
11602
+ # If true, enable Retrieval Augmented Generation in ChatCompletion request. Once
11603
+ # enabled, the endpoint will be identified as GenAI endpoint and Arthedain
11604
+ # router will be used.
11605
+ # Corresponds to the JSON property `enableRag`
11606
+ # @return [Boolean]
11607
+ attr_accessor :enable_rag
11608
+ alias_method :enable_rag?, :enable_rag
11609
+
11610
+ def initialize(**args)
11611
+ update!(**args)
11612
+ end
11613
+
11614
+ # Update properties of this object
11615
+ def update!(**args)
11616
+ @enable_rag = args[:enable_rag] if args.key?(:enable_rag)
11617
+ end
11618
+ end
11619
+
11358
11620
  # Request message for [PredictionService.GenerateContent].
11359
11621
  class GoogleCloudAiplatformV1GenerateContentRequest
11360
11622
  include Google::Apis::Core::Hashable
@@ -11442,6 +11704,11 @@ module Google
11442
11704
  # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1Candidate>]
11443
11705
  attr_accessor :candidates
11444
11706
 
11707
+ # Output only. Timestamp when the request is made to the server.
11708
+ # Corresponds to the JSON property `createTime`
11709
+ # @return [String]
11710
+ attr_accessor :create_time
11711
+
11445
11712
  # Output only. The model version used to generate the response.
11446
11713
  # Corresponds to the JSON property `modelVersion`
11447
11714
  # @return [String]
@@ -11452,6 +11719,12 @@ module Google
11452
11719
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GenerateContentResponsePromptFeedback]
11453
11720
  attr_accessor :prompt_feedback
11454
11721
 
11722
+ # Output only. response_id is used to identify each response. It is the encoding
11723
+ # of the event_id.
11724
+ # Corresponds to the JSON property `responseId`
11725
+ # @return [String]
11726
+ attr_accessor :response_id
11727
+
11455
11728
  # Usage metadata about response(s).
11456
11729
  # Corresponds to the JSON property `usageMetadata`
11457
11730
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GenerateContentResponseUsageMetadata]
@@ -11464,8 +11737,10 @@ module Google
11464
11737
  # Update properties of this object
11465
11738
  def update!(**args)
11466
11739
  @candidates = args[:candidates] if args.key?(:candidates)
11740
+ @create_time = args[:create_time] if args.key?(:create_time)
11467
11741
  @model_version = args[:model_version] if args.key?(:model_version)
11468
11742
  @prompt_feedback = args[:prompt_feedback] if args.key?(:prompt_feedback)
11743
+ @response_id = args[:response_id] if args.key?(:response_id)
11469
11744
  @usage_metadata = args[:usage_metadata] if args.key?(:usage_metadata)
11470
11745
  end
11471
11746
  end
@@ -11505,6 +11780,11 @@ module Google
11505
11780
  class GoogleCloudAiplatformV1GenerateContentResponseUsageMetadata
11506
11781
  include Google::Apis::Core::Hashable
11507
11782
 
11783
+ # Output only. List of modalities of the cached content in the request input.
11784
+ # Corresponds to the JSON property `cacheTokensDetails`
11785
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModalityTokenCount>]
11786
+ attr_accessor :cache_tokens_details
11787
+
11508
11788
  # Output only. Number of tokens in the cached part in the input (the cached
11509
11789
  # content).
11510
11790
  # Corresponds to the JSON property `cachedContentTokenCount`
@@ -11516,6 +11796,11 @@ module Google
11516
11796
  # @return [Fixnum]
11517
11797
  attr_accessor :candidates_token_count
11518
11798
 
11799
+ # Output only. List of modalities that were returned in the response.
11800
+ # Corresponds to the JSON property `candidatesTokensDetails`
11801
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModalityTokenCount>]
11802
+ attr_accessor :candidates_tokens_details
11803
+
11519
11804
  # Number of tokens in the request. When `cached_content` is set, this is still
11520
11805
  # the total effective prompt size meaning this includes the number of tokens in
11521
11806
  # the cached content.
@@ -11523,6 +11808,11 @@ module Google
11523
11808
  # @return [Fixnum]
11524
11809
  attr_accessor :prompt_token_count
11525
11810
 
11811
+ # Output only. List of modalities that were processed in the request input.
11812
+ # Corresponds to the JSON property `promptTokensDetails`
11813
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModalityTokenCount>]
11814
+ attr_accessor :prompt_tokens_details
11815
+
11526
11816
  # Total token count for prompt and response candidates.
11527
11817
  # Corresponds to the JSON property `totalTokenCount`
11528
11818
  # @return [Fixnum]
@@ -11534,9 +11824,12 @@ module Google
11534
11824
 
11535
11825
  # Update properties of this object
11536
11826
  def update!(**args)
11827
+ @cache_tokens_details = args[:cache_tokens_details] if args.key?(:cache_tokens_details)
11537
11828
  @cached_content_token_count = args[:cached_content_token_count] if args.key?(:cached_content_token_count)
11538
11829
  @candidates_token_count = args[:candidates_token_count] if args.key?(:candidates_token_count)
11830
+ @candidates_tokens_details = args[:candidates_tokens_details] if args.key?(:candidates_tokens_details)
11539
11831
  @prompt_token_count = args[:prompt_token_count] if args.key?(:prompt_token_count)
11832
+ @prompt_tokens_details = args[:prompt_tokens_details] if args.key?(:prompt_tokens_details)
11540
11833
  @total_token_count = args[:total_token_count] if args.key?(:total_token_count)
11541
11834
  end
11542
11835
  end
@@ -11572,6 +11865,11 @@ module Google
11572
11865
  # @return [Fixnum]
11573
11866
  attr_accessor :max_output_tokens
11574
11867
 
11868
+ # Optional. If specified, the media resolution specified will be used.
11869
+ # Corresponds to the JSON property `mediaResolution`
11870
+ # @return [String]
11871
+ attr_accessor :media_resolution
11872
+
11575
11873
  # Optional. Positive penalties.
11576
11874
  # Corresponds to the JSON property `presencePenalty`
11577
11875
  # @return [Float]
@@ -11629,11 +11927,6 @@ module Google
11629
11927
  # @return [Float]
11630
11928
  attr_accessor :temperature
11631
11929
 
11632
- # Optional. If specified, the token resolution specified will be used.
11633
- # Corresponds to the JSON property `tokenResolution`
11634
- # @return [String]
11635
- attr_accessor :token_resolution
11636
-
11637
11930
  # Optional. If specified, top-k sampling will be used.
11638
11931
  # Corresponds to the JSON property `topK`
11639
11932
  # @return [Float]
@@ -11655,6 +11948,7 @@ module Google
11655
11948
  @frequency_penalty = args[:frequency_penalty] if args.key?(:frequency_penalty)
11656
11949
  @logprobs = args[:logprobs] if args.key?(:logprobs)
11657
11950
  @max_output_tokens = args[:max_output_tokens] if args.key?(:max_output_tokens)
11951
+ @media_resolution = args[:media_resolution] if args.key?(:media_resolution)
11658
11952
  @presence_penalty = args[:presence_penalty] if args.key?(:presence_penalty)
11659
11953
  @response_logprobs = args[:response_logprobs] if args.key?(:response_logprobs)
11660
11954
  @response_mime_type = args[:response_mime_type] if args.key?(:response_mime_type)
@@ -11665,7 +11959,6 @@ module Google
11665
11959
  @speech_config = args[:speech_config] if args.key?(:speech_config)
11666
11960
  @stop_sequences = args[:stop_sequences] if args.key?(:stop_sequences)
11667
11961
  @temperature = args[:temperature] if args.key?(:temperature)
11668
- @token_resolution = args[:token_resolution] if args.key?(:token_resolution)
11669
11962
  @top_k = args[:top_k] if args.key?(:top_k)
11670
11963
  @top_p = args[:top_p] if args.key?(:top_p)
11671
11964
  end
@@ -14265,6 +14558,32 @@ module Google
14265
14558
  end
14266
14559
  end
14267
14560
 
14561
+ # Response message for ModelService.ListModelVersionCheckpoints
14562
+ class GoogleCloudAiplatformV1ListModelVersionCheckpointsResponse
14563
+ include Google::Apis::Core::Hashable
14564
+
14565
+ # List of Model Version checkpoints.
14566
+ # Corresponds to the JSON property `checkpoints`
14567
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModelVersionCheckpoint>]
14568
+ attr_accessor :checkpoints
14569
+
14570
+ # A token to retrieve the next page of results. Pass to
14571
+ # ListModelVersionCheckpointsRequest.page_token to obtain that page.
14572
+ # Corresponds to the JSON property `nextPageToken`
14573
+ # @return [String]
14574
+ attr_accessor :next_page_token
14575
+
14576
+ def initialize(**args)
14577
+ update!(**args)
14578
+ end
14579
+
14580
+ # Update properties of this object
14581
+ def update!(**args)
14582
+ @checkpoints = args[:checkpoints] if args.key?(:checkpoints)
14583
+ @next_page_token = args[:next_page_token] if args.key?(:next_page_token)
14584
+ end
14585
+ end
14586
+
14268
14587
  # Response message for ModelService.ListModelVersions
14269
14588
  class GoogleCloudAiplatformV1ListModelVersionsResponse
14270
14589
  include Google::Apis::Core::Hashable
@@ -15021,6 +15340,12 @@ module Google
15021
15340
  # @return [String]
15022
15341
  attr_accessor :machine_type
15023
15342
 
15343
+ # Optional. Immutable. The number of nodes per replica for multihost GPU
15344
+ # deployments.
15345
+ # Corresponds to the JSON property `multihostGpuNodeCount`
15346
+ # @return [Fixnum]
15347
+ attr_accessor :multihost_gpu_node_count
15348
+
15024
15349
  # A ReservationAffinity can be used to configure a Vertex AI resource (e.g., a
15025
15350
  # DeployedModel) to draw its Compute Engine resources from a Shared Reservation,
15026
15351
  # or exclusively from on-demand capacity.
@@ -15043,6 +15368,7 @@ module Google
15043
15368
  @accelerator_count = args[:accelerator_count] if args.key?(:accelerator_count)
15044
15369
  @accelerator_type = args[:accelerator_type] if args.key?(:accelerator_type)
15045
15370
  @machine_type = args[:machine_type] if args.key?(:machine_type)
15371
+ @multihost_gpu_node_count = args[:multihost_gpu_node_count] if args.key?(:multihost_gpu_node_count)
15046
15372
  @reservation_affinity = args[:reservation_affinity] if args.key?(:reservation_affinity)
15047
15373
  @tpu_topology = args[:tpu_topology] if args.key?(:tpu_topology)
15048
15374
  end
@@ -15311,6 +15637,58 @@ module Google
15311
15637
  end
15312
15638
  end
15313
15639
 
15640
+ # The metric used for dataset level evaluation.
15641
+ class GoogleCloudAiplatformV1Metric
15642
+ include Google::Apis::Core::Hashable
15643
+
15644
+ # Optional. The aggregation metrics to use.
15645
+ # Corresponds to the JSON property `aggregationMetrics`
15646
+ # @return [Array<String>]
15647
+ attr_accessor :aggregation_metrics
15648
+
15649
+ # Spec for bleu score metric - calculates the precision of n-grams in the
15650
+ # prediction as compared to reference - returns a score ranging between 0 to 1.
15651
+ # Corresponds to the JSON property `bleuSpec`
15652
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1BleuSpec]
15653
+ attr_accessor :bleu_spec
15654
+
15655
+ # Spec for exact match metric - returns 1 if prediction and reference exactly
15656
+ # matches, otherwise 0.
15657
+ # Corresponds to the JSON property `exactMatchSpec`
15658
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ExactMatchSpec]
15659
+ attr_accessor :exact_match_spec
15660
+
15661
+ # Spec for pairwise metric.
15662
+ # Corresponds to the JSON property `pairwiseMetricSpec`
15663
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1PairwiseMetricSpec]
15664
+ attr_accessor :pairwise_metric_spec
15665
+
15666
+ # Spec for pointwise metric.
15667
+ # Corresponds to the JSON property `pointwiseMetricSpec`
15668
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1PointwiseMetricSpec]
15669
+ attr_accessor :pointwise_metric_spec
15670
+
15671
+ # Spec for rouge score metric - calculates the recall of n-grams in prediction
15672
+ # as compared to reference - returns a score ranging between 0 and 1.
15673
+ # Corresponds to the JSON property `rougeSpec`
15674
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1RougeSpec]
15675
+ attr_accessor :rouge_spec
15676
+
15677
+ def initialize(**args)
15678
+ update!(**args)
15679
+ end
15680
+
15681
+ # Update properties of this object
15682
+ def update!(**args)
15683
+ @aggregation_metrics = args[:aggregation_metrics] if args.key?(:aggregation_metrics)
15684
+ @bleu_spec = args[:bleu_spec] if args.key?(:bleu_spec)
15685
+ @exact_match_spec = args[:exact_match_spec] if args.key?(:exact_match_spec)
15686
+ @pairwise_metric_spec = args[:pairwise_metric_spec] if args.key?(:pairwise_metric_spec)
15687
+ @pointwise_metric_spec = args[:pointwise_metric_spec] if args.key?(:pointwise_metric_spec)
15688
+ @rouge_spec = args[:rouge_spec] if args.key?(:rouge_spec)
15689
+ end
15690
+ end
15691
+
15314
15692
  # Input for MetricX metric.
15315
15693
  class GoogleCloudAiplatformV1MetricxInput
15316
15694
  include Google::Apis::Core::Hashable
@@ -15829,6 +16207,31 @@ module Google
15829
16207
  end
15830
16208
  end
15831
16209
 
16210
+ # Represents token counting info for a single modality.
16211
+ class GoogleCloudAiplatformV1ModalityTokenCount
16212
+ include Google::Apis::Core::Hashable
16213
+
16214
+ # The modality associated with this token count.
16215
+ # Corresponds to the JSON property `modality`
16216
+ # @return [String]
16217
+ attr_accessor :modality
16218
+
16219
+ # Number of tokens.
16220
+ # Corresponds to the JSON property `tokenCount`
16221
+ # @return [Fixnum]
16222
+ attr_accessor :token_count
16223
+
16224
+ def initialize(**args)
16225
+ update!(**args)
16226
+ end
16227
+
16228
+ # Update properties of this object
16229
+ def update!(**args)
16230
+ @modality = args[:modality] if args.key?(:modality)
16231
+ @token_count = args[:token_count] if args.key?(:token_count)
16232
+ end
16233
+ end
16234
+
15832
16235
  # A trained machine learning Model.
15833
16236
  class GoogleCloudAiplatformV1Model
15834
16237
  include Google::Apis::Core::Hashable
@@ -15863,6 +16266,11 @@ module Google
15863
16266
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModelDataStats]
15864
16267
  attr_accessor :data_stats
15865
16268
 
16269
+ # The default checkpoint id of a model version.
16270
+ # Corresponds to the JSON property `defaultCheckpointId`
16271
+ # @return [String]
16272
+ attr_accessor :default_checkpoint_id
16273
+
15866
16274
  # Output only. The pointers to DeployedModels created from this Model. Note that
15867
16275
  # Model could have been deployed to Endpoints in different Locations.
15868
16276
  # Corresponds to the JSON property `deployedModels`
@@ -16083,6 +16491,7 @@ module Google
16083
16491
  @container_spec = args[:container_spec] if args.key?(:container_spec)
16084
16492
  @create_time = args[:create_time] if args.key?(:create_time)
16085
16493
  @data_stats = args[:data_stats] if args.key?(:data_stats)
16494
+ @default_checkpoint_id = args[:default_checkpoint_id] if args.key?(:default_checkpoint_id)
16086
16495
  @deployed_models = args[:deployed_models] if args.key?(:deployed_models)
16087
16496
  @description = args[:description] if args.key?(:description)
16088
16497
  @display_name = args[:display_name] if args.key?(:display_name)
@@ -16286,6 +16695,12 @@ module Google
16286
16695
  # @return [String]
16287
16696
  attr_accessor :image_uri
16288
16697
 
16698
+ # Probe describes a health check to be performed against a container to
16699
+ # determine whether it is alive or ready to receive traffic.
16700
+ # Corresponds to the JSON property `livenessProbe`
16701
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1Probe]
16702
+ attr_accessor :liveness_probe
16703
+
16289
16704
  # Immutable. List of ports to expose from the container. Vertex AI sends any
16290
16705
  # prediction requests that it receives to the first port on this list. Vertex AI
16291
16706
  # also sends [liveness and health checks](https://cloud.google.com/vertex-ai/
@@ -16348,6 +16763,7 @@ module Google
16348
16763
  @health_probe = args[:health_probe] if args.key?(:health_probe)
16349
16764
  @health_route = args[:health_route] if args.key?(:health_route)
16350
16765
  @image_uri = args[:image_uri] if args.key?(:image_uri)
16766
+ @liveness_probe = args[:liveness_probe] if args.key?(:liveness_probe)
16351
16767
  @ports = args[:ports] if args.key?(:ports)
16352
16768
  @predict_route = args[:predict_route] if args.key?(:predict_route)
16353
16769
  @shared_memory_size_mb = args[:shared_memory_size_mb] if args.key?(:shared_memory_size_mb)
@@ -17130,7 +17546,7 @@ module Google
17130
17546
  # model in SavedModel format. * `tf-js` A [TensorFlow.js](https://www.tensorflow.
17131
17547
  # org/js) model that can be used in the browser and in Node.js using JavaScript.
17132
17548
  # * `core-ml` Used for iOS mobile devices. * `custom-trained` A Model that was
17133
- # uploaded or trained by custom code.
17549
+ # uploaded or trained by custom code. * `genie` A tuned Model Garden model.
17134
17550
  # Corresponds to the JSON property `id`
17135
17551
  # @return [String]
17136
17552
  attr_accessor :id
@@ -17156,6 +17572,17 @@ module Google
17156
17572
  # @return [String]
17157
17573
  attr_accessor :public_model_name
17158
17574
 
17575
+ # Optional. Whether to avoid pulling the model from the HF cache.
17576
+ # Corresponds to the JSON property `skipHfModelCache`
17577
+ # @return [Boolean]
17578
+ attr_accessor :skip_hf_model_cache
17579
+ alias_method :skip_hf_model_cache?, :skip_hf_model_cache
17580
+
17581
+ # Optional. The model garden source model version ID.
17582
+ # Corresponds to the JSON property `versionId`
17583
+ # @return [String]
17584
+ attr_accessor :version_id
17585
+
17159
17586
  def initialize(**args)
17160
17587
  update!(**args)
17161
17588
  end
@@ -17163,6 +17590,8 @@ module Google
17163
17590
  # Update properties of this object
17164
17591
  def update!(**args)
17165
17592
  @public_model_name = args[:public_model_name] if args.key?(:public_model_name)
17593
+ @skip_hf_model_cache = args[:skip_hf_model_cache] if args.key?(:skip_hf_model_cache)
17594
+ @version_id = args[:version_id] if args.key?(:version_id)
17166
17595
  end
17167
17596
  end
17168
17597
 
@@ -17576,6 +18005,45 @@ module Google
17576
18005
  end
17577
18006
  end
17578
18007
 
18008
+ # Describes the machine learning model version checkpoint.
18009
+ class GoogleCloudAiplatformV1ModelVersionCheckpoint
18010
+ include Google::Apis::Core::Hashable
18011
+
18012
+ # The ID of the checkpoint.
18013
+ # Corresponds to the JSON property `checkpointId`
18014
+ # @return [String]
18015
+ attr_accessor :checkpoint_id
18016
+
18017
+ # The epoch of the checkpoint.
18018
+ # Corresponds to the JSON property `epoch`
18019
+ # @return [Fixnum]
18020
+ attr_accessor :epoch
18021
+
18022
+ # Identifier. The resource name of the ModelVersionCheckpoint. Format: `projects/
18023
+ # `project`/locations/`location`/models/`model`/versions/`version`/checkpoints/`
18024
+ # checkpoint``
18025
+ # Corresponds to the JSON property `name`
18026
+ # @return [String]
18027
+ attr_accessor :name
18028
+
18029
+ # The step of the checkpoint.
18030
+ # Corresponds to the JSON property `step`
18031
+ # @return [Fixnum]
18032
+ attr_accessor :step
18033
+
18034
+ def initialize(**args)
18035
+ update!(**args)
18036
+ end
18037
+
18038
+ # Update properties of this object
18039
+ def update!(**args)
18040
+ @checkpoint_id = args[:checkpoint_id] if args.key?(:checkpoint_id)
18041
+ @epoch = args[:epoch] if args.key?(:epoch)
18042
+ @name = args[:name] if args.key?(:name)
18043
+ @step = args[:step] if args.key?(:step)
18044
+ end
18045
+ end
18046
+
17579
18047
  # Runtime operation information for IndexEndpointService.MutateDeployedIndex.
17580
18048
  class GoogleCloudAiplatformV1MutateDeployedIndexOperationMetadata
17581
18049
  include Google::Apis::Core::Hashable
@@ -18685,8 +19153,8 @@ module Google
18685
19153
  # @return [String]
18686
19154
  attr_accessor :notebook_runtime_template_resource_name
18687
19155
 
18688
- # Output only. The Schedule resource name if this job is triggered by one.
18689
- # Format: `projects/`project_id`/locations/`location`/schedules/`schedule_id``
19156
+ # The Schedule resource name if this job is triggered by one. Format: `projects/`
19157
+ # project_id`/locations/`location`/schedules/`schedule_id``
18690
19158
  # Corresponds to the JSON property `scheduleResourceName`
18691
19159
  # @return [String]
18692
19160
  attr_accessor :schedule_resource_name
@@ -19049,6 +19517,11 @@ module Google
19049
19517
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ShieldedVmConfig]
19050
19518
  attr_accessor :shielded_vm_config
19051
19519
 
19520
+ # Notebook Software Config.
19521
+ # Corresponds to the JSON property `softwareConfig`
19522
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1NotebookSoftwareConfig]
19523
+ attr_accessor :software_config
19524
+
19052
19525
  # Output only. Timestamp when this NotebookRuntime was most recently updated.
19053
19526
  # Corresponds to the JSON property `updateTime`
19054
19527
  # @return [String]
@@ -19089,6 +19562,7 @@ module Google
19089
19562
  @satisfies_pzs = args[:satisfies_pzs] if args.key?(:satisfies_pzs)
19090
19563
  @service_account = args[:service_account] if args.key?(:service_account)
19091
19564
  @shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
19565
+ @software_config = args[:software_config] if args.key?(:software_config)
19092
19566
  @update_time = args[:update_time] if args.key?(:update_time)
19093
19567
  @version = args[:version] if args.key?(:version)
19094
19568
  end
@@ -19207,6 +19681,11 @@ module Google
19207
19681
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ShieldedVmConfig]
19208
19682
  attr_accessor :shielded_vm_config
19209
19683
 
19684
+ # Notebook Software Config.
19685
+ # Corresponds to the JSON property `softwareConfig`
19686
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1NotebookSoftwareConfig]
19687
+ attr_accessor :software_config
19688
+
19210
19689
  # Output only. Timestamp when this NotebookRuntimeTemplate was most recently
19211
19690
  # updated.
19212
19691
  # Corresponds to the JSON property `updateTime`
@@ -19236,6 +19715,7 @@ module Google
19236
19715
  @notebook_runtime_type = args[:notebook_runtime_type] if args.key?(:notebook_runtime_type)
19237
19716
  @service_account = args[:service_account] if args.key?(:service_account)
19238
19717
  @shielded_vm_config = args[:shielded_vm_config] if args.key?(:shielded_vm_config)
19718
+ @software_config = args[:software_config] if args.key?(:software_config)
19239
19719
  @update_time = args[:update_time] if args.key?(:update_time)
19240
19720
  end
19241
19721
  end
@@ -19259,6 +19739,51 @@ module Google
19259
19739
  end
19260
19740
  end
19261
19741
 
19742
+ # Notebook Software Config.
19743
+ class GoogleCloudAiplatformV1NotebookSoftwareConfig
19744
+ include Google::Apis::Core::Hashable
19745
+
19746
+ # Optional. Environment variables to be passed to the container. Maximum limit
19747
+ # is 100.
19748
+ # Corresponds to the JSON property `env`
19749
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1EnvVar>]
19750
+ attr_accessor :env
19751
+
19752
+ # Post startup script config.
19753
+ # Corresponds to the JSON property `postStartupScriptConfig`
19754
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1PostStartupScriptConfig]
19755
+ attr_accessor :post_startup_script_config
19756
+
19757
+ def initialize(**args)
19758
+ update!(**args)
19759
+ end
19760
+
19761
+ # Update properties of this object
19762
+ def update!(**args)
19763
+ @env = args[:env] if args.key?(:env)
19764
+ @post_startup_script_config = args[:post_startup_script_config] if args.key?(:post_startup_script_config)
19765
+ end
19766
+ end
19767
+
19768
+ # Config for evaluation output.
19769
+ class GoogleCloudAiplatformV1OutputConfig
19770
+ include Google::Apis::Core::Hashable
19771
+
19772
+ # The Google Cloud Storage location where the output is to be written to.
19773
+ # Corresponds to the JSON property `gcsDestination`
19774
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1GcsDestination]
19775
+ attr_accessor :gcs_destination
19776
+
19777
+ def initialize(**args)
19778
+ update!(**args)
19779
+ end
19780
+
19781
+ # Update properties of this object
19782
+ def update!(**args)
19783
+ @gcs_destination = args[:gcs_destination] if args.key?(:gcs_destination)
19784
+ end
19785
+ end
19786
+
19262
19787
  # PSC config that is used to automatically create forwarding rule via
19263
19788
  # ServiceConnectionMap.
19264
19789
  class GoogleCloudAiplatformV1PscAutomationConfig
@@ -19365,18 +19890,36 @@ module Google
19365
19890
  class GoogleCloudAiplatformV1PairwiseMetricSpec
19366
19891
  include Google::Apis::Core::Hashable
19367
19892
 
19893
+ # Optional. The field name of the baseline response.
19894
+ # Corresponds to the JSON property `baselineResponseFieldName`
19895
+ # @return [String]
19896
+ attr_accessor :baseline_response_field_name
19897
+
19898
+ # Optional. The field name of the candidate response.
19899
+ # Corresponds to the JSON property `candidateResponseFieldName`
19900
+ # @return [String]
19901
+ attr_accessor :candidate_response_field_name
19902
+
19368
19903
  # Required. Metric prompt template for pairwise metric.
19369
19904
  # Corresponds to the JSON property `metricPromptTemplate`
19370
19905
  # @return [String]
19371
19906
  attr_accessor :metric_prompt_template
19372
19907
 
19908
+ # Optional. System instructions for pairwise metric.
19909
+ # Corresponds to the JSON property `systemInstruction`
19910
+ # @return [String]
19911
+ attr_accessor :system_instruction
19912
+
19373
19913
  def initialize(**args)
19374
19914
  update!(**args)
19375
19915
  end
19376
19916
 
19377
19917
  # Update properties of this object
19378
19918
  def update!(**args)
19919
+ @baseline_response_field_name = args[:baseline_response_field_name] if args.key?(:baseline_response_field_name)
19920
+ @candidate_response_field_name = args[:candidate_response_field_name] if args.key?(:candidate_response_field_name)
19379
19921
  @metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
19922
+ @system_instruction = args[:system_instruction] if args.key?(:system_instruction)
19380
19923
  end
19381
19924
  end
19382
19925
 
@@ -19640,6 +20183,19 @@ module Google
19640
20183
  class GoogleCloudAiplatformV1Part
19641
20184
  include Google::Apis::Core::Hashable
19642
20185
 
20186
+ # Result of executing the [ExecutableCode]. Always follows a `part` containing
20187
+ # the [ExecutableCode].
20188
+ # Corresponds to the JSON property `codeExecutionResult`
20189
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1CodeExecutionResult]
20190
+ attr_accessor :code_execution_result
20191
+
20192
+ # Code generated by the model that is meant to be executed, and the result
20193
+ # returned to the model. Generated when using the [FunctionDeclaration] tool and
20194
+ # [FunctionCallingConfig] mode is set to [Mode.CODE].
20195
+ # Corresponds to the JSON property `executableCode`
20196
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ExecutableCode]
20197
+ attr_accessor :executable_code
20198
+
19643
20199
  # URI based data.
19644
20200
  # Corresponds to the JSON property `fileData`
19645
20201
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1FileData]
@@ -19660,7 +20216,7 @@ module Google
19660
20216
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1FunctionResponse]
19661
20217
  attr_accessor :function_response
19662
20218
 
19663
- # Content blob. It's preferred to send as text directly rather than raw bytes.
20219
+ # Content blob.
19664
20220
  # Corresponds to the JSON property `inlineData`
19665
20221
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1Blob]
19666
20222
  attr_accessor :inline_data
@@ -19681,6 +20237,8 @@ module Google
19681
20237
 
19682
20238
  # Update properties of this object
19683
20239
  def update!(**args)
20240
+ @code_execution_result = args[:code_execution_result] if args.key?(:code_execution_result)
20241
+ @executable_code = args[:executable_code] if args.key?(:executable_code)
19684
20242
  @file_data = args[:file_data] if args.key?(:file_data)
19685
20243
  @function_call = args[:function_call] if args.key?(:function_call)
19686
20244
  @function_response = args[:function_response] if args.key?(:function_response)
@@ -20521,6 +21079,11 @@ module Google
20521
21079
  # @return [String]
20522
21080
  attr_accessor :metric_prompt_template
20523
21081
 
21082
+ # Optional. System instructions for pointwise metric.
21083
+ # Corresponds to the JSON property `systemInstruction`
21084
+ # @return [String]
21085
+ attr_accessor :system_instruction
21086
+
20524
21087
  def initialize(**args)
20525
21088
  update!(**args)
20526
21089
  end
@@ -20528,6 +21091,7 @@ module Google
20528
21091
  # Update properties of this object
20529
21092
  def update!(**args)
20530
21093
  @metric_prompt_template = args[:metric_prompt_template] if args.key?(:metric_prompt_template)
21094
+ @system_instruction = args[:system_instruction] if args.key?(:system_instruction)
20531
21095
  end
20532
21096
  end
20533
21097
 
@@ -20551,6 +21115,39 @@ module Google
20551
21115
  end
20552
21116
  end
20553
21117
 
21118
+ # Post startup script config.
21119
+ class GoogleCloudAiplatformV1PostStartupScriptConfig
21120
+ include Google::Apis::Core::Hashable
21121
+
21122
+ # Optional. Post startup script to run after runtime is started.
21123
+ # Corresponds to the JSON property `postStartupScript`
21124
+ # @return [String]
21125
+ attr_accessor :post_startup_script
21126
+
21127
+ # Optional. Post startup script behavior that defines download and execution
21128
+ # behavior.
21129
+ # Corresponds to the JSON property `postStartupScriptBehavior`
21130
+ # @return [String]
21131
+ attr_accessor :post_startup_script_behavior
21132
+
21133
+ # Optional. Post startup script url to download. Example: https://bucket/script.
21134
+ # sh
21135
+ # Corresponds to the JSON property `postStartupScriptUrl`
21136
+ # @return [String]
21137
+ attr_accessor :post_startup_script_url
21138
+
21139
+ def initialize(**args)
21140
+ update!(**args)
21141
+ end
21142
+
21143
+ # Update properties of this object
21144
+ def update!(**args)
21145
+ @post_startup_script = args[:post_startup_script] if args.key?(:post_startup_script)
21146
+ @post_startup_script_behavior = args[:post_startup_script_behavior] if args.key?(:post_startup_script_behavior)
21147
+ @post_startup_script_url = args[:post_startup_script_url] if args.key?(:post_startup_script_url)
21148
+ end
21149
+ end
21150
+
20554
21151
  # The configuration for the prebuilt speaker to use.
20555
21152
  class GoogleCloudAiplatformV1PrebuiltVoiceConfig
20556
21153
  include Google::Apis::Core::Hashable
@@ -20915,6 +21512,28 @@ module Google
20915
21512
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ProbeExecAction]
20916
21513
  attr_accessor :exec
20917
21514
 
21515
+ # Number of consecutive failures before the probe is considered failed. Defaults
21516
+ # to 3. Minimum value is 1. Maps to Kubernetes probe argument 'failureThreshold'.
21517
+ # Corresponds to the JSON property `failureThreshold`
21518
+ # @return [Fixnum]
21519
+ attr_accessor :failure_threshold
21520
+
21521
+ # GrpcAction checks the health of a container using a gRPC service.
21522
+ # Corresponds to the JSON property `grpc`
21523
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ProbeGrpcAction]
21524
+ attr_accessor :grpc
21525
+
21526
+ # HttpGetAction describes an action based on HTTP Get requests.
21527
+ # Corresponds to the JSON property `httpGet`
21528
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ProbeHttpGetAction]
21529
+ attr_accessor :http_get
21530
+
21531
+ # Number of seconds to wait before starting the probe. Defaults to 0. Minimum
21532
+ # value is 0. Maps to Kubernetes probe argument 'initialDelaySeconds'.
21533
+ # Corresponds to the JSON property `initialDelaySeconds`
21534
+ # @return [Fixnum]
21535
+ attr_accessor :initial_delay_seconds
21536
+
20918
21537
  # How often (in seconds) to perform the probe. Default to 10 seconds. Minimum
20919
21538
  # value is 1. Must be less than timeout_seconds. Maps to Kubernetes probe
20920
21539
  # argument 'periodSeconds'.
@@ -20922,6 +21541,19 @@ module Google
20922
21541
  # @return [Fixnum]
20923
21542
  attr_accessor :period_seconds
20924
21543
 
21544
+ # Number of consecutive successes before the probe is considered successful.
21545
+ # Defaults to 1. Minimum value is 1. Maps to Kubernetes probe argument '
21546
+ # successThreshold'.
21547
+ # Corresponds to the JSON property `successThreshold`
21548
+ # @return [Fixnum]
21549
+ attr_accessor :success_threshold
21550
+
21551
+ # TcpSocketAction probes the health of a container by opening a TCP socket
21552
+ # connection.
21553
+ # Corresponds to the JSON property `tcpSocket`
21554
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ProbeTcpSocketAction]
21555
+ attr_accessor :tcp_socket
21556
+
20925
21557
  # Number of seconds after which the probe times out. Defaults to 1 second.
20926
21558
  # Minimum value is 1. Must be greater or equal to period_seconds. Maps to
20927
21559
  # Kubernetes probe argument 'timeoutSeconds'.
@@ -20936,7 +21568,13 @@ module Google
20936
21568
  # Update properties of this object
20937
21569
  def update!(**args)
20938
21570
  @exec = args[:exec] if args.key?(:exec)
21571
+ @failure_threshold = args[:failure_threshold] if args.key?(:failure_threshold)
21572
+ @grpc = args[:grpc] if args.key?(:grpc)
21573
+ @http_get = args[:http_get] if args.key?(:http_get)
21574
+ @initial_delay_seconds = args[:initial_delay_seconds] if args.key?(:initial_delay_seconds)
20939
21575
  @period_seconds = args[:period_seconds] if args.key?(:period_seconds)
21576
+ @success_threshold = args[:success_threshold] if args.key?(:success_threshold)
21577
+ @tcp_socket = args[:tcp_socket] if args.key?(:tcp_socket)
20940
21578
  @timeout_seconds = args[:timeout_seconds] if args.key?(:timeout_seconds)
20941
21579
  end
20942
21580
  end
@@ -20965,6 +21603,133 @@ module Google
20965
21603
  end
20966
21604
  end
20967
21605
 
21606
+ # GrpcAction checks the health of a container using a gRPC service.
21607
+ class GoogleCloudAiplatformV1ProbeGrpcAction
21608
+ include Google::Apis::Core::Hashable
21609
+
21610
+ # Port number of the gRPC service. Number must be in the range 1 to 65535.
21611
+ # Corresponds to the JSON property `port`
21612
+ # @return [Fixnum]
21613
+ attr_accessor :port
21614
+
21615
+ # Service is the name of the service to place in the gRPC HealthCheckRequest (
21616
+ # see https://github.com/grpc/grpc/blob/master/doc/health-checking.md). If this
21617
+ # is not specified, the default behavior is defined by gRPC.
21618
+ # Corresponds to the JSON property `service`
21619
+ # @return [String]
21620
+ attr_accessor :service
21621
+
21622
+ def initialize(**args)
21623
+ update!(**args)
21624
+ end
21625
+
21626
+ # Update properties of this object
21627
+ def update!(**args)
21628
+ @port = args[:port] if args.key?(:port)
21629
+ @service = args[:service] if args.key?(:service)
21630
+ end
21631
+ end
21632
+
21633
+ # HttpGetAction describes an action based on HTTP Get requests.
21634
+ class GoogleCloudAiplatformV1ProbeHttpGetAction
21635
+ include Google::Apis::Core::Hashable
21636
+
21637
+ # Host name to connect to, defaults to the model serving container's IP. You
21638
+ # probably want to set "Host" in httpHeaders instead.
21639
+ # Corresponds to the JSON property `host`
21640
+ # @return [String]
21641
+ attr_accessor :host
21642
+
21643
+ # Custom headers to set in the request. HTTP allows repeated headers.
21644
+ # Corresponds to the JSON property `httpHeaders`
21645
+ # @return [Array<Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ProbeHttpHeader>]
21646
+ attr_accessor :http_headers
21647
+
21648
+ # Path to access on the HTTP server.
21649
+ # Corresponds to the JSON property `path`
21650
+ # @return [String]
21651
+ attr_accessor :path
21652
+
21653
+ # Number of the port to access on the container. Number must be in the range 1
21654
+ # to 65535.
21655
+ # Corresponds to the JSON property `port`
21656
+ # @return [Fixnum]
21657
+ attr_accessor :port
21658
+
21659
+ # Scheme to use for connecting to the host. Defaults to HTTP. Acceptable values
21660
+ # are "HTTP" or "HTTPS".
21661
+ # Corresponds to the JSON property `scheme`
21662
+ # @return [String]
21663
+ attr_accessor :scheme
21664
+
21665
+ def initialize(**args)
21666
+ update!(**args)
21667
+ end
21668
+
21669
+ # Update properties of this object
21670
+ def update!(**args)
21671
+ @host = args[:host] if args.key?(:host)
21672
+ @http_headers = args[:http_headers] if args.key?(:http_headers)
21673
+ @path = args[:path] if args.key?(:path)
21674
+ @port = args[:port] if args.key?(:port)
21675
+ @scheme = args[:scheme] if args.key?(:scheme)
21676
+ end
21677
+ end
21678
+
21679
+ # HttpHeader describes a custom header to be used in HTTP probes
21680
+ class GoogleCloudAiplatformV1ProbeHttpHeader
21681
+ include Google::Apis::Core::Hashable
21682
+
21683
+ # The header field name. This will be canonicalized upon output, so case-variant
21684
+ # names will be understood as the same header.
21685
+ # Corresponds to the JSON property `name`
21686
+ # @return [String]
21687
+ attr_accessor :name
21688
+
21689
+ # The header field value
21690
+ # Corresponds to the JSON property `value`
21691
+ # @return [String]
21692
+ attr_accessor :value
21693
+
21694
+ def initialize(**args)
21695
+ update!(**args)
21696
+ end
21697
+
21698
+ # Update properties of this object
21699
+ def update!(**args)
21700
+ @name = args[:name] if args.key?(:name)
21701
+ @value = args[:value] if args.key?(:value)
21702
+ end
21703
+ end
21704
+
21705
+ # TcpSocketAction probes the health of a container by opening a TCP socket
21706
+ # connection.
21707
+ class GoogleCloudAiplatformV1ProbeTcpSocketAction
21708
+ include Google::Apis::Core::Hashable
21709
+
21710
+ # Optional: Host name to connect to, defaults to the model serving container's
21711
+ # IP.
21712
+ # Corresponds to the JSON property `host`
21713
+ # @return [String]
21714
+ attr_accessor :host
21715
+
21716
+ # Number of the port to access on the container. Number must be in the range 1
21717
+ # to 65535.
21718
+ # Corresponds to the JSON property `port`
21719
+ # @return [Fixnum]
21720
+ attr_accessor :port
21721
+
21722
+ def initialize(**args)
21723
+ update!(**args)
21724
+ end
21725
+
21726
+ # Update properties of this object
21727
+ def update!(**args)
21728
+ @host = args[:host] if args.key?(:host)
21729
+ @port = args[:port] if args.key?(:port)
21730
+ end
21731
+ end
21732
+
20968
21733
  # PscAutomatedEndpoints defines the output of the forwarding rule automatically
20969
21734
  # created by each PscAutomationConfig.
20970
21735
  class GoogleCloudAiplatformV1PscAutomatedEndpoints
@@ -21200,8 +21965,8 @@ module Google
21200
21965
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ModelContainerSpec]
21201
21966
  attr_accessor :container_spec
21202
21967
 
21203
- # A description of resources that are dedicated to a DeployedModel, and that
21204
- # need a higher degree of manual configuration.
21968
+ # A description of resources that are dedicated to a DeployedModel or
21969
+ # DeployedIndex, and that need a higher degree of manual configuration.
21205
21970
  # Corresponds to the JSON property `dedicatedResources`
21206
21971
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1DedicatedResources]
21207
21972
  attr_accessor :dedicated_resources
@@ -22755,7 +23520,8 @@ module Google
22755
23520
  class GoogleCloudAiplatformV1RagVectorDbConfig
22756
23521
  include Google::Apis::Core::Hashable
22757
23522
 
22758
- # The generic reusable api auth config.
23523
+ # The generic reusable api auth config. Deprecated. Please use AuthConfig (
23524
+ # google/cloud/aiplatform/master/auth.proto) instead.
22759
23525
  # Corresponds to the JSON property `apiAuth`
22760
23526
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ApiAuth]
22761
23527
  attr_accessor :api_auth
@@ -23844,6 +24610,34 @@ module Google
23844
24610
  end
23845
24611
  end
23846
24612
 
24613
+ # Retrieval config.
24614
+ class GoogleCloudAiplatformV1RetrievalConfig
24615
+ include Google::Apis::Core::Hashable
24616
+
24617
+ # The language code of the user.
24618
+ # Corresponds to the JSON property `languageCode`
24619
+ # @return [String]
24620
+ attr_accessor :language_code
24621
+
24622
+ # An object that represents a latitude/longitude pair. This is expressed as a
24623
+ # pair of doubles to represent degrees latitude and degrees longitude. Unless
24624
+ # specified otherwise, this object must conform to the WGS84 standard. Values
24625
+ # must be within normalized ranges.
24626
+ # Corresponds to the JSON property `latLng`
24627
+ # @return [Google::Apis::AiplatformV1::GoogleTypeLatLng]
24628
+ attr_accessor :lat_lng
24629
+
24630
+ def initialize(**args)
24631
+ update!(**args)
24632
+ end
24633
+
24634
+ # Update properties of this object
24635
+ def update!(**args)
24636
+ @language_code = args[:language_code] if args.key?(:language_code)
24637
+ @lat_lng = args[:lat_lng] if args.key?(:lat_lng)
24638
+ end
24639
+ end
24640
+
23847
24641
  # Metadata related to retrieval in the grounding flow.
23848
24642
  class GoogleCloudAiplatformV1RetrievalMetadata
23849
24643
  include Google::Apis::Core::Hashable
@@ -28075,8 +28869,9 @@ module Google
28075
28869
  class GoogleCloudAiplatformV1SchemaTextDataItem
28076
28870
  include Google::Apis::Core::Hashable
28077
28871
 
28078
- # Output only. Google Cloud Storage URI points to the original text in user's
28079
- # bucket. The text file is up to 10MB in size.
28872
+ # Output only. Google Cloud Storage URI points to a copy of the original text in
28873
+ # the Vertex-managed bucket in the user's project. The text file is up to 10MB
28874
+ # in size.
28080
28875
  # Corresponds to the JSON property `gcsUri`
28081
28876
  # @return [String]
28082
28877
  attr_accessor :gcs_uri
@@ -32159,6 +32954,81 @@ module Google
32159
32954
  end
32160
32955
  end
32161
32956
 
32957
+ # Configuration for Speculative Decoding.
32958
+ class GoogleCloudAiplatformV1SpeculativeDecodingSpec
32959
+ include Google::Apis::Core::Hashable
32960
+
32961
+ # Draft model speculation works by using the smaller model to generate candidate
32962
+ # tokens for speculative decoding.
32963
+ # Corresponds to the JSON property `draftModelSpeculation`
32964
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1SpeculativeDecodingSpecDraftModelSpeculation]
32965
+ attr_accessor :draft_model_speculation
32966
+
32967
+ # N-Gram speculation works by trying to find matching tokens in the previous
32968
+ # prompt sequence and use those as speculation for generating new tokens.
32969
+ # Corresponds to the JSON property `ngramSpeculation`
32970
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1SpeculativeDecodingSpecNgramSpeculation]
32971
+ attr_accessor :ngram_speculation
32972
+
32973
+ # The number of speculative tokens to generate at each step.
32974
+ # Corresponds to the JSON property `speculativeTokenCount`
32975
+ # @return [Fixnum]
32976
+ attr_accessor :speculative_token_count
32977
+
32978
+ def initialize(**args)
32979
+ update!(**args)
32980
+ end
32981
+
32982
+ # Update properties of this object
32983
+ def update!(**args)
32984
+ @draft_model_speculation = args[:draft_model_speculation] if args.key?(:draft_model_speculation)
32985
+ @ngram_speculation = args[:ngram_speculation] if args.key?(:ngram_speculation)
32986
+ @speculative_token_count = args[:speculative_token_count] if args.key?(:speculative_token_count)
32987
+ end
32988
+ end
32989
+
32990
+ # Draft model speculation works by using the smaller model to generate candidate
32991
+ # tokens for speculative decoding.
32992
+ class GoogleCloudAiplatformV1SpeculativeDecodingSpecDraftModelSpeculation
32993
+ include Google::Apis::Core::Hashable
32994
+
32995
+ # Required. The resource name of the draft model.
32996
+ # Corresponds to the JSON property `draftModel`
32997
+ # @return [String]
32998
+ attr_accessor :draft_model
32999
+
33000
+ def initialize(**args)
33001
+ update!(**args)
33002
+ end
33003
+
33004
+ # Update properties of this object
33005
+ def update!(**args)
33006
+ @draft_model = args[:draft_model] if args.key?(:draft_model)
33007
+ end
33008
+ end
33009
+
33010
+ # N-Gram speculation works by trying to find matching tokens in the previous
33011
+ # prompt sequence and use those as speculation for generating new tokens.
33012
+ class GoogleCloudAiplatformV1SpeculativeDecodingSpecNgramSpeculation
33013
+ include Google::Apis::Core::Hashable
33014
+
33015
+ # The number of last N input tokens used as ngram to search/match against the
33016
+ # previous prompt sequence. This is equal to the N in N-Gram. The default value
33017
+ # is 3 if not specified.
33018
+ # Corresponds to the JSON property `ngramSize`
33019
+ # @return [Fixnum]
33020
+ attr_accessor :ngram_size
33021
+
33022
+ def initialize(**args)
33023
+ update!(**args)
33024
+ end
33025
+
33026
+ # Update properties of this object
33027
+ def update!(**args)
33028
+ @ngram_size = args[:ngram_size] if args.key?(:ngram_size)
33029
+ end
33030
+ end
33031
+
32162
33032
  # The speech generation config.
32163
33033
  class GoogleCloudAiplatformV1SpeechConfig
32164
33034
  include Google::Apis::Core::Hashable
@@ -32292,6 +33162,33 @@ module Google
32292
33162
  end
32293
33163
  end
32294
33164
 
33165
+ # Request message for ReasoningEngineExecutionService.StreamQuery.
33166
+ class GoogleCloudAiplatformV1StreamQueryReasoningEngineRequest
33167
+ include Google::Apis::Core::Hashable
33168
+
33169
+ # Optional. Class method to be used for the stream query. It is optional and
33170
+ # defaults to "stream_query" if unspecified.
33171
+ # Corresponds to the JSON property `classMethod`
33172
+ # @return [String]
33173
+ attr_accessor :class_method
33174
+
33175
+ # Optional. Input content provided by users in JSON object format. Examples
33176
+ # include text query, function calling parameters, media bytes, etc.
33177
+ # Corresponds to the JSON property `input`
33178
+ # @return [Hash<String,Object>]
33179
+ attr_accessor :input
33180
+
33181
+ def initialize(**args)
33182
+ update!(**args)
33183
+ end
33184
+
33185
+ # Update properties of this object
33186
+ def update!(**args)
33187
+ @class_method = args[:class_method] if args.key?(:class_method)
33188
+ @input = args[:input] if args.key?(:input)
33189
+ end
33190
+ end
33191
+
32295
33192
  # Request message for PredictionService.StreamRawPredict.
32296
33193
  class GoogleCloudAiplatformV1StreamRawPredictRequest
32297
33194
  include Google::Apis::Core::Hashable
@@ -33691,6 +34588,12 @@ module Google
33691
34588
  class GoogleCloudAiplatformV1SupervisedTuningDataStats
33692
34589
  include Google::Apis::Core::Hashable
33693
34590
 
34591
+ # Output only. For each index in `truncated_example_indices`, the user-facing
34592
+ # reason why the example was dropped. Must not include example itself.
34593
+ # Corresponds to the JSON property `droppedExampleReasons`
34594
+ # @return [Array<String>]
34595
+ attr_accessor :dropped_example_reasons
34596
+
33694
34597
  # Output only. Number of billable characters in the tuning dataset.
33695
34598
  # Corresponds to the JSON property `totalBillableCharacterCount`
33696
34599
  # @return [Fixnum]
@@ -33701,7 +34604,9 @@ module Google
33701
34604
  # @return [Fixnum]
33702
34605
  attr_accessor :total_billable_token_count
33703
34606
 
33704
- # The number of examples in the dataset that have been truncated by any amount.
34607
+ # Output only. The number of examples in the dataset that have been dropped. An
34608
+ # example can be dropped for reasons including: too many tokens, contains an
34609
+ # invalid image, contains too many images, etc.
33705
34610
  # Corresponds to the JSON property `totalTruncatedExampleCount`
33706
34611
  # @return [Fixnum]
33707
34612
  attr_accessor :total_truncated_example_count
@@ -33711,7 +34616,8 @@ module Google
33711
34616
  # @return [Fixnum]
33712
34617
  attr_accessor :total_tuning_character_count
33713
34618
 
33714
- # A partial sample of the indices (starting from 1) of the truncated examples.
34619
+ # Output only. A partial sample of the indices (starting from 1) of the dropped
34620
+ # examples.
33715
34621
  # Corresponds to the JSON property `truncatedExampleIndices`
33716
34622
  # @return [Array<Fixnum>]
33717
34623
  attr_accessor :truncated_example_indices
@@ -33752,6 +34658,7 @@ module Google
33752
34658
 
33753
34659
  # Update properties of this object
33754
34660
  def update!(**args)
34661
+ @dropped_example_reasons = args[:dropped_example_reasons] if args.key?(:dropped_example_reasons)
33755
34662
  @total_billable_character_count = args[:total_billable_character_count] if args.key?(:total_billable_character_count)
33756
34663
  @total_billable_token_count = args[:total_billable_token_count] if args.key?(:total_billable_token_count)
33757
34664
  @total_truncated_example_count = args[:total_truncated_example_count] if args.key?(:total_truncated_example_count)
@@ -34675,6 +35582,13 @@ module Google
34675
35582
  class GoogleCloudAiplatformV1Tool
34676
35583
  include Google::Apis::Core::Hashable
34677
35584
 
35585
+ # Tool that executes code generated by the model, and automatically returns the
35586
+ # result to the model. See also [ExecutableCode]and [CodeExecutionResult] which
35587
+ # are input and output to this tool.
35588
+ # Corresponds to the JSON property `codeExecution`
35589
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1ToolCodeExecution]
35590
+ attr_accessor :code_execution
35591
+
34678
35592
  # Optional. Function tool type. One or more function declarations to be passed
34679
35593
  # to the model along with the current user query. Model may decide to call a
34680
35594
  # subset of these functions by populating FunctionCall in the response. User
@@ -34707,6 +35621,7 @@ module Google
34707
35621
 
34708
35622
  # Update properties of this object
34709
35623
  def update!(**args)
35624
+ @code_execution = args[:code_execution] if args.key?(:code_execution)
34710
35625
  @function_declarations = args[:function_declarations] if args.key?(:function_declarations)
34711
35626
  @google_search = args[:google_search] if args.key?(:google_search)
34712
35627
  @google_search_retrieval = args[:google_search_retrieval] if args.key?(:google_search_retrieval)
@@ -34840,6 +35755,21 @@ module Google
34840
35755
  end
34841
35756
  end
34842
35757
 
35758
+ # Tool that executes code generated by the model, and automatically returns the
35759
+ # result to the model. See also [ExecutableCode]and [CodeExecutionResult] which
35760
+ # are input and output to this tool.
35761
+ class GoogleCloudAiplatformV1ToolCodeExecution
35762
+ include Google::Apis::Core::Hashable
35763
+
35764
+ def initialize(**args)
35765
+ update!(**args)
35766
+ end
35767
+
35768
+ # Update properties of this object
35769
+ def update!(**args)
35770
+ end
35771
+ end
35772
+
34843
35773
  # Tool config. This config is shared for all tools provided in the request.
34844
35774
  class GoogleCloudAiplatformV1ToolConfig
34845
35775
  include Google::Apis::Core::Hashable
@@ -34849,6 +35779,11 @@ module Google
34849
35779
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1FunctionCallingConfig]
34850
35780
  attr_accessor :function_calling_config
34851
35781
 
35782
+ # Retrieval config.
35783
+ # Corresponds to the JSON property `retrievalConfig`
35784
+ # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1RetrievalConfig]
35785
+ attr_accessor :retrieval_config
35786
+
34852
35787
  def initialize(**args)
34853
35788
  update!(**args)
34854
35789
  end
@@ -34856,6 +35791,7 @@ module Google
34856
35791
  # Update properties of this object
34857
35792
  def update!(**args)
34858
35793
  @function_calling_config = args[:function_calling_config] if args.key?(:function_calling_config)
35794
+ @retrieval_config = args[:retrieval_config] if args.key?(:retrieval_config)
34859
35795
  end
34860
35796
  end
34861
35797
 
@@ -36158,7 +37094,7 @@ module Google
36158
37094
  end
36159
37095
  end
36160
37096
 
36161
- # The Model Registry Model and Online Prediction Endpoint assiociated with this
37097
+ # The Model Registry Model and Online Prediction Endpoint associated with this
36162
37098
  # TuningJob.
36163
37099
  class GoogleCloudAiplatformV1TunedModel
36164
37100
  include Google::Apis::Core::Hashable
@@ -36325,7 +37261,7 @@ module Google
36325
37261
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1SupervisedTuningSpec]
36326
37262
  attr_accessor :supervised_tuning_spec
36327
37263
 
36328
- # The Model Registry Model and Online Prediction Endpoint assiociated with this
37264
+ # The Model Registry Model and Online Prediction Endpoint associated with this
36329
37265
  # TuningJob.
36330
37266
  # Corresponds to the JSON property `tunedModel`
36331
37267
  # @return [Google::Apis::AiplatformV1::GoogleCloudAiplatformV1TunedModel]
@@ -38180,6 +39116,34 @@ module Google
38180
39116
  end
38181
39117
  end
38182
39118
 
39119
+ # An object that represents a latitude/longitude pair. This is expressed as a
39120
+ # pair of doubles to represent degrees latitude and degrees longitude. Unless
39121
+ # specified otherwise, this object must conform to the WGS84 standard. Values
39122
+ # must be within normalized ranges.
39123
+ class GoogleTypeLatLng
39124
+ include Google::Apis::Core::Hashable
39125
+
39126
+ # The latitude in degrees. It must be in the range [-90.0, +90.0].
39127
+ # Corresponds to the JSON property `latitude`
39128
+ # @return [Float]
39129
+ attr_accessor :latitude
39130
+
39131
+ # The longitude in degrees. It must be in the range [-180.0, +180.0].
39132
+ # Corresponds to the JSON property `longitude`
39133
+ # @return [Float]
39134
+ attr_accessor :longitude
39135
+
39136
+ def initialize(**args)
39137
+ update!(**args)
39138
+ end
39139
+
39140
+ # Update properties of this object
39141
+ def update!(**args)
39142
+ @latitude = args[:latitude] if args.key?(:latitude)
39143
+ @longitude = args[:longitude] if args.key?(:longitude)
39144
+ end
39145
+ end
39146
+
38183
39147
  # Represents an amount of money with its currency type.
38184
39148
  class GoogleTypeMoney
38185
39149
  include Google::Apis::Core::Hashable