@datarobot/pulumi-datarobot 0.10.36 → 0.10.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@datarobot/pulumi-datarobot",
3
- "version": "0.10.36",
3
+ "version": "0.10.37",
4
4
  "description": "A Pulumi package for creating and managing DataRobot resources.",
5
5
  "keywords": [
6
6
  "datarobot",
package/types/input.d.ts CHANGED
@@ -121,10 +121,6 @@ export interface ArtifactSpecContainerGroupContainer {
121
121
  * Container readiness check configuration.
122
122
  */
123
123
  readinessProbe?: pulumi.Input<inputs.ArtifactSpecContainerGroupContainerReadinessProbe>;
124
- /**
125
- * Resource requirements for the container.
126
- */
127
- resourceRequest: pulumi.Input<inputs.ArtifactSpecContainerGroupContainerResourceRequest>;
128
124
  /**
129
125
  * Container startup check configuration.
130
126
  */
@@ -208,24 +204,6 @@ export interface ArtifactSpecContainerGroupContainerReadinessProbe {
208
204
  */
209
205
  timeoutSeconds?: pulumi.Input<number>;
210
206
  }
211
- export interface ArtifactSpecContainerGroupContainerResourceRequest {
212
- /**
213
- * Number of CPU cores required.
214
- */
215
- cpu: pulumi.Input<number>;
216
- /**
217
- * Number of GPUs required.
218
- */
219
- gpu?: pulumi.Input<number>;
220
- /**
221
- * GPU type required (e.g., NVIDIA-A100).
222
- */
223
- gpuType?: pulumi.Input<string>;
224
- /**
225
- * Memory required in bytes.
226
- */
227
- memory: pulumi.Input<number>;
228
- }
229
207
  export interface ArtifactSpecContainerGroupContainerStartupProbe {
230
208
  /**
231
209
  * Minimum consecutive failures for the probe to be considered failed.
@@ -1440,19 +1418,37 @@ export interface VectorDatabaseChunkingParameters {
1440
1418
  }
1441
1419
  export interface WorkloadRuntime {
1442
1420
  /**
1443
- * Autoscaling configuration. When set, takes precedence over replica_count.
1421
+ * Per-group runtime configuration.
1444
1422
  */
1445
- autoscaling?: pulumi.Input<inputs.WorkloadRuntimeAutoscaling>;
1423
+ containerGroups?: pulumi.Input<pulumi.Input<inputs.WorkloadRuntimeContainerGroup>[]>;
1424
+ }
1425
+ export interface WorkloadRuntimeContainerGroup {
1446
1426
  /**
1447
- * Number of replicas to run. Cannot be used together with `autoscaling`. Omitting this field retains the current value. Set to `0` to explicitly clear it (e.g. when switching to autoscaling).
1427
+ * Autoscaling configuration. When set, takes precedence over `replicaCount`.
1428
+ */
1429
+ autoscaling?: pulumi.Input<inputs.WorkloadRuntimeContainerGroupAutoscaling>;
1430
+ /**
1431
+ * How to select among `resourceBundles`. Defaults to `availability`.
1432
+ */
1433
+ bundleSelectionPolicy?: pulumi.Input<string>;
1434
+ /**
1435
+ * Per-container resource allocation overrides.
1436
+ */
1437
+ containers?: pulumi.Input<pulumi.Input<inputs.WorkloadRuntimeContainerGroupContainer>[]>;
1438
+ /**
1439
+ * Container group name (server-assigned, always `default`).
1440
+ */
1441
+ name?: pulumi.Input<string>;
1442
+ /**
1443
+ * Number of replicas. Cannot be set alongside `autoscaling.enabled=true`. Set to `0` to explicitly clear it.
1448
1444
  */
1449
1445
  replicaCount?: pulumi.Input<number>;
1450
1446
  /**
1451
- * Resource bundles assigned to the Workload. When empty the server infers an appropriate bundle.
1447
+ * Ordered list of resource bundle IDs. One is selected at scheduling time.
1452
1448
  */
1453
- resources?: pulumi.Input<pulumi.Input<inputs.WorkloadRuntimeResource>[]>;
1449
+ resourceBundles?: pulumi.Input<pulumi.Input<string>[]>;
1454
1450
  }
1455
- export interface WorkloadRuntimeAutoscaling {
1451
+ export interface WorkloadRuntimeContainerGroupAutoscaling {
1456
1452
  /**
1457
1453
  * Whether autoscaling is enabled. Defaults to true.
1458
1454
  */
@@ -1460,9 +1456,9 @@ export interface WorkloadRuntimeAutoscaling {
1460
1456
  /**
1461
1457
  * Scaling policies that define when and how to scale.
1462
1458
  */
1463
- policies: pulumi.Input<pulumi.Input<inputs.WorkloadRuntimeAutoscalingPolicy>[]>;
1459
+ policies: pulumi.Input<pulumi.Input<inputs.WorkloadRuntimeContainerGroupAutoscalingPolicy>[]>;
1464
1460
  }
1465
- export interface WorkloadRuntimeAutoscalingPolicy {
1461
+ export interface WorkloadRuntimeContainerGroupAutoscalingPolicy {
1466
1462
  /**
1467
1463
  * Maximum number of replicas.
1468
1464
  */
@@ -1484,9 +1480,31 @@ export interface WorkloadRuntimeAutoscalingPolicy {
1484
1480
  */
1485
1481
  target: pulumi.Input<number>;
1486
1482
  }
1487
- export interface WorkloadRuntimeResource {
1483
+ export interface WorkloadRuntimeContainerGroupContainer {
1484
+ /**
1485
+ * Container name. Must match a container declared in the artifact group.
1486
+ */
1487
+ name: pulumi.Input<string>;
1488
+ /**
1489
+ * Resource allocation for this container.
1490
+ */
1491
+ resourceAllocation?: pulumi.Input<inputs.WorkloadRuntimeContainerGroupContainerResourceAllocation>;
1492
+ }
1493
+ export interface WorkloadRuntimeContainerGroupContainerResourceAllocation {
1494
+ /**
1495
+ * CPU cores allocated to this container.
1496
+ */
1497
+ cpu?: pulumi.Input<number>;
1498
+ /**
1499
+ * GPUs allocated to this container.
1500
+ */
1501
+ gpu?: pulumi.Input<number>;
1502
+ /**
1503
+ * GPU VRAM allocated in bytes.
1504
+ */
1505
+ gpuMemory?: pulumi.Input<number>;
1488
1506
  /**
1489
- * ID of the resource bundle (e.g. `cpu.nano`).
1507
+ * RAM allocated in bytes.
1490
1508
  */
1491
- resourceBundleId: pulumi.Input<string>;
1509
+ memory?: pulumi.Input<number>;
1492
1510
  }
package/types/output.d.ts CHANGED
@@ -120,10 +120,6 @@ export interface ArtifactSpecContainerGroupContainer {
120
120
  * Container readiness check configuration.
121
121
  */
122
122
  readinessProbe?: outputs.ArtifactSpecContainerGroupContainerReadinessProbe;
123
- /**
124
- * Resource requirements for the container.
125
- */
126
- resourceRequest: outputs.ArtifactSpecContainerGroupContainerResourceRequest;
127
123
  /**
128
124
  * Container startup check configuration.
129
125
  */
@@ -207,24 +203,6 @@ export interface ArtifactSpecContainerGroupContainerReadinessProbe {
207
203
  */
208
204
  timeoutSeconds: number;
209
205
  }
210
- export interface ArtifactSpecContainerGroupContainerResourceRequest {
211
- /**
212
- * Number of CPU cores required.
213
- */
214
- cpu: number;
215
- /**
216
- * Number of GPUs required.
217
- */
218
- gpu?: number;
219
- /**
220
- * GPU type required (e.g., NVIDIA-A100).
221
- */
222
- gpuType?: string;
223
- /**
224
- * Memory required in bytes.
225
- */
226
- memory: number;
227
- }
228
206
  export interface ArtifactSpecContainerGroupContainerStartupProbe {
229
207
  /**
230
208
  * Minimum consecutive failures for the probe to be considered failed.
@@ -1439,19 +1417,37 @@ export interface VectorDatabaseChunkingParameters {
1439
1417
  }
1440
1418
  export interface WorkloadRuntime {
1441
1419
  /**
1442
- * Autoscaling configuration. When set, takes precedence over replica_count.
1420
+ * Per-group runtime configuration.
1443
1421
  */
1444
- autoscaling?: outputs.WorkloadRuntimeAutoscaling;
1422
+ containerGroups?: outputs.WorkloadRuntimeContainerGroup[];
1423
+ }
1424
+ export interface WorkloadRuntimeContainerGroup {
1445
1425
  /**
1446
- * Number of replicas to run. Cannot be used together with `autoscaling`. Omitting this field retains the current value. Set to `0` to explicitly clear it (e.g. when switching to autoscaling).
1426
+ * Autoscaling configuration. When set, takes precedence over `replicaCount`.
1427
+ */
1428
+ autoscaling?: outputs.WorkloadRuntimeContainerGroupAutoscaling;
1429
+ /**
1430
+ * How to select among `resourceBundles`. Defaults to `availability`.
1431
+ */
1432
+ bundleSelectionPolicy: string;
1433
+ /**
1434
+ * Per-container resource allocation overrides.
1435
+ */
1436
+ containers?: outputs.WorkloadRuntimeContainerGroupContainer[];
1437
+ /**
1438
+ * Container group name (server-assigned, always `default`).
1439
+ */
1440
+ name: string;
1441
+ /**
1442
+ * Number of replicas. Cannot be set alongside `autoscaling.enabled=true`. Set to `0` to explicitly clear it.
1447
1443
  */
1448
1444
  replicaCount: number;
1449
1445
  /**
1450
- * Resource bundles assigned to the Workload. When empty the server infers an appropriate bundle.
1446
+ * Ordered list of resource bundle IDs. One is selected at scheduling time.
1451
1447
  */
1452
- resources?: outputs.WorkloadRuntimeResource[];
1448
+ resourceBundles?: string[];
1453
1449
  }
1454
- export interface WorkloadRuntimeAutoscaling {
1450
+ export interface WorkloadRuntimeContainerGroupAutoscaling {
1455
1451
  /**
1456
1452
  * Whether autoscaling is enabled. Defaults to true.
1457
1453
  */
@@ -1459,9 +1455,9 @@ export interface WorkloadRuntimeAutoscaling {
1459
1455
  /**
1460
1456
  * Scaling policies that define when and how to scale.
1461
1457
  */
1462
- policies: outputs.WorkloadRuntimeAutoscalingPolicy[];
1458
+ policies: outputs.WorkloadRuntimeContainerGroupAutoscalingPolicy[];
1463
1459
  }
1464
- export interface WorkloadRuntimeAutoscalingPolicy {
1460
+ export interface WorkloadRuntimeContainerGroupAutoscalingPolicy {
1465
1461
  /**
1466
1462
  * Maximum number of replicas.
1467
1463
  */
@@ -1483,9 +1479,31 @@ export interface WorkloadRuntimeAutoscalingPolicy {
1483
1479
  */
1484
1480
  target: number;
1485
1481
  }
1486
- export interface WorkloadRuntimeResource {
1482
+ export interface WorkloadRuntimeContainerGroupContainer {
1483
+ /**
1484
+ * Container name. Must match a container declared in the artifact group.
1485
+ */
1486
+ name: string;
1487
+ /**
1488
+ * Resource allocation for this container.
1489
+ */
1490
+ resourceAllocation?: outputs.WorkloadRuntimeContainerGroupContainerResourceAllocation;
1491
+ }
1492
+ export interface WorkloadRuntimeContainerGroupContainerResourceAllocation {
1493
+ /**
1494
+ * CPU cores allocated to this container.
1495
+ */
1496
+ cpu?: number;
1497
+ /**
1498
+ * GPUs allocated to this container.
1499
+ */
1500
+ gpu?: number;
1501
+ /**
1502
+ * GPU VRAM allocated in bytes.
1503
+ */
1504
+ gpuMemory?: number;
1487
1505
  /**
1488
- * ID of the resource bundle (e.g. `cpu.nano`).
1506
+ * RAM allocated in bytes.
1489
1507
  */
1490
- resourceBundleId: string;
1508
+ memory?: number;
1491
1509
  }