@daocloud-proto/baize 0.123.0 → 0.124.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -12,6 +12,12 @@ export enum QueueType {
|
|
|
12
12
|
KUEUE = "KUEUE",
|
|
13
13
|
}
|
|
14
14
|
|
|
15
|
+
export enum PlacementPolicy {
|
|
16
|
+
PLACEMENT_POLICY_UNSPECIFIED = "PLACEMENT_POLICY_UNSPECIFIED",
|
|
17
|
+
BALANCED = "BALANCED",
|
|
18
|
+
GROUPED = "GROUPED",
|
|
19
|
+
}
|
|
20
|
+
|
|
15
21
|
export enum TrainingMode {
|
|
16
22
|
TRAINING_MODE_UNSPECIFIED = "TRAINING_MODE_UNSPECIFIED",
|
|
17
23
|
SINGLE = "SINGLE",
|
|
@@ -63,6 +69,7 @@ export type JobCreationBaseConfig = {
|
|
|
63
69
|
noOverrideEnvPath?: boolean
|
|
64
70
|
imageConfig?: BaizeManagement_apiImageV1alpha1Image.ImageConfig
|
|
65
71
|
preflight?: boolean
|
|
72
|
+
placement?: PlacementPolicy
|
|
66
73
|
}
|
|
67
74
|
|
|
68
75
|
export type JobRoleDifferenceConfig = {
|
|
@@ -156,6 +156,7 @@ export type InferenceServing = {
|
|
|
156
156
|
hpaConfig?: HPAConfig
|
|
157
157
|
image?: string
|
|
158
158
|
imageConfig?: BaizeManagement_apiImageV1alpha1Image.ImageConfig
|
|
159
|
+
targetGpus?: string[]
|
|
159
160
|
}
|
|
160
161
|
|
|
161
162
|
export type InferenceServingStatusModelStatus = {
|
|
@@ -215,6 +216,7 @@ export type CreateInferenceServingRequest = {
|
|
|
215
216
|
workspace?: number
|
|
216
217
|
image?: string
|
|
217
218
|
imageConfig?: BaizeManagement_apiImageV1alpha1Image.ImageConfig
|
|
219
|
+
targetGpus?: string[]
|
|
218
220
|
}
|
|
219
221
|
|
|
220
222
|
export type UpdateInferenceServingRequest = {
|
|
@@ -232,6 +234,7 @@ export type UpdateInferenceServingRequest = {
|
|
|
232
234
|
workspace?: number
|
|
233
235
|
image?: string
|
|
234
236
|
imageConfig?: BaizeManagement_apiImageV1alpha1Image.ImageConfig
|
|
237
|
+
targetGpus?: string[]
|
|
235
238
|
}
|
|
236
239
|
|
|
237
240
|
export type SingleInferenceServingRequest = {
|