npm - @civitai/client - Versions diffs - 0.2.0-beta.55 → 0.2.0-beta.57 - Mend

@civitai/client 0.2.0-beta.55 → 0.2.0-beta.57

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/generated/index.d.ts +28 -0
package/dist/generated/index.js +2 -2
package/dist/generated/sdk.gen.d.ts +16 -0
package/dist/generated/sdk.gen.js +16 -0
package/dist/generated/types.gen.d.ts +432 -11
package/dist/generated/types.gen.js +16 -0
package/dist/utils/Air.d.ts +3 -1
package/dist/utils/Air.js +3 -3
package/package.json +1 -1

package/dist/generated/index.d.ts CHANGED Viewed

@@ -15,6 +15,7 @@ export {
   invalidateUserCache,
   invokeAceStepAudioStepTemplate,
   invokeAgeClassificationStepTemplate,
+  invokeAudioCaptioningStepTemplate,
   invokeBatchOcrSafetyClassificationStepTemplate,
   invokeBlobArchiveStepTemplate,
   invokeChatCompletionStepTemplate,
@@ -63,6 +64,10 @@ export {
   uploadConsumerBlob,
 } from './sdk.gen';
 export {
+  type AceStep15AiToolkitTrainingInput,
+  type AceStep15XlAiToolkitTrainingInput,
+  type AceStep15XlBaseAiToolkitTrainingInput,
+  type AceStep15XlSftAiToolkitTrainingInput,
   type AceStepAudioCover,
   type AceStepAudioInput,
   type AceStepAudioOutput,
@@ -91,6 +96,11 @@ export {
   ArchiveFormat,
   type AssistantMessage,
   type AudioBlob,
+  type AudioCaptioningInput,
+  type AudioCaptioningOutput,
+  type AudioCaptioningOutputItem,
+  type AudioCaptioningStep,
+  type AudioCaptioningStepTemplate,
   type BatchOcrSafetyClassificationInput,
   type BatchOcrSafetyClassificationOutput,
   type BatchOcrSafetyClassificationResult,
@@ -110,11 +120,16 @@ export {
   type ChatCompletionContentPartWritable,
   type ChatCompletionFunction,
   type ChatCompletionFunctionCall,
+  type ChatCompletionGeneratedImage,
+  type ChatCompletionGeneratedImageUrl,
+  type ChatCompletionImageConfig,
   type ChatCompletionImageUrl,
   type ChatCompletionInput,
+  type ChatCompletionJsonSchema,
   type ChatCompletionMessage,
   type ChatCompletionMessageWritable,
   type ChatCompletionOutput,
+  type ChatCompletionResponseFormat,
   type ChatCompletionStep,
   type ChatCompletionStepTemplate,
   type ChatCompletionTool,
@@ -123,6 +138,8 @@ export {
   type ChromaAiToolkitTrainingInput,
   type ClientOptions,
   CoarseMode,
+  type ComfyAnimaCreateImageGenInput,
+  type ComfyAnimaImageGenInput,
   type ComfyErnieImageGenInput,
   type ComfyErnieStandardCreateImageGenInput,
   type ComfyErnieStandardImageGenInput,
@@ -131,6 +148,9 @@ export {
   type ComfyFlux1CreateImageGenInput,
   type ComfyFlux1ImageGenInput,
   type ComfyFlux1VariantImageGenInput,
+  type ComfyFlux2DevCreateImageInput,
+  type ComfyFlux2DevEditImageInput,
+  type ComfyFlux2DevImageGenInput,
   type ComfyImageGenInput,
   type ComfyInput,
   type ComfyLtx23AudioToVideoInput,
@@ -351,6 +371,11 @@ export {
   type InvokeAgeClassificationStepTemplateErrors,
   type InvokeAgeClassificationStepTemplateResponse,
   type InvokeAgeClassificationStepTemplateResponses,
+  type InvokeAudioCaptioningStepTemplateData,
+  type InvokeAudioCaptioningStepTemplateError,
+  type InvokeAudioCaptioningStepTemplateErrors,
+  type InvokeAudioCaptioningStepTemplateResponse,
+  type InvokeAudioCaptioningStepTemplateResponses,
   type InvokeBatchOcrSafetyClassificationStepTemplateData,
   type InvokeBatchOcrSafetyClassificationStepTemplateError,
   type InvokeBatchOcrSafetyClassificationStepTemplateErrors,
@@ -567,6 +592,7 @@ export {
   type MochiVideoGenInput,
   type ModelClamScanInput,
   type ModelClamScanOutput,
+  ModelClamScanStatus,
   type ModelClamScanStep,
   type ModelClamScanStepTemplate,
   type ModelHashInput,
@@ -579,6 +605,7 @@ export {
   type ModelParseMetadataStepTemplate,
   type ModelPickleScanInput,
   type ModelPickleScanOutput,
+  ModelPickleScanStatus,
   type ModelPickleScanStep,
   type ModelPickleScanStepTemplate,
   type MusubiImageResourceTrainingInput,
@@ -721,6 +748,7 @@ export {
   type Qwen3BaseTtsInput,
   type Qwen3CustomVoiceTtsInput,
   type Qwen3TextToSpeechInput,
+  type Qwen3VoiceDesignTtsInput,
   type QwenAiToolkitTrainingInput,
   type QwenImageGenInput,
   type RefreshBlobData,

package/dist/generated/index.js CHANGED Viewed

@@ -1,3 +1,3 @@
 // This file is auto-generated by @hey-api/openapi-ts
-export { addWorkflowTag, deleteWorkflow, getBlob, getBlobArchive, getBlobContent, getBlockedContent, getConsumerBlobUploadUrl, getResource, getStreamingBlob, getWorkflow, getWorkflowStep, headBlob, invalidateResource, invalidateUserCache, invokeAceStepAudioStepTemplate, invokeAgeClassificationStepTemplate, invokeBatchOcrSafetyClassificationStepTemplate, invokeBlobArchiveStepTemplate, invokeChatCompletionStepTemplate, invokeComfyStepTemplate, invokeConvertImageStepTemplate, invokeEchoStepTemplate, invokeHumanoidImageMaskStepTemplate, invokeImageGenStepTemplate, invokeImageResourceTrainingStepTemplate, invokeImageUploadStepTemplate, invokeImageUpscalerStepTemplate, invokeMediaCaptioningStepTemplate, invokeMediaHashStepTemplate, invokeMediaRatingStepTemplate, invokeModelClamScanStepTemplate, invokeModelHashStepTemplate, invokeModelParseMetadataStepTemplate, invokeModelPickleScanStepTemplate, invokePreprocessImageStepTemplate, invokePromptEnhancementStepTemplate, invokeRepeatStepTemplate, invokeTextToImageStepTemplate, invokeTextToSpeechStepTemplate, invokeTrainingStepTemplate, invokeTranscodeStepTemplate, invokeTranscriptionStepTemplate, invokeTryOnUStepTemplate, invokeVideoEnhancementStepTemplate, invokeVideoFrameExtractionStepTemplate, invokeVideoGenStepTemplate, invokeVideoInterpolationStepTemplate, invokeVideoMetadataStepTemplate, invokeVideoUpscalerStepTemplate, invokeWdTaggingStepTemplate, invokeXGuardModerationStepTemplate, patchWorkflow, patchWorkflowStep, queryWorkflows, refreshBlob, removeAllWorkflowTags, removeWorkflowTag, submitWorkflow, updateWorkflow, updateWorkflowStep, uploadConsumerBlob, } from './sdk.gen';
-export { AnimalPoseBboxDetector, AnimalPoseEstimator, AnylineMergeWith, ArchiveFormat, BlurRegionMode, BuzzClientAccount, CoarseMode, ComfySampler, ComfyScheduler, ContainerFormat, DensePoseColormap, DensePoseModel, DepthAnythingCheckpoint, DepthAnythingV2Checkpoint, DwPoseBboxDetector, DwPoseEstimator, FileFormat, HaiperVideoGenAspectRatio, HaiperVideoGenCameraMovement, HaiperVideoGenModel, HumanoidImageMaskCategory, ImageGenOutputFormat, ImageResouceTrainingModerationStatus, ImageTransformer, JobSupport, KlingMode, KlingModel, KlingV3Operation, KlingVideoGenAspectRatio, KlingVideoGenDuration, LeresBoost, LightricksAspectRatio, MediaHashType, Metric3dBackbone, MiniMaxVideoGenModel, NsfwLevel, OutputFormat, Priority, SafeMode, Scheduler, SdCppSampleMethod, SdCppSchedule, SdCppUCacheMode, SeedanceModel, SeedreamVersion, TrainingModerationStatus, TransactionType, UpdateWorkflowStatus, Veo3AspectRatio, Veo3GenerationMode, Veo3Version, ViduVideoGenModel, ViduVideoGenStyle, WorkflowStatus, WorkflowUpgradeMode, ZoeDepthEnvironment, } from './types.gen';
+export { addWorkflowTag, deleteWorkflow, getBlob, getBlobArchive, getBlobContent, getBlockedContent, getConsumerBlobUploadUrl, getResource, getStreamingBlob, getWorkflow, getWorkflowStep, headBlob, invalidateResource, invalidateUserCache, invokeAceStepAudioStepTemplate, invokeAgeClassificationStepTemplate, invokeAudioCaptioningStepTemplate, invokeBatchOcrSafetyClassificationStepTemplate, invokeBlobArchiveStepTemplate, invokeChatCompletionStepTemplate, invokeComfyStepTemplate, invokeConvertImageStepTemplate, invokeEchoStepTemplate, invokeHumanoidImageMaskStepTemplate, invokeImageGenStepTemplate, invokeImageResourceTrainingStepTemplate, invokeImageUploadStepTemplate, invokeImageUpscalerStepTemplate, invokeMediaCaptioningStepTemplate, invokeMediaHashStepTemplate, invokeMediaRatingStepTemplate, invokeModelClamScanStepTemplate, invokeModelHashStepTemplate, invokeModelParseMetadataStepTemplate, invokeModelPickleScanStepTemplate, invokePreprocessImageStepTemplate, invokePromptEnhancementStepTemplate, invokeRepeatStepTemplate, invokeTextToImageStepTemplate, invokeTextToSpeechStepTemplate, invokeTrainingStepTemplate, invokeTranscodeStepTemplate, invokeTranscriptionStepTemplate, invokeTryOnUStepTemplate, invokeVideoEnhancementStepTemplate, invokeVideoFrameExtractionStepTemplate, invokeVideoGenStepTemplate, invokeVideoInterpolationStepTemplate, invokeVideoMetadataStepTemplate, invokeVideoUpscalerStepTemplate, invokeWdTaggingStepTemplate, invokeXGuardModerationStepTemplate, patchWorkflow, patchWorkflowStep, queryWorkflows, refreshBlob, removeAllWorkflowTags, removeWorkflowTag, submitWorkflow, updateWorkflow, updateWorkflowStep, uploadConsumerBlob, } from './sdk.gen';
+export { AnimalPoseBboxDetector, AnimalPoseEstimator, AnylineMergeWith, ArchiveFormat, BlurRegionMode, BuzzClientAccount, CoarseMode, ComfySampler, ComfyScheduler, ContainerFormat, DensePoseColormap, DensePoseModel, DepthAnythingCheckpoint, DepthAnythingV2Checkpoint, DwPoseBboxDetector, DwPoseEstimator, FileFormat, HaiperVideoGenAspectRatio, HaiperVideoGenCameraMovement, HaiperVideoGenModel, HumanoidImageMaskCategory, ImageGenOutputFormat, ImageResouceTrainingModerationStatus, ImageTransformer, JobSupport, KlingMode, KlingModel, KlingV3Operation, KlingVideoGenAspectRatio, KlingVideoGenDuration, LeresBoost, LightricksAspectRatio, MediaHashType, Metric3dBackbone, MiniMaxVideoGenModel, ModelClamScanStatus, ModelPickleScanStatus, NsfwLevel, OutputFormat, Priority, SafeMode, Scheduler, SdCppSampleMethod, SdCppSchedule, SdCppUCacheMode, SeedanceModel, SeedreamVersion, TrainingModerationStatus, TransactionType, UpdateWorkflowStatus, Veo3AspectRatio, Veo3GenerationMode, Veo3Version, ViduVideoGenModel, ViduVideoGenStyle, WorkflowStatus, WorkflowUpgradeMode, ZoeDepthEnvironment, } from './types.gen';

package/dist/generated/sdk.gen.d.ts CHANGED Viewed

@@ -46,6 +46,9 @@ import type {
   InvokeAgeClassificationStepTemplateData,
   InvokeAgeClassificationStepTemplateErrors,
   InvokeAgeClassificationStepTemplateResponses,
+  InvokeAudioCaptioningStepTemplateData,
+  InvokeAudioCaptioningStepTemplateErrors,
+  InvokeAudioCaptioningStepTemplateResponses,
   InvokeBatchOcrSafetyClassificationStepTemplateData,
   InvokeBatchOcrSafetyClassificationStepTemplateErrors,
   InvokeBatchOcrSafetyClassificationStepTemplateResponses,
@@ -308,6 +311,19 @@ export declare const invokeAgeClassificationStepTemplate: <ThrowOnError extends
   ThrowOnError,
   'fields'
 >;
+/**
+ * Audio Captioning
+ *
+ * Generates music captions, lyrics, and metadata by running the ACE-Step captioner and transcriber models.
+ */
+export declare const invokeAudioCaptioningStepTemplate: <ThrowOnError extends boolean = false>(
+  options?: Options<InvokeAudioCaptioningStepTemplateData, ThrowOnError>
+) => import('./client').RequestResult<
+  InvokeAudioCaptioningStepTemplateResponses,
+  InvokeAudioCaptioningStepTemplateErrors,
+  ThrowOnError,
+  'fields'
+>;
 export declare const invokeBatchOcrSafetyClassificationStepTemplate: <
   ThrowOnError extends boolean = false,
 >(

package/dist/generated/sdk.gen.js CHANGED Viewed

@@ -113,6 +113,22 @@ export const invokeAgeClassificationStepTemplate = (options) => {
         },
     });
 };
+/**
+ * Audio Captioning
+ *
+ * Generates music captions, lyrics, and metadata by running the ACE-Step captioner and transcriber models.
+ */
+export const invokeAudioCaptioningStepTemplate = (options) => {
+    var _a;
+    return ((_a = options === null || options === void 0 ? void 0 : options.client) !== null && _a !== void 0 ? _a : client).post({
+        url: '/v2/consumer/recipes/audioCaptioning',
+        ...options,
+        headers: {
+            'Content-Type': 'application/json',
+            ...options === null || options === void 0 ? void 0 : options.headers,
+        },
+    });
+};
 export const invokeBatchOcrSafetyClassificationStepTemplate = (options) => {
     var _a;
     return ((_a = options === null || options === void 0 ? void 0 : options.client) !== null && _a !== void 0 ? _a : client).post({

package/dist/generated/types.gen.d.ts CHANGED Viewed

@@ -96,6 +96,49 @@ export type AiToolkitTrainingInput = Omit<TrainingInput, 'engine'> & {
   triggerWord?: null | string;
   engine: 'ai-toolkit';
 };
+/**
+ * AI Toolkit training for ACE-Step 1.5 base models.
+ */
+export type AceStep15AiToolkitTrainingInput = Omit<
+  AiToolkitTrainingInput,
+  'engine' | 'ecosystem'
+> & {
+  ecosystem: 'ace_step_15';
+  engine: 'ai-toolkit';
+};
+/**
+ * AI Toolkit training for ACE-Step 1.5 XL models.
+ */
+export type AceStep15XlAiToolkitTrainingInput = Omit<
+  AiToolkitTrainingInput,
+  'engine' | 'ecosystem'
+> & {
+  modelVariant: string;
+  ecosystem: 'ace_step_15_xl';
+  engine: 'ai-toolkit';
+};
+/**
+ * AI Toolkit training for ACE-Step 1.5 XL base models.
+ */
+export type AceStep15XlBaseAiToolkitTrainingInput = Omit<
+  AceStep15XlAiToolkitTrainingInput,
+  'engine' | 'ecosystem' | 'modelVariant'
+> & {
+  modelVariant: 'base';
+  ecosystem: 'ace_step_15_xl';
+  engine: 'ai-toolkit';
+};
+/**
+ * AI Toolkit training for ACE-Step 1.5 XL SFT models.
+ */
+export type AceStep15XlSftAiToolkitTrainingInput = Omit<
+  AceStep15XlAiToolkitTrainingInput,
+  'engine' | 'ecosystem' | 'modelVariant'
+> & {
+  modelVariant: 'sft';
+  ecosystem: 'ace_step_15_xl';
+  engine: 'ai-toolkit';
+};
 /**
  * Cover image configuration for ACE Step audio output.
  * When present, the output is a WebM video with this image as the visual.
@@ -133,15 +176,73 @@ export type AceStepAudioInput = {
   /**
    * Time signature (e.g., "4" for 4/4 time)
    */
-  timeSignature?: string;
+  timeSignature?: '2' | '3' | '4' | '6';
   /**
    * Language code (e.g., "en", "zh", "ja", "ko")
    */
-  language?: string;
-  /**
-   * Musical key (e.g., "C major", "E minor")
-   */
-  key?: string;
+  language?:
+    | 'en'
+    | 'ja'
+    | 'zh'
+    | 'es'
+    | 'de'
+    | 'fr'
+    | 'pt'
+    | 'ru'
+    | 'it'
+    | 'nl'
+    | 'pl'
+    | 'tr'
+    | 'vi'
+    | 'cs'
+    | 'fa'
+    | 'id'
+    | 'ko'
+    | 'uk'
+    | 'hu'
+    | 'ar'
+    | 'sv'
+    | 'ro'
+    | 'el';
+  /**
+   * Musical key (e.g., "C major", "E minor"). Mirrors ComfyUI's
+   * TextEncodeAceStepAudio1.5 keyscale combo: 17 roots × {major, minor}.
+   */
+  key?:
+    | 'C major'
+    | 'C# major'
+    | 'Db major'
+    | 'D major'
+    | 'D# major'
+    | 'Eb major'
+    | 'E major'
+    | 'F major'
+    | 'F# major'
+    | 'Gb major'
+    | 'G major'
+    | 'G# major'
+    | 'Ab major'
+    | 'A major'
+    | 'A# major'
+    | 'Bb major'
+    | 'B major'
+    | 'C minor'
+    | 'C# minor'
+    | 'Db minor'
+    | 'D minor'
+    | 'D# minor'
+    | 'Eb minor'
+    | 'E minor'
+    | 'F minor'
+    | 'F# minor'
+    | 'Gb minor'
+    | 'G minor'
+    | 'G# minor'
+    | 'Ab minor'
+    | 'A minor'
+    | 'A# minor'
+    | 'Bb minor'
+    | 'B minor';
   /**
    * Weight for instrumental elements (0.0-1.0)
    */
@@ -177,6 +278,14 @@ export type AceStepAudioInput = {
    * non-turbo base / sft variants expect CFG on (around 4).
    */
   cfg?: number;
+  /**
+   * Optional LoRAs to apply. Each entry's strength is applied to both the
+   * diffusion model (UNET) and the dual CLIP via ComfyUI's LoraLoader.
+   * Compatibility with non-default base models is the caller's responsibility.
+   */
+  loras: {
+    [key: string]: number;
+  };
 };
 /**
  * Output from ACE Step 1.5 audio generation workflow step.
@@ -413,6 +522,11 @@ export type AssistantMessage = Omit<ChatCompletionMessage, 'role'> & {
    * Tool calls requested by the model.
    */
   tool_calls?: null | Array<ChatCompletionToolCall>;
+  /**
+   * Generated images attached to this assistant message, populated when the request
+   * included "image" in its modalities. Each entry is a base64 data URI.
+   */
+  images?: null | Array<ChatCompletionGeneratedImage>;
   role: 'assistant';
 };
 export type AudioBlob = Omit<Blob, 'type'> & {
@@ -422,6 +536,57 @@ export type AudioBlob = Omit<Blob, 'type'> & {
   duration?: null | number;
   type: 'audio';
 };
+export type AudioCaptioningInput = {
+  /**
+   * The URL of the audio file or zip archive to caption.
+   */
+  mediaUrl: string;
+  /**
+   * Sampling temperature for both ACE-Step requests.
+   */
+  temperature: number;
+  /**
+   * Maximum number of tokens to generate for each ACE-Step request.
+   */
+  maxNewTokens: number;
+};
+export type AudioCaptioningOutput = {
+  /**
+   * Combined caption, transcription, and music metadata for the first or only audio item.
+   */
+  text?: null | string;
+  /**
+   * Per-file results when the input is an archive or contains multiple audio items.
+   */
+  results: {
+    [key: string]: AudioCaptioningOutputItem;
+  };
+};
+export type AudioCaptioningOutputItem = {
+  text: string;
+  caption?: null | string;
+  lyrics?: null | string;
+  bpm?: null | string;
+  keyScale?: null | string;
+  timeSignature?: null | string;
+  duration?: null | string;
+  language?: null | string;
+};
+/**
+ * Audio Captioning
+ */
+export type AudioCaptioningStep = Omit<WorkflowStep, '$type'> & {
+  input: AudioCaptioningInput;
+  output?: AudioCaptioningOutput;
+  $type: 'audioCaptioning';
+};
+/**
+ * Audio Captioning
+ */
+export type AudioCaptioningStepTemplate = Omit<WorkflowStepTemplate, '$type'> & {
+  input: AudioCaptioningInput;
+  $type: 'audioCaptioning';
+};
 export type BatchOcrSafetyClassificationInput = {
   mediaUrls: Array<string>;
 };
@@ -639,6 +804,44 @@ export type ChatCompletionFunctionCall = {
   name: string;
   arguments: string;
 };
+/**
+ * A generated image attached to an assistant message when "image" is included in
+ * Civitai.Orchestration.Grains.Workflows.Steps.ChatCompletion.ChatCompletionInput.Modalities. Matches the OpenRouter wire shape.
+ */
+export type ChatCompletionGeneratedImage = {
+  /**
+   * Always "image_url".
+   */
+  type?: string;
+  image_url: ChatCompletionGeneratedImageUrl;
+};
+/**
+ * The image_url payload on a generated image. Currently always a base64 data URI.
+ */
+export type ChatCompletionGeneratedImageUrl = {
+  /**
+   * Base64 data URI (e.g. "data:image/png;base64,...").
+   */
+  url: string;
+};
+/**
+ * Image generation parameters used when Civitai.Orchestration.Grains.Workflows.Steps.ChatCompletion.ChatCompletionInput.Modalities contains "image".
+ * Mirrors OpenRouter's `image_config` shape on chat-completion requests.
+ */
+export type ChatCompletionImageConfig = {
+  /**
+   * Width:height aspect ratio. Examples: "1:1", "16:9", "9:16", "4:3", "3:4", "21:9".
+   */
+  aspect_ratio?: '1:1' | '16:9' | '9:16' | '4:3' | '3:4' | '21:9';
+  /**
+   * Approximate output resolution. "1K" ≈ 1MP, "2K" ≈ 2MP, etc. Engines clamp to their supported range.
+   */
+  image_size?: '0.5K' | '1K' | '2K' | '4K';
+  /**
+   * Number of images to generate. Engines may clamp to their supported maximum.
+   */
+  n?: null | number;
+};
 /**
  * Image URL details matching OpenAI API spec.
  */
@@ -727,6 +930,23 @@ export type ChatCompletionInput = {
    * Can be "auto", "none", "required", or an object specifying a particular function.
    */
   tool_choice?: null;
+  /**
+   * Output modalities the model should produce. Defaults to text-only when omitted.
+   * Supported values: "text", "image". When "image" is included, the request is routed
+   * to the image generation pipeline and returns generated images on the assistant message.
+   */
+  modalities?: null | Array<string>;
+  image_config?: ChatCompletionImageConfig;
+  responseFormat?: ChatCompletionResponseFormat;
+};
+export type ChatCompletionJsonSchema = {
+  name: string;
+  description?: null | string;
+  schema: unknown;
+  /**
+   * OpenAI strict mode. Forces additionalProperties=false and all fields required.
+   */
+  strict?: null | boolean;
 };
 /**
  * Base type for chat messages, discriminated by the "role" property.
@@ -764,6 +984,27 @@ export type ChatCompletionOutput = {
    * System fingerprint for the model configuration.
    */
   systemFingerprint?: null | string;
+  /**
+   * Parsed JSON content of `Choices[0].Message.Content`. Populated when the request
+   * specified a JSON-flavored `response_format` and the content was parseable.
+   * Reachable from downstream workflow steps via `$ref` paths like
+   * `output.parsed.<field>` — DynamicAssignmentEvaluator walks JsonElement trees
+   * the same way it walks the rest of this output.
+   */
+  parsed?: null;
+};
+/**
+ * OpenAI-compatible response_format. When Civitai.Orchestration.Grains.Workflows.Steps.ChatCompletion.ChatCompletionResponseFormat.Type is `json_object` or
+ * `json_schema`, the LLM-emitted content is parsed as JSON server-side and exposed on
+ * Civitai.Orchestration.Grains.Workflows.Steps.ChatCompletion.ChatCompletionOutput.Parsed, allowing downstream workflow steps to reference
+ * individual fields via `$ref` paths like `output.parsed.<field>`.
+ */
+export type ChatCompletionResponseFormat = {
+  /**
+   * OpenAI-compatible value: `text`, `json_object`, or `json_schema`.
+   */
+  type: string;
+  jsonSchema?: ChatCompletionJsonSchema;
 };
 /**
  * ChatCompletion
@@ -785,7 +1026,11 @@ export type ChatCompletionStepTemplate = Omit<WorkflowStepTemplate, '$type'> & {
  */
 export type ChatCompletionTool = {
   type: string;
-  function: ChatCompletionFunction;
+  function?: ChatCompletionFunction;
+  /**
+   * Server-tool parameters for providers such as OpenRouter.
+   */
+  parameters?: null;
 };
 /**
  * A tool call returned in an assistant message response.
@@ -824,6 +1069,33 @@ export declare const CoarseMode: {
   readonly ENABLE: 'enable';
 };
 export type CoarseMode = (typeof CoarseMode)[keyof typeof CoarseMode];
+export type ComfyAnimaCreateImageGenInput = Omit<
+  ComfyAnimaImageGenInput,
+  'engine' | 'ecosystem' | 'operation'
+> & {
+  width?: number;
+  height?: number;
+  operation: 'createImage';
+  ecosystem: 'anima';
+  engine: 'comfy';
+};
+export type ComfyAnimaImageGenInput = Omit<ComfyImageGenInput, 'engine' | 'ecosystem'> & {
+  operation: string;
+  prompt: string;
+  negativePrompt?: null | string;
+  sampler?: ComfySampler;
+  scheduler?: ComfyScheduler;
+  steps?: number;
+  cfgScale?: number;
+  seed?: null | number;
+  quantity?: number;
+  loras?: {
+    [key: string]: number;
+  };
+  diffuserModel?: string;
+  ecosystem: 'anima';
+  engine: 'comfy';
+};
 export type ComfyErnieImageGenInput = Omit<ComfyImageGenInput, 'engine' | 'ecosystem'> & {
   model: string;
   ecosystem: 'ernie';
@@ -935,6 +1207,41 @@ export type ComfyFlux1VariantImageGenInput = Omit<
   ecosystem: 'flux1';
   engine: 'comfy';
 };
+export type ComfyFlux2DevCreateImageInput = Omit<
+  ComfyFlux2DevImageGenInput,
+  'engine' | 'ecosystem' | 'operation'
+> & {
+  operation: 'createImage';
+  ecosystem: 'flux2Dev';
+  engine: 'comfy';
+};
+export type ComfyFlux2DevEditImageInput = Omit<
+  ComfyFlux2DevImageGenInput,
+  'engine' | 'ecosystem' | 'operation'
+> & {
+  images?: Array<string>;
+  operation: 'editImage';
+  ecosystem: 'flux2Dev';
+  engine: 'comfy';
+};
+export type ComfyFlux2DevImageGenInput = Omit<ComfyImageGenInput, 'engine' | 'ecosystem'> & {
+  operation: string;
+  prompt: string;
+  width?: number;
+  height?: number;
+  seed?: null | number;
+  quantity?: number;
+  cfgScale?: number;
+  steps?: number;
+  sampler?: ComfySampler;
+  scheduler?: ComfyScheduler;
+  negativePrompt?: null | string;
+  loras?: {
+    [key: string]: number;
+  };
+  ecosystem: 'flux2Dev';
+  engine: 'comfy';
+};
 export type ComfyImageGenInput = Omit<ImageGenInput, 'engine'> & {
   ecosystem: string;
   engine: 'comfy';
@@ -1055,6 +1362,12 @@ export type ComfyLtx23VideoGenInput = Omit<VideoGenInput, 'engine'> & {
   loras?: {
     [key: string]: number;
   };
+  /**
+   * Optional override for the LTX 2.3 diffusion-model checkpoint. When set, replaces the
+   * transformer file selected by Civitai.Orchestration.Grains.Workflows.Steps.VideoGen.ComfyLtx23VideoGenInput.Model while leaving the CLIPs, VAEs, and
+   * upscale-LoRA behavior unchanged. Use to point at a community fine-tune (e.g. SulphurAI/Sulphur-2-base).
+   */
+  diffusionModel?: null | string;
   engine: 'ltx2.3';
 };
 /**
@@ -1188,6 +1501,7 @@ export declare const ComfySampler: {
   readonly DDIM: 'ddim';
   readonly UNI_PC: 'uni_pc';
   readonly UNI_PC_BH2: 'uni_pc_bh2';
+  readonly ER_SDE: 'er_sde';
 };
 export type ComfySampler = (typeof ComfySampler)[keyof typeof ComfySampler];
 export declare const ComfyScheduler: {
@@ -3030,7 +3344,27 @@ export type ModelClamScanOutput = {
    * The raw ClamAV scan output.
    */
   output?: null | string;
+  status?: ModelClamScanStatus;
+  /**
+   * True when ClamAV reported one or more infected files (exit code 1).
+   */
+  infected?: null | boolean;
+  /**
+   * Number of infected files parsed from the ClamAV scan summary.
+   */
+  infectedFileCount?: null | number;
+  /**
+   * Number of files scanned, parsed from the ClamAV scan summary.
+   */
+  scannedFileCount?: null | number;
+};
+export declare const ModelClamScanStatus: {
+  readonly CLEAN: 'clean';
+  readonly INFECTED: 'infected';
+  readonly TIMEOUT: 'timeout';
+  readonly ERROR: 'error';
 };
+export type ModelClamScanStatus = (typeof ModelClamScanStatus)[keyof typeof ModelClamScanStatus];
 /**
  * ModelClamScan
  */
@@ -3113,8 +3447,9 @@ export type ModelParseMetadataInput = {
  */
 export type ModelParseMetadataOutput = {
   /**
-   * The raw JSON metadata header as stored in the safetensors file, or null when
-   * the model is not a safetensors file or the header could not be parsed.
+   * The `__metadata__` object from the safetensors header as a JSON string,
+   * or null when the model is not a safetensors file, the header could not be
+   * parsed, or no `__metadata__` object is present.
    */
   metadata?: null | string;
 };
@@ -3162,7 +3497,43 @@ export type ModelPickleScanOutput = {
    * Dangerous imports discovered during pickle scanning.
    */
   dangerousImports?: null | Array<string>;
+  status?: ModelPickleScanStatus;
+  /**
+   * True when one or more dangerous imports were detected.
+   */
+  dangerousImportsFound?: null | boolean;
+  /**
+   * True when picklescan was skipped (e.g. file is safetensors and cannot contain pickled code).
+   */
+  skipped?: null | boolean;
+  /**
+   * Reason picklescan was skipped, if applicable. Examples: "safetensors", "safetensors-extension".
+   */
+  skipReason?: null | string;
+  /**
+   * Number of files scanned, parsed from the picklescan summary.
+   */
+  scannedFileCount?: null | number;
+  /**
+   * Number of infected files reported by picklescan.
+   */
+  infectedFileCount?: null | number;
+  /**
+   * Number of dangerous globals reported by picklescan.
+   */
+  dangerousGlobalCount?: null | number;
+};
+export declare const ModelPickleScanStatus: {
+  readonly CLEAN: 'clean';
+  readonly DANGEROUS_IMPORTS_FOUND: 'dangerousImportsFound';
+  readonly SKIPPED_SAFETENSORS: 'skippedSafetensors';
+  readonly SKIPPED_GGUF: 'skippedGguf';
+  readonly SKIPPED: 'skipped';
+  readonly PARSE_ERROR: 'parseError';
+  readonly ERROR: 'error';
 };
+export type ModelPickleScanStatus =
+  (typeof ModelPickleScanStatus)[keyof typeof ModelPickleScanStatus];
 /**
  * ModelPickleScan
  */
@@ -3665,6 +4036,13 @@ export type PromptEnhancementInput = {
    * Optional instruction to guide how the prompt is enhanced (e.g., "expand to 77 tokens", "keep it under 20 words").
    */
   instruction?: null | string;
+  /**
+   * Optional reference images for the prompt enhancement model to consider when enhancing the prompt
+   * (subject, style, lighting, composition, color palette). Accepts URLs, data URIs, raw base64, or AIR strings.
+   * Requires the per-ecosystem prompt-analysis model to be a vision-capable LLM (configured via
+   * IPromptAnalysisGrain.SetConfigurationAsync) — non-VLM models will silently ignore the images.
+   */
+  images?: null | Array<string>;
 };
 /**
  * Output from prompt enhancement analysis.
@@ -3882,6 +4260,19 @@ export type Qwen3TextToSpeechInput = Omit<VllmOmniTextToSpeechInput, 'engine' |
   ecosystem: 'qwen3';
   engine: 'vllm-omni';
 };
+export type Qwen3VoiceDesignTtsInput = Omit<
+  Qwen3TextToSpeechInput,
+  'engine' | 'ecosystem' | 'operation'
+> & {
+  /**
+   * Natural-language description of the desired voice
+   * (e.g., "a calm middle-aged male narrator with a slight British accent").
+   */
+  instruct: string;
+  operation: 'voiceDesign';
+  ecosystem: 'qwen3';
+  engine: 'vllm-omni';
+};
 /**
  * AI Toolkit training for Qwen Image models
  */
@@ -4009,7 +4400,7 @@ export type ResourceInfo = {
   publishedAt?: null | string;
   /**
    * A boolean indicating whether this resource restricts to SFW content generation.
-   * NSFWContent covers X and AA whereas MatureContent includes R rated content.
+   * NSFWContent covers X and XXX whereas MatureContent includes R rated content.
    */
   hasNSFWContentRestriction: boolean;
 };
@@ -4235,7 +4626,7 @@ export type SeedanceVideoGenInput = Omit<VideoGenInput, 'engine'> & {
   duration: 4 | 5 | 6 | 7 | 8 | 9 | 10 | 11 | 12 | 13 | 14 | 15;
   generateAudio?: boolean;
   seed?: null | number;
-  resolution: '480p' | '720p';
+  resolution: '480p' | '720p' | '1080p';
   images?: Array<string>;
   engine: 'seedance';
 };
@@ -7423,6 +7814,36 @@ export type InvokeAgeClassificationStepTemplateResponses = {
 };
 export type InvokeAgeClassificationStepTemplateResponse =
   InvokeAgeClassificationStepTemplateResponses[keyof InvokeAgeClassificationStepTemplateResponses];
+export type InvokeAudioCaptioningStepTemplateData = {
+  body?: AudioCaptioningInput;
+  path?: never;
+  query?: {
+    experimental?: boolean;
+    allowMatureContent?: boolean;
+    whatif?: boolean;
+  };
+  url: '/v2/consumer/recipes/audioCaptioning';
+};
+export type InvokeAudioCaptioningStepTemplateErrors = {
+  /**
+   * Bad Request
+   */
+  400: ProblemDetails;
+  /**
+   * Unauthorized
+   */
+  401: ProblemDetails;
+};
+export type InvokeAudioCaptioningStepTemplateError =
+  InvokeAudioCaptioningStepTemplateErrors[keyof InvokeAudioCaptioningStepTemplateErrors];
+export type InvokeAudioCaptioningStepTemplateResponses = {
+  /**
+   * OK
+   */
+  200: AudioCaptioningOutput;
+};
+export type InvokeAudioCaptioningStepTemplateResponse =
+  InvokeAudioCaptioningStepTemplateResponses[keyof InvokeAudioCaptioningStepTemplateResponses];
 export type InvokeBatchOcrSafetyClassificationStepTemplateData = {
   body?: BatchOcrSafetyClassificationInput;
   path?: never;

package/dist/generated/types.gen.js CHANGED Viewed

@@ -61,6 +61,7 @@ export const ComfySampler = {
     DDIM: 'ddim',
     UNI_PC: 'uni_pc',
     UNI_PC_BH2: 'uni_pc_bh2',
+    ER_SDE: 'er_sde',
 };
 export const ComfyScheduler = {
     NORMAL: 'normal',
@@ -232,6 +233,21 @@ export const Metric3dBackbone = {
     VIT_GIANT2: 'vit-giant2',
 };
 export const MiniMaxVideoGenModel = { HAILOU: 'hailou' };
+export const ModelClamScanStatus = {
+    CLEAN: 'clean',
+    INFECTED: 'infected',
+    TIMEOUT: 'timeout',
+    ERROR: 'error',
+};
+export const ModelPickleScanStatus = {
+    CLEAN: 'clean',
+    DANGEROUS_IMPORTS_FOUND: 'dangerousImportsFound',
+    SKIPPED_SAFETENSORS: 'skippedSafetensors',
+    SKIPPED_GGUF: 'skippedGguf',
+    SKIPPED: 'skipped',
+    PARSE_ERROR: 'parseError',
+    ERROR: 'error',
+};
 export const NsfwLevel = {
     PG: 'pg',
     PG13: 'pg13',

package/dist/utils/Air.d.ts CHANGED Viewed

@@ -8,6 +8,8 @@ type AirProps = {
   /** Id of the resource from the source */
   id: string;
   version?: string;
+  /** Id of a specific model file within the version */
+  modelFileId?: string;
   /** The format of the model (safetensor, ckpt, diffuser, tensor rt) optional */
   format?: string;
 };
@@ -16,6 +18,6 @@ export declare abstract class Air {
   static parse(identifier: string): AirProps;
   static parseSafe(identifier: string): AirProps | undefined;
   static isAir(identifier: string): boolean;
-  static stringify({ ecosystem, type, source, id, version, format }: AirProps): string;
+  static stringify({ ecosystem, type, source, id, version, modelFileId, format }: AirProps): string;
 }
 export {};

package/dist/utils/Air.js CHANGED Viewed

@@ -1,4 +1,4 @@
-const regex = /^(?:urn:)?(?:air:)?(?:(?<ecosystem>[a-zA-Z0-9_\-\/]+):)?(?:(?<type>[a-zA-Z0-9_\-\/]+):)?(?<source>[a-zA-Z0-9_\-\/]+):(?<id>[a-zA-Z0-9_\-\/\.]+)(?:@(?<version>[a-zA-Z0-9_\-\/.]+))?(?:\.(?<format>[a-zA-Z0-9_\-]+))?$/i;
+const regex = /^(?:urn:)?(?:air:)?(?:(?<ecosystem>[a-zA-Z0-9_\-\/]+):)?(?:(?<type>[a-zA-Z0-9_\-\/]+):)?(?<source>[a-zA-Z0-9_\-\/]+):(?<id>[a-zA-Z0-9_\-\/\.]+)(?:@(?<version>[a-zA-Z0-9_\-\/.]+))?(?:\+(?<modelFileId>\d+))?(?:\.(?<format>[a-zA-Z0-9_\-]+))?$/i;
 /** https://github.com/civitai/civitai/wiki/AIR-%E2%80%90-Uniform-Resource-Names-for-AI */
 export class Air {
     static parse(identifier) {
@@ -15,7 +15,7 @@ export class Air {
     static isAir(identifier) {
         return regex.test(identifier);
     }
-    static stringify({ ecosystem, type, source, id, version, format }) {
-        return `urn:air:${ecosystem}:${type}:${source}:${id}${version ? `@${version}` : ''}${format ? `:${format}` : ''}`;
+    static stringify({ ecosystem, type, source, id, version, modelFileId, format }) {
+        return `urn:air:${ecosystem}:${type}:${source}:${id}${version ? `@${version}` : ''}${modelFileId ? `+${modelFileId}` : ''}${format ? `.${format}` : ''}`;
     }
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@civitai/client",
-  "version": "0.2.0-beta.55",
+  "version": "0.2.0-beta.57",
   "description": "Civitai's javascript client for generating ai content",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",