npm - @vectorx/ai-sdk - Versions diffs - 1.0.0 → 1.1.0 - Mend

@vectorx/ai-sdk 1.0.0 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

package/lib/ai.d.ts +1 -1
package/lib/ai.js +14 -0
package/lib/model-type.d.ts +26 -0
package/lib/models/Chat.d.ts +2 -2
package/lib/models/Default/index.d.ts +1 -0
package/lib/models/Default/index.js +27 -1
package/lib/models/Qwen25T2iPreview/index.d.ts +3 -1
package/lib/models/Qwen25T2iPreview/index.js +49 -0
package/lib/models/Qwen3VlPlus/index.d.ts +2 -0
package/lib/models/Qwen3VlPlus/index.js +66 -2
package/lib/models/QwenCosyVoiceTTS/index.d.ts +8 -0
package/lib/models/QwenCosyVoiceTTS/index.js +178 -0
package/lib/models/QwenDocTurbo/adapters/DashScope.d.ts +2 -0
package/lib/models/QwenDocTurbo/adapters/DashScope.js +86 -11
package/lib/models/QwenDocTurbo/adapters/OpenAICompat.d.ts +2 -0
package/lib/models/QwenDocTurbo/adapters/OpenAICompat.js +102 -3
package/lib/models/QwenImage/index.d.ts +3 -1
package/lib/models/QwenImage/index.js +52 -1
package/lib/models/QwenImage20/index.d.ts +91 -0
package/lib/models/QwenImage20/index.js +244 -0
package/lib/models/QwenImageEdit/index.d.ts +3 -1
package/lib/models/QwenImageEdit/index.js +52 -1
package/lib/models/QwenSketchToImage/index.d.ts +1 -1
package/lib/models/QwenStyleRepaintV1/index.d.ts +1 -1
package/lib/models/QwenStyleRepaintV1/index.js +3 -1
package/lib/models/QwenVlMax/index.d.ts +2 -0
package/lib/models/QwenVlMax/index.js +67 -2
package/lib/models/TTSModel.d.ts +11 -0
package/lib/models/TTSModel.js +75 -0
package/lib/models/Wan26Image/index.d.ts +3 -1
package/lib/models/Wan26Image/index.js +52 -1
package/lib/models/index.d.ts +25 -3
package/lib/models/index.js +49 -2
package/lib/models/react.d.ts +6 -2
package/lib/models/react.js +22 -0
package/lib/stream.js +10 -7
package/lib/tokenManager.js +11 -1
package/package.json +9 -7

package/lib/ai.d.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export declare class AI {
     protected request: IAbstractRequest;
     tokenManager: TokenManager;
     constructor(request: IAbstractRequest, baseUrl: string, env: AiSdkEnv);
-    createModel(model: models.ModelName | models.MultiModalModelName): models.ReActModel;
+    createModel(model: models.ModelName | models.MultiModalModelName | models.TTSModelName): models.ReActModel;
     createAgent(options: types.IAgentOptions): Agent;
     registerFunctionTool(functionTool: types.FunctionTool): void;
 }

package/lib/ai.js CHANGED Viewed

@@ -47,19 +47,33 @@ class AI {
         this.tokenManager = new tokenManager_1.TokenManager(this.request, this.baseUrl);
     }
     createModel(model) {
+        var _a;
+        const _debug = process.env.VECTORX_DEBUG === "1";
+        if (_debug)
+            console.log("[AI:createModel] model:", model, "env:", this.env, "baseUrl:", (_a = this.baseUrl) === null || _a === void 0 ? void 0 : _a.slice(0, 50));
         if (this.env === index_1.AiSdkEnv.MiniProgram) {
             console.warn(`[${index_1.AiSdkEnv.MiniProgram}] is not supported for model creation`);
             return null;
         }
         if (!models.isValidModel(model)) {
+            console.error("[AI:createModel] invalid model:", model);
             throw new Error(`[${model}] is not supported, please check the model name`);
         }
+        if (models.isTTSModel(model)) {
+            if (_debug)
+                console.log("[AI:createModel] creating TTS model:", model);
+            return new models.ReActModel(new models.AliyunCosyVoiceTTSModel(this.tokenManager, model));
+        }
         switch (model) {
             case models.MultiModalModelName.QwenImage:
                 return new models.ReActModel(new models.QwenImageModel(this.request, models.QwenImageModel.BASE_URL, this.tokenManager));
             case models.MultiModalModelName.QwenImageEditPlus:
             case models.MultiModalModelName.QwenImageEdit:
                 return new models.ReActModel(new models.QwenImageEditModel(this.request, models.QwenImageEditModel.BASE_URL, this.tokenManager, model));
+            case models.MultiModalModelName.QwenImage20Pro:
+                return new models.ReActModel(new models.QwenImage20ProModel(this.request, models.QwenImage20ProModel.BASE_URL, this.tokenManager));
+            case models.MultiModalModelName.QwenImage20:
+                return new models.ReActModel(new models.QwenImage20FastModel(this.request, models.QwenImage20FastModel.BASE_URL, this.tokenManager));
             case models.MultiModalModelName.WanxSketchToImageLite:
                 return new models.ReActModel(new models.WanxSketchToImageLiteModel(this.request, models.WanxSketchToImageLiteModel.BASE_URL, this.tokenManager));
             case models.MultiModalModelName.QwenStyleRepaintV1:

package/lib/model-type.d.ts CHANGED Viewed

@@ -187,6 +187,32 @@ interface Usage {
     reasoning_tokens: number;
     total_tokens: number;
 }
+export interface TTSRequestOptions {
+    text: string;
+    voice: string;
+    format?: "mp3" | "wav" | "pcm" | "opus";
+    sampleRate?: 8000 | 16000 | 22050 | 24000 | 44100 | 48000;
+    volume?: number;
+    rate?: number;
+    pitch?: number;
+    instruction?: string;
+    languageHints?: string[];
+}
+export interface TTSStreamChunk {
+    audio: Buffer;
+    event: "sentence-begin" | "sentence-synthesis" | "sentence-end";
+    sentence?: {
+        index: number;
+        originalText?: string;
+    };
+}
+export type DoStreamSpeechOutput = AsyncIterableReadableStream<TTSStreamChunk>;
+export interface DoGenerateSpeechOutput {
+    audio: Buffer;
+    usage: {
+        characters: number;
+    };
+}
 export interface IAgent {
     sendMessage(input: SendMessageInput): Promise<any>;
     getHistoryMessages?(input: GetHistoryMessagesParams): Promise<GetHistoryMessagesResponse>;

package/lib/models/Chat.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 import type { IAbstractRequest } from "@vectorx/ai-types";
-import { DoGenerateOutput, DoStreamOutput, ModelRequestOptions, ReqOptions } from "../model-type";
-import { TokenManager } from "../tokenManager";
+import type { DoGenerateOutput, DoStreamOutput, ModelRequestOptions, ReqOptions } from "../model-type";
+import type { TokenManager } from "../tokenManager";
 export declare abstract class SimpleChatModel {
     protected req: IAbstractRequest;
     protected baseUrl: string;

package/lib/models/Default/index.d.ts CHANGED Viewed

@@ -5,6 +5,7 @@ import type { ModelName } from "../index";
 export declare class DefaultSimpleModel extends SimpleChatModel {
     modelName: ModelName;
     constructor(req: IAbstractRequest, baseUrl: string, modelName: ModelName);
+    private adaptMessages;
     protected modelRequest(data: ModelRequestOptions, options?: ReqOptions): Promise<ReadableStream<Uint8Array> | Promise<unknown>>;
     doGenerate(data: ModelRequestOptions, options?: ReqOptions): Promise<DoGenerateOutput>;
     doStream(data: ModelRequestOptions, options?: ReqOptions): Promise<DoStreamOutput>;

package/lib/models/Default/index.js CHANGED Viewed

@@ -30,24 +30,45 @@ class DefaultSimpleModel extends Chat_1.SimpleChatModel {
         super(req, baseUrl, "conversation/chat");
         this.modelName = modelName;
     }
+    adaptMessages(data) {
+        if (!data.messages)
+            return data;
+        return Object.assign(Object.assign({}, data), { messages: data.messages.map((msg) => {
+                if (typeof msg.content === "string" || !Array.isArray(msg.content))
+                    return msg;
+                return Object.assign(Object.assign({}, msg), { content: msg.content.map((item) => {
+                        if (item.type !== "text")
+                            return item;
+                        if ("content" in item)
+                            return item;
+                        if ("text" in item)
+                            return { type: "text", content: item.text };
+                        return item;
+                    }) });
+            }) });
+    }
     modelRequest(data_1) {
         return __awaiter(this, arguments, void 0, function* (data, options = {
             timeout: 30 * 1000,
         }) {
             const fetchHeaders = Object.assign({ "Content-Type": "application/json" }, ((options === null || options === void 0 ? void 0 : options.headers) || {}));
             data.stream && Object.assign(fetchHeaders, { Accept: "text/event-stream" });
+            const reqUrl = `${this.baseUrl}/${this.subUrl}`;
+            console.log("[DefaultSimpleModel:modelRequest] fetching:", reqUrl, JSON.stringify(data, null, 2));
             const { data: responseData, header } = (yield this.req.fetch({
-                url: `${this.baseUrl}/${this.subUrl}`,
+                url: reqUrl,
                 headers: Object.assign({}, fetchHeaders),
                 body: JSON.stringify(data),
                 method: "post",
                 stream: Boolean(data.stream),
             }));
+            console.log("[DefaultSimpleModel:modelRequest] response received, type:", typeof responseData, "hasHeader:", !!header);
             return (0, utils_1.handleResponseData)(responseData, header);
         });
     }
     doGenerate(data, options) {
         return __awaiter(this, void 0, void 0, function* () {
+            data = this.adaptMessages(data);
             data.model = this.modelName;
             const payload = Object.assign(Object.assign(Object.assign({}, defaultOptions), data), { stream: false });
             const res = yield this.modelRequest(payload, options);
@@ -56,9 +77,14 @@ class DefaultSimpleModel extends Chat_1.SimpleChatModel {
     }
     doStream(data, options) {
         return __awaiter(this, void 0, void 0, function* () {
+            var _a;
+            data = this.adaptMessages(data);
             data.model = this.modelName;
             const payload = Object.assign(Object.assign(Object.assign({}, defaultOptions), data), { stream: true });
+            console.log("[DefaultSimpleModel:doStream] url:", `${this.baseUrl}/${this.subUrl}`, "model:", this.modelName);
+            console.log("[DefaultSimpleModel:doStream] messages count:", (_a = payload.messages) === null || _a === void 0 ? void 0 : _a.length);
             const _stream = (yield this.modelRequest(payload, options));
+            console.log("[DefaultSimpleModel:doStream] got stream:", !!_stream, "type:", typeof _stream);
             const stream = (0, stream_1.toPolyfillReadable)(_stream);
             const standardStream = (0, stream_1.intoStandardStream)(stream);
             return (0, stream_1.createAsyncIterable)(standardStream);

package/lib/models/Qwen25T2iPreview/index.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 import type { IAbstractRequest } from "@vectorx/ai-types";
 import type { DoGenerateOutput, DoStreamOutput, ModelRequestOptions, ReqOptions } from "../../model-type";
-import { TokenManager } from "../../tokenManager";
+import type { TokenManager } from "../../tokenManager";
 import { SimpleChatModel } from "../Chat";
 export interface Qwen25T2iPreviewParameters {
     size?: string;
@@ -71,6 +71,8 @@ export declare class Qwen25T2iPreviewModel extends SimpleChatModel {
         parameters?: Qwen25T2iPreviewParameters;
     }): Qwen25T2iPreviewRequestOptions;
     protected modelRequest(data: Qwen25T2iPreviewRequestOptions, options?: ReqOptions): Promise<ReadableStream<Uint8Array> | Promise<unknown>>;
+    private isErrorResponse;
+    private normalizeErrorResponse;
     doGenerate(data: ModelRequestOptions, options?: ReqOptions): Promise<DoGenerateOutput>;
     doStream(data: ModelRequestOptions, options?: ReqOptions): Promise<DoStreamOutput>;
 }

package/lib/models/Qwen25T2iPreview/index.js CHANGED Viewed

@@ -149,11 +149,60 @@ class Qwen25T2iPreviewModel extends Chat_1.SimpleChatModel {
             return (0, utils_1.handleResponseData)(responseData, header);
         });
     }
+    isErrorResponse(obj) {
+        if ((obj === null || obj === void 0 ? void 0 : obj.error) && typeof obj.error === "object" && obj.error.code)
+            return true;
+        if (typeof (obj === null || obj === void 0 ? void 0 : obj.code) === "string" && !(obj === null || obj === void 0 ? void 0 : obj.output))
+            return true;
+        if (typeof (obj === null || obj === void 0 ? void 0 : obj.code) === "number" && obj.code !== 0 && !(obj === null || obj === void 0 ? void 0 : obj.output))
+            return true;
+        return false;
+    }
+    normalizeErrorResponse(res) {
+        var _a, _b;
+        const err = typeof (res === null || res === void 0 ? void 0 : res.error) === "object" ? res.error : {};
+        const errorCode = (err === null || err === void 0 ? void 0 : err.code) || (res === null || res === void 0 ? void 0 : res.code) || "unknown_error";
+        const errorMessage = (err === null || err === void 0 ? void 0 : err.message) || (res === null || res === void 0 ? void 0 : res.message) || "Unknown error";
+        const id = (res === null || res === void 0 ? void 0 : res.id) || (res === null || res === void 0 ? void 0 : res.request_id) || "";
+        const created = (_a = res === null || res === void 0 ? void 0 : res.created) !== null && _a !== void 0 ? _a : Math.floor(Date.now() / 1000);
+        return {
+            id,
+            object: "chat.completion",
+            created,
+            model: (_b = res === null || res === void 0 ? void 0 : res.model) !== null && _b !== void 0 ? _b : this.modelName,
+            log_id: id,
+            error: `[${errorCode}] ${errorMessage}`,
+            code: typeof (res === null || res === void 0 ? void 0 : res.code) === "number" ? res.code : -1,
+            choices: [
+                {
+                    index: 0,
+                    message: {
+                        id,
+                        role: "assistant",
+                        type: "error",
+                        content: `[${errorCode}] ${errorMessage}`,
+                        reasoning_content: "",
+                    },
+                    finish_reason: "error",
+                },
+            ],
+            usage: {
+                prompt_tokens: 0,
+                completion_tokens: 0,
+                knowledge_tokens: 0,
+                reasoning_tokens: 0,
+                total_tokens: 0,
+            },
+        };
+    }
     doGenerate(data, options) {
         return __awaiter(this, void 0, void 0, function* () {
             data.model = this.modelName;
             const payload = this.coverModelRequestToQwenInput(data);
             const res = (yield this.modelRequest(payload, options));
+            if (this.isErrorResponse(res)) {
+                return this.normalizeErrorResponse(res);
+            }
             return this.normalizeStandardImageCompletion(res, this.modelName);
         });
     }

package/lib/models/Qwen3VlPlus/index.d.ts CHANGED Viewed

@@ -72,6 +72,8 @@ export declare class Qwen3VlPlus extends SimpleChatModel {
     constructor(req: IAbstractRequest, baseUrl: string, modelName: MultiModalModelName, tokenManager: TokenManager);
     protected modelRequest(data: Qwen3VlPlusAPIInput, options?: ReqOptions): Promise<ReadableStream<Uint8Array> | Promise<unknown>>;
     protected normalizeResponse(response: Qwen3VlPlusResponse): DoGenerateOutput;
+    private normalizeErrorResponse;
+    private isErrorResponse;
     doGenerate(data: ModelRequestOptions, options?: ReqOptions): Promise<DoGenerateOutput>;
     doStream(data: ModelRequestOptions, options?: ReqOptions): Promise<DoStreamOutput>;
     private convertToQwen3VlPlusRequestOptions;

package/lib/models/Qwen3VlPlus/index.js CHANGED Viewed

@@ -77,11 +77,61 @@ class Qwen3VlPlus extends Chat_1.SimpleChatModel {
             },
         };
     }
+    normalizeErrorResponse(res) {
+        var _a, _b;
+        const err = (res === null || res === void 0 ? void 0 : res.error) || {};
+        const errorCode = (err === null || err === void 0 ? void 0 : err.code) || (res === null || res === void 0 ? void 0 : res.code) || "unknown_error";
+        const errorMessage = (err === null || err === void 0 ? void 0 : err.message) || (res === null || res === void 0 ? void 0 : res.message) || "Unknown error";
+        const id = (res === null || res === void 0 ? void 0 : res.id) || (res === null || res === void 0 ? void 0 : res.request_id) || "";
+        const created = (_a = res === null || res === void 0 ? void 0 : res.created) !== null && _a !== void 0 ? _a : Math.floor(Date.now() / 1000);
+        return {
+            id,
+            object: "chat.completion",
+            created,
+            model: (_b = res === null || res === void 0 ? void 0 : res.model) !== null && _b !== void 0 ? _b : this.modelName,
+            log_id: id,
+            error: `[${errorCode}] ${errorMessage}`,
+            code: typeof (res === null || res === void 0 ? void 0 : res.code) === "number" ? res.code : -1,
+            choices: [
+                {
+                    index: 0,
+                    message: {
+                        id,
+                        role: "assistant",
+                        type: "error",
+                        content: `[${errorCode}] ${errorMessage}`,
+                        reasoning_content: "",
+                    },
+                    finish_reason: "error",
+                },
+            ],
+            usage: {
+                prompt_tokens: 0,
+                completion_tokens: 0,
+                knowledge_tokens: 0,
+                reasoning_tokens: 0,
+                total_tokens: 0,
+            },
+        };
+    }
+    isErrorResponse(obj) {
+        if ((obj === null || obj === void 0 ? void 0 : obj.error) && typeof obj.error === "object" && obj.error.code)
+            return true;
+        if ((obj === null || obj === void 0 ? void 0 : obj.error) && typeof obj.error === "string" && obj.error.length > 0 && !obj.choices)
+            return true;
+        if (typeof (obj === null || obj === void 0 ? void 0 : obj.code) === "number" && obj.code !== 0 && !obj.choices)
+            return true;
+        return false;
+    }
     doGenerate(data, options) {
         return __awaiter(this, void 0, void 0, function* () {
             const qwen3VlPlusData = this.convertToQwen3VlPlusRequestOptions(data);
             const requestData = Object.assign(Object.assign({}, qwen3VlPlusData), { stream: false });
             const res = yield this.modelRequest(requestData, options);
+            const resObj = res;
+            if (this.isErrorResponse(resObj)) {
+                return this.normalizeErrorResponse(resObj);
+            }
             return this.normalizeResponse(res);
         });
     }
@@ -92,7 +142,19 @@ class Qwen3VlPlus extends Chat_1.SimpleChatModel {
             const _stream = (yield this.modelRequest(requestData, options));
             const stream = (0, stream_1.toPolyfillReadable)(_stream);
             const standardStream = (0, stream_1.intoStandardStream)(stream);
-            return (0, stream_1.createAsyncIterable)(standardStream);
+            const self = this;
+            const errorNormalizingStream = standardStream.pipeThrough(new stream_1.TransformStream({
+                transform(chunk, controller) {
+                    const raw = chunk;
+                    if (self.isErrorResponse(raw)) {
+                        controller.enqueue(self.normalizeErrorResponse(raw));
+                    }
+                    else {
+                        controller.enqueue(chunk);
+                    }
+                },
+            }));
+            return (0, stream_1.createAsyncIterable)(errorNormalizingStream);
         });
     }
     convertToQwen3VlPlusRequestOptions(data) {
@@ -100,7 +162,9 @@ class Qwen3VlPlus extends Chat_1.SimpleChatModel {
         const clamp = (value, min, max, defaultValue) => value !== undefined ? Math.max(min, Math.min(max, value)) : defaultValue;
         const messages = (data.messages || []).map((msg) => ({
             role: msg.role,
-            content: Array.isArray(msg.content) ? (0, model_type_1.filterContentByTypes)(msg.content, ["text", "image_url"]) : msg.content,
+            content: Array.isArray(msg.content)
+                ? (0, model_type_1.filterContentByTypes)(msg.content, ["text", "image_url"])
+                : msg.content,
         }));
         return {
             model: this.modelName,

package/lib/models/QwenCosyVoiceTTS/index.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+import type { DoStreamSpeechOutput, TTSRequestOptions } from "../../model-type";
+import type { TokenManager } from "../../tokenManager";
+import { SimpleTTSModel } from "../TTSModel";
+import type { TTSModelName } from "../index";
+export declare class AliyunCosyVoiceTTSModel extends SimpleTTSModel {
+    constructor(tokenManager: TokenManager, modelName: TTSModelName);
+    doStreamSpeech(options: TTSRequestOptions): Promise<DoStreamSpeechOutput>;
+}

package/lib/models/QwenCosyVoiceTTS/index.js ADDED Viewed

@@ -0,0 +1,178 @@
+"use strict";
+var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) {
+    function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }
+    return new (P || (P = Promise))(function (resolve, reject) {
+        function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }
+        function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } }
+        function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
+        step((generator = generator.apply(thisArg, _arguments || [])).next());
+    });
+};
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.AliyunCosyVoiceTTSModel = void 0;
+const node_crypto_1 = require("node:crypto");
+const ws_1 = __importDefault(require("ws"));
+const TTSModel_1 = require("../TTSModel");
+const DASHSCOPE_WSS_URL = "wss://dashscope.aliyuncs.com/api-ws/v1/inference/";
+class AliyunCosyVoiceTTSModel extends TTSModel_1.SimpleTTSModel {
+    constructor(tokenManager, modelName) {
+        super(tokenManager, modelName);
+    }
+    doStreamSpeech(options) {
+        return __awaiter(this, void 0, void 0, function* () {
+            console.log("[AliyunCosyVoiceTTS:doStreamSpeech] start, model:", this.modelName, "voice:", options.voice);
+            const token = yield this.getValidToken();
+            console.log("[AliyunCosyVoiceTTS:doStreamSpeech] token obtained:", token ? `${token.slice(0, 8)}...` : "(empty)");
+            const taskId = (0, node_crypto_1.randomUUID)().replace(/-/g, "");
+            console.log("[AliyunCosyVoiceTTS:doStreamSpeech] taskId:", taskId);
+            const modelName = this.modelName;
+            return new Promise((resolve, reject) => {
+                console.log("[AliyunCosyVoiceTTS:doStreamSpeech] connecting to WSS:", DASHSCOPE_WSS_URL);
+                const ws = new ws_1.default(DASHSCOPE_WSS_URL, {
+                    headers: { Authorization: `Bearer ${token}` },
+                });
+                let taskStarted = false;
+                let totalCharacters = 0;
+                let currentSentenceIndex = 0;
+                let currentOriginalText;
+                let pendingEvent = null;
+                const controller = new ReadableStream({
+                    start(streamController) {
+                        ws.on("open", () => {
+                            console.log("[AliyunCosyVoiceTTS] WebSocket opened, sending run-task...");
+                            ws.send(JSON.stringify({
+                                header: {
+                                    action: "run-task",
+                                    task_id: taskId,
+                                    streaming: "duplex",
+                                },
+                                payload: {
+                                    task_group: "audio",
+                                    task: "tts",
+                                    function: "SpeechSynthesizer",
+                                    model: modelName,
+                                    parameters: Object.assign(Object.assign(Object.assign(Object.assign(Object.assign(Object.assign(Object.assign({ text_type: "PlainText", voice: options.voice }, (options.format && { format: options.format })), (options.sampleRate && { sample_rate: options.sampleRate })), (options.volume != null && { volume: options.volume })), (options.rate != null && { rate: options.rate })), (options.pitch != null && { pitch: options.pitch })), (options.instruction && { instruction: options.instruction })), (options.languageHints && { language_hints: options.languageHints })),
+                                    input: {},
+                                },
+                            }));
+                        });
+                        ws.on("message", (data, isBinary) => {
+                            var _a, _b, _c, _d, _e, _f;
+                            console.log("[AliyunCosyVoiceTTS] ws.message received, isBinary:", isBinary, "size:", typeof data === "string" ? data.length : data.length);
+                            if (isBinary) {
+                                const audioBuffer = Buffer.isBuffer(data) ? data : Buffer.from(data);
+                                streamController.enqueue({
+                                    audio: audioBuffer,
+                                    event: pendingEvent !== null && pendingEvent !== void 0 ? pendingEvent : "sentence-synthesis",
+                                    sentence: Object.assign({ index: currentSentenceIndex }, (currentOriginalText && { originalText: currentOriginalText })),
+                                });
+                                pendingEvent = null;
+                                return;
+                            }
+                            const msgStr = typeof data === "string" ? data : data.toString();
+                            let event;
+                            try {
+                                event = JSON.parse(msgStr);
+                            }
+                            catch (_g) {
+                                return;
+                            }
+                            const { header, payload } = event;
+                            console.log("[AliyunCosyVoiceTTS] server event:", header.event, header.error_code ? `error: ${header.error_code}` : "");
+                            switch (header.event) {
+                                case "task-started":
+                                    console.log("[AliyunCosyVoiceTTS] task-started, will send text and finish...");
+                                    taskStarted = true;
+                                    sendTextAndFinish();
+                                    break;
+                                case "result-generated": {
+                                    const outputType = (_a = payload === null || payload === void 0 ? void 0 : payload.output) === null || _a === void 0 ? void 0 : _a.type;
+                                    if (!outputType)
+                                        break;
+                                    if ((_b = payload === null || payload === void 0 ? void 0 : payload.output) === null || _b === void 0 ? void 0 : _b.sentence) {
+                                        currentSentenceIndex = payload.output.sentence.index;
+                                    }
+                                    currentOriginalText = (_c = payload === null || payload === void 0 ? void 0 : payload.output) === null || _c === void 0 ? void 0 : _c.original_text;
+                                    if (outputType === "sentence-synthesis") {
+                                        pendingEvent = "sentence-synthesis";
+                                    }
+                                    else {
+                                        streamController.enqueue({
+                                            audio: Buffer.alloc(0),
+                                            event: outputType,
+                                            sentence: Object.assign({ index: currentSentenceIndex }, (currentOriginalText && { originalText: currentOriginalText })),
+                                        });
+                                    }
+                                    if ((_d = payload === null || payload === void 0 ? void 0 : payload.usage) === null || _d === void 0 ? void 0 : _d.characters) {
+                                        totalCharacters = payload.usage.characters;
+                                    }
+                                    break;
+                                }
+                                case "task-finished":
+                                    console.log("[AliyunCosyVoiceTTS] task-finished, characters:", (_e = payload === null || payload === void 0 ? void 0 : payload.usage) === null || _e === void 0 ? void 0 : _e.characters);
+                                    if ((_f = payload === null || payload === void 0 ? void 0 : payload.usage) === null || _f === void 0 ? void 0 : _f.characters) {
+                                        totalCharacters = payload.usage.characters;
+                                    }
+                                    streamController.close();
+                                    ws.close();
+                                    break;
+                                case "task-failed":
+                                    console.error("[AliyunCosyVoiceTTS] task-failed:", header.error_code, header.error_message);
+                                    streamController.error(new Error(`TTS task failed: [${header.error_code}] ${header.error_message}`));
+                                    ws.close();
+                                    break;
+                            }
+                        });
+                        ws.on("error", (err) => {
+                            console.error("[AliyunCosyVoiceTTS] ws.error:", err.message);
+                            try {
+                                streamController.error(err);
+                            }
+                            catch (_a) {
+                            }
+                        });
+                        ws.on("close", (code, reason) => {
+                            console.log("[AliyunCosyVoiceTTS] ws.close, code:", code, "reason:", reason === null || reason === void 0 ? void 0 : reason.toString());
+                            try {
+                                streamController.close();
+                            }
+                            catch (_a) {
+                            }
+                        });
+                        function sendTextAndFinish() {
+                            if (!taskStarted)
+                                return;
+                            console.log("[AliyunCosyVoiceTTS] sendTextAndFinish, text length:", options.text.length);
+                            ws.send(JSON.stringify({
+                                header: {
+                                    action: "continue-task",
+                                    task_id: taskId,
+                                    streaming: "duplex",
+                                },
+                                payload: {
+                                    input: { text: options.text },
+                                },
+                            }));
+                            ws.send(JSON.stringify({
+                                header: {
+                                    action: "finish-task",
+                                    task_id: taskId,
+                                    streaming: "duplex",
+                                },
+                                payload: {
+                                    input: {},
+                                },
+                            }));
+                        }
+                    },
+                });
+                const asyncIterableStream = this.createAsyncIterable(controller);
+                resolve(asyncIterableStream);
+            });
+        });
+    }
+}
+exports.AliyunCosyVoiceTTSModel = AliyunCosyVoiceTTSModel;

package/lib/models/QwenDocTurbo/adapters/DashScope.d.ts CHANGED Viewed

@@ -21,5 +21,7 @@ export declare class DashScopeApi implements QwenDocTurboApi {
     buildPayload(data: ModelRequestOptions, stream: boolean): QwenDocTurboAPIInput;
     request(payload: QwenDocTurboAPIInput, options?: ReqOptions): Promise<ReadableStream<Uint8Array> | unknown>;
     normalizeResponse(response: QwenDocTurboResponse): DoGenerateOutput;
+    private isErrorResponse;
+    private normalizeErrorResponse;
     normalizeStream(_stream: ReadableStream<Uint8Array>): ReadableStream<BaseDoStreamOutputChunk>;
 }