@amaster.ai/tts-client 1.0.0-alpha.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/LICENSE ADDED
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2026 Amaster Team
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
package/README.md ADDED
@@ -0,0 +1,270 @@
1
+ # TTS Realtime WebSocket Client SDK
2
+
3
+ 基于 WebSocket 的实时文本转语音(TTS)客户端 SDK,用于对接 `qwen-tts` 实时语音合成服务,支持流式音频返回与自动播放。
4
+
5
+ ---
6
+
7
+ ## 特性
8
+
9
+ - 🔊 WebSocket 实时 TTS
10
+ - 🎵 支持多种音频格式(`pcm` / `mp3` / `wav` / `opus`)
11
+ - ▶️ 支持自动播放或手动播放
12
+ - 📦 支持音频流分片回调
13
+ - 🎧 浏览器原生 `AudioContext` 播放(PCM)
14
+ - 🎭 多种音色可选
15
+
16
+ ---
17
+
18
+ ## 安装
19
+
20
+ ```bash
21
+ # npm
22
+ npm install @amaster.ai/tts-client
23
+
24
+ # pnpm
25
+ pnpm add @amaster.ai/tts-client
26
+
27
+ # yarn
28
+ yarn add @amaster.ai/tts-client
29
+ ```
30
+
31
+ ---
32
+
33
+ ## 快速开始
34
+
35
+ ### 基础用法
36
+
37
+ ```ts
38
+ import { createTTSClient } from "@amaster.ai/tts-client";
39
+
40
+ const tts = createTTSClient({
41
+ voice: "Cherry",
42
+ autoPlay: true,
43
+ audioFormat: "pcm",
44
+ sampleRate: 24000,
45
+ onReady() {
46
+ console.log("TTS 已就绪");
47
+ },
48
+ onAudioStart() {
49
+ console.log("开始播放");
50
+ },
51
+ onAudioEnd() {
52
+ console.log("播放结束");
53
+ },
54
+ onAudioChunk(chunks) {
55
+ console.log("收到音频片段:", chunks.length);
56
+ },
57
+ onError(err) {
58
+ console.error("TTS 错误:", err);
59
+ },
60
+ });
61
+
62
+ // 建立连接
63
+ await tts.connect();
64
+
65
+ // 合成并播放语音
66
+ await tts.speak("你好,欢迎使用实时语音合成服务。");
67
+
68
+ // 关闭连接
69
+ // tts.close();
70
+ ```
71
+
72
+ ---
73
+
74
+ ### React 完整示例
75
+
76
+ ```tsx
77
+ import { useRef, useState } from "react";
78
+ import { createTTSClient, type TTSClient } from "@amaster.ai/tts-client";
79
+
80
+ const VoiceTypes = {
81
+ Cherry: "Cherry - 甜美女声",
82
+ Serena: "苏瑶 - 温柔小姐姐",
83
+ Ethan: "晨煦 - 标准普通话",
84
+ Chelsie: "千雪 - 二次元虚拟女友",
85
+ Peter: "天津话",
86
+ };
87
+
88
+ function TTSPlayer() {
89
+ const [voice, setVoice] = useState("Cherry");
90
+ const [connected, setConnected] = useState(false);
91
+ const [status, setStatus] = useState("disconnected");
92
+ const [text, setText] = useState("你好,欢迎使用通义千问实时语音合成服务。");
93
+ const clientRef = useRef<TTSClient | null>(null);
94
+
95
+ const connectTTS = () => {
96
+ if (clientRef.current) return;
97
+
98
+ const ttsClient = createTTSClient({
99
+ voice,
100
+ autoPlay: true,
101
+ audioFormat: "pcm",
102
+ sampleRate: 24000,
103
+ onReady: () => {
104
+ setConnected(true);
105
+ setStatus("connected");
106
+ },
107
+ onAudioStart: () => setStatus("playing"),
108
+ onAudioEnd: () => setStatus("connected"),
109
+ onAudioChunk: (chunks) => {
110
+ console.log("音频片段数:", chunks.length);
111
+ },
112
+ onError: (err) => {
113
+ console.error("TTS Error:", err);
114
+ setStatus("error");
115
+ setConnected(false);
116
+ },
117
+ });
118
+
119
+ ttsClient.connect();
120
+ clientRef.current = ttsClient;
121
+ };
122
+
123
+ const sendTTS = () => {
124
+ if (!text || !clientRef.current) return;
125
+ clientRef.current.speak(text);
126
+ };
127
+
128
+ const disconnectTTS = () => {
129
+ clientRef.current?.close();
130
+ clientRef.current = null;
131
+ setConnected(false);
132
+ setStatus("disconnected");
133
+ };
134
+
135
+ return (
136
+ <div>
137
+ <h3>🔊 实时语音合成(TTS)</h3>
138
+
139
+ <div>状态: {status}</div>
140
+
141
+ <div>
142
+ <label>音色:</label>
143
+ <select value={voice} onChange={(e) => setVoice(e.target.value)}>
144
+ {Object.entries(VoiceTypes).map(([key, label]) => (
145
+ <option key={key} value={key}>
146
+ {label}
147
+ </option>
148
+ ))}
149
+ </select>
150
+ </div>
151
+
152
+ <div>
153
+ <label>合成文本:</label>
154
+ <textarea rows={4} value={text} onChange={(e) => setText(e.target.value)} />
155
+ </div>
156
+
157
+ <div>
158
+ <button onClick={connectTTS} disabled={connected}>
159
+ 1. 连接
160
+ </button>
161
+ <button onClick={sendTTS} disabled={!connected}>
162
+ 2. 合成语音
163
+ </button>
164
+ <button onClick={disconnectTTS} disabled={!connected}>
165
+ 断开
166
+ </button>
167
+ </div>
168
+ </div>
169
+ );
170
+ }
171
+ ```
172
+
173
+ ---
174
+
175
+ ## API 说明
176
+
177
+ ### `createTTSClient(config)`
178
+
179
+ 创建一个 TTS 客户端实例。
180
+
181
+ #### `TTSClientConfig`
182
+
183
+ | 参数 | 类型 | 默认值 | 说明 |
184
+ | ---------------- | ----------------------------------- | ---------- | ---------------------------------------------------------------------- |
185
+ | `voice` | `string` | `"Cherry"` | 发音人名称,可选值:`Cherry`, `Serena`, `Ethan`, `Chelsie`, `Peter` 等 |
186
+ | `autoPlay` | `boolean` | `true` | 是否在音频接收完成后自动播放 |
187
+ | `audioFormat` | `"pcm" \| "mp3" \| "wav" \| "opus"` | `"pcm"` | 音频格式,**注意:内置播放仅支持 `pcm`** |
188
+ | `sampleRate` | `number` | `24000` | 采样率 |
189
+ | `getAccessToken` | `() => string \| null` | - | 获取访问令牌(用于 WebSocket 认证) |
190
+ | `onReady` | `() => void` | - | 会话初始化完成回调 |
191
+ | `onAudioStart` | `() => void` | - | 音频开始播放回调 |
192
+ | `onAudioEnd` | `() => void` | - | 音频播放结束回调 |
193
+ | `onAudioChunk` | `(chunks: string[]) => void` | - | 接收到音频分片回调 |
194
+ | `onError` | `(error: Error) => void` | - | 错误回调 |
195
+
196
+ #### `TTSClient`
197
+
198
+ ```ts
199
+ interface TTSClient {
200
+ connect(): Promise<void>; // 建立 WebSocket 连接
201
+ speak(text: string): Promise<void>; // 发送文本进行语音合成
202
+ play(): void; // 手动播放(autoPlay=false 时使用)
203
+ close(): void; // 关闭连接并释放资源
204
+ }
205
+ ```
206
+
207
+ ---
208
+
209
+ ## 配合统一客户端使用
210
+
211
+ 推荐与 `@amaster.ai/client` 统一客户端一起使用,自动处理认证:
212
+
213
+ ```tsx
214
+ import { createClient } from "@amaster.ai/client";
215
+
216
+ const client = createClient({
217
+ baseURL: "https://api.amaster.ai",
218
+ });
219
+
220
+ const ttsClient = client.tts({
221
+ voice: "Cherry",
222
+ autoPlay: true,
223
+ onReady() {
224
+ console.log("TTS 已就绪");
225
+ },
226
+ onAudioStart() {
227
+ console.log("开始播放");
228
+ },
229
+ onAudioEnd() {
230
+ console.log("播放结束");
231
+ },
232
+ });
233
+
234
+ await ttsClient.connect();
235
+ await ttsClient.speak("你好,欢迎使用 Amaster AI!");
236
+ ```
237
+
238
+ ---
239
+
240
+ ## 音频说明
241
+
242
+ - 当前内置播放逻辑 **仅支持 `pcm` 格式**
243
+ - `pcm` 数据为 **16-bit little-endian 单声道**
244
+ - 播放基于 `AudioContext`,仅支持浏览器环境
245
+ - 若使用 `mp3 / wav / opus`,需自行实现解码与播放逻辑
246
+
247
+ ---
248
+
249
+ ## 运行环境
250
+
251
+ - 浏览器(Chrome / Edge / Safari)
252
+ - 需支持:
253
+ - WebSocket
254
+ - AudioContext
255
+ - atob
256
+
257
+ ---
258
+
259
+ ## 注意事项
260
+
261
+ - WebSocket 必须在 `connect()` 成功后才能调用 `speak()`
262
+ - 多次 `speak()` 会覆盖之前的音频缓存
263
+ - 自动播放依赖浏览器的自动播放策略,部分场景可能需要用户交互触发
264
+ - 建议在组件卸载时调用 `close()` 释放资源
265
+
266
+ ---
267
+
268
+ ## License
269
+
270
+ MIT
package/dist/index.cjs ADDED
@@ -0,0 +1,193 @@
1
+ "use strict";
2
+ var __defProp = Object.defineProperty;
3
+ var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
4
+ var __getOwnPropNames = Object.getOwnPropertyNames;
5
+ var __hasOwnProp = Object.prototype.hasOwnProperty;
6
+ var __export = (target, all) => {
7
+ for (var name in all)
8
+ __defProp(target, name, { get: all[name], enumerable: true });
9
+ };
10
+ var __copyProps = (to, from, except, desc) => {
11
+ if (from && typeof from === "object" || typeof from === "function") {
12
+ for (let key of __getOwnPropNames(from))
13
+ if (!__hasOwnProp.call(to, key) && key !== except)
14
+ __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
15
+ }
16
+ return to;
17
+ };
18
+ var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
19
+
20
+ // src/index.ts
21
+ var index_exports = {};
22
+ __export(index_exports, {
23
+ createTTSClient: () => tts_client_default
24
+ });
25
+ module.exports = __toCommonJS(index_exports);
26
+
27
+ // src/tts-client.ts
28
+ var TTS_PATH = "/api/proxy/builtin/platform/qwen-tts/api-ws/v1/realtime";
29
+ function createTTSClient(config) {
30
+ const {
31
+ getAccessToken,
32
+ voice = "Cherry",
33
+ autoPlay = true,
34
+ audioFormat = "pcm",
35
+ sampleRate = 24e3,
36
+ onReady,
37
+ onAudioStart,
38
+ onAudioEnd,
39
+ onAudioChunk,
40
+ onError
41
+ } = config;
42
+ let ws = null;
43
+ let audioChunks = [];
44
+ let audioContext = null;
45
+ async function connect() {
46
+ return new Promise((resolve, reject) => {
47
+ let wsUrl = TTS_PATH;
48
+ if (getAccessToken) {
49
+ const token = getAccessToken();
50
+ if (token) {
51
+ const separator = wsUrl.includes("?") ? "&" : "?";
52
+ wsUrl = `${wsUrl}${separator}token=${encodeURIComponent(token)}`;
53
+ }
54
+ }
55
+ ws = new WebSocket(wsUrl);
56
+ ws.onopen = () => {
57
+ };
58
+ ws.onmessage = (event) => {
59
+ const data = JSON.parse(event.data);
60
+ if (data.type === "session.created") {
61
+ ws.send(
62
+ JSON.stringify({
63
+ type: "session.update",
64
+ session: {
65
+ mode: "server_commit",
66
+ voice,
67
+ response_format: audioFormat,
68
+ sample_rate: sampleRate
69
+ }
70
+ })
71
+ );
72
+ }
73
+ if (data.type === "session.updated") {
74
+ onReady?.();
75
+ resolve();
76
+ }
77
+ if (data.type === "response.audio.delta") {
78
+ audioChunks.push(data.delta);
79
+ onAudioChunk?.(audioChunks);
80
+ }
81
+ if (data.type === "response.audio.done") {
82
+ onAudioChunk?.(audioChunks);
83
+ if (autoPlay && typeof window !== "undefined") {
84
+ playAudio();
85
+ }
86
+ }
87
+ if (data.type === "response.done") {
88
+ ws.send(JSON.stringify({ type: "session.finish" }));
89
+ }
90
+ if (data.type === "error") {
91
+ const err = new Error(data.error?.message || "Unknown error");
92
+ onError?.(err);
93
+ reject(err);
94
+ }
95
+ };
96
+ ws.onerror = () => {
97
+ const err = new Error("WebSocket connection error");
98
+ onError?.(err);
99
+ reject(err);
100
+ };
101
+ ws.onclose = () => {
102
+ ws = null;
103
+ };
104
+ });
105
+ }
106
+ async function speak(text) {
107
+ if (!ws || ws.readyState !== WebSocket.OPEN) {
108
+ throw new Error("WebSocket not connected");
109
+ }
110
+ audioChunks = [];
111
+ ws.send(
112
+ JSON.stringify({
113
+ type: "input_text_buffer.append",
114
+ text
115
+ })
116
+ );
117
+ setTimeout(() => {
118
+ ws.send(
119
+ JSON.stringify({
120
+ type: "input_text_buffer.commit"
121
+ })
122
+ );
123
+ }, 100);
124
+ }
125
+ function playAudio() {
126
+ let chunks = audioChunks;
127
+ if (typeof window === "undefined") return;
128
+ try {
129
+ if (!audioContext) {
130
+ audioContext = new AudioContext();
131
+ }
132
+ onAudioStart?.();
133
+ let totalBytes = 0;
134
+ const allBytes = [];
135
+ for (const chunk of chunks) {
136
+ const binaryString = atob(chunk);
137
+ const bytes = new Uint8Array(binaryString.length);
138
+ for (let i = 0; i < binaryString.length; i++) {
139
+ bytes[i] = binaryString.charCodeAt(i);
140
+ }
141
+ allBytes.push(bytes);
142
+ totalBytes += bytes.length;
143
+ }
144
+ const combined = new Uint8Array(totalBytes);
145
+ let offset = 0;
146
+ for (const bytes of allBytes) {
147
+ combined.set(bytes, offset);
148
+ offset += bytes.length;
149
+ }
150
+ const numSamples = combined.length / 2;
151
+ const audioBuffer = audioContext.createBuffer(1, numSamples, sampleRate);
152
+ const channelData = audioBuffer.getChannelData(0);
153
+ const dataView = new DataView(combined.buffer);
154
+ for (let i = 0; i < numSamples; i++) {
155
+ const int16 = dataView.getInt16(i * 2, true);
156
+ channelData[i] = int16 / 32768;
157
+ }
158
+ const source = audioContext.createBufferSource();
159
+ source.buffer = audioBuffer;
160
+ source.connect(audioContext.destination);
161
+ source.onended = () => onAudioEnd?.();
162
+ source.start(0);
163
+ } catch (err) {
164
+ onError?.(err);
165
+ }
166
+ }
167
+ function close() {
168
+ if (ws) {
169
+ ws.close();
170
+ ws = null;
171
+ }
172
+ if (audioContext) {
173
+ audioContext.close();
174
+ audioContext = null;
175
+ }
176
+ }
177
+ return {
178
+ connect,
179
+ speak,
180
+ close,
181
+ play: playAudio
182
+ };
183
+ }
184
+ var tts_client_default = (authConfig) => {
185
+ return (config) => {
186
+ return createTTSClient({ ...authConfig, ...config });
187
+ };
188
+ };
189
+ // Annotate the CommonJS export names for ESM import in node:
190
+ 0 && (module.exports = {
191
+ createTTSClient
192
+ });
193
+ //# sourceMappingURL=index.cjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/index.ts","../src/tts-client.ts"],"sourcesContent":["import type { TTSClient, TTSClientConfig } from \"./tts-client\";\nimport createTTSClient from \"./tts-client\";\nexport { createTTSClient, type TTSClient, type TTSClientConfig };\n","/**\n * TTS Realtime WebSocket Client\n *\n * WebSocket-based real-time text-to-speech synthesis with multiple voice options.\n * Built-in playback only supports PCM format.\n *\n * @example\n * ```typescript\n * const client = createTTSClient({\n * voice: \"Cherry\",\n * autoPlay: true,\n * onReady() {\n * console.log(\"TTS ready\");\n * },\n * onAudioStart() {\n * console.log(\"Playing audio\");\n * },\n * onAudioEnd() {\n * console.log(\"Playback ended\");\n * },\n * });\n *\n * await client.connect();\n * await client.speak(\"Hello, this is a test.\");\n * // client.close();\n * ```\n */\n\nconst TTS_PATH = \"/api/proxy/builtin/platform/qwen-tts/api-ws/v1/realtime\";\n\nexport interface TTSClientConfig {\n /** Get access token for WebSocket authentication */\n getAccessToken?: () => string | null;\n /** Voice name, default 'Cherry' */\n voice?: string;\n /** Auto play audio, default true */\n autoPlay?: boolean;\n /** Audio format, default 'pcm' */\n audioFormat?: \"pcm\" | \"mp3\" | \"wav\" | \"opus\";\n /** Sample rate, default 24000 */\n sampleRate?: number;\n /** Called when connection is ready */\n onReady?: () => void;\n /** Called when audio playback starts */\n onAudioStart?: () => void;\n /** Called when audio playback ends */\n onAudioEnd?: () => void;\n /** Called on each audio chunk received */\n onAudioChunk?: (chunk: string[]) => void;\n /** Called on error */\n onError?: (error: Error) => void;\n}\n\nexport interface TTSClient {\n /** Connect to TTS service */\n connect(): Promise<void>;\n /** Synthesize speech from text */\n speak(text: string): Promise<void>;\n /** Play audio from chunks */\n play(): void;\n /** Close connection */\n close(): void;\n}\n\nfunction createTTSClient(config: TTSClientConfig): TTSClient {\n const {\n getAccessToken,\n voice = \"Cherry\",\n autoPlay = true,\n audioFormat = \"pcm\",\n sampleRate = 24000,\n onReady,\n onAudioStart,\n onAudioEnd,\n onAudioChunk,\n onError,\n } = config;\n\n let ws: WebSocket | null = null;\n let audioChunks: string[] = [];\n let audioContext: AudioContext | null = null;\n\n async function connect(): Promise<void> {\n return new Promise((resolve, reject) => {\n // Build WebSocket URL with optional token parameter\n let wsUrl = TTS_PATH;\n if (getAccessToken) {\n const token = getAccessToken();\n if (token) {\n const separator = wsUrl.includes(\"?\") ? \"&\" : \"?\";\n wsUrl = `${wsUrl}${separator}token=${encodeURIComponent(token)}`;\n }\n }\n\n ws = new WebSocket(wsUrl);\n\n ws.onopen = () => {};\n\n ws.onmessage = (event) => {\n const data = JSON.parse(event.data);\n\n if (data.type === \"session.created\") {\n ws!.send(\n JSON.stringify({\n type: \"session.update\",\n session: {\n mode: \"server_commit\",\n voice,\n response_format: audioFormat,\n sample_rate: sampleRate,\n },\n })\n );\n }\n\n if (data.type === \"session.updated\") {\n onReady?.();\n resolve();\n }\n\n if (data.type === \"response.audio.delta\") {\n audioChunks.push(data.delta);\n onAudioChunk?.(audioChunks);\n }\n\n if (data.type === \"response.audio.done\") {\n onAudioChunk?.(audioChunks);\n if (autoPlay && typeof window !== \"undefined\") {\n playAudio();\n }\n }\n\n if (data.type === \"response.done\") {\n ws!.send(JSON.stringify({ type: \"session.finish\" }));\n }\n\n if (data.type === \"error\") {\n const err = new Error(data.error?.message || \"Unknown error\");\n onError?.(err);\n reject(err);\n }\n };\n\n ws.onerror = () => {\n const err = new Error(\"WebSocket connection error\");\n onError?.(err);\n reject(err);\n };\n\n ws.onclose = () => {\n ws = null;\n };\n });\n }\n\n async function speak(text: string): Promise<void> {\n if (!ws || ws.readyState !== WebSocket.OPEN) {\n throw new Error(\"WebSocket not connected\");\n }\n\n audioChunks = [];\n\n ws.send(\n JSON.stringify({\n type: \"input_text_buffer.append\",\n text,\n })\n );\n\n setTimeout(() => {\n ws!.send(\n JSON.stringify({\n type: \"input_text_buffer.commit\",\n })\n );\n }, 100);\n }\n\n function playAudio() {\n let chunks: string[] = audioChunks;\n if (typeof window === \"undefined\") return;\n\n try {\n if (!audioContext) {\n audioContext = new AudioContext();\n }\n\n onAudioStart?.();\n\n let totalBytes = 0;\n const allBytes: Uint8Array[] = [];\n\n for (const chunk of chunks) {\n const binaryString = atob(chunk);\n const bytes = new Uint8Array(binaryString.length);\n for (let i = 0; i < binaryString.length; i++) {\n bytes[i] = binaryString.charCodeAt(i);\n }\n allBytes.push(bytes);\n totalBytes += bytes.length;\n }\n\n const combined = new Uint8Array(totalBytes);\n let offset = 0;\n for (const bytes of allBytes) {\n combined.set(bytes, offset);\n offset += bytes.length;\n }\n\n const numSamples = combined.length / 2;\n const audioBuffer = audioContext.createBuffer(1, numSamples, sampleRate);\n const channelData = audioBuffer.getChannelData(0);\n\n const dataView = new DataView(combined.buffer);\n for (let i = 0; i < numSamples; i++) {\n const int16 = dataView.getInt16(i * 2, true);\n channelData[i] = int16 / 32768.0;\n }\n\n const source = audioContext.createBufferSource();\n source.buffer = audioBuffer;\n source.connect(audioContext.destination);\n source.onended = () => onAudioEnd?.();\n source.start(0);\n } catch (err) {\n onError?.(err as Error);\n }\n }\n\n function close() {\n if (ws) {\n ws.close();\n ws = null;\n }\n if (audioContext) {\n audioContext.close();\n audioContext = null;\n }\n }\n\n return {\n connect,\n speak,\n close,\n play: playAudio,\n };\n}\n\nexport default (\n authConfig: Pick<TTSClientConfig, \"getAccessToken\">\n): ((config: TTSClientConfig) => TTSClient) => {\n return (config: TTSClientConfig) => {\n return createTTSClient({ ...authConfig, ...config });\n };\n};\n"],"mappings":";;;;;;;;;;;;;;;;;;;;AAAA;AAAA;AAAA;AAAA;AAAA;;;AC4BA,IAAM,WAAW;AAoCjB,SAAS,gBAAgB,QAAoC;AAC3D,QAAM;AAAA,IACJ;AAAA,IACA,QAAQ;AAAA,IACR,WAAW;AAAA,IACX,cAAc;AAAA,IACd,aAAa;AAAA,IACb;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,EACF,IAAI;AAEJ,MAAI,KAAuB;AAC3B,MAAI,cAAwB,CAAC;AAC7B,MAAI,eAAoC;AAExC,iBAAe,UAAyB;AACtC,WAAO,IAAI,QAAQ,CAAC,SAAS,WAAW;AAEtC,UAAI,QAAQ;AACZ,UAAI,gBAAgB;AAClB,cAAM,QAAQ,eAAe;AAC7B,YAAI,OAAO;AACT,gBAAM,YAAY,MAAM,SAAS,GAAG,IAAI,MAAM;AAC9C,kBAAQ,GAAG,KAAK,GAAG,SAAS,SAAS,mBAAmB,KAAK,CAAC;AAAA,QAChE;AAAA,MACF;AAEA,WAAK,IAAI,UAAU,KAAK;AAExB,SAAG,SAAS,MAAM;AAAA,MAAC;AAEnB,SAAG,YAAY,CAAC,UAAU;AACxB,cAAM,OAAO,KAAK,MAAM,MAAM,IAAI;AAElC,YAAI,KAAK,SAAS,mBAAmB;AACnC,aAAI;AAAA,YACF,KAAK,UAAU;AAAA,cACb,MAAM;AAAA,cACN,SAAS;AAAA,gBACP,MAAM;AAAA,gBACN;AAAA,gBACA,iBAAiB;AAAA,gBACjB,aAAa;AAAA,cACf;AAAA,YACF,CAAC;AAAA,UACH;AAAA,QACF;AAEA,YAAI,KAAK,SAAS,mBAAmB;AACnC,oBAAU;AACV,kBAAQ;AAAA,QACV;AAEA,YAAI,KAAK,SAAS,wBAAwB;AACxC,sBAAY,KAAK,KAAK,KAAK;AAC3B,yBAAe,WAAW;AAAA,QAC5B;AAEA,YAAI,KAAK,SAAS,uBAAuB;AACvC,yBAAe,WAAW;AAC1B,cAAI,YAAY,OAAO,WAAW,aAAa;AAC7C,sBAAU;AAAA,UACZ;AAAA,QACF;AAEA,YAAI,KAAK,SAAS,iBAAiB;AACjC,aAAI,KAAK,KAAK,UAAU,EAAE,MAAM,iBAAiB,CAAC,CAAC;AAAA,QACrD;AAEA,YAAI,KAAK,SAAS,SAAS;AACzB,gBAAM,MAAM,IAAI,MAAM,KAAK,OAAO,WAAW,eAAe;AAC5D,oBAAU,GAAG;AACb,iBAAO,GAAG;AAAA,QACZ;AAAA,MACF;AAEA,SAAG,UAAU,MAAM;AACjB,cAAM,MAAM,IAAI,MAAM,4BAA4B;AAClD,kBAAU,GAAG;AACb,eAAO,GAAG;AAAA,MACZ;AAEA,SAAG,UAAU,MAAM;AACjB,aAAK;AAAA,MACP;AAAA,IACF,CAAC;AAAA,EACH;AAEA,iBAAe,MAAM,MAA6B;AAChD,QAAI,CAAC,MAAM,GAAG,eAAe,UAAU,MAAM;AAC3C,YAAM,IAAI,MAAM,yBAAyB;AAAA,IAC3C;AAEA,kBAAc,CAAC;AAEf,OAAG;AAAA,MACD,KAAK,UAAU;AAAA,QACb,MAAM;AAAA,QACN;AAAA,MACF,CAAC;AAAA,IACH;AAEA,eAAW,MAAM;AACf,SAAI;AAAA,QACF,KAAK,UAAU;AAAA,UACb,MAAM;AAAA,QACR,CAAC;AAAA,MACH;AAAA,IACF,GAAG,GAAG;AAAA,EACR;AAEA,WAAS,YAAY;AACnB,QAAI,SAAmB;AACvB,QAAI,OAAO,WAAW,YAAa;AAEnC,QAAI;AACF,UAAI,CAAC,cAAc;AACjB,uBAAe,IAAI,aAAa;AAAA,MAClC;AAEA,qBAAe;AAEf,UAAI,aAAa;AACjB,YAAM,WAAyB,CAAC;AAEhC,iBAAW,SAAS,QAAQ;AAC1B,cAAM,eAAe,KAAK,KAAK;AAC/B,cAAM,QAAQ,IAAI,WAAW,aAAa,MAAM;AAChD,iBAAS,IAAI,GAAG,IAAI,aAAa,QAAQ,KAAK;AAC5C,gBAAM,CAAC,IAAI,aAAa,WAAW,CAAC;AAAA,QACtC;AACA,iBAAS,KAAK,KAAK;AACnB,sBAAc,MAAM;AAAA,MACtB;AAEA,YAAM,WAAW,IAAI,WAAW,UAAU;AAC1C,UAAI,SAAS;AACb,iBAAW,SAAS,UAAU;AAC5B,iBAAS,IAAI,OAAO,MAAM;AAC1B,kBAAU,MAAM;AAAA,MAClB;AAEA,YAAM,aAAa,SAAS,SAAS;AACrC,YAAM,cAAc,aAAa,aAAa,GAAG,YAAY,UAAU;AACvE,YAAM,cAAc,YAAY,eAAe,CAAC;AAEhD,YAAM,WAAW,IAAI,SAAS,SAAS,MAAM;AAC7C,eAAS,IAAI,GAAG,IAAI,YAAY,KAAK;AACnC,cAAM,QAAQ,SAAS,SAAS,IAAI,GAAG,IAAI;AAC3C,oBAAY,CAAC,IAAI,QAAQ;AAAA,MAC3B;AAEA,YAAM,SAAS,aAAa,mBAAmB;AAC/C,aAAO,SAAS;AAChB,aAAO,QAAQ,aAAa,WAAW;AACvC,aAAO,UAAU,MAAM,aAAa;AACpC,aAAO,MAAM,CAAC;AAAA,IAChB,SAAS,KAAK;AACZ,gBAAU,GAAY;AAAA,IACxB;AAAA,EACF;AAEA,WAAS,QAAQ;AACf,QAAI,IAAI;AACN,SAAG,MAAM;AACT,WAAK;AAAA,IACP;AACA,QAAI,cAAc;AAChB,mBAAa,MAAM;AACnB,qBAAe;AAAA,IACjB;AAAA,EACF;AAEA,SAAO;AAAA,IACL;AAAA,IACA;AAAA,IACA;AAAA,IACA,MAAM;AAAA,EACR;AACF;AAEA,IAAO,qBAAQ,CACb,eAC6C;AAC7C,SAAO,CAAC,WAA4B;AAClC,WAAO,gBAAgB,EAAE,GAAG,YAAY,GAAG,OAAO,CAAC;AAAA,EACrD;AACF;","names":[]}
@@ -0,0 +1,62 @@
1
+ /**
2
+ * TTS Realtime WebSocket Client
3
+ *
4
+ * WebSocket-based real-time text-to-speech synthesis with multiple voice options.
5
+ * Built-in playback only supports PCM format.
6
+ *
7
+ * @example
8
+ * ```typescript
9
+ * const client = createTTSClient({
10
+ * voice: "Cherry",
11
+ * autoPlay: true,
12
+ * onReady() {
13
+ * console.log("TTS ready");
14
+ * },
15
+ * onAudioStart() {
16
+ * console.log("Playing audio");
17
+ * },
18
+ * onAudioEnd() {
19
+ * console.log("Playback ended");
20
+ * },
21
+ * });
22
+ *
23
+ * await client.connect();
24
+ * await client.speak("Hello, this is a test.");
25
+ * // client.close();
26
+ * ```
27
+ */
28
+ interface TTSClientConfig {
29
+ /** Get access token for WebSocket authentication */
30
+ getAccessToken?: () => string | null;
31
+ /** Voice name, default 'Cherry' */
32
+ voice?: string;
33
+ /** Auto play audio, default true */
34
+ autoPlay?: boolean;
35
+ /** Audio format, default 'pcm' */
36
+ audioFormat?: "pcm" | "mp3" | "wav" | "opus";
37
+ /** Sample rate, default 24000 */
38
+ sampleRate?: number;
39
+ /** Called when connection is ready */
40
+ onReady?: () => void;
41
+ /** Called when audio playback starts */
42
+ onAudioStart?: () => void;
43
+ /** Called when audio playback ends */
44
+ onAudioEnd?: () => void;
45
+ /** Called on each audio chunk received */
46
+ onAudioChunk?: (chunk: string[]) => void;
47
+ /** Called on error */
48
+ onError?: (error: Error) => void;
49
+ }
50
+ interface TTSClient {
51
+ /** Connect to TTS service */
52
+ connect(): Promise<void>;
53
+ /** Synthesize speech from text */
54
+ speak(text: string): Promise<void>;
55
+ /** Play audio from chunks */
56
+ play(): void;
57
+ /** Close connection */
58
+ close(): void;
59
+ }
60
+ declare const _default: (authConfig: Pick<TTSClientConfig, "getAccessToken">) => ((config: TTSClientConfig) => TTSClient);
61
+
62
+ export { type TTSClient, type TTSClientConfig, _default as createTTSClient };
@@ -0,0 +1,62 @@
1
+ /**
2
+ * TTS Realtime WebSocket Client
3
+ *
4
+ * WebSocket-based real-time text-to-speech synthesis with multiple voice options.
5
+ * Built-in playback only supports PCM format.
6
+ *
7
+ * @example
8
+ * ```typescript
9
+ * const client = createTTSClient({
10
+ * voice: "Cherry",
11
+ * autoPlay: true,
12
+ * onReady() {
13
+ * console.log("TTS ready");
14
+ * },
15
+ * onAudioStart() {
16
+ * console.log("Playing audio");
17
+ * },
18
+ * onAudioEnd() {
19
+ * console.log("Playback ended");
20
+ * },
21
+ * });
22
+ *
23
+ * await client.connect();
24
+ * await client.speak("Hello, this is a test.");
25
+ * // client.close();
26
+ * ```
27
+ */
28
+ interface TTSClientConfig {
29
+ /** Get access token for WebSocket authentication */
30
+ getAccessToken?: () => string | null;
31
+ /** Voice name, default 'Cherry' */
32
+ voice?: string;
33
+ /** Auto play audio, default true */
34
+ autoPlay?: boolean;
35
+ /** Audio format, default 'pcm' */
36
+ audioFormat?: "pcm" | "mp3" | "wav" | "opus";
37
+ /** Sample rate, default 24000 */
38
+ sampleRate?: number;
39
+ /** Called when connection is ready */
40
+ onReady?: () => void;
41
+ /** Called when audio playback starts */
42
+ onAudioStart?: () => void;
43
+ /** Called when audio playback ends */
44
+ onAudioEnd?: () => void;
45
+ /** Called on each audio chunk received */
46
+ onAudioChunk?: (chunk: string[]) => void;
47
+ /** Called on error */
48
+ onError?: (error: Error) => void;
49
+ }
50
+ interface TTSClient {
51
+ /** Connect to TTS service */
52
+ connect(): Promise<void>;
53
+ /** Synthesize speech from text */
54
+ speak(text: string): Promise<void>;
55
+ /** Play audio from chunks */
56
+ play(): void;
57
+ /** Close connection */
58
+ close(): void;
59
+ }
60
+ declare const _default: (authConfig: Pick<TTSClientConfig, "getAccessToken">) => ((config: TTSClientConfig) => TTSClient);
61
+
62
+ export { type TTSClient, type TTSClientConfig, _default as createTTSClient };
package/dist/index.js ADDED
@@ -0,0 +1,166 @@
1
+ // src/tts-client.ts
2
+ var TTS_PATH = "/api/proxy/builtin/platform/qwen-tts/api-ws/v1/realtime";
3
+ function createTTSClient(config) {
4
+ const {
5
+ getAccessToken,
6
+ voice = "Cherry",
7
+ autoPlay = true,
8
+ audioFormat = "pcm",
9
+ sampleRate = 24e3,
10
+ onReady,
11
+ onAudioStart,
12
+ onAudioEnd,
13
+ onAudioChunk,
14
+ onError
15
+ } = config;
16
+ let ws = null;
17
+ let audioChunks = [];
18
+ let audioContext = null;
19
+ async function connect() {
20
+ return new Promise((resolve, reject) => {
21
+ let wsUrl = TTS_PATH;
22
+ if (getAccessToken) {
23
+ const token = getAccessToken();
24
+ if (token) {
25
+ const separator = wsUrl.includes("?") ? "&" : "?";
26
+ wsUrl = `${wsUrl}${separator}token=${encodeURIComponent(token)}`;
27
+ }
28
+ }
29
+ ws = new WebSocket(wsUrl);
30
+ ws.onopen = () => {
31
+ };
32
+ ws.onmessage = (event) => {
33
+ const data = JSON.parse(event.data);
34
+ if (data.type === "session.created") {
35
+ ws.send(
36
+ JSON.stringify({
37
+ type: "session.update",
38
+ session: {
39
+ mode: "server_commit",
40
+ voice,
41
+ response_format: audioFormat,
42
+ sample_rate: sampleRate
43
+ }
44
+ })
45
+ );
46
+ }
47
+ if (data.type === "session.updated") {
48
+ onReady?.();
49
+ resolve();
50
+ }
51
+ if (data.type === "response.audio.delta") {
52
+ audioChunks.push(data.delta);
53
+ onAudioChunk?.(audioChunks);
54
+ }
55
+ if (data.type === "response.audio.done") {
56
+ onAudioChunk?.(audioChunks);
57
+ if (autoPlay && typeof window !== "undefined") {
58
+ playAudio();
59
+ }
60
+ }
61
+ if (data.type === "response.done") {
62
+ ws.send(JSON.stringify({ type: "session.finish" }));
63
+ }
64
+ if (data.type === "error") {
65
+ const err = new Error(data.error?.message || "Unknown error");
66
+ onError?.(err);
67
+ reject(err);
68
+ }
69
+ };
70
+ ws.onerror = () => {
71
+ const err = new Error("WebSocket connection error");
72
+ onError?.(err);
73
+ reject(err);
74
+ };
75
+ ws.onclose = () => {
76
+ ws = null;
77
+ };
78
+ });
79
+ }
80
+ async function speak(text) {
81
+ if (!ws || ws.readyState !== WebSocket.OPEN) {
82
+ throw new Error("WebSocket not connected");
83
+ }
84
+ audioChunks = [];
85
+ ws.send(
86
+ JSON.stringify({
87
+ type: "input_text_buffer.append",
88
+ text
89
+ })
90
+ );
91
+ setTimeout(() => {
92
+ ws.send(
93
+ JSON.stringify({
94
+ type: "input_text_buffer.commit"
95
+ })
96
+ );
97
+ }, 100);
98
+ }
99
+ function playAudio() {
100
+ let chunks = audioChunks;
101
+ if (typeof window === "undefined") return;
102
+ try {
103
+ if (!audioContext) {
104
+ audioContext = new AudioContext();
105
+ }
106
+ onAudioStart?.();
107
+ let totalBytes = 0;
108
+ const allBytes = [];
109
+ for (const chunk of chunks) {
110
+ const binaryString = atob(chunk);
111
+ const bytes = new Uint8Array(binaryString.length);
112
+ for (let i = 0; i < binaryString.length; i++) {
113
+ bytes[i] = binaryString.charCodeAt(i);
114
+ }
115
+ allBytes.push(bytes);
116
+ totalBytes += bytes.length;
117
+ }
118
+ const combined = new Uint8Array(totalBytes);
119
+ let offset = 0;
120
+ for (const bytes of allBytes) {
121
+ combined.set(bytes, offset);
122
+ offset += bytes.length;
123
+ }
124
+ const numSamples = combined.length / 2;
125
+ const audioBuffer = audioContext.createBuffer(1, numSamples, sampleRate);
126
+ const channelData = audioBuffer.getChannelData(0);
127
+ const dataView = new DataView(combined.buffer);
128
+ for (let i = 0; i < numSamples; i++) {
129
+ const int16 = dataView.getInt16(i * 2, true);
130
+ channelData[i] = int16 / 32768;
131
+ }
132
+ const source = audioContext.createBufferSource();
133
+ source.buffer = audioBuffer;
134
+ source.connect(audioContext.destination);
135
+ source.onended = () => onAudioEnd?.();
136
+ source.start(0);
137
+ } catch (err) {
138
+ onError?.(err);
139
+ }
140
+ }
141
+ function close() {
142
+ if (ws) {
143
+ ws.close();
144
+ ws = null;
145
+ }
146
+ if (audioContext) {
147
+ audioContext.close();
148
+ audioContext = null;
149
+ }
150
+ }
151
+ return {
152
+ connect,
153
+ speak,
154
+ close,
155
+ play: playAudio
156
+ };
157
+ }
158
+ var tts_client_default = (authConfig) => {
159
+ return (config) => {
160
+ return createTTSClient({ ...authConfig, ...config });
161
+ };
162
+ };
163
+ export {
164
+ tts_client_default as createTTSClient
165
+ };
166
+ //# sourceMappingURL=index.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/tts-client.ts"],"sourcesContent":["/**\n * TTS Realtime WebSocket Client\n *\n * WebSocket-based real-time text-to-speech synthesis with multiple voice options.\n * Built-in playback only supports PCM format.\n *\n * @example\n * ```typescript\n * const client = createTTSClient({\n * voice: \"Cherry\",\n * autoPlay: true,\n * onReady() {\n * console.log(\"TTS ready\");\n * },\n * onAudioStart() {\n * console.log(\"Playing audio\");\n * },\n * onAudioEnd() {\n * console.log(\"Playback ended\");\n * },\n * });\n *\n * await client.connect();\n * await client.speak(\"Hello, this is a test.\");\n * // client.close();\n * ```\n */\n\nconst TTS_PATH = \"/api/proxy/builtin/platform/qwen-tts/api-ws/v1/realtime\";\n\nexport interface TTSClientConfig {\n /** Get access token for WebSocket authentication */\n getAccessToken?: () => string | null;\n /** Voice name, default 'Cherry' */\n voice?: string;\n /** Auto play audio, default true */\n autoPlay?: boolean;\n /** Audio format, default 'pcm' */\n audioFormat?: \"pcm\" | \"mp3\" | \"wav\" | \"opus\";\n /** Sample rate, default 24000 */\n sampleRate?: number;\n /** Called when connection is ready */\n onReady?: () => void;\n /** Called when audio playback starts */\n onAudioStart?: () => void;\n /** Called when audio playback ends */\n onAudioEnd?: () => void;\n /** Called on each audio chunk received */\n onAudioChunk?: (chunk: string[]) => void;\n /** Called on error */\n onError?: (error: Error) => void;\n}\n\nexport interface TTSClient {\n /** Connect to TTS service */\n connect(): Promise<void>;\n /** Synthesize speech from text */\n speak(text: string): Promise<void>;\n /** Play audio from chunks */\n play(): void;\n /** Close connection */\n close(): void;\n}\n\nfunction createTTSClient(config: TTSClientConfig): TTSClient {\n const {\n getAccessToken,\n voice = \"Cherry\",\n autoPlay = true,\n audioFormat = \"pcm\",\n sampleRate = 24000,\n onReady,\n onAudioStart,\n onAudioEnd,\n onAudioChunk,\n onError,\n } = config;\n\n let ws: WebSocket | null = null;\n let audioChunks: string[] = [];\n let audioContext: AudioContext | null = null;\n\n async function connect(): Promise<void> {\n return new Promise((resolve, reject) => {\n // Build WebSocket URL with optional token parameter\n let wsUrl = TTS_PATH;\n if (getAccessToken) {\n const token = getAccessToken();\n if (token) {\n const separator = wsUrl.includes(\"?\") ? \"&\" : \"?\";\n wsUrl = `${wsUrl}${separator}token=${encodeURIComponent(token)}`;\n }\n }\n\n ws = new WebSocket(wsUrl);\n\n ws.onopen = () => {};\n\n ws.onmessage = (event) => {\n const data = JSON.parse(event.data);\n\n if (data.type === \"session.created\") {\n ws!.send(\n JSON.stringify({\n type: \"session.update\",\n session: {\n mode: \"server_commit\",\n voice,\n response_format: audioFormat,\n sample_rate: sampleRate,\n },\n })\n );\n }\n\n if (data.type === \"session.updated\") {\n onReady?.();\n resolve();\n }\n\n if (data.type === \"response.audio.delta\") {\n audioChunks.push(data.delta);\n onAudioChunk?.(audioChunks);\n }\n\n if (data.type === \"response.audio.done\") {\n onAudioChunk?.(audioChunks);\n if (autoPlay && typeof window !== \"undefined\") {\n playAudio();\n }\n }\n\n if (data.type === \"response.done\") {\n ws!.send(JSON.stringify({ type: \"session.finish\" }));\n }\n\n if (data.type === \"error\") {\n const err = new Error(data.error?.message || \"Unknown error\");\n onError?.(err);\n reject(err);\n }\n };\n\n ws.onerror = () => {\n const err = new Error(\"WebSocket connection error\");\n onError?.(err);\n reject(err);\n };\n\n ws.onclose = () => {\n ws = null;\n };\n });\n }\n\n async function speak(text: string): Promise<void> {\n if (!ws || ws.readyState !== WebSocket.OPEN) {\n throw new Error(\"WebSocket not connected\");\n }\n\n audioChunks = [];\n\n ws.send(\n JSON.stringify({\n type: \"input_text_buffer.append\",\n text,\n })\n );\n\n setTimeout(() => {\n ws!.send(\n JSON.stringify({\n type: \"input_text_buffer.commit\",\n })\n );\n }, 100);\n }\n\n function playAudio() {\n let chunks: string[] = audioChunks;\n if (typeof window === \"undefined\") return;\n\n try {\n if (!audioContext) {\n audioContext = new AudioContext();\n }\n\n onAudioStart?.();\n\n let totalBytes = 0;\n const allBytes: Uint8Array[] = [];\n\n for (const chunk of chunks) {\n const binaryString = atob(chunk);\n const bytes = new Uint8Array(binaryString.length);\n for (let i = 0; i < binaryString.length; i++) {\n bytes[i] = binaryString.charCodeAt(i);\n }\n allBytes.push(bytes);\n totalBytes += bytes.length;\n }\n\n const combined = new Uint8Array(totalBytes);\n let offset = 0;\n for (const bytes of allBytes) {\n combined.set(bytes, offset);\n offset += bytes.length;\n }\n\n const numSamples = combined.length / 2;\n const audioBuffer = audioContext.createBuffer(1, numSamples, sampleRate);\n const channelData = audioBuffer.getChannelData(0);\n\n const dataView = new DataView(combined.buffer);\n for (let i = 0; i < numSamples; i++) {\n const int16 = dataView.getInt16(i * 2, true);\n channelData[i] = int16 / 32768.0;\n }\n\n const source = audioContext.createBufferSource();\n source.buffer = audioBuffer;\n source.connect(audioContext.destination);\n source.onended = () => onAudioEnd?.();\n source.start(0);\n } catch (err) {\n onError?.(err as Error);\n }\n }\n\n function close() {\n if (ws) {\n ws.close();\n ws = null;\n }\n if (audioContext) {\n audioContext.close();\n audioContext = null;\n }\n }\n\n return {\n connect,\n speak,\n close,\n play: playAudio,\n };\n}\n\nexport default (\n authConfig: Pick<TTSClientConfig, \"getAccessToken\">\n): ((config: TTSClientConfig) => TTSClient) => {\n return (config: TTSClientConfig) => {\n return createTTSClient({ ...authConfig, ...config });\n };\n};\n"],"mappings":";AA4BA,IAAM,WAAW;AAoCjB,SAAS,gBAAgB,QAAoC;AAC3D,QAAM;AAAA,IACJ;AAAA,IACA,QAAQ;AAAA,IACR,WAAW;AAAA,IACX,cAAc;AAAA,IACd,aAAa;AAAA,IACb;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,EACF,IAAI;AAEJ,MAAI,KAAuB;AAC3B,MAAI,cAAwB,CAAC;AAC7B,MAAI,eAAoC;AAExC,iBAAe,UAAyB;AACtC,WAAO,IAAI,QAAQ,CAAC,SAAS,WAAW;AAEtC,UAAI,QAAQ;AACZ,UAAI,gBAAgB;AAClB,cAAM,QAAQ,eAAe;AAC7B,YAAI,OAAO;AACT,gBAAM,YAAY,MAAM,SAAS,GAAG,IAAI,MAAM;AAC9C,kBAAQ,GAAG,KAAK,GAAG,SAAS,SAAS,mBAAmB,KAAK,CAAC;AAAA,QAChE;AAAA,MACF;AAEA,WAAK,IAAI,UAAU,KAAK;AAExB,SAAG,SAAS,MAAM;AAAA,MAAC;AAEnB,SAAG,YAAY,CAAC,UAAU;AACxB,cAAM,OAAO,KAAK,MAAM,MAAM,IAAI;AAElC,YAAI,KAAK,SAAS,mBAAmB;AACnC,aAAI;AAAA,YACF,KAAK,UAAU;AAAA,cACb,MAAM;AAAA,cACN,SAAS;AAAA,gBACP,MAAM;AAAA,gBACN;AAAA,gBACA,iBAAiB;AAAA,gBACjB,aAAa;AAAA,cACf;AAAA,YACF,CAAC;AAAA,UACH;AAAA,QACF;AAEA,YAAI,KAAK,SAAS,mBAAmB;AACnC,oBAAU;AACV,kBAAQ;AAAA,QACV;AAEA,YAAI,KAAK,SAAS,wBAAwB;AACxC,sBAAY,KAAK,KAAK,KAAK;AAC3B,yBAAe,WAAW;AAAA,QAC5B;AAEA,YAAI,KAAK,SAAS,uBAAuB;AACvC,yBAAe,WAAW;AAC1B,cAAI,YAAY,OAAO,WAAW,aAAa;AAC7C,sBAAU;AAAA,UACZ;AAAA,QACF;AAEA,YAAI,KAAK,SAAS,iBAAiB;AACjC,aAAI,KAAK,KAAK,UAAU,EAAE,MAAM,iBAAiB,CAAC,CAAC;AAAA,QACrD;AAEA,YAAI,KAAK,SAAS,SAAS;AACzB,gBAAM,MAAM,IAAI,MAAM,KAAK,OAAO,WAAW,eAAe;AAC5D,oBAAU,GAAG;AACb,iBAAO,GAAG;AAAA,QACZ;AAAA,MACF;AAEA,SAAG,UAAU,MAAM;AACjB,cAAM,MAAM,IAAI,MAAM,4BAA4B;AAClD,kBAAU,GAAG;AACb,eAAO,GAAG;AAAA,MACZ;AAEA,SAAG,UAAU,MAAM;AACjB,aAAK;AAAA,MACP;AAAA,IACF,CAAC;AAAA,EACH;AAEA,iBAAe,MAAM,MAA6B;AAChD,QAAI,CAAC,MAAM,GAAG,eAAe,UAAU,MAAM;AAC3C,YAAM,IAAI,MAAM,yBAAyB;AAAA,IAC3C;AAEA,kBAAc,CAAC;AAEf,OAAG;AAAA,MACD,KAAK,UAAU;AAAA,QACb,MAAM;AAAA,QACN;AAAA,MACF,CAAC;AAAA,IACH;AAEA,eAAW,MAAM;AACf,SAAI;AAAA,QACF,KAAK,UAAU;AAAA,UACb,MAAM;AAAA,QACR,CAAC;AAAA,MACH;AAAA,IACF,GAAG,GAAG;AAAA,EACR;AAEA,WAAS,YAAY;AACnB,QAAI,SAAmB;AACvB,QAAI,OAAO,WAAW,YAAa;AAEnC,QAAI;AACF,UAAI,CAAC,cAAc;AACjB,uBAAe,IAAI,aAAa;AAAA,MAClC;AAEA,qBAAe;AAEf,UAAI,aAAa;AACjB,YAAM,WAAyB,CAAC;AAEhC,iBAAW,SAAS,QAAQ;AAC1B,cAAM,eAAe,KAAK,KAAK;AAC/B,cAAM,QAAQ,IAAI,WAAW,aAAa,MAAM;AAChD,iBAAS,IAAI,GAAG,IAAI,aAAa,QAAQ,KAAK;AAC5C,gBAAM,CAAC,IAAI,aAAa,WAAW,CAAC;AAAA,QACtC;AACA,iBAAS,KAAK,KAAK;AACnB,sBAAc,MAAM;AAAA,MACtB;AAEA,YAAM,WAAW,IAAI,WAAW,UAAU;AAC1C,UAAI,SAAS;AACb,iBAAW,SAAS,UAAU;AAC5B,iBAAS,IAAI,OAAO,MAAM;AAC1B,kBAAU,MAAM;AAAA,MAClB;AAEA,YAAM,aAAa,SAAS,SAAS;AACrC,YAAM,cAAc,aAAa,aAAa,GAAG,YAAY,UAAU;AACvE,YAAM,cAAc,YAAY,eAAe,CAAC;AAEhD,YAAM,WAAW,IAAI,SAAS,SAAS,MAAM;AAC7C,eAAS,IAAI,GAAG,IAAI,YAAY,KAAK;AACnC,cAAM,QAAQ,SAAS,SAAS,IAAI,GAAG,IAAI;AAC3C,oBAAY,CAAC,IAAI,QAAQ;AAAA,MAC3B;AAEA,YAAM,SAAS,aAAa,mBAAmB;AAC/C,aAAO,SAAS;AAChB,aAAO,QAAQ,aAAa,WAAW;AACvC,aAAO,UAAU,MAAM,aAAa;AACpC,aAAO,MAAM,CAAC;AAAA,IAChB,SAAS,KAAK;AACZ,gBAAU,GAAY;AAAA,IACxB;AAAA,EACF;AAEA,WAAS,QAAQ;AACf,QAAI,IAAI;AACN,SAAG,MAAM;AACT,WAAK;AAAA,IACP;AACA,QAAI,cAAc;AAChB,mBAAa,MAAM;AACnB,qBAAe;AAAA,IACjB;AAAA,EACF;AAEA,SAAO;AAAA,IACL;AAAA,IACA;AAAA,IACA;AAAA,IACA,MAAM;AAAA,EACR;AACF;AAEA,IAAO,qBAAQ,CACb,eAC6C;AAC7C,SAAO,CAAC,WAA4B;AAClC,WAAO,gBAAgB,EAAE,GAAG,YAAY,GAAG,OAAO,CAAC;AAAA,EACrD;AACF;","names":[]}
package/package.json ADDED
@@ -0,0 +1,45 @@
1
+ {
2
+ "name": "@amaster.ai/tts-client",
3
+ "version": "1.0.0-alpha.2",
4
+ "description": "Qwen TTS Realtime WebSocket client with audio playback",
5
+ "type": "module",
6
+ "main": "./dist/index.cjs",
7
+ "module": "./dist/index.js",
8
+ "types": "./dist/index.d.ts",
9
+ "exports": {
10
+ ".": {
11
+ "types": "./dist/index.d.ts",
12
+ "import": "./dist/index.js",
13
+ "require": "./dist/index.cjs"
14
+ }
15
+ },
16
+ "files": [
17
+ "dist",
18
+ "README.md"
19
+ ],
20
+ "keywords": [
21
+ "tts",
22
+ "text-to-speech",
23
+ "qwen",
24
+ "realtime",
25
+ "websocket",
26
+ "audio",
27
+ "speech-synthesis"
28
+ ],
29
+ "author": "Amaster Team",
30
+ "license": "MIT",
31
+ "publishConfig": {
32
+ "access": "public",
33
+ "registry": "https://registry.npmjs.org/"
34
+ },
35
+ "devDependencies": {
36
+ "tsup": "^8.3.5",
37
+ "typescript": "~5.7.2"
38
+ },
39
+ "scripts": {
40
+ "build": "tsup",
41
+ "dev": "tsup --watch",
42
+ "clean": "rm -rf dist *.tsbuildinfo",
43
+ "type-check": "tsc --noEmit"
44
+ }
45
+ }