@cloudflare/tanstack-ai 0.1.6 → 0.1.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +6 -6
- package/dist/adapters/anthropic.cjs +32 -11
- package/dist/adapters/anthropic.cjs.map +1 -1
- package/dist/adapters/anthropic.d.cts +23 -5
- package/dist/adapters/anthropic.d.mts +23 -0
- package/dist/adapters/anthropic.mjs +30 -0
- package/dist/adapters/anthropic.mjs.map +1 -0
- package/dist/adapters/gemini.cjs +83 -20
- package/dist/adapters/gemini.cjs.map +1 -1
- package/dist/adapters/gemini.d.cts +52 -14
- package/dist/adapters/gemini.d.mts +52 -0
- package/dist/adapters/gemini.mjs +76 -0
- package/dist/adapters/gemini.mjs.map +1 -0
- package/dist/adapters/grok.cjs +44 -15
- package/dist/adapters/grok.cjs.map +1 -1
- package/dist/adapters/grok.d.cts +26 -9
- package/dist/adapters/grok.d.mts +26 -0
- package/dist/adapters/grok.mjs +40 -0
- package/dist/adapters/grok.mjs.map +1 -0
- package/dist/adapters/openai.cjs +76 -27
- package/dist/adapters/openai.cjs.map +1 -1
- package/dist/adapters/openai.d.cts +45 -17
- package/dist/adapters/openai.d.mts +45 -0
- package/dist/adapters/openai.mjs +66 -0
- package/dist/adapters/openai.mjs.map +1 -0
- package/dist/adapters/openrouter.cjs +83 -11
- package/dist/adapters/openrouter.cjs.map +1 -1
- package/dist/adapters/openrouter.d.cts +39 -7
- package/dist/adapters/openrouter.d.mts +39 -0
- package/dist/adapters/openrouter.mjs +81 -0
- package/dist/adapters/openrouter.mjs.map +1 -0
- package/dist/adapters/workers-ai-image.cjs +97 -11
- package/dist/adapters/workers-ai-image.cjs.map +1 -1
- package/dist/adapters/workers-ai-image.d.cts +41 -3
- package/dist/adapters/workers-ai-image.d.mts +41 -0
- package/dist/adapters/workers-ai-image.mjs +96 -0
- package/dist/adapters/workers-ai-image.mjs.map +1 -0
- package/dist/adapters/workers-ai-summarize.cjs +86 -10
- package/dist/adapters/workers-ai-summarize.cjs.map +1 -1
- package/dist/adapters/workers-ai-summarize.d.cts +42 -3
- package/dist/adapters/workers-ai-summarize.d.mts +42 -0
- package/dist/adapters/workers-ai-summarize.mjs +85 -0
- package/dist/adapters/workers-ai-summarize.mjs.map +1 -0
- package/dist/adapters/workers-ai-transcription.cjs +200 -11
- package/dist/adapters/workers-ai-transcription.cjs.map +1 -1
- package/dist/adapters/workers-ai-transcription.d.cts +74 -3
- package/dist/adapters/workers-ai-transcription.d.mts +74 -0
- package/dist/adapters/workers-ai-transcription.mjs +199 -0
- package/dist/adapters/workers-ai-transcription.mjs.map +1 -0
- package/dist/adapters/workers-ai-tts.cjs +112 -11
- package/dist/adapters/workers-ai-tts.cjs.map +1 -1
- package/dist/adapters/workers-ai-tts.d.cts +54 -3
- package/dist/adapters/workers-ai-tts.d.mts +54 -0
- package/dist/adapters/workers-ai-tts.mjs +111 -0
- package/dist/adapters/workers-ai-tts.mjs.map +1 -0
- package/dist/adapters/workers-ai.cjs +4 -11
- package/dist/adapters/workers-ai.d.cts +18 -3
- package/dist/adapters/workers-ai.d.mts +18 -0
- package/dist/adapters/workers-ai.mjs +470 -0
- package/dist/adapters/workers-ai.mjs.map +1 -0
- package/dist/binary-C9FAYwZj.cjs +70 -0
- package/dist/binary-C9FAYwZj.cjs.map +1 -0
- package/dist/binary-p4H_N_3M.mjs +59 -0
- package/dist/binary-p4H_N_3M.mjs.map +1 -0
- package/dist/create-fetcher-5iL34e6H.cjs +310 -0
- package/dist/create-fetcher-5iL34e6H.cjs.map +1 -0
- package/dist/create-fetcher-6p6heb85.d.mts +93 -0
- package/dist/create-fetcher-DY7wfYYy.mjs +281 -0
- package/dist/create-fetcher-DY7wfYYy.mjs.map +1 -0
- package/dist/create-fetcher-vAQ8WW-p.d.cts +93 -0
- package/dist/defineProperty-CbyrzcbA.mjs +39 -0
- package/dist/defineProperty-DQoAg20E.cjs +44 -0
- package/dist/index.cjs +50 -97
- package/dist/index.d.cts +12 -64
- package/dist/index.d.mts +12 -0
- package/dist/index.mjs +11 -0
- package/dist/workers-ai-Bm7Up4or.cjs +510 -0
- package/dist/workers-ai-Bm7Up4or.cjs.map +1 -0
- package/dist/workers-ai-rest-CkNCtBwv.cjs +85 -0
- package/dist/workers-ai-rest-CkNCtBwv.cjs.map +1 -0
- package/dist/workers-ai-rest-GKy2r7eG.mjs +74 -0
- package/dist/workers-ai-rest-GKy2r7eG.mjs.map +1 -0
- package/package.json +73 -40
- package/dist/_tsup-dts-rollup.d.cts +0 -837
- package/dist/_tsup-dts-rollup.d.ts +0 -837
- package/dist/adapters/anthropic.d.ts +0 -5
- package/dist/adapters/anthropic.js +0 -13
- package/dist/adapters/anthropic.js.map +0 -1
- package/dist/adapters/gemini.d.ts +0 -14
- package/dist/adapters/gemini.js +0 -22
- package/dist/adapters/gemini.js.map +0 -1
- package/dist/adapters/grok.d.ts +0 -9
- package/dist/adapters/grok.js +0 -17
- package/dist/adapters/grok.js.map +0 -1
- package/dist/adapters/openai.d.ts +0 -17
- package/dist/adapters/openai.js +0 -29
- package/dist/adapters/openai.js.map +0 -1
- package/dist/adapters/openrouter.d.ts +0 -7
- package/dist/adapters/openrouter.js +0 -13
- package/dist/adapters/openrouter.js.map +0 -1
- package/dist/adapters/workers-ai-image.d.ts +0 -3
- package/dist/adapters/workers-ai-image.js +0 -13
- package/dist/adapters/workers-ai-image.js.map +0 -1
- package/dist/adapters/workers-ai-summarize.d.ts +0 -3
- package/dist/adapters/workers-ai-summarize.js +0 -12
- package/dist/adapters/workers-ai-summarize.js.map +0 -1
- package/dist/adapters/workers-ai-transcription.d.ts +0 -3
- package/dist/adapters/workers-ai-transcription.js +0 -13
- package/dist/adapters/workers-ai-transcription.js.map +0 -1
- package/dist/adapters/workers-ai-tts.d.ts +0 -3
- package/dist/adapters/workers-ai-tts.js +0 -13
- package/dist/adapters/workers-ai-tts.js.map +0 -1
- package/dist/adapters/workers-ai.cjs.map +0 -1
- package/dist/adapters/workers-ai.d.ts +0 -3
- package/dist/adapters/workers-ai.js +0 -11
- package/dist/adapters/workers-ai.js.map +0 -1
- package/dist/chunk-2VII5BK2.js +0 -42
- package/dist/chunk-2VII5BK2.js.map +0 -1
- package/dist/chunk-3VQDXJLW.cjs +0 -46
- package/dist/chunk-3VQDXJLW.cjs.map +0 -1
- package/dist/chunk-3WK5ZD57.js +0 -57
- package/dist/chunk-3WK5ZD57.js.map +0 -1
- package/dist/chunk-4DE2IREA.cjs +0 -8
- package/dist/chunk-4DE2IREA.cjs.map +0 -1
- package/dist/chunk-53A2QIXV.js +0 -98
- package/dist/chunk-53A2QIXV.js.map +0 -1
- package/dist/chunk-6MEX2ZSM.cjs +0 -48
- package/dist/chunk-6MEX2ZSM.cjs.map +0 -1
- package/dist/chunk-7HSUHP63.cjs +0 -42
- package/dist/chunk-7HSUHP63.cjs.map +0 -1
- package/dist/chunk-AIAJANLC.js +0 -327
- package/dist/chunk-AIAJANLC.js.map +0 -1
- package/dist/chunk-CB3PSZY2.cjs +0 -218
- package/dist/chunk-CB3PSZY2.cjs.map +0 -1
- package/dist/chunk-FQE2UKUU.cjs +0 -57
- package/dist/chunk-FQE2UKUU.cjs.map +0 -1
- package/dist/chunk-GL3HHR4M.js +0 -523
- package/dist/chunk-GL3HHR4M.js.map +0 -1
- package/dist/chunk-J5DSSZTO.js +0 -71
- package/dist/chunk-J5DSSZTO.js.map +0 -1
- package/dist/chunk-JRFPCMSE.js +0 -57
- package/dist/chunk-JRFPCMSE.js.map +0 -1
- package/dist/chunk-KWYOUT2Y.js +0 -111
- package/dist/chunk-KWYOUT2Y.js.map +0 -1
- package/dist/chunk-MJ45L566.cjs +0 -57
- package/dist/chunk-MJ45L566.cjs.map +0 -1
- package/dist/chunk-N6U27RQW.cjs +0 -111
- package/dist/chunk-N6U27RQW.cjs.map +0 -1
- package/dist/chunk-NH3FF5JC.js +0 -86
- package/dist/chunk-NH3FF5JC.js.map +0 -1
- package/dist/chunk-OFUYHQZE.cjs +0 -31
- package/dist/chunk-OFUYHQZE.cjs.map +0 -1
- package/dist/chunk-OUEAAP25.cjs +0 -523
- package/dist/chunk-OUEAAP25.cjs.map +0 -1
- package/dist/chunk-Q33U5I5S.js +0 -31
- package/dist/chunk-Q33U5I5S.js.map +0 -1
- package/dist/chunk-V4LKHWJA.cjs +0 -71
- package/dist/chunk-V4LKHWJA.cjs.map +0 -1
- package/dist/chunk-V6TY7KAL.js +0 -8
- package/dist/chunk-V6TY7KAL.js.map +0 -1
- package/dist/chunk-WBTQKWFN.cjs +0 -327
- package/dist/chunk-WBTQKWFN.cjs.map +0 -1
- package/dist/chunk-XU7YEPML.js +0 -46
- package/dist/chunk-XU7YEPML.js.map +0 -1
- package/dist/chunk-YCGNMVQZ.js +0 -218
- package/dist/chunk-YCGNMVQZ.js.map +0 -1
- package/dist/chunk-Z5ZC5ZOQ.js +0 -48
- package/dist/chunk-Z5ZC5ZOQ.js.map +0 -1
- package/dist/chunk-ZFB72L57.cjs +0 -86
- package/dist/chunk-ZFB72L57.cjs.map +0 -1
- package/dist/chunk-ZGLSJM26.cjs +0 -98
- package/dist/chunk-ZGLSJM26.cjs.map +0 -1
- package/dist/index.cjs.map +0 -1
- package/dist/index.d.ts +0 -64
- package/dist/index.js +0 -97
- package/dist/index.js.map +0 -1
|
@@ -0,0 +1,199 @@
|
|
|
1
|
+
import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-DY7wfYYy.mjs";
|
|
2
|
+
import { t as _defineProperty } from "../defineProperty-CbyrzcbA.mjs";
|
|
3
|
+
import { n as workersAiRestFetchBinary, t as workersAiRestFetch } from "../workers-ai-rest-GKy2r7eG.mjs";
|
|
4
|
+
import { n as uint8ArrayToBase64 } from "../binary-p4H_N_3M.mjs";
|
|
5
|
+
import { BaseTranscriptionAdapter } from "@tanstack/ai/adapters";
|
|
6
|
+
//#region src/adapters/workers-ai-transcription.ts
|
|
7
|
+
var WorkersAiTranscriptionAdapter = class extends BaseTranscriptionAdapter {
|
|
8
|
+
constructor(config, model) {
|
|
9
|
+
super({}, model);
|
|
10
|
+
_defineProperty(this, "name", "workers-ai-transcription");
|
|
11
|
+
_defineProperty(this, "adapterConfig", void 0);
|
|
12
|
+
validateWorkersAiConfig(config);
|
|
13
|
+
this.adapterConfig = config;
|
|
14
|
+
}
|
|
15
|
+
async transcribe(options) {
|
|
16
|
+
const { audio, language, prompt, modelOptions } = options;
|
|
17
|
+
const audioBytes = await normalizeAudioToBytes(audio);
|
|
18
|
+
const extra = { ...modelOptions };
|
|
19
|
+
if (language) extra.language = language;
|
|
20
|
+
if (prompt) extra.initial_prompt = prompt;
|
|
21
|
+
const audioPayload = this.buildAudioPayload(audioBytes, audio);
|
|
22
|
+
if (isDirectBindingConfig(this.adapterConfig)) return this.transcribeViaBinding(audioPayload, extra);
|
|
23
|
+
if (isDirectCredentialsConfig(this.adapterConfig)) {
|
|
24
|
+
if (this.model === "@cf/deepgram/nova-3") return this.transcribeViaRestBinary(audioBytes, audio, extra);
|
|
25
|
+
return this.transcribeViaRest(audioPayload, extra);
|
|
26
|
+
}
|
|
27
|
+
return this.transcribeViaGateway(audioPayload, extra);
|
|
28
|
+
}
|
|
29
|
+
/**
|
|
30
|
+
* Build the audio field for the request payload, handling model-specific formats.
|
|
31
|
+
*
|
|
32
|
+
* - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: "audio/..." }`
|
|
33
|
+
* - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string
|
|
34
|
+
* - Other Whisper models accept `number[]` (binding) or base64 (REST)
|
|
35
|
+
*/
|
|
36
|
+
buildAudioPayload(audioBytes, originalAudio) {
|
|
37
|
+
if (this.model === "@cf/deepgram/nova-3") return { audio: {
|
|
38
|
+
body: uint8ArrayToBase64(new Uint8Array(audioBytes)),
|
|
39
|
+
contentType: detectAudioContentType(originalAudio)
|
|
40
|
+
} };
|
|
41
|
+
if (this.model === "@cf/openai/whisper-large-v3-turbo") return { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };
|
|
42
|
+
return { audio: audioBytes };
|
|
43
|
+
}
|
|
44
|
+
async transcribeViaBinding(audioPayload, options) {
|
|
45
|
+
const result = await this.adapterConfig.binding.run(this.model, {
|
|
46
|
+
...audioPayload,
|
|
47
|
+
...options
|
|
48
|
+
});
|
|
49
|
+
return this.normalizeResult(result);
|
|
50
|
+
}
|
|
51
|
+
async transcribeViaRest(audioPayload, options) {
|
|
52
|
+
const config = this.adapterConfig;
|
|
53
|
+
const data = await (await workersAiRestFetch(config, this.model, {
|
|
54
|
+
...audioPayload,
|
|
55
|
+
...options
|
|
56
|
+
}, {
|
|
57
|
+
label: "Workers AI transcription",
|
|
58
|
+
signal: options.signal
|
|
59
|
+
})).json();
|
|
60
|
+
return this.normalizeResult(data.result ?? data);
|
|
61
|
+
}
|
|
62
|
+
/**
|
|
63
|
+
* Transcribe via REST using raw binary audio.
|
|
64
|
+
* Required for models like Deepgram Nova-3 that expect raw audio bytes
|
|
65
|
+
* with a Content-Type header (e.g. "audio/wav") instead of JSON.
|
|
66
|
+
*/
|
|
67
|
+
async transcribeViaRestBinary(audioBytes, originalAudio, options) {
|
|
68
|
+
const config = this.adapterConfig;
|
|
69
|
+
const contentType = detectAudioContentType(originalAudio);
|
|
70
|
+
const data = await (await workersAiRestFetchBinary(config, this.model, new Uint8Array(audioBytes), contentType, {
|
|
71
|
+
label: "Workers AI transcription",
|
|
72
|
+
signal: options.signal
|
|
73
|
+
})).json();
|
|
74
|
+
return this.normalizeResult(data.result ?? data);
|
|
75
|
+
}
|
|
76
|
+
async transcribeViaGateway(audioPayload, options) {
|
|
77
|
+
const gatewayConfig = this.adapterConfig;
|
|
78
|
+
const response = await createGatewayFetch("workers-ai", gatewayConfig)("https://api.cloudflare.com/v1/audio/transcriptions", {
|
|
79
|
+
method: "POST",
|
|
80
|
+
body: JSON.stringify({
|
|
81
|
+
model: this.model,
|
|
82
|
+
...audioPayload,
|
|
83
|
+
...options
|
|
84
|
+
})
|
|
85
|
+
});
|
|
86
|
+
if (!response.ok) {
|
|
87
|
+
const errorText = await response.text();
|
|
88
|
+
throw new Error(`Workers AI transcription gateway request failed (${response.status}): ${errorText}`);
|
|
89
|
+
}
|
|
90
|
+
const data = await response.json();
|
|
91
|
+
return this.normalizeResult(data);
|
|
92
|
+
}
|
|
93
|
+
/**
|
|
94
|
+
* Normalize Workers AI transcription results into the standard
|
|
95
|
+
* TanStack AI TranscriptionResult shape.
|
|
96
|
+
*
|
|
97
|
+
* Handles three response formats:
|
|
98
|
+
* - Whisper: `{ text, words?, vtt? }`
|
|
99
|
+
* - Whisper v3-turbo: `{ text, segments?, transcription_info? }`
|
|
100
|
+
* - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`
|
|
101
|
+
*/
|
|
102
|
+
normalizeResult(raw) {
|
|
103
|
+
const results = raw.results;
|
|
104
|
+
if (results?.channels) {
|
|
105
|
+
const alt = results.channels?.[0]?.alternatives?.[0];
|
|
106
|
+
const text = alt?.transcript ?? "";
|
|
107
|
+
const result = {
|
|
108
|
+
id: this.generateId(),
|
|
109
|
+
model: this.model,
|
|
110
|
+
text
|
|
111
|
+
};
|
|
112
|
+
if (alt?.words && Array.isArray(alt.words)) result.words = alt.words.map((w) => ({
|
|
113
|
+
word: w.word ?? "",
|
|
114
|
+
start: w.start ?? 0,
|
|
115
|
+
end: w.end ?? 0
|
|
116
|
+
}));
|
|
117
|
+
return result;
|
|
118
|
+
}
|
|
119
|
+
const result = {
|
|
120
|
+
id: this.generateId(),
|
|
121
|
+
model: this.model,
|
|
122
|
+
text: raw.text ?? ""
|
|
123
|
+
};
|
|
124
|
+
const transcriptionInfo = raw.transcription_info;
|
|
125
|
+
if (transcriptionInfo?.language) result.language = transcriptionInfo.language;
|
|
126
|
+
if (transcriptionInfo?.duration != null) result.duration = transcriptionInfo.duration;
|
|
127
|
+
if (raw.segments && Array.isArray(raw.segments)) result.segments = raw.segments.map((seg, idx) => ({
|
|
128
|
+
id: idx,
|
|
129
|
+
text: seg.text ?? "",
|
|
130
|
+
start: seg.start ?? 0,
|
|
131
|
+
end: seg.end ?? 0
|
|
132
|
+
}));
|
|
133
|
+
if (raw.words && Array.isArray(raw.words)) result.words = raw.words.map((w) => ({
|
|
134
|
+
word: w.word ?? "",
|
|
135
|
+
start: w.start ?? 0,
|
|
136
|
+
end: w.end ?? 0
|
|
137
|
+
}));
|
|
138
|
+
return result;
|
|
139
|
+
}
|
|
140
|
+
};
|
|
141
|
+
/**
|
|
142
|
+
* Creates a Workers AI transcription adapter for speech-to-text.
|
|
143
|
+
*
|
|
144
|
+
* Works with TanStack AI's `generateTranscription()` activity function:
|
|
145
|
+
* ```ts
|
|
146
|
+
* import { generateTranscription } from "@tanstack/ai";
|
|
147
|
+
* import { createWorkersAiTranscription } from "@cloudflare/tanstack-ai";
|
|
148
|
+
*
|
|
149
|
+
* const adapter = createWorkersAiTranscription(
|
|
150
|
+
* "@cf/openai/whisper-large-v3-turbo",
|
|
151
|
+
* { binding: env.AI },
|
|
152
|
+
* );
|
|
153
|
+
*
|
|
154
|
+
* const result = await generateTranscription({ adapter, audio: audioData });
|
|
155
|
+
* // result.text — the transcribed text
|
|
156
|
+
* ```
|
|
157
|
+
*
|
|
158
|
+
* Note: Factory takes `(model, config)` for ergonomics — the class constructor
|
|
159
|
+
* uses `(config, model)` to match TanStack AI's upstream convention.
|
|
160
|
+
*/
|
|
161
|
+
function createWorkersAiTranscription(model, config) {
|
|
162
|
+
return new WorkersAiTranscriptionAdapter(config, model);
|
|
163
|
+
}
|
|
164
|
+
/**
|
|
165
|
+
* Normalize various audio input formats into a number[] (raw bytes).
|
|
166
|
+
*
|
|
167
|
+
* Note: `File extends Blob`, so `File` instances are handled by the
|
|
168
|
+
* `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full
|
|
169
|
+
* contents regardless of any prior reads — there's no cursor to worry about.
|
|
170
|
+
*/
|
|
171
|
+
async function normalizeAudioToBytes(audio) {
|
|
172
|
+
if (audio instanceof ArrayBuffer) return Array.from(new Uint8Array(audio));
|
|
173
|
+
if (audio instanceof Blob) {
|
|
174
|
+
const buffer = await audio.arrayBuffer();
|
|
175
|
+
return Array.from(new Uint8Array(buffer));
|
|
176
|
+
}
|
|
177
|
+
if (typeof audio === "string") {
|
|
178
|
+
const binary = atob(audio);
|
|
179
|
+
const bytes = new Uint8Array(binary.length);
|
|
180
|
+
for (let i = 0; i < binary.length; i++) bytes[i] = binary.charCodeAt(i);
|
|
181
|
+
return Array.from(bytes);
|
|
182
|
+
}
|
|
183
|
+
throw new Error("Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.");
|
|
184
|
+
}
|
|
185
|
+
/**
|
|
186
|
+
* Detect the MIME type of the audio input for models that require it
|
|
187
|
+
* (e.g., Deepgram Nova-3).
|
|
188
|
+
*
|
|
189
|
+
* - `File` / `Blob`: use the `.type` property (e.g., "audio/wav")
|
|
190
|
+
* - `ArrayBuffer` / `string`: defaults to "audio/wav"
|
|
191
|
+
*/
|
|
192
|
+
function detectAudioContentType(audio) {
|
|
193
|
+
if (audio instanceof Blob && audio.type) return audio.type;
|
|
194
|
+
return "audio/wav";
|
|
195
|
+
}
|
|
196
|
+
//#endregion
|
|
197
|
+
export { WorkersAiTranscriptionAdapter, createWorkersAiTranscription };
|
|
198
|
+
|
|
199
|
+
//# sourceMappingURL=workers-ai-transcription.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"workers-ai-transcription.mjs","names":[],"sources":["../../src/adapters/workers-ai-transcription.ts"],"sourcesContent":["import { BaseTranscriptionAdapter } from \"@tanstack/ai/adapters\";\nimport type { TranscriptionOptions, TranscriptionResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch, workersAiRestFetchBinary } from \"../utils/workers-ai-rest\";\nimport { uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support speech-to-text transcription.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n *\n * **Nova-3 note:** `@cf/deepgram/nova-3` uses a different input format than the\n * Whisper models. Via binding it accepts `{ audio: { body: base64, contentType } }`.\n * Via REST it requires multipart form data (not JSON). The adapter handles both.\n */\nexport type WorkersAiTranscriptionModel =\n\t| \"@cf/openai/whisper\"\n\t| \"@cf/openai/whisper-tiny-en\"\n\t| \"@cf/openai/whisper-large-v3-turbo\"\n\t| \"@cf/deepgram/nova-3\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTranscriptionAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTranscriptionAdapter extends BaseTranscriptionAdapter<WorkersAiTranscriptionModel> {\n\treadonly name = \"workers-ai-transcription\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTranscriptionModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync transcribe(options: TranscriptionOptions): Promise<TranscriptionResult> {\n\t\tconst { audio, language, prompt, modelOptions } = options;\n\n\t\t// Normalize audio to raw bytes\n\t\tconst audioBytes = await normalizeAudioToBytes(audio);\n\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (language) extra.language = language;\n\t\tif (prompt) extra.initial_prompt = prompt;\n\n\t\t// Build the model-specific audio payload:\n\t\t// - Deepgram Nova-3 (binding): { audio: { body: base64, contentType: \"audio/...\" } }\n\t\t// - Deepgram Nova-3 (REST): multipart FormData (handled separately)\n\t\t// - Whisper Large v3 Turbo (REST/gateway): { audio: base64string }\n\t\t// - Other Whisper models (binding): { audio: number[] }\n\t\tconst audioPayload = this.buildAudioPayload(audioBytes, audio);\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.transcribeViaBinding(audioPayload, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\t// Nova-3 REST requires raw binary audio, not JSON\n\t\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\t\treturn this.transcribeViaRestBinary(audioBytes, audio, extra);\n\t\t\t}\n\t\t\treturn this.transcribeViaRest(audioPayload, extra);\n\t\t}\n\n\t\treturn this.transcribeViaGateway(audioPayload, extra);\n\t}\n\n\t/**\n\t * Build the audio field for the request payload, handling model-specific formats.\n\t *\n\t * - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: \"audio/...\" }`\n\t * - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string\n\t * - Other Whisper models accept `number[]` (binding) or base64 (REST)\n\t */\n\tprivate buildAudioPayload(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t): Record<string, unknown> {\n\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\tconst b64 = uint8ArrayToBase64(new Uint8Array(audioBytes));\n\t\t\tconst contentType = detectAudioContentType(originalAudio);\n\t\t\treturn { audio: { body: b64, contentType } };\n\t\t}\n\n\t\tif (this.model === \"@cf/openai/whisper-large-v3-turbo\") {\n\t\t\treturn { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };\n\t\t}\n\n\t\treturn { audio: audioBytes };\n\t}\n\n\tprivate async transcribeViaBinding(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = (await ai.run(this.model, {\n\t\t\t...audioPayload,\n\t\t\t...options,\n\t\t})) as Record<string, unknown>;\n\t\treturn this.normalizeResult(result);\n\t}\n\n\tprivate async transcribeViaRest(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ ...audioPayload, ...options },\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\t// Cloudflare REST API wraps responses in { success, result: {...} }.\n\t\t// Use `data.result` when present, fall back to `data` for direct responses.\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\t/**\n\t * Transcribe via REST using raw binary audio.\n\t * Required for models like Deepgram Nova-3 that expect raw audio bytes\n\t * with a Content-Type header (e.g. \"audio/wav\") instead of JSON.\n\t */\n\tprivate async transcribeViaRestBinary(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst contentType = detectAudioContentType(originalAudio);\n\n\t\tconst response = await workersAiRestFetchBinary(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\tnew Uint8Array(audioBytes),\n\t\t\tcontentType,\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\tprivate async transcribeViaGateway(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/transcriptions\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\t...audioPayload,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI transcription gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst data = (await response.json()) as Record<string, unknown>;\n\t\treturn this.normalizeResult(data);\n\t}\n\n\t/**\n\t * Normalize Workers AI transcription results into the standard\n\t * TanStack AI TranscriptionResult shape.\n\t *\n\t * Handles three response formats:\n\t * - Whisper: `{ text, words?, vtt? }`\n\t * - Whisper v3-turbo: `{ text, segments?, transcription_info? }`\n\t * - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`\n\t */\n\tprivate normalizeResult(raw: Record<string, unknown>): TranscriptionResult {\n\t\t// Deepgram Nova-3 format: { results: { channels: [{ alternatives: [{ transcript, words }] }] } }\n\t\tconst results = raw.results as Record<string, unknown> | undefined;\n\t\tif (results?.channels) {\n\t\t\tconst channels = results.channels as Array<{\n\t\t\t\talternatives?: Array<{\n\t\t\t\t\ttranscript?: string;\n\t\t\t\t\tconfidence?: number;\n\t\t\t\t\twords?: Array<{ word: string; start: number; end: number; confidence: number }>;\n\t\t\t\t}>;\n\t\t\t}>;\n\t\t\tconst alt = channels?.[0]?.alternatives?.[0];\n\t\t\tconst text = alt?.transcript ?? \"\";\n\t\t\tconst result: TranscriptionResult = {\n\t\t\t\tid: this.generateId(),\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t};\n\t\t\tif (alt?.words && Array.isArray(alt.words)) {\n\t\t\t\tresult.words = alt.words.map((w) => ({\n\t\t\t\t\tword: w.word ?? \"\",\n\t\t\t\t\tstart: w.start ?? 0,\n\t\t\t\t\tend: w.end ?? 0,\n\t\t\t\t}));\n\t\t\t}\n\t\t\treturn result;\n\t\t}\n\n\t\t// Whisper format: { text, words?, vtt? }\n\t\t// Whisper v3-turbo format: { text, segments?, transcription_info? }\n\t\tconst result: TranscriptionResult = {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\ttext: (raw.text as string) ?? \"\",\n\t\t};\n\n\t\t// Language from transcription_info (whisper-large-v3-turbo)\n\t\tconst transcriptionInfo = raw.transcription_info as Record<string, unknown> | undefined;\n\t\tif (transcriptionInfo?.language) {\n\t\t\tresult.language = transcriptionInfo.language as string;\n\t\t}\n\n\t\t// Duration\n\t\tif (transcriptionInfo?.duration != null) {\n\t\t\tresult.duration = transcriptionInfo.duration as number;\n\t\t}\n\n\t\t// Segments (whisper-large-v3-turbo returns these)\n\t\tif (raw.segments && Array.isArray(raw.segments)) {\n\t\t\tresult.segments = raw.segments.map((seg: Record<string, unknown>, idx: number) => ({\n\t\t\t\tid: idx,\n\t\t\t\ttext: (seg.text as string) ?? \"\",\n\t\t\t\tstart: (seg.start as number) ?? 0,\n\t\t\t\tend: (seg.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\t// Words — basic whisper returns top-level words[], v3-turbo nests them in segments\n\t\tif (raw.words && Array.isArray(raw.words)) {\n\t\t\tresult.words = raw.words.map((w: Record<string, unknown>) => ({\n\t\t\t\tword: (w.word as string) ?? \"\",\n\t\t\t\tstart: (w.start as number) ?? 0,\n\t\t\t\tend: (w.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\treturn result;\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI transcription adapter for speech-to-text.\n *\n * Works with TanStack AI's `generateTranscription()` activity function:\n * ```ts\n * import { generateTranscription } from \"@tanstack/ai\";\n * import { createWorkersAiTranscription } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTranscription(\n * \"@cf/openai/whisper-large-v3-turbo\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateTranscription({ adapter, audio: audioData });\n * // result.text — the transcribed text\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTranscription(\n\tmodel: WorkersAiTranscriptionModel,\n\tconfig: WorkersAiAdapterConfig,\n) {\n\treturn new WorkersAiTranscriptionAdapter(config, model);\n}\n\n// ---------------------------------------------------------------------------\n// Utilities\n// ---------------------------------------------------------------------------\n\n/**\n * Normalize various audio input formats into a number[] (raw bytes).\n *\n * Note: `File extends Blob`, so `File` instances are handled by the\n * `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full\n * contents regardless of any prior reads — there's no cursor to worry about.\n */\nasync function normalizeAudioToBytes(audio: string | File | Blob | ArrayBuffer): Promise<number[]> {\n\tif (audio instanceof ArrayBuffer) {\n\t\treturn Array.from(new Uint8Array(audio));\n\t}\n\n\tif (audio instanceof Blob) {\n\t\t// This also handles `File` (which extends Blob)\n\t\tconst buffer = await audio.arrayBuffer();\n\t\treturn Array.from(new Uint8Array(buffer));\n\t}\n\n\tif (typeof audio === \"string\") {\n\t\t// Assume base64 string — decode to bytes\n\t\tconst binary = atob(audio);\n\t\tconst bytes = new Uint8Array(binary.length);\n\t\tfor (let i = 0; i < binary.length; i++) {\n\t\t\tbytes[i] = binary.charCodeAt(i);\n\t\t}\n\t\treturn Array.from(bytes);\n\t}\n\n\tthrow new Error(\"Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.\");\n}\n\n/**\n * Detect the MIME type of the audio input for models that require it\n * (e.g., Deepgram Nova-3).\n *\n * - `File` / `Blob`: use the `.type` property (e.g., \"audio/wav\")\n * - `ArrayBuffer` / `string`: defaults to \"audio/wav\"\n */\nfunction detectAudioContentType(audio: string | File | Blob | ArrayBuffer): string {\n\t// File and Blob carry their own MIME type\n\tif (audio instanceof Blob && audio.type) {\n\t\treturn audio.type;\n\t}\n\n\t// For raw bytes, default to audio/wav — this is the most common\n\t// format for transcription inputs and what the E2E tests use.\n\treturn \"audio/wav\";\n}\n"],"mappings":";;;;;;AAyCA,IAAa,gCAAb,cAAmD,yBAAsD;CAIxG,YAAY,QAAgC,OAAoC;AAC/E,QAAM,EAAE,EAAE,MAAM;wBAJR,QAAO,2BAAoC;wBAC5C,iBAAA,KAAA,EAAsC;AAI7C,0BAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,WAAW,SAA6D;EAC7E,MAAM,EAAE,OAAO,UAAU,QAAQ,iBAAiB;EAGlD,MAAM,aAAa,MAAM,sBAAsB,MAAM;EAErD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,SAAU,OAAM,WAAW;AAC/B,MAAI,OAAQ,OAAM,iBAAiB;EAOnC,MAAM,eAAe,KAAK,kBAAkB,YAAY,MAAM;AAE9D,MAAI,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,qBAAqB,cAAc,MAAM;AAGtD,MAAI,0BAA0B,KAAK,cAAc,EAAE;AAElD,OAAI,KAAK,UAAU,sBAClB,QAAO,KAAK,wBAAwB,YAAY,OAAO,MAAM;AAE9D,UAAO,KAAK,kBAAkB,cAAc,MAAM;;AAGnD,SAAO,KAAK,qBAAqB,cAAc,MAAM;;;;;;;;;CAUtD,kBACC,YACA,eAC0B;AAC1B,MAAI,KAAK,UAAU,sBAGlB,QAAO,EAAE,OAAO;GAAE,MAFN,mBAAmB,IAAI,WAAW,WAAW,CAAC;GAE7B,aADT,uBAAuB,cAAc;GACf,EAAE;AAG7C,MAAI,KAAK,UAAU,oCAClB,QAAO,EAAE,OAAO,mBAAmB,IAAI,WAAW,WAAW,CAAC,EAAE;AAGjE,SAAO,EAAE,OAAO,YAAY;;CAG7B,MAAc,qBACb,cACA,SAC+B;EAE/B,MAAM,SAAU,MADJ,KAAK,cAA+C,QACvC,IAAI,KAAK,OAAO;GACxC,GAAG;GACH,GAAG;GACH,CAAC;AACF,SAAO,KAAK,gBAAgB,OAAO;;CAGpC,MAAc,kBACb,cACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EAYpB,MAAM,OAAQ,OAVG,MAAM,mBACtB,QACA,KAAK,OACL;GAAE,GAAG;GAAc,GAAG;GAAS,EAC/B;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAMnC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;;;;;;CAQjD,MAAc,wBACb,YACA,eACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EACpB,MAAM,cAAc,uBAAuB,cAAc;EAazD,MAAM,OAAQ,OAXG,MAAM,yBACtB,QACA,KAAK,OACL,IAAI,WAAW,WAAW,EAC1B,aACA;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAInC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;CAGjD,MAAc,qBACb,cACA,SAC+B;EAC/B,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,cAAc,CAKhC,sDAAsD;GACzF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ,GAAG;IACH,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,oDAAoD,SAAS,OAAO,KAAK,YACzE;;EAGF,MAAM,OAAQ,MAAM,SAAS,MAAM;AACnC,SAAO,KAAK,gBAAgB,KAAK;;;;;;;;;;;CAYlC,gBAAwB,KAAmD;EAE1E,MAAM,UAAU,IAAI;AACpB,MAAI,SAAS,UAAU;GAQtB,MAAM,MAPW,QAAQ,WAOF,IAAI,eAAe;GAC1C,MAAM,OAAO,KAAK,cAAc;GAChC,MAAM,SAA8B;IACnC,IAAI,KAAK,YAAY;IACrB,OAAO,KAAK;IACZ;IACA;AACD,OAAI,KAAK,SAAS,MAAM,QAAQ,IAAI,MAAM,CACzC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAO;IACpC,MAAM,EAAE,QAAQ;IAChB,OAAO,EAAE,SAAS;IAClB,KAAK,EAAE,OAAO;IACd,EAAE;AAEJ,UAAO;;EAKR,MAAM,SAA8B;GACnC,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,MAAO,IAAI,QAAmB;GAC9B;EAGD,MAAM,oBAAoB,IAAI;AAC9B,MAAI,mBAAmB,SACtB,QAAO,WAAW,kBAAkB;AAIrC,MAAI,mBAAmB,YAAY,KAClC,QAAO,WAAW,kBAAkB;AAIrC,MAAI,IAAI,YAAY,MAAM,QAAQ,IAAI,SAAS,CAC9C,QAAO,WAAW,IAAI,SAAS,KAAK,KAA8B,SAAiB;GAClF,IAAI;GACJ,MAAO,IAAI,QAAmB;GAC9B,OAAQ,IAAI,SAAoB;GAChC,KAAM,IAAI,OAAkB;GAC5B,EAAE;AAIJ,MAAI,IAAI,SAAS,MAAM,QAAQ,IAAI,MAAM,CACxC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAgC;GAC7D,MAAO,EAAE,QAAmB;GAC5B,OAAQ,EAAE,SAAoB;GAC9B,KAAM,EAAE,OAAkB;GAC1B,EAAE;AAGJ,SAAO;;;;;;;;;;;;;;;;;;;;;;;AA4BT,SAAgB,6BACf,OACA,QACC;AACD,QAAO,IAAI,8BAA8B,QAAQ,MAAM;;;;;;;;;AAcxD,eAAe,sBAAsB,OAA8D;AAClG,KAAI,iBAAiB,YACpB,QAAO,MAAM,KAAK,IAAI,WAAW,MAAM,CAAC;AAGzC,KAAI,iBAAiB,MAAM;EAE1B,MAAM,SAAS,MAAM,MAAM,aAAa;AACxC,SAAO,MAAM,KAAK,IAAI,WAAW,OAAO,CAAC;;AAG1C,KAAI,OAAO,UAAU,UAAU;EAE9B,MAAM,SAAS,KAAK,MAAM;EAC1B,MAAM,QAAQ,IAAI,WAAW,OAAO,OAAO;AAC3C,OAAK,IAAI,IAAI,GAAG,IAAI,OAAO,QAAQ,IAClC,OAAM,KAAK,OAAO,WAAW,EAAE;AAEhC,SAAO,MAAM,KAAK,MAAM;;AAGzB,OAAM,IAAI,MAAM,yEAAyE;;;;;;;;;AAU1F,SAAS,uBAAuB,OAAmD;AAElF,KAAI,iBAAiB,QAAQ,MAAM,KAClC,QAAO,MAAM;AAKd,QAAO"}
|
|
@@ -1,13 +1,114 @@
|
|
|
1
|
-
|
|
1
|
+
Object.defineProperty(exports, Symbol.toStringTag, { value: "Module" });
|
|
2
|
+
require("../workers-ai-Bm7Up4or.cjs");
|
|
3
|
+
const require_create_fetcher = require("../create-fetcher-5iL34e6H.cjs");
|
|
4
|
+
const require_defineProperty = require("../defineProperty-DQoAg20E.cjs");
|
|
5
|
+
const require_workers_ai_rest = require("../workers-ai-rest-CkNCtBwv.cjs");
|
|
6
|
+
const require_binary = require("../binary-C9FAYwZj.cjs");
|
|
7
|
+
let _tanstack_ai_adapters = require("@tanstack/ai/adapters");
|
|
8
|
+
//#region src/adapters/workers-ai-tts.ts
|
|
9
|
+
var WorkersAiTTSAdapter = class extends _tanstack_ai_adapters.BaseTTSAdapter {
|
|
10
|
+
constructor(config, model) {
|
|
11
|
+
super({}, model);
|
|
12
|
+
require_defineProperty._defineProperty(this, "name", "workers-ai-tts");
|
|
13
|
+
require_defineProperty._defineProperty(this, "adapterConfig", void 0);
|
|
14
|
+
require_create_fetcher.validateWorkersAiConfig(config);
|
|
15
|
+
this.adapterConfig = config;
|
|
16
|
+
}
|
|
17
|
+
async generateSpeech(options) {
|
|
18
|
+
const { text, voice, format, speed, modelOptions } = options;
|
|
19
|
+
const extra = { ...modelOptions };
|
|
20
|
+
if (voice) extra.voice = voice;
|
|
21
|
+
if (speed != null) extra.speed = speed;
|
|
22
|
+
if (require_create_fetcher.isDirectBindingConfig(this.adapterConfig)) return this.generateViaBinding(text, format, extra);
|
|
23
|
+
if (require_create_fetcher.isDirectCredentialsConfig(this.adapterConfig)) return this.generateViaRest(text, format, extra);
|
|
24
|
+
return this.generateViaGateway(text, format, extra);
|
|
25
|
+
}
|
|
26
|
+
async generateViaBinding(text, format, options) {
|
|
27
|
+
const result = await this.adapterConfig.binding.run(this.model, {
|
|
28
|
+
text,
|
|
29
|
+
...options
|
|
30
|
+
});
|
|
31
|
+
return this.normalizeResult(result, format);
|
|
32
|
+
}
|
|
33
|
+
async generateViaRest(text, format, options) {
|
|
34
|
+
const config = this.adapterConfig;
|
|
35
|
+
const buffer = await (await require_workers_ai_rest.workersAiRestFetch(config, this.model, {
|
|
36
|
+
text,
|
|
37
|
+
...options
|
|
38
|
+
}, {
|
|
39
|
+
label: "Workers AI TTS",
|
|
40
|
+
signal: options.signal
|
|
41
|
+
})).arrayBuffer();
|
|
42
|
+
return this.wrapAudioResult(new Uint8Array(buffer), format);
|
|
43
|
+
}
|
|
44
|
+
async generateViaGateway(text, format, options) {
|
|
45
|
+
const gatewayConfig = this.adapterConfig;
|
|
46
|
+
const response = await require_create_fetcher.createGatewayFetch("workers-ai", gatewayConfig)("https://api.cloudflare.com/v1/audio/speech", {
|
|
47
|
+
method: "POST",
|
|
48
|
+
body: JSON.stringify({
|
|
49
|
+
model: this.model,
|
|
50
|
+
text,
|
|
51
|
+
...options
|
|
52
|
+
})
|
|
53
|
+
});
|
|
54
|
+
if (!response.ok) {
|
|
55
|
+
const errorText = await response.text();
|
|
56
|
+
throw new Error(`Workers AI TTS gateway request failed (${response.status}): ${errorText}`);
|
|
57
|
+
}
|
|
58
|
+
const buffer = await response.arrayBuffer();
|
|
59
|
+
return this.wrapAudioResult(new Uint8Array(buffer), format);
|
|
60
|
+
}
|
|
61
|
+
/**
|
|
62
|
+
* Normalize binding results. Workers AI TTS can return:
|
|
63
|
+
* - Uint8Array / ArrayBuffer (raw audio bytes)
|
|
64
|
+
* - ReadableStream<Uint8Array> (streamed audio bytes)
|
|
65
|
+
* - { audio: "base64..." } (JSON wrapper)
|
|
66
|
+
*/
|
|
67
|
+
async normalizeResult(result, format) {
|
|
68
|
+
const b64 = await require_binary.binaryToBase64(result, "audio");
|
|
69
|
+
return {
|
|
70
|
+
id: this.generateId(),
|
|
71
|
+
model: this.model,
|
|
72
|
+
audio: b64,
|
|
73
|
+
format: format ?? "mp3",
|
|
74
|
+
contentType: `audio/${format ?? "mp3"}`
|
|
75
|
+
};
|
|
76
|
+
}
|
|
77
|
+
wrapAudioResult(bytes, format) {
|
|
78
|
+
return {
|
|
79
|
+
id: this.generateId(),
|
|
80
|
+
model: this.model,
|
|
81
|
+
audio: require_binary.uint8ArrayToBase64(bytes),
|
|
82
|
+
format: format ?? "mp3",
|
|
83
|
+
contentType: `audio/${format ?? "mp3"}`
|
|
84
|
+
};
|
|
85
|
+
}
|
|
86
|
+
};
|
|
87
|
+
/**
|
|
88
|
+
* Creates a Workers AI text-to-speech adapter.
|
|
89
|
+
*
|
|
90
|
+
* Works with TanStack AI's `generateSpeech()` activity function:
|
|
91
|
+
* ```ts
|
|
92
|
+
* import { generateSpeech } from "@tanstack/ai";
|
|
93
|
+
* import { createWorkersAiTts } from "@cloudflare/tanstack-ai";
|
|
94
|
+
*
|
|
95
|
+
* const adapter = createWorkersAiTts(
|
|
96
|
+
* "@cf/deepgram/aura-1",
|
|
97
|
+
* { binding: env.AI },
|
|
98
|
+
* );
|
|
99
|
+
*
|
|
100
|
+
* const result = await generateSpeech({ adapter, text: "Hello world" });
|
|
101
|
+
* // result.audio — base64-encoded audio
|
|
102
|
+
* ```
|
|
103
|
+
*
|
|
104
|
+
* Note: Factory takes `(model, config)` for ergonomics — the class constructor
|
|
105
|
+
* uses `(config, model)` to match TanStack AI's upstream convention.
|
|
106
|
+
*/
|
|
107
|
+
function createWorkersAiTts(model, config) {
|
|
108
|
+
return new WorkersAiTTSAdapter(config, model);
|
|
109
|
+
}
|
|
110
|
+
//#endregion
|
|
111
|
+
exports.WorkersAiTTSAdapter = WorkersAiTTSAdapter;
|
|
112
|
+
exports.createWorkersAiTts = createWorkersAiTts;
|
|
2
113
|
|
|
3
|
-
|
|
4
|
-
var _chunkN6U27RQWcjs = require('../chunk-N6U27RQW.cjs');
|
|
5
|
-
require('../chunk-3VQDXJLW.cjs');
|
|
6
|
-
require('../chunk-7HSUHP63.cjs');
|
|
7
|
-
require('../chunk-WBTQKWFN.cjs');
|
|
8
|
-
require('../chunk-4DE2IREA.cjs');
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
exports.WorkersAiTTSAdapter = _chunkN6U27RQWcjs.WorkersAiTTSAdapter; exports.createWorkersAiTts = _chunkN6U27RQWcjs.createWorkersAiTts;
|
|
13
114
|
//# sourceMappingURL=workers-ai-tts.cjs.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["/
|
|
1
|
+
{"version":3,"file":"workers-ai-tts.cjs","names":["BaseTTSAdapter","isDirectBindingConfig","isDirectCredentialsConfig","workersAiRestFetch","createGatewayFetch","binaryToBase64","uint8ArrayToBase64"],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;;;AAoCA,IAAa,sBAAb,cAAyCA,sBAAAA,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;AACrE,QAAM,EAAE,EAAE,MAAM;+CAJR,QAAO,iBAA0B;+CAClC,iBAAA,KAAA,EAAsC;AAI7C,yBAAA,wBAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,MAAO,OAAM,QAAQ;AACzB,MAAI,SAAS,KAAM,OAAM,QAAQ;AAEjC,MAAIC,uBAAAA,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;AAGpD,MAAIC,uBAAAA,0BAA0B,KAAK,cAAc,CAChD,QAAO,KAAK,gBAAgB,MAAM,QAAQ,MAAM;AAGjD,SAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;;CAGpD,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;GAAS,CAAC;AAE7D,SAAO,KAAK,gBAAgB,QAAQ,OAAO;;CAG5C,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OARE,MAAMC,wBAAAA,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;GAAS,EACpB;GAAE,OAAO;GAAkB,QAAS,QAAqC;GAAQ,CACjF,EAG6B,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;CAG5D,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALIC,uBAAAA,mBAAmB,cAAc,cAAc,CAKhC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,YAC/D;;EAGF,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;;;;;;;CAS5D,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAMC,eAAAA,eAAe,QAAQ,QAAQ;AACjD,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;CAGF,gBAAwB,OAAmB,QAAuC;AACjF,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAOC,eAAAA,mBAAmB,MAAM;GAChC,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;;;;;;;;;;;;;;;;;;;;;;AA4BH,SAAgB,mBAAmB,OAA0B,QAAgC;AAC5F,QAAO,IAAI,oBAAoB,QAAQ,MAAM"}
|
|
@@ -1,3 +1,54 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
1
|
+
import { i as WorkersAiAdapterConfig } from "../create-fetcher-vAQ8WW-p.cjs";
|
|
2
|
+
import { TTSOptions, TTSResult } from "@tanstack/ai";
|
|
3
|
+
import { BaseTTSAdapter } from "@tanstack/ai/adapters";
|
|
4
|
+
|
|
5
|
+
//#region src/adapters/workers-ai-tts.d.ts
|
|
6
|
+
/**
|
|
7
|
+
* Workers AI models that support text-to-speech generation.
|
|
8
|
+
*
|
|
9
|
+
* Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag
|
|
10
|
+
* behind what's deployed. We use a string union here that matches the known
|
|
11
|
+
* models including Deepgram partner models.
|
|
12
|
+
*/
|
|
13
|
+
type WorkersAiTTSModel = "@cf/deepgram/aura-1" | "@cf/deepgram/aura-2-en" | "@cf/deepgram/aura-2-es" | (string & {});
|
|
14
|
+
declare class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {
|
|
15
|
+
readonly name: "workers-ai-tts";
|
|
16
|
+
private adapterConfig;
|
|
17
|
+
constructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel);
|
|
18
|
+
generateSpeech(options: TTSOptions): Promise<TTSResult>;
|
|
19
|
+
private generateViaBinding;
|
|
20
|
+
private generateViaRest;
|
|
21
|
+
private generateViaGateway;
|
|
22
|
+
/**
|
|
23
|
+
* Normalize binding results. Workers AI TTS can return:
|
|
24
|
+
* - Uint8Array / ArrayBuffer (raw audio bytes)
|
|
25
|
+
* - ReadableStream<Uint8Array> (streamed audio bytes)
|
|
26
|
+
* - { audio: "base64..." } (JSON wrapper)
|
|
27
|
+
*/
|
|
28
|
+
private normalizeResult;
|
|
29
|
+
private wrapAudioResult;
|
|
30
|
+
}
|
|
31
|
+
/**
|
|
32
|
+
* Creates a Workers AI text-to-speech adapter.
|
|
33
|
+
*
|
|
34
|
+
* Works with TanStack AI's `generateSpeech()` activity function:
|
|
35
|
+
* ```ts
|
|
36
|
+
* import { generateSpeech } from "@tanstack/ai";
|
|
37
|
+
* import { createWorkersAiTts } from "@cloudflare/tanstack-ai";
|
|
38
|
+
*
|
|
39
|
+
* const adapter = createWorkersAiTts(
|
|
40
|
+
* "@cf/deepgram/aura-1",
|
|
41
|
+
* { binding: env.AI },
|
|
42
|
+
* );
|
|
43
|
+
*
|
|
44
|
+
* const result = await generateSpeech({ adapter, text: "Hello world" });
|
|
45
|
+
* // result.audio — base64-encoded audio
|
|
46
|
+
* ```
|
|
47
|
+
*
|
|
48
|
+
* Note: Factory takes `(model, config)` for ergonomics — the class constructor
|
|
49
|
+
* uses `(config, model)` to match TanStack AI's upstream convention.
|
|
50
|
+
*/
|
|
51
|
+
declare function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig): WorkersAiTTSAdapter;
|
|
52
|
+
//#endregion
|
|
53
|
+
export { WorkersAiTTSAdapter, WorkersAiTTSModel, createWorkersAiTts };
|
|
54
|
+
//# sourceMappingURL=workers-ai-tts.d.cts.map
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
import { i as WorkersAiAdapterConfig } from "../create-fetcher-6p6heb85.mjs";
|
|
2
|
+
import { BaseTTSAdapter } from "@tanstack/ai/adapters";
|
|
3
|
+
import { TTSOptions, TTSResult } from "@tanstack/ai";
|
|
4
|
+
|
|
5
|
+
//#region src/adapters/workers-ai-tts.d.ts
|
|
6
|
+
/**
|
|
7
|
+
* Workers AI models that support text-to-speech generation.
|
|
8
|
+
*
|
|
9
|
+
* Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag
|
|
10
|
+
* behind what's deployed. We use a string union here that matches the known
|
|
11
|
+
* models including Deepgram partner models.
|
|
12
|
+
*/
|
|
13
|
+
type WorkersAiTTSModel = "@cf/deepgram/aura-1" | "@cf/deepgram/aura-2-en" | "@cf/deepgram/aura-2-es" | (string & {});
|
|
14
|
+
declare class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {
|
|
15
|
+
readonly name: "workers-ai-tts";
|
|
16
|
+
private adapterConfig;
|
|
17
|
+
constructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel);
|
|
18
|
+
generateSpeech(options: TTSOptions): Promise<TTSResult>;
|
|
19
|
+
private generateViaBinding;
|
|
20
|
+
private generateViaRest;
|
|
21
|
+
private generateViaGateway;
|
|
22
|
+
/**
|
|
23
|
+
* Normalize binding results. Workers AI TTS can return:
|
|
24
|
+
* - Uint8Array / ArrayBuffer (raw audio bytes)
|
|
25
|
+
* - ReadableStream<Uint8Array> (streamed audio bytes)
|
|
26
|
+
* - { audio: "base64..." } (JSON wrapper)
|
|
27
|
+
*/
|
|
28
|
+
private normalizeResult;
|
|
29
|
+
private wrapAudioResult;
|
|
30
|
+
}
|
|
31
|
+
/**
|
|
32
|
+
* Creates a Workers AI text-to-speech adapter.
|
|
33
|
+
*
|
|
34
|
+
* Works with TanStack AI's `generateSpeech()` activity function:
|
|
35
|
+
* ```ts
|
|
36
|
+
* import { generateSpeech } from "@tanstack/ai";
|
|
37
|
+
* import { createWorkersAiTts } from "@cloudflare/tanstack-ai";
|
|
38
|
+
*
|
|
39
|
+
* const adapter = createWorkersAiTts(
|
|
40
|
+
* "@cf/deepgram/aura-1",
|
|
41
|
+
* { binding: env.AI },
|
|
42
|
+
* );
|
|
43
|
+
*
|
|
44
|
+
* const result = await generateSpeech({ adapter, text: "Hello world" });
|
|
45
|
+
* // result.audio — base64-encoded audio
|
|
46
|
+
* ```
|
|
47
|
+
*
|
|
48
|
+
* Note: Factory takes `(model, config)` for ergonomics — the class constructor
|
|
49
|
+
* uses `(config, model)` to match TanStack AI's upstream convention.
|
|
50
|
+
*/
|
|
51
|
+
declare function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig): WorkersAiTTSAdapter;
|
|
52
|
+
//#endregion
|
|
53
|
+
export { WorkersAiTTSAdapter, WorkersAiTTSModel, createWorkersAiTts };
|
|
54
|
+
//# sourceMappingURL=workers-ai-tts.d.mts.map
|
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-DY7wfYYy.mjs";
|
|
2
|
+
import { t as _defineProperty } from "../defineProperty-CbyrzcbA.mjs";
|
|
3
|
+
import { t as workersAiRestFetch } from "../workers-ai-rest-GKy2r7eG.mjs";
|
|
4
|
+
import { n as uint8ArrayToBase64, t as binaryToBase64 } from "../binary-p4H_N_3M.mjs";
|
|
5
|
+
import { BaseTTSAdapter } from "@tanstack/ai/adapters";
|
|
6
|
+
//#region src/adapters/workers-ai-tts.ts
|
|
7
|
+
var WorkersAiTTSAdapter = class extends BaseTTSAdapter {
|
|
8
|
+
constructor(config, model) {
|
|
9
|
+
super({}, model);
|
|
10
|
+
_defineProperty(this, "name", "workers-ai-tts");
|
|
11
|
+
_defineProperty(this, "adapterConfig", void 0);
|
|
12
|
+
validateWorkersAiConfig(config);
|
|
13
|
+
this.adapterConfig = config;
|
|
14
|
+
}
|
|
15
|
+
async generateSpeech(options) {
|
|
16
|
+
const { text, voice, format, speed, modelOptions } = options;
|
|
17
|
+
const extra = { ...modelOptions };
|
|
18
|
+
if (voice) extra.voice = voice;
|
|
19
|
+
if (speed != null) extra.speed = speed;
|
|
20
|
+
if (isDirectBindingConfig(this.adapterConfig)) return this.generateViaBinding(text, format, extra);
|
|
21
|
+
if (isDirectCredentialsConfig(this.adapterConfig)) return this.generateViaRest(text, format, extra);
|
|
22
|
+
return this.generateViaGateway(text, format, extra);
|
|
23
|
+
}
|
|
24
|
+
async generateViaBinding(text, format, options) {
|
|
25
|
+
const result = await this.adapterConfig.binding.run(this.model, {
|
|
26
|
+
text,
|
|
27
|
+
...options
|
|
28
|
+
});
|
|
29
|
+
return this.normalizeResult(result, format);
|
|
30
|
+
}
|
|
31
|
+
async generateViaRest(text, format, options) {
|
|
32
|
+
const config = this.adapterConfig;
|
|
33
|
+
const buffer = await (await workersAiRestFetch(config, this.model, {
|
|
34
|
+
text,
|
|
35
|
+
...options
|
|
36
|
+
}, {
|
|
37
|
+
label: "Workers AI TTS",
|
|
38
|
+
signal: options.signal
|
|
39
|
+
})).arrayBuffer();
|
|
40
|
+
return this.wrapAudioResult(new Uint8Array(buffer), format);
|
|
41
|
+
}
|
|
42
|
+
async generateViaGateway(text, format, options) {
|
|
43
|
+
const gatewayConfig = this.adapterConfig;
|
|
44
|
+
const response = await createGatewayFetch("workers-ai", gatewayConfig)("https://api.cloudflare.com/v1/audio/speech", {
|
|
45
|
+
method: "POST",
|
|
46
|
+
body: JSON.stringify({
|
|
47
|
+
model: this.model,
|
|
48
|
+
text,
|
|
49
|
+
...options
|
|
50
|
+
})
|
|
51
|
+
});
|
|
52
|
+
if (!response.ok) {
|
|
53
|
+
const errorText = await response.text();
|
|
54
|
+
throw new Error(`Workers AI TTS gateway request failed (${response.status}): ${errorText}`);
|
|
55
|
+
}
|
|
56
|
+
const buffer = await response.arrayBuffer();
|
|
57
|
+
return this.wrapAudioResult(new Uint8Array(buffer), format);
|
|
58
|
+
}
|
|
59
|
+
/**
|
|
60
|
+
* Normalize binding results. Workers AI TTS can return:
|
|
61
|
+
* - Uint8Array / ArrayBuffer (raw audio bytes)
|
|
62
|
+
* - ReadableStream<Uint8Array> (streamed audio bytes)
|
|
63
|
+
* - { audio: "base64..." } (JSON wrapper)
|
|
64
|
+
*/
|
|
65
|
+
async normalizeResult(result, format) {
|
|
66
|
+
const b64 = await binaryToBase64(result, "audio");
|
|
67
|
+
return {
|
|
68
|
+
id: this.generateId(),
|
|
69
|
+
model: this.model,
|
|
70
|
+
audio: b64,
|
|
71
|
+
format: format ?? "mp3",
|
|
72
|
+
contentType: `audio/${format ?? "mp3"}`
|
|
73
|
+
};
|
|
74
|
+
}
|
|
75
|
+
wrapAudioResult(bytes, format) {
|
|
76
|
+
return {
|
|
77
|
+
id: this.generateId(),
|
|
78
|
+
model: this.model,
|
|
79
|
+
audio: uint8ArrayToBase64(bytes),
|
|
80
|
+
format: format ?? "mp3",
|
|
81
|
+
contentType: `audio/${format ?? "mp3"}`
|
|
82
|
+
};
|
|
83
|
+
}
|
|
84
|
+
};
|
|
85
|
+
/**
|
|
86
|
+
* Creates a Workers AI text-to-speech adapter.
|
|
87
|
+
*
|
|
88
|
+
* Works with TanStack AI's `generateSpeech()` activity function:
|
|
89
|
+
* ```ts
|
|
90
|
+
* import { generateSpeech } from "@tanstack/ai";
|
|
91
|
+
* import { createWorkersAiTts } from "@cloudflare/tanstack-ai";
|
|
92
|
+
*
|
|
93
|
+
* const adapter = createWorkersAiTts(
|
|
94
|
+
* "@cf/deepgram/aura-1",
|
|
95
|
+
* { binding: env.AI },
|
|
96
|
+
* );
|
|
97
|
+
*
|
|
98
|
+
* const result = await generateSpeech({ adapter, text: "Hello world" });
|
|
99
|
+
* // result.audio — base64-encoded audio
|
|
100
|
+
* ```
|
|
101
|
+
*
|
|
102
|
+
* Note: Factory takes `(model, config)` for ergonomics — the class constructor
|
|
103
|
+
* uses `(config, model)` to match TanStack AI's upstream convention.
|
|
104
|
+
*/
|
|
105
|
+
function createWorkersAiTts(model, config) {
|
|
106
|
+
return new WorkersAiTTSAdapter(config, model);
|
|
107
|
+
}
|
|
108
|
+
//#endregion
|
|
109
|
+
export { WorkersAiTTSAdapter, createWorkersAiTts };
|
|
110
|
+
|
|
111
|
+
//# sourceMappingURL=workers-ai-tts.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"workers-ai-tts.mjs","names":[],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;AAoCA,IAAa,sBAAb,cAAyC,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;AACrE,QAAM,EAAE,EAAE,MAAM;wBAJR,QAAO,iBAA0B;wBAClC,iBAAA,KAAA,EAAsC;AAI7C,0BAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,MAAO,OAAM,QAAQ;AACzB,MAAI,SAAS,KAAM,OAAM,QAAQ;AAEjC,MAAI,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;AAGpD,MAAI,0BAA0B,KAAK,cAAc,CAChD,QAAO,KAAK,gBAAgB,MAAM,QAAQ,MAAM;AAGjD,SAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;;CAGpD,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;GAAS,CAAC;AAE7D,SAAO,KAAK,gBAAgB,QAAQ,OAAO;;CAG5C,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OARE,MAAM,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;GAAS,EACpB;GAAE,OAAO;GAAkB,QAAS,QAAqC;GAAQ,CACjF,EAG6B,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;CAG5D,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,cAAc,CAKhC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,YAC/D;;EAGF,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;;;;;;;CAS5D,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAM,eAAe,QAAQ,QAAQ;AACjD,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;CAGF,gBAAwB,OAAmB,QAAuC;AACjF,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO,mBAAmB,MAAM;GAChC,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;;;;;;;;;;;;;;;;;;;;;;AA4BH,SAAgB,mBAAmB,OAA0B,QAAgC;AAC5F,QAAO,IAAI,oBAAoB,QAAQ,MAAM"}
|
|
@@ -1,11 +1,4 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
require('../chunk-WBTQKWFN.cjs');
|
|
6
|
-
require('../chunk-4DE2IREA.cjs');
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
exports.WorkersAiTextAdapter = _chunkOUEAAP25cjs.WorkersAiTextAdapter; exports.createWorkersAiChat = _chunkOUEAAP25cjs.createWorkersAiChat;
|
|
11
|
-
//# sourceMappingURL=workers-ai.cjs.map
|
|
1
|
+
Object.defineProperty(exports, Symbol.toStringTag, { value: "Module" });
|
|
2
|
+
const require_workers_ai = require("../workers-ai-Bm7Up4or.cjs");
|
|
3
|
+
exports.WorkersAiTextAdapter = require_workers_ai.WorkersAiTextAdapter;
|
|
4
|
+
exports.createWorkersAiChat = require_workers_ai.createWorkersAiChat;
|