@cloudflare/tanstack-ai 0.1.8 → 0.1.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (84) hide show
  1. package/README.md +5 -5
  2. package/dist/adapters/anthropic.cjs +2 -3
  3. package/dist/adapters/anthropic.cjs.map +1 -1
  4. package/dist/adapters/anthropic.d.cts +4 -3
  5. package/dist/adapters/anthropic.d.mts +4 -3
  6. package/dist/adapters/anthropic.mjs +3 -3
  7. package/dist/adapters/anthropic.mjs.map +1 -1
  8. package/dist/adapters/gemini.cjs +2 -3
  9. package/dist/adapters/gemini.cjs.map +1 -1
  10. package/dist/adapters/gemini.d.cts +6 -6
  11. package/dist/adapters/gemini.d.mts +6 -6
  12. package/dist/adapters/gemini.mjs +4 -3
  13. package/dist/adapters/gemini.mjs.map +1 -1
  14. package/dist/adapters/grok.cjs +2 -6
  15. package/dist/adapters/grok.cjs.map +1 -1
  16. package/dist/adapters/grok.d.cts +5 -4
  17. package/dist/adapters/grok.d.mts +5 -4
  18. package/dist/adapters/grok.mjs +3 -6
  19. package/dist/adapters/grok.mjs.map +1 -1
  20. package/dist/adapters/openai.cjs +2 -3
  21. package/dist/adapters/openai.cjs.map +1 -1
  22. package/dist/adapters/openai.d.cts +6 -5
  23. package/dist/adapters/openai.d.mts +6 -5
  24. package/dist/adapters/openai.mjs +3 -3
  25. package/dist/adapters/openai.mjs.map +1 -1
  26. package/dist/adapters/openrouter.cjs +3 -17
  27. package/dist/adapters/openrouter.cjs.map +1 -1
  28. package/dist/adapters/openrouter.d.cts +4 -4
  29. package/dist/adapters/openrouter.d.mts +4 -4
  30. package/dist/adapters/openrouter.mjs +4 -17
  31. package/dist/adapters/openrouter.mjs.map +1 -1
  32. package/dist/adapters/workers-ai-image.cjs +5 -6
  33. package/dist/adapters/workers-ai-image.cjs.map +1 -1
  34. package/dist/adapters/workers-ai-image.d.cts +1 -1
  35. package/dist/adapters/workers-ai-image.d.mts +2 -2
  36. package/dist/adapters/workers-ai-image.mjs +5 -5
  37. package/dist/adapters/workers-ai-image.mjs.map +1 -1
  38. package/dist/adapters/workers-ai-summarize.cjs +3 -4
  39. package/dist/adapters/workers-ai-summarize.cjs.map +1 -1
  40. package/dist/adapters/workers-ai-summarize.d.cts +1 -1
  41. package/dist/adapters/workers-ai-summarize.d.mts +2 -2
  42. package/dist/adapters/workers-ai-summarize.mjs +3 -3
  43. package/dist/adapters/workers-ai-summarize.mjs.map +1 -1
  44. package/dist/adapters/workers-ai-transcription.cjs +5 -6
  45. package/dist/adapters/workers-ai-transcription.cjs.map +1 -1
  46. package/dist/adapters/workers-ai-transcription.d.cts +1 -1
  47. package/dist/adapters/workers-ai-transcription.d.mts +2 -2
  48. package/dist/adapters/workers-ai-transcription.mjs +5 -5
  49. package/dist/adapters/workers-ai-transcription.mjs.map +1 -1
  50. package/dist/adapters/workers-ai-tts.cjs +5 -6
  51. package/dist/adapters/workers-ai-tts.cjs.map +1 -1
  52. package/dist/adapters/workers-ai-tts.d.cts +1 -1
  53. package/dist/adapters/workers-ai-tts.d.mts +2 -2
  54. package/dist/adapters/workers-ai-tts.mjs +5 -5
  55. package/dist/adapters/workers-ai-tts.mjs.map +1 -1
  56. package/dist/adapters/workers-ai.cjs +520 -3
  57. package/dist/adapters/workers-ai.cjs.map +1 -0
  58. package/dist/adapters/workers-ai.d.cts +2 -2
  59. package/dist/adapters/workers-ai.d.mts +3 -3
  60. package/dist/adapters/workers-ai.mjs +56 -41
  61. package/dist/adapters/workers-ai.mjs.map +1 -1
  62. package/dist/{binary-p4H_N_3M.mjs → binary-B5YCVsro.mjs} +1 -1
  63. package/dist/{binary-C9FAYwZj.cjs.map → binary-B5YCVsro.mjs.map} +1 -1
  64. package/dist/{binary-C9FAYwZj.cjs → binary-CZhr1_2n.cjs} +1 -1
  65. package/dist/{binary-p4H_N_3M.mjs.map → binary-CZhr1_2n.cjs.map} +1 -1
  66. package/dist/{create-fetcher-CeUOJgrh.mjs → create-fetcher-BnSnCaHf.mjs} +1 -1
  67. package/dist/{create-fetcher-By-hTiT9.cjs.map → create-fetcher-BnSnCaHf.mjs.map} +1 -1
  68. package/dist/{create-fetcher-6p6heb85.d.mts → create-fetcher-Bp5yCNaO.d.cts} +1 -1
  69. package/dist/{create-fetcher-vAQ8WW-p.d.cts → create-fetcher-Bp5yCNaO.d.mts} +1 -1
  70. package/dist/{create-fetcher-By-hTiT9.cjs → create-fetcher-YVxWCTVL.cjs} +1 -1
  71. package/dist/{create-fetcher-CeUOJgrh.mjs.map → create-fetcher-YVxWCTVL.cjs.map} +1 -1
  72. package/dist/{defineProperty-CbyrzcbA.mjs → defineProperty-BC3bEcwq.mjs} +4 -4
  73. package/dist/{defineProperty-DQoAg20E.cjs → defineProperty-In8g9yAD.cjs} +4 -4
  74. package/dist/index.cjs +2 -3
  75. package/dist/index.d.cts +3 -3
  76. package/dist/index.d.mts +3 -3
  77. package/dist/index.mjs +2 -2
  78. package/dist/{workers-ai-rest-GKy2r7eG.mjs → workers-ai-rest-B6_yU35Q.mjs} +1 -1
  79. package/dist/{workers-ai-rest-CkNCtBwv.cjs.map → workers-ai-rest-B6_yU35Q.mjs.map} +1 -1
  80. package/dist/{workers-ai-rest-CkNCtBwv.cjs → workers-ai-rest-_MXOmyDs.cjs} +1 -1
  81. package/dist/{workers-ai-rest-GKy2r7eG.mjs.map → workers-ai-rest-_MXOmyDs.cjs.map} +1 -1
  82. package/package.json +15 -15
  83. package/dist/workers-ai-BOZ5iyhY.cjs +0 -521
  84. package/dist/workers-ai-BOZ5iyhY.cjs.map +0 -1
@@ -1 +1 @@
1
- {"version":3,"file":"workers-ai-transcription.cjs","names":["BaseTranscriptionAdapter","isDirectBindingConfig","isDirectCredentialsConfig","uint8ArrayToBase64","workersAiRestFetch","workersAiRestFetchBinary","createGatewayFetch"],"sources":["../../src/adapters/workers-ai-transcription.ts"],"sourcesContent":["import { BaseTranscriptionAdapter } from \"@tanstack/ai/adapters\";\nimport type { TranscriptionOptions, TranscriptionResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch, workersAiRestFetchBinary } from \"../utils/workers-ai-rest\";\nimport { uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support speech-to-text transcription.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n *\n * **Nova-3 note:** `@cf/deepgram/nova-3` uses a different input format than the\n * Whisper models. Via binding it accepts `{ audio: { body: base64, contentType } }`.\n * Via REST it requires multipart form data (not JSON). The adapter handles both.\n */\nexport type WorkersAiTranscriptionModel =\n\t| \"@cf/openai/whisper\"\n\t| \"@cf/openai/whisper-tiny-en\"\n\t| \"@cf/openai/whisper-large-v3-turbo\"\n\t| \"@cf/deepgram/nova-3\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTranscriptionAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTranscriptionAdapter extends BaseTranscriptionAdapter<WorkersAiTranscriptionModel> {\n\treadonly name = \"workers-ai-transcription\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTranscriptionModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync transcribe(options: TranscriptionOptions): Promise<TranscriptionResult> {\n\t\tconst { audio, language, prompt, modelOptions } = options;\n\n\t\t// Normalize audio to raw bytes\n\t\tconst audioBytes = await normalizeAudioToBytes(audio);\n\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (language) extra.language = language;\n\t\tif (prompt) extra.initial_prompt = prompt;\n\n\t\t// Build the model-specific audio payload:\n\t\t// - Deepgram Nova-3 (binding): { audio: { body: base64, contentType: \"audio/...\" } }\n\t\t// - Deepgram Nova-3 (REST): multipart FormData (handled separately)\n\t\t// - Whisper Large v3 Turbo (REST/gateway): { audio: base64string }\n\t\t// - Other Whisper models (binding): { audio: number[] }\n\t\tconst audioPayload = this.buildAudioPayload(audioBytes, audio);\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.transcribeViaBinding(audioPayload, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\t// Nova-3 REST requires raw binary audio, not JSON\n\t\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\t\treturn this.transcribeViaRestBinary(audioBytes, audio, extra);\n\t\t\t}\n\t\t\treturn this.transcribeViaRest(audioPayload, extra);\n\t\t}\n\n\t\treturn this.transcribeViaGateway(audioPayload, extra);\n\t}\n\n\t/**\n\t * Build the audio field for the request payload, handling model-specific formats.\n\t *\n\t * - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: \"audio/...\" }`\n\t * - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string\n\t * - Other Whisper models accept `number[]` (binding) or base64 (REST)\n\t */\n\tprivate buildAudioPayload(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t): Record<string, unknown> {\n\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\tconst b64 = uint8ArrayToBase64(new Uint8Array(audioBytes));\n\t\t\tconst contentType = detectAudioContentType(originalAudio);\n\t\t\treturn { audio: { body: b64, contentType } };\n\t\t}\n\n\t\tif (this.model === \"@cf/openai/whisper-large-v3-turbo\") {\n\t\t\treturn { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };\n\t\t}\n\n\t\treturn { audio: audioBytes };\n\t}\n\n\tprivate async transcribeViaBinding(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = (await ai.run(this.model, {\n\t\t\t...audioPayload,\n\t\t\t...options,\n\t\t})) as Record<string, unknown>;\n\t\treturn this.normalizeResult(result);\n\t}\n\n\tprivate async transcribeViaRest(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ ...audioPayload, ...options },\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\t// Cloudflare REST API wraps responses in { success, result: {...} }.\n\t\t// Use `data.result` when present, fall back to `data` for direct responses.\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\t/**\n\t * Transcribe via REST using raw binary audio.\n\t * Required for models like Deepgram Nova-3 that expect raw audio bytes\n\t * with a Content-Type header (e.g. \"audio/wav\") instead of JSON.\n\t */\n\tprivate async transcribeViaRestBinary(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst contentType = detectAudioContentType(originalAudio);\n\n\t\tconst response = await workersAiRestFetchBinary(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\tnew Uint8Array(audioBytes),\n\t\t\tcontentType,\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\tprivate async transcribeViaGateway(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/transcriptions\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\t...audioPayload,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI transcription gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst data = (await response.json()) as Record<string, unknown>;\n\t\treturn this.normalizeResult(data);\n\t}\n\n\t/**\n\t * Normalize Workers AI transcription results into the standard\n\t * TanStack AI TranscriptionResult shape.\n\t *\n\t * Handles three response formats:\n\t * - Whisper: `{ text, words?, vtt? }`\n\t * - Whisper v3-turbo: `{ text, segments?, transcription_info? }`\n\t * - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`\n\t */\n\tprivate normalizeResult(raw: Record<string, unknown>): TranscriptionResult {\n\t\t// Deepgram Nova-3 format: { results: { channels: [{ alternatives: [{ transcript, words }] }] } }\n\t\tconst results = raw.results as Record<string, unknown> | undefined;\n\t\tif (results?.channels) {\n\t\t\tconst channels = results.channels as Array<{\n\t\t\t\talternatives?: Array<{\n\t\t\t\t\ttranscript?: string;\n\t\t\t\t\tconfidence?: number;\n\t\t\t\t\twords?: Array<{ word: string; start: number; end: number; confidence: number }>;\n\t\t\t\t}>;\n\t\t\t}>;\n\t\t\tconst alt = channels?.[0]?.alternatives?.[0];\n\t\t\tconst text = alt?.transcript ?? \"\";\n\t\t\tconst result: TranscriptionResult = {\n\t\t\t\tid: this.generateId(),\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t};\n\t\t\tif (alt?.words && Array.isArray(alt.words)) {\n\t\t\t\tresult.words = alt.words.map((w) => ({\n\t\t\t\t\tword: w.word ?? \"\",\n\t\t\t\t\tstart: w.start ?? 0,\n\t\t\t\t\tend: w.end ?? 0,\n\t\t\t\t}));\n\t\t\t}\n\t\t\treturn result;\n\t\t}\n\n\t\t// Whisper format: { text, words?, vtt? }\n\t\t// Whisper v3-turbo format: { text, segments?, transcription_info? }\n\t\tconst result: TranscriptionResult = {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\ttext: (raw.text as string) ?? \"\",\n\t\t};\n\n\t\t// Language from transcription_info (whisper-large-v3-turbo)\n\t\tconst transcriptionInfo = raw.transcription_info as Record<string, unknown> | undefined;\n\t\tif (transcriptionInfo?.language) {\n\t\t\tresult.language = transcriptionInfo.language as string;\n\t\t}\n\n\t\t// Duration\n\t\tif (transcriptionInfo?.duration != null) {\n\t\t\tresult.duration = transcriptionInfo.duration as number;\n\t\t}\n\n\t\t// Segments (whisper-large-v3-turbo returns these)\n\t\tif (raw.segments && Array.isArray(raw.segments)) {\n\t\t\tresult.segments = raw.segments.map((seg: Record<string, unknown>, idx: number) => ({\n\t\t\t\tid: idx,\n\t\t\t\ttext: (seg.text as string) ?? \"\",\n\t\t\t\tstart: (seg.start as number) ?? 0,\n\t\t\t\tend: (seg.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\t// Words — basic whisper returns top-level words[], v3-turbo nests them in segments\n\t\tif (raw.words && Array.isArray(raw.words)) {\n\t\t\tresult.words = raw.words.map((w: Record<string, unknown>) => ({\n\t\t\t\tword: (w.word as string) ?? \"\",\n\t\t\t\tstart: (w.start as number) ?? 0,\n\t\t\t\tend: (w.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\treturn result;\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI transcription adapter for speech-to-text.\n *\n * Works with TanStack AI's `generateTranscription()` activity function:\n * ```ts\n * import { generateTranscription } from \"@tanstack/ai\";\n * import { createWorkersAiTranscription } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTranscription(\n * \"@cf/openai/whisper-large-v3-turbo\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateTranscription({ adapter, audio: audioData });\n * // result.text — the transcribed text\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTranscription(\n\tmodel: WorkersAiTranscriptionModel,\n\tconfig: WorkersAiAdapterConfig,\n) {\n\treturn new WorkersAiTranscriptionAdapter(config, model);\n}\n\n// ---------------------------------------------------------------------------\n// Utilities\n// ---------------------------------------------------------------------------\n\n/**\n * Normalize various audio input formats into a number[] (raw bytes).\n *\n * Note: `File extends Blob`, so `File` instances are handled by the\n * `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full\n * contents regardless of any prior reads — there's no cursor to worry about.\n */\nasync function normalizeAudioToBytes(audio: string | File | Blob | ArrayBuffer): Promise<number[]> {\n\tif (audio instanceof ArrayBuffer) {\n\t\treturn Array.from(new Uint8Array(audio));\n\t}\n\n\tif (audio instanceof Blob) {\n\t\t// This also handles `File` (which extends Blob)\n\t\tconst buffer = await audio.arrayBuffer();\n\t\treturn Array.from(new Uint8Array(buffer));\n\t}\n\n\tif (typeof audio === \"string\") {\n\t\t// Assume base64 string — decode to bytes\n\t\tconst binary = atob(audio);\n\t\tconst bytes = new Uint8Array(binary.length);\n\t\tfor (let i = 0; i < binary.length; i++) {\n\t\t\tbytes[i] = binary.charCodeAt(i);\n\t\t}\n\t\treturn Array.from(bytes);\n\t}\n\n\tthrow new Error(\"Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.\");\n}\n\n/**\n * Detect the MIME type of the audio input for models that require it\n * (e.g., Deepgram Nova-3).\n *\n * - `File` / `Blob`: use the `.type` property (e.g., \"audio/wav\")\n * - `ArrayBuffer` / `string`: defaults to \"audio/wav\"\n */\nfunction detectAudioContentType(audio: string | File | Blob | ArrayBuffer): string {\n\t// File and Blob carry their own MIME type\n\tif (audio instanceof Blob && audio.type) {\n\t\treturn audio.type;\n\t}\n\n\t// For raw bytes, default to audio/wav — this is the most common\n\t// format for transcription inputs and what the E2E tests use.\n\treturn \"audio/wav\";\n}\n"],"mappings":";;;;;;;;AAyCA,IAAa,gCAAb,cAAmDA,sBAAAA,yBAAsD;CAIxG,YAAY,QAAgC,OAAoC;AAC/E,QAAM,EAAE,EAAE,MAAM;+CAJR,QAAO,2BAAoC;+CAC5C,iBAAA,KAAA,EAAsC;AAI7C,yBAAA,wBAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,WAAW,SAA6D;EAC7E,MAAM,EAAE,OAAO,UAAU,QAAQ,iBAAiB;EAGlD,MAAM,aAAa,MAAM,sBAAsB,MAAM;EAErD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,SAAU,OAAM,WAAW;AAC/B,MAAI,OAAQ,OAAM,iBAAiB;EAOnC,MAAM,eAAe,KAAK,kBAAkB,YAAY,MAAM;AAE9D,MAAIC,uBAAAA,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,qBAAqB,cAAc,MAAM;AAGtD,MAAIC,uBAAAA,0BAA0B,KAAK,cAAc,EAAE;AAElD,OAAI,KAAK,UAAU,sBAClB,QAAO,KAAK,wBAAwB,YAAY,OAAO,MAAM;AAE9D,UAAO,KAAK,kBAAkB,cAAc,MAAM;;AAGnD,SAAO,KAAK,qBAAqB,cAAc,MAAM;;;;;;;;;CAUtD,kBACC,YACA,eAC0B;AAC1B,MAAI,KAAK,UAAU,sBAGlB,QAAO,EAAE,OAAO;GAAE,MAFNC,eAAAA,mBAAmB,IAAI,WAAW,WAAW,CAAC;GAE7B,aADT,uBAAuB,cAAc;GACf,EAAE;AAG7C,MAAI,KAAK,UAAU,oCAClB,QAAO,EAAE,OAAOA,eAAAA,mBAAmB,IAAI,WAAW,WAAW,CAAC,EAAE;AAGjE,SAAO,EAAE,OAAO,YAAY;;CAG7B,MAAc,qBACb,cACA,SAC+B;EAE/B,MAAM,SAAU,MADJ,KAAK,cAA+C,QACvC,IAAI,KAAK,OAAO;GACxC,GAAG;GACH,GAAG;GACH,CAAC;AACF,SAAO,KAAK,gBAAgB,OAAO;;CAGpC,MAAc,kBACb,cACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EAYpB,MAAM,OAAQ,OAVG,MAAMC,wBAAAA,mBACtB,QACA,KAAK,OACL;GAAE,GAAG;GAAc,GAAG;GAAS,EAC/B;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAMnC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;;;;;;CAQjD,MAAc,wBACb,YACA,eACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EACpB,MAAM,cAAc,uBAAuB,cAAc;EAazD,MAAM,OAAQ,OAXG,MAAMC,wBAAAA,yBACtB,QACA,KAAK,OACL,IAAI,WAAW,WAAW,EAC1B,aACA;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAInC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;CAGjD,MAAc,qBACb,cACA,SAC+B;EAC/B,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALIC,uBAAAA,mBAAmB,cAAc,cAAc,CAKhC,sDAAsD;GACzF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ,GAAG;IACH,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,oDAAoD,SAAS,OAAO,KAAK,YACzE;;EAGF,MAAM,OAAQ,MAAM,SAAS,MAAM;AACnC,SAAO,KAAK,gBAAgB,KAAK;;;;;;;;;;;CAYlC,gBAAwB,KAAmD;EAE1E,MAAM,UAAU,IAAI;AACpB,MAAI,SAAS,UAAU;GAQtB,MAAM,MAPW,QAAQ,WAOF,IAAI,eAAe;GAC1C,MAAM,OAAO,KAAK,cAAc;GAChC,MAAM,SAA8B;IACnC,IAAI,KAAK,YAAY;IACrB,OAAO,KAAK;IACZ;IACA;AACD,OAAI,KAAK,SAAS,MAAM,QAAQ,IAAI,MAAM,CACzC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAO;IACpC,MAAM,EAAE,QAAQ;IAChB,OAAO,EAAE,SAAS;IAClB,KAAK,EAAE,OAAO;IACd,EAAE;AAEJ,UAAO;;EAKR,MAAM,SAA8B;GACnC,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,MAAO,IAAI,QAAmB;GAC9B;EAGD,MAAM,oBAAoB,IAAI;AAC9B,MAAI,mBAAmB,SACtB,QAAO,WAAW,kBAAkB;AAIrC,MAAI,mBAAmB,YAAY,KAClC,QAAO,WAAW,kBAAkB;AAIrC,MAAI,IAAI,YAAY,MAAM,QAAQ,IAAI,SAAS,CAC9C,QAAO,WAAW,IAAI,SAAS,KAAK,KAA8B,SAAiB;GAClF,IAAI;GACJ,MAAO,IAAI,QAAmB;GAC9B,OAAQ,IAAI,SAAoB;GAChC,KAAM,IAAI,OAAkB;GAC5B,EAAE;AAIJ,MAAI,IAAI,SAAS,MAAM,QAAQ,IAAI,MAAM,CACxC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAgC;GAC7D,MAAO,EAAE,QAAmB;GAC5B,OAAQ,EAAE,SAAoB;GAC9B,KAAM,EAAE,OAAkB;GAC1B,EAAE;AAGJ,SAAO;;;;;;;;;;;;;;;;;;;;;;;AA4BT,SAAgB,6BACf,OACA,QACC;AACD,QAAO,IAAI,8BAA8B,QAAQ,MAAM;;;;;;;;;AAcxD,eAAe,sBAAsB,OAA8D;AAClG,KAAI,iBAAiB,YACpB,QAAO,MAAM,KAAK,IAAI,WAAW,MAAM,CAAC;AAGzC,KAAI,iBAAiB,MAAM;EAE1B,MAAM,SAAS,MAAM,MAAM,aAAa;AACxC,SAAO,MAAM,KAAK,IAAI,WAAW,OAAO,CAAC;;AAG1C,KAAI,OAAO,UAAU,UAAU;EAE9B,MAAM,SAAS,KAAK,MAAM;EAC1B,MAAM,QAAQ,IAAI,WAAW,OAAO,OAAO;AAC3C,OAAK,IAAI,IAAI,GAAG,IAAI,OAAO,QAAQ,IAClC,OAAM,KAAK,OAAO,WAAW,EAAE;AAEhC,SAAO,MAAM,KAAK,MAAM;;AAGzB,OAAM,IAAI,MAAM,yEAAyE;;;;;;;;;AAU1F,SAAS,uBAAuB,OAAmD;AAElF,KAAI,iBAAiB,QAAQ,MAAM,KAClC,QAAO,MAAM;AAKd,QAAO"}
1
+ {"version":3,"file":"workers-ai-transcription.cjs","names":["BaseTranscriptionAdapter","isDirectBindingConfig","isDirectCredentialsConfig","uint8ArrayToBase64","workersAiRestFetch","workersAiRestFetchBinary","createGatewayFetch"],"sources":["../../src/adapters/workers-ai-transcription.ts"],"sourcesContent":["import { BaseTranscriptionAdapter } from \"@tanstack/ai/adapters\";\nimport type { TranscriptionOptions, TranscriptionResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch, workersAiRestFetchBinary } from \"../utils/workers-ai-rest\";\nimport { uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support speech-to-text transcription.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n *\n * **Nova-3 note:** `@cf/deepgram/nova-3` uses a different input format than the\n * Whisper models. Via binding it accepts `{ audio: { body: base64, contentType } }`.\n * Via REST it requires multipart form data (not JSON). The adapter handles both.\n */\nexport type WorkersAiTranscriptionModel =\n\t| \"@cf/openai/whisper\"\n\t| \"@cf/openai/whisper-tiny-en\"\n\t| \"@cf/openai/whisper-large-v3-turbo\"\n\t| \"@cf/deepgram/nova-3\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTranscriptionAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTranscriptionAdapter extends BaseTranscriptionAdapter<WorkersAiTranscriptionModel> {\n\treadonly name = \"workers-ai-transcription\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTranscriptionModel) {\n\t\tsuper(model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync transcribe(options: TranscriptionOptions): Promise<TranscriptionResult> {\n\t\tconst { audio, language, prompt, modelOptions } = options;\n\n\t\t// Normalize audio to raw bytes\n\t\tconst audioBytes = await normalizeAudioToBytes(audio);\n\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (language) extra.language = language;\n\t\tif (prompt) extra.initial_prompt = prompt;\n\n\t\t// Build the model-specific audio payload:\n\t\t// - Deepgram Nova-3 (binding): { audio: { body: base64, contentType: \"audio/...\" } }\n\t\t// - Deepgram Nova-3 (REST): multipart FormData (handled separately)\n\t\t// - Whisper Large v3 Turbo (REST/gateway): { audio: base64string }\n\t\t// - Other Whisper models (binding): { audio: number[] }\n\t\tconst audioPayload = this.buildAudioPayload(audioBytes, audio);\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.transcribeViaBinding(audioPayload, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\t// Nova-3 REST requires raw binary audio, not JSON\n\t\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\t\treturn this.transcribeViaRestBinary(audioBytes, audio, extra);\n\t\t\t}\n\t\t\treturn this.transcribeViaRest(audioPayload, extra);\n\t\t}\n\n\t\treturn this.transcribeViaGateway(audioPayload, extra);\n\t}\n\n\t/**\n\t * Build the audio field for the request payload, handling model-specific formats.\n\t *\n\t * - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: \"audio/...\" }`\n\t * - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string\n\t * - Other Whisper models accept `number[]` (binding) or base64 (REST)\n\t */\n\tprivate buildAudioPayload(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t): Record<string, unknown> {\n\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\tconst b64 = uint8ArrayToBase64(new Uint8Array(audioBytes));\n\t\t\tconst contentType = detectAudioContentType(originalAudio);\n\t\t\treturn { audio: { body: b64, contentType } };\n\t\t}\n\n\t\tif (this.model === \"@cf/openai/whisper-large-v3-turbo\") {\n\t\t\treturn { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };\n\t\t}\n\n\t\treturn { audio: audioBytes };\n\t}\n\n\tprivate async transcribeViaBinding(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = (await ai.run(this.model, {\n\t\t\t...audioPayload,\n\t\t\t...options,\n\t\t})) as Record<string, unknown>;\n\t\treturn this.normalizeResult(result);\n\t}\n\n\tprivate async transcribeViaRest(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ ...audioPayload, ...options },\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\t// Cloudflare REST API wraps responses in { success, result: {...} }.\n\t\t// Use `data.result` when present, fall back to `data` for direct responses.\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\t/**\n\t * Transcribe via REST using raw binary audio.\n\t * Required for models like Deepgram Nova-3 that expect raw audio bytes\n\t * with a Content-Type header (e.g. \"audio/wav\") instead of JSON.\n\t */\n\tprivate async transcribeViaRestBinary(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst contentType = detectAudioContentType(originalAudio);\n\n\t\tconst response = await workersAiRestFetchBinary(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\tnew Uint8Array(audioBytes),\n\t\t\tcontentType,\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\tprivate async transcribeViaGateway(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/transcriptions\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\t...audioPayload,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI transcription gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst data = (await response.json()) as Record<string, unknown>;\n\t\treturn this.normalizeResult(data);\n\t}\n\n\t/**\n\t * Normalize Workers AI transcription results into the standard\n\t * TanStack AI TranscriptionResult shape.\n\t *\n\t * Handles three response formats:\n\t * - Whisper: `{ text, words?, vtt? }`\n\t * - Whisper v3-turbo: `{ text, segments?, transcription_info? }`\n\t * - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`\n\t */\n\tprivate normalizeResult(raw: Record<string, unknown>): TranscriptionResult {\n\t\t// Deepgram Nova-3 format: { results: { channels: [{ alternatives: [{ transcript, words }] }] } }\n\t\tconst results = raw.results as Record<string, unknown> | undefined;\n\t\tif (results?.channels) {\n\t\t\tconst channels = results.channels as Array<{\n\t\t\t\talternatives?: Array<{\n\t\t\t\t\ttranscript?: string;\n\t\t\t\t\tconfidence?: number;\n\t\t\t\t\twords?: Array<{ word: string; start: number; end: number; confidence: number }>;\n\t\t\t\t}>;\n\t\t\t}>;\n\t\t\tconst alt = channels?.[0]?.alternatives?.[0];\n\t\t\tconst text = alt?.transcript ?? \"\";\n\t\t\tconst result: TranscriptionResult = {\n\t\t\t\tid: this.generateId(),\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t};\n\t\t\tif (alt?.words && Array.isArray(alt.words)) {\n\t\t\t\tresult.words = alt.words.map((w) => ({\n\t\t\t\t\tword: w.word ?? \"\",\n\t\t\t\t\tstart: w.start ?? 0,\n\t\t\t\t\tend: w.end ?? 0,\n\t\t\t\t}));\n\t\t\t}\n\t\t\treturn result;\n\t\t}\n\n\t\t// Whisper format: { text, words?, vtt? }\n\t\t// Whisper v3-turbo format: { text, segments?, transcription_info? }\n\t\tconst result: TranscriptionResult = {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\ttext: (raw.text as string) ?? \"\",\n\t\t};\n\n\t\t// Language from transcription_info (whisper-large-v3-turbo)\n\t\tconst transcriptionInfo = raw.transcription_info as Record<string, unknown> | undefined;\n\t\tif (transcriptionInfo?.language) {\n\t\t\tresult.language = transcriptionInfo.language as string;\n\t\t}\n\n\t\t// Duration\n\t\tif (transcriptionInfo?.duration != null) {\n\t\t\tresult.duration = transcriptionInfo.duration as number;\n\t\t}\n\n\t\t// Segments (whisper-large-v3-turbo returns these)\n\t\tif (raw.segments && Array.isArray(raw.segments)) {\n\t\t\tresult.segments = raw.segments.map((seg: Record<string, unknown>, idx: number) => ({\n\t\t\t\tid: idx,\n\t\t\t\ttext: (seg.text as string) ?? \"\",\n\t\t\t\tstart: (seg.start as number) ?? 0,\n\t\t\t\tend: (seg.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\t// Words — basic whisper returns top-level words[], v3-turbo nests them in segments\n\t\tif (raw.words && Array.isArray(raw.words)) {\n\t\t\tresult.words = raw.words.map((w: Record<string, unknown>) => ({\n\t\t\t\tword: (w.word as string) ?? \"\",\n\t\t\t\tstart: (w.start as number) ?? 0,\n\t\t\t\tend: (w.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\treturn result;\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI transcription adapter for speech-to-text.\n *\n * Works with TanStack AI's `generateTranscription()` activity function:\n * ```ts\n * import { generateTranscription } from \"@tanstack/ai\";\n * import { createWorkersAiTranscription } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTranscription(\n * \"@cf/openai/whisper-large-v3-turbo\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateTranscription({ adapter, audio: audioData });\n * // result.text — the transcribed text\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTranscription(\n\tmodel: WorkersAiTranscriptionModel,\n\tconfig: WorkersAiAdapterConfig,\n) {\n\treturn new WorkersAiTranscriptionAdapter(config, model);\n}\n\n// ---------------------------------------------------------------------------\n// Utilities\n// ---------------------------------------------------------------------------\n\n/**\n * Normalize various audio input formats into a number[] (raw bytes).\n *\n * Note: `File extends Blob`, so `File` instances are handled by the\n * `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full\n * contents regardless of any prior reads — there's no cursor to worry about.\n */\nasync function normalizeAudioToBytes(audio: string | File | Blob | ArrayBuffer): Promise<number[]> {\n\tif (audio instanceof ArrayBuffer) {\n\t\treturn Array.from(new Uint8Array(audio));\n\t}\n\n\tif (audio instanceof Blob) {\n\t\t// This also handles `File` (which extends Blob)\n\t\tconst buffer = await audio.arrayBuffer();\n\t\treturn Array.from(new Uint8Array(buffer));\n\t}\n\n\tif (typeof audio === \"string\") {\n\t\t// Assume base64 string — decode to bytes\n\t\tconst binary = atob(audio);\n\t\tconst bytes = new Uint8Array(binary.length);\n\t\tfor (let i = 0; i < binary.length; i++) {\n\t\t\tbytes[i] = binary.charCodeAt(i);\n\t\t}\n\t\treturn Array.from(bytes);\n\t}\n\n\tthrow new Error(\"Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.\");\n}\n\n/**\n * Detect the MIME type of the audio input for models that require it\n * (e.g., Deepgram Nova-3).\n *\n * - `File` / `Blob`: use the `.type` property (e.g., \"audio/wav\")\n * - `ArrayBuffer` / `string`: defaults to \"audio/wav\"\n */\nfunction detectAudioContentType(audio: string | File | Blob | ArrayBuffer): string {\n\t// File and Blob carry their own MIME type\n\tif (audio instanceof Blob && audio.type) {\n\t\treturn audio.type;\n\t}\n\n\t// For raw bytes, default to audio/wav — this is the most common\n\t// format for transcription inputs and what the E2E tests use.\n\treturn \"audio/wav\";\n}\n"],"mappings":";;;;;;;AAyCA,IAAa,gCAAb,cAAmDA,sBAAAA,yBAAsD;CAIxG,YAAY,QAAgC,OAAoC;EAC/E,MAAM,KAAK;+CAJH,QAAO,0BAAA;+CACR,iBAAA,KAAA,CAAA;EAIP,uBAAA,wBAAwB,MAAM;EAC9B,KAAK,gBAAgB;CACtB;CAEA,MAAM,WAAW,SAA6D;EAC7E,MAAM,EAAE,OAAO,UAAU,QAAQ,iBAAiB;EAGlD,MAAM,aAAa,MAAM,sBAAsB,KAAK;EAEpD,MAAM,QAAiC,EAAE,GAAG,aAAa;EACzD,IAAI,UAAU,MAAM,WAAW;EAC/B,IAAI,QAAQ,MAAM,iBAAiB;EAOnC,MAAM,eAAe,KAAK,kBAAkB,YAAY,KAAK;EAE7D,IAAIC,uBAAAA,sBAAsB,KAAK,aAAa,GAC3C,OAAO,KAAK,qBAAqB,cAAc,KAAK;EAGrD,IAAIC,uBAAAA,0BAA0B,KAAK,aAAa,GAAG;GAElD,IAAI,KAAK,UAAU,uBAClB,OAAO,KAAK,wBAAwB,YAAY,OAAO,KAAK;GAE7D,OAAO,KAAK,kBAAkB,cAAc,KAAK;EAClD;EAEA,OAAO,KAAK,qBAAqB,cAAc,KAAK;CACrD;;;;;;;;CASA,kBACC,YACA,eAC0B;EAC1B,IAAI,KAAK,UAAU,uBAGlB,OAAO,EAAE,OAAO;GAAE,MAFNC,eAAAA,mBAAmB,IAAI,WAAW,UAAU,CAE9B;GAAG,aADT,uBAAuB,aACJ;EAAE,EAAE;EAG5C,IAAI,KAAK,UAAU,qCAClB,OAAO,EAAE,OAAOA,eAAAA,mBAAmB,IAAI,WAAW,UAAU,CAAC,EAAE;EAGhE,OAAO,EAAE,OAAO,WAAW;CAC5B;CAEA,MAAc,qBACb,cACA,SAC+B;EAE/B,MAAM,SAAU,MADJ,KAAK,cAA+C,QACvC,IAAI,KAAK,OAAO;GACxC,GAAG;GACH,GAAG;EACJ,CAAC;EACD,OAAO,KAAK,gBAAgB,MAAM;CACnC;CAEA,MAAc,kBACb,cACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EAYpB,MAAM,OAAQ,OAAM,MAVGC,wBAAAA,mBACtB,QACA,KAAK,OACL;GAAE,GAAG;GAAc,GAAG;EAAQ,GAC9B;GACC,OAAO;GACP,QAAS,QAAqC;EAC/C,CACD,EAAA,CAE6B,KAAK;EAMlC,OAAO,KAAK,gBAAgB,KAAK,UAAU,IAAI;CAChD;;;;;;CAOA,MAAc,wBACb,YACA,eACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EACpB,MAAM,cAAc,uBAAuB,aAAa;EAaxD,MAAM,OAAQ,OAAM,MAXGC,wBAAAA,yBACtB,QACA,KAAK,OACL,IAAI,WAAW,UAAU,GACzB,aACA;GACC,OAAO;GACP,QAAS,QAAqC;EAC/C,CACD,EAAA,CAE6B,KAAK;EAIlC,OAAO,KAAK,gBAAgB,KAAK,UAAU,IAAI;CAChD;CAEA,MAAc,qBACb,cACA,SAC+B;EAC/B,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALIC,uBAAAA,mBAAmB,cAAc,aAKpB,CAAC,CAAC,sDAAsD;GACzF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ,GAAG;IACH,GAAG;GACJ,CAAC;EACF,CAAC;EAED,IAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,KAAK;GACtC,MAAM,IAAI,MACT,oDAAoD,SAAS,OAAO,KAAK,WAC1E;EACD;EAEA,MAAM,OAAQ,MAAM,SAAS,KAAK;EAClC,OAAO,KAAK,gBAAgB,IAAI;CACjC;;;;;;;;;;CAWA,gBAAwB,KAAmD;EAE1E,MAAM,UAAU,IAAI;EACpB,IAAI,SAAS,UAAU;GAQtB,MAAM,MAPW,QAAQ,WAOF,EAAE,EAAE,eAAe;GAC1C,MAAM,OAAO,KAAK,cAAc;GAChC,MAAM,SAA8B;IACnC,IAAI,KAAK,WAAW;IACpB,OAAO,KAAK;IACZ;GACD;GACA,IAAI,KAAK,SAAS,MAAM,QAAQ,IAAI,KAAK,GACxC,OAAO,QAAQ,IAAI,MAAM,KAAK,OAAO;IACpC,MAAM,EAAE,QAAQ;IAChB,OAAO,EAAE,SAAS;IAClB,KAAK,EAAE,OAAO;GACf,EAAE;GAEH,OAAO;EACR;EAIA,MAAM,SAA8B;GACnC,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,MAAO,IAAI,QAAmB;EAC/B;EAGA,MAAM,oBAAoB,IAAI;EAC9B,IAAI,mBAAmB,UACtB,OAAO,WAAW,kBAAkB;EAIrC,IAAI,mBAAmB,YAAY,MAClC,OAAO,WAAW,kBAAkB;EAIrC,IAAI,IAAI,YAAY,MAAM,QAAQ,IAAI,QAAQ,GAC7C,OAAO,WAAW,IAAI,SAAS,KAAK,KAA8B,SAAiB;GAClF,IAAI;GACJ,MAAO,IAAI,QAAmB;GAC9B,OAAQ,IAAI,SAAoB;GAChC,KAAM,IAAI,OAAkB;EAC7B,EAAE;EAIH,IAAI,IAAI,SAAS,MAAM,QAAQ,IAAI,KAAK,GACvC,OAAO,QAAQ,IAAI,MAAM,KAAK,OAAgC;GAC7D,MAAO,EAAE,QAAmB;GAC5B,OAAQ,EAAE,SAAoB;GAC9B,KAAM,EAAE,OAAkB;EAC3B,EAAE;EAGH,OAAO;CACR;AACD;;;;;;;;;;;;;;;;;;;;;AA0BA,SAAgB,6BACf,OACA,QACC;CACD,OAAO,IAAI,8BAA8B,QAAQ,KAAK;AACvD;;;;;;;;AAaA,eAAe,sBAAsB,OAA8D;CAClG,IAAI,iBAAiB,aACpB,OAAO,MAAM,KAAK,IAAI,WAAW,KAAK,CAAC;CAGxC,IAAI,iBAAiB,MAAM;EAE1B,MAAM,SAAS,MAAM,MAAM,YAAY;EACvC,OAAO,MAAM,KAAK,IAAI,WAAW,MAAM,CAAC;CACzC;CAEA,IAAI,OAAO,UAAU,UAAU;EAE9B,MAAM,SAAS,KAAK,KAAK;EACzB,MAAM,QAAQ,IAAI,WAAW,OAAO,MAAM;EAC1C,KAAK,IAAI,IAAI,GAAG,IAAI,OAAO,QAAQ,KAClC,MAAM,KAAK,OAAO,WAAW,CAAC;EAE/B,OAAO,MAAM,KAAK,KAAK;CACxB;CAEA,MAAM,IAAI,MAAM,wEAAwE;AACzF;;;;;;;;AASA,SAAS,uBAAuB,OAAmD;CAElF,IAAI,iBAAiB,QAAQ,MAAM,MAClC,OAAO,MAAM;CAKd,OAAO;AACR"}
@@ -1,4 +1,4 @@
1
- import { i as WorkersAiAdapterConfig } from "../create-fetcher-vAQ8WW-p.cjs";
1
+ import { i as WorkersAiAdapterConfig } from "../create-fetcher-Bp5yCNaO.cjs";
2
2
  import { TranscriptionOptions, TranscriptionResult } from "@tanstack/ai";
3
3
  import { BaseTranscriptionAdapter } from "@tanstack/ai/adapters";
4
4
 
@@ -1,6 +1,6 @@
1
- import { i as WorkersAiAdapterConfig } from "../create-fetcher-6p6heb85.mjs";
2
- import { BaseTranscriptionAdapter } from "@tanstack/ai/adapters";
1
+ import { i as WorkersAiAdapterConfig } from "../create-fetcher-Bp5yCNaO.mjs";
3
2
  import { TranscriptionOptions, TranscriptionResult } from "@tanstack/ai";
3
+ import { BaseTranscriptionAdapter } from "@tanstack/ai/adapters";
4
4
 
5
5
  //#region src/adapters/workers-ai-transcription.d.ts
6
6
  /**
@@ -1,12 +1,12 @@
1
- import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-CeUOJgrh.mjs";
2
- import { t as _defineProperty } from "../defineProperty-CbyrzcbA.mjs";
3
- import { n as workersAiRestFetchBinary, t as workersAiRestFetch } from "../workers-ai-rest-GKy2r7eG.mjs";
4
- import { n as uint8ArrayToBase64 } from "../binary-p4H_N_3M.mjs";
1
+ import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-BnSnCaHf.mjs";
2
+ import { t as _defineProperty } from "../defineProperty-BC3bEcwq.mjs";
3
+ import { n as workersAiRestFetchBinary, t as workersAiRestFetch } from "../workers-ai-rest-B6_yU35Q.mjs";
4
+ import { n as uint8ArrayToBase64 } from "../binary-B5YCVsro.mjs";
5
5
  import { BaseTranscriptionAdapter } from "@tanstack/ai/adapters";
6
6
  //#region src/adapters/workers-ai-transcription.ts
7
7
  var WorkersAiTranscriptionAdapter = class extends BaseTranscriptionAdapter {
8
8
  constructor(config, model) {
9
- super({}, model);
9
+ super(model);
10
10
  _defineProperty(this, "name", "workers-ai-transcription");
11
11
  _defineProperty(this, "adapterConfig", void 0);
12
12
  validateWorkersAiConfig(config);
@@ -1 +1 @@
1
- {"version":3,"file":"workers-ai-transcription.mjs","names":[],"sources":["../../src/adapters/workers-ai-transcription.ts"],"sourcesContent":["import { BaseTranscriptionAdapter } from \"@tanstack/ai/adapters\";\nimport type { TranscriptionOptions, TranscriptionResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch, workersAiRestFetchBinary } from \"../utils/workers-ai-rest\";\nimport { uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support speech-to-text transcription.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n *\n * **Nova-3 note:** `@cf/deepgram/nova-3` uses a different input format than the\n * Whisper models. Via binding it accepts `{ audio: { body: base64, contentType } }`.\n * Via REST it requires multipart form data (not JSON). The adapter handles both.\n */\nexport type WorkersAiTranscriptionModel =\n\t| \"@cf/openai/whisper\"\n\t| \"@cf/openai/whisper-tiny-en\"\n\t| \"@cf/openai/whisper-large-v3-turbo\"\n\t| \"@cf/deepgram/nova-3\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTranscriptionAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTranscriptionAdapter extends BaseTranscriptionAdapter<WorkersAiTranscriptionModel> {\n\treadonly name = \"workers-ai-transcription\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTranscriptionModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync transcribe(options: TranscriptionOptions): Promise<TranscriptionResult> {\n\t\tconst { audio, language, prompt, modelOptions } = options;\n\n\t\t// Normalize audio to raw bytes\n\t\tconst audioBytes = await normalizeAudioToBytes(audio);\n\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (language) extra.language = language;\n\t\tif (prompt) extra.initial_prompt = prompt;\n\n\t\t// Build the model-specific audio payload:\n\t\t// - Deepgram Nova-3 (binding): { audio: { body: base64, contentType: \"audio/...\" } }\n\t\t// - Deepgram Nova-3 (REST): multipart FormData (handled separately)\n\t\t// - Whisper Large v3 Turbo (REST/gateway): { audio: base64string }\n\t\t// - Other Whisper models (binding): { audio: number[] }\n\t\tconst audioPayload = this.buildAudioPayload(audioBytes, audio);\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.transcribeViaBinding(audioPayload, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\t// Nova-3 REST requires raw binary audio, not JSON\n\t\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\t\treturn this.transcribeViaRestBinary(audioBytes, audio, extra);\n\t\t\t}\n\t\t\treturn this.transcribeViaRest(audioPayload, extra);\n\t\t}\n\n\t\treturn this.transcribeViaGateway(audioPayload, extra);\n\t}\n\n\t/**\n\t * Build the audio field for the request payload, handling model-specific formats.\n\t *\n\t * - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: \"audio/...\" }`\n\t * - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string\n\t * - Other Whisper models accept `number[]` (binding) or base64 (REST)\n\t */\n\tprivate buildAudioPayload(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t): Record<string, unknown> {\n\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\tconst b64 = uint8ArrayToBase64(new Uint8Array(audioBytes));\n\t\t\tconst contentType = detectAudioContentType(originalAudio);\n\t\t\treturn { audio: { body: b64, contentType } };\n\t\t}\n\n\t\tif (this.model === \"@cf/openai/whisper-large-v3-turbo\") {\n\t\t\treturn { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };\n\t\t}\n\n\t\treturn { audio: audioBytes };\n\t}\n\n\tprivate async transcribeViaBinding(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = (await ai.run(this.model, {\n\t\t\t...audioPayload,\n\t\t\t...options,\n\t\t})) as Record<string, unknown>;\n\t\treturn this.normalizeResult(result);\n\t}\n\n\tprivate async transcribeViaRest(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ ...audioPayload, ...options },\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\t// Cloudflare REST API wraps responses in { success, result: {...} }.\n\t\t// Use `data.result` when present, fall back to `data` for direct responses.\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\t/**\n\t * Transcribe via REST using raw binary audio.\n\t * Required for models like Deepgram Nova-3 that expect raw audio bytes\n\t * with a Content-Type header (e.g. \"audio/wav\") instead of JSON.\n\t */\n\tprivate async transcribeViaRestBinary(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst contentType = detectAudioContentType(originalAudio);\n\n\t\tconst response = await workersAiRestFetchBinary(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\tnew Uint8Array(audioBytes),\n\t\t\tcontentType,\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\tprivate async transcribeViaGateway(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/transcriptions\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\t...audioPayload,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI transcription gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst data = (await response.json()) as Record<string, unknown>;\n\t\treturn this.normalizeResult(data);\n\t}\n\n\t/**\n\t * Normalize Workers AI transcription results into the standard\n\t * TanStack AI TranscriptionResult shape.\n\t *\n\t * Handles three response formats:\n\t * - Whisper: `{ text, words?, vtt? }`\n\t * - Whisper v3-turbo: `{ text, segments?, transcription_info? }`\n\t * - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`\n\t */\n\tprivate normalizeResult(raw: Record<string, unknown>): TranscriptionResult {\n\t\t// Deepgram Nova-3 format: { results: { channels: [{ alternatives: [{ transcript, words }] }] } }\n\t\tconst results = raw.results as Record<string, unknown> | undefined;\n\t\tif (results?.channels) {\n\t\t\tconst channels = results.channels as Array<{\n\t\t\t\talternatives?: Array<{\n\t\t\t\t\ttranscript?: string;\n\t\t\t\t\tconfidence?: number;\n\t\t\t\t\twords?: Array<{ word: string; start: number; end: number; confidence: number }>;\n\t\t\t\t}>;\n\t\t\t}>;\n\t\t\tconst alt = channels?.[0]?.alternatives?.[0];\n\t\t\tconst text = alt?.transcript ?? \"\";\n\t\t\tconst result: TranscriptionResult = {\n\t\t\t\tid: this.generateId(),\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t};\n\t\t\tif (alt?.words && Array.isArray(alt.words)) {\n\t\t\t\tresult.words = alt.words.map((w) => ({\n\t\t\t\t\tword: w.word ?? \"\",\n\t\t\t\t\tstart: w.start ?? 0,\n\t\t\t\t\tend: w.end ?? 0,\n\t\t\t\t}));\n\t\t\t}\n\t\t\treturn result;\n\t\t}\n\n\t\t// Whisper format: { text, words?, vtt? }\n\t\t// Whisper v3-turbo format: { text, segments?, transcription_info? }\n\t\tconst result: TranscriptionResult = {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\ttext: (raw.text as string) ?? \"\",\n\t\t};\n\n\t\t// Language from transcription_info (whisper-large-v3-turbo)\n\t\tconst transcriptionInfo = raw.transcription_info as Record<string, unknown> | undefined;\n\t\tif (transcriptionInfo?.language) {\n\t\t\tresult.language = transcriptionInfo.language as string;\n\t\t}\n\n\t\t// Duration\n\t\tif (transcriptionInfo?.duration != null) {\n\t\t\tresult.duration = transcriptionInfo.duration as number;\n\t\t}\n\n\t\t// Segments (whisper-large-v3-turbo returns these)\n\t\tif (raw.segments && Array.isArray(raw.segments)) {\n\t\t\tresult.segments = raw.segments.map((seg: Record<string, unknown>, idx: number) => ({\n\t\t\t\tid: idx,\n\t\t\t\ttext: (seg.text as string) ?? \"\",\n\t\t\t\tstart: (seg.start as number) ?? 0,\n\t\t\t\tend: (seg.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\t// Words — basic whisper returns top-level words[], v3-turbo nests them in segments\n\t\tif (raw.words && Array.isArray(raw.words)) {\n\t\t\tresult.words = raw.words.map((w: Record<string, unknown>) => ({\n\t\t\t\tword: (w.word as string) ?? \"\",\n\t\t\t\tstart: (w.start as number) ?? 0,\n\t\t\t\tend: (w.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\treturn result;\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI transcription adapter for speech-to-text.\n *\n * Works with TanStack AI's `generateTranscription()` activity function:\n * ```ts\n * import { generateTranscription } from \"@tanstack/ai\";\n * import { createWorkersAiTranscription } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTranscription(\n * \"@cf/openai/whisper-large-v3-turbo\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateTranscription({ adapter, audio: audioData });\n * // result.text — the transcribed text\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTranscription(\n\tmodel: WorkersAiTranscriptionModel,\n\tconfig: WorkersAiAdapterConfig,\n) {\n\treturn new WorkersAiTranscriptionAdapter(config, model);\n}\n\n// ---------------------------------------------------------------------------\n// Utilities\n// ---------------------------------------------------------------------------\n\n/**\n * Normalize various audio input formats into a number[] (raw bytes).\n *\n * Note: `File extends Blob`, so `File` instances are handled by the\n * `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full\n * contents regardless of any prior reads — there's no cursor to worry about.\n */\nasync function normalizeAudioToBytes(audio: string | File | Blob | ArrayBuffer): Promise<number[]> {\n\tif (audio instanceof ArrayBuffer) {\n\t\treturn Array.from(new Uint8Array(audio));\n\t}\n\n\tif (audio instanceof Blob) {\n\t\t// This also handles `File` (which extends Blob)\n\t\tconst buffer = await audio.arrayBuffer();\n\t\treturn Array.from(new Uint8Array(buffer));\n\t}\n\n\tif (typeof audio === \"string\") {\n\t\t// Assume base64 string — decode to bytes\n\t\tconst binary = atob(audio);\n\t\tconst bytes = new Uint8Array(binary.length);\n\t\tfor (let i = 0; i < binary.length; i++) {\n\t\t\tbytes[i] = binary.charCodeAt(i);\n\t\t}\n\t\treturn Array.from(bytes);\n\t}\n\n\tthrow new Error(\"Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.\");\n}\n\n/**\n * Detect the MIME type of the audio input for models that require it\n * (e.g., Deepgram Nova-3).\n *\n * - `File` / `Blob`: use the `.type` property (e.g., \"audio/wav\")\n * - `ArrayBuffer` / `string`: defaults to \"audio/wav\"\n */\nfunction detectAudioContentType(audio: string | File | Blob | ArrayBuffer): string {\n\t// File and Blob carry their own MIME type\n\tif (audio instanceof Blob && audio.type) {\n\t\treturn audio.type;\n\t}\n\n\t// For raw bytes, default to audio/wav — this is the most common\n\t// format for transcription inputs and what the E2E tests use.\n\treturn \"audio/wav\";\n}\n"],"mappings":";;;;;;AAyCA,IAAa,gCAAb,cAAmD,yBAAsD;CAIxG,YAAY,QAAgC,OAAoC;AAC/E,QAAM,EAAE,EAAE,MAAM;wBAJR,QAAO,2BAAoC;wBAC5C,iBAAA,KAAA,EAAsC;AAI7C,0BAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,WAAW,SAA6D;EAC7E,MAAM,EAAE,OAAO,UAAU,QAAQ,iBAAiB;EAGlD,MAAM,aAAa,MAAM,sBAAsB,MAAM;EAErD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,SAAU,OAAM,WAAW;AAC/B,MAAI,OAAQ,OAAM,iBAAiB;EAOnC,MAAM,eAAe,KAAK,kBAAkB,YAAY,MAAM;AAE9D,MAAI,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,qBAAqB,cAAc,MAAM;AAGtD,MAAI,0BAA0B,KAAK,cAAc,EAAE;AAElD,OAAI,KAAK,UAAU,sBAClB,QAAO,KAAK,wBAAwB,YAAY,OAAO,MAAM;AAE9D,UAAO,KAAK,kBAAkB,cAAc,MAAM;;AAGnD,SAAO,KAAK,qBAAqB,cAAc,MAAM;;;;;;;;;CAUtD,kBACC,YACA,eAC0B;AAC1B,MAAI,KAAK,UAAU,sBAGlB,QAAO,EAAE,OAAO;GAAE,MAFN,mBAAmB,IAAI,WAAW,WAAW,CAAC;GAE7B,aADT,uBAAuB,cAAc;GACf,EAAE;AAG7C,MAAI,KAAK,UAAU,oCAClB,QAAO,EAAE,OAAO,mBAAmB,IAAI,WAAW,WAAW,CAAC,EAAE;AAGjE,SAAO,EAAE,OAAO,YAAY;;CAG7B,MAAc,qBACb,cACA,SAC+B;EAE/B,MAAM,SAAU,MADJ,KAAK,cAA+C,QACvC,IAAI,KAAK,OAAO;GACxC,GAAG;GACH,GAAG;GACH,CAAC;AACF,SAAO,KAAK,gBAAgB,OAAO;;CAGpC,MAAc,kBACb,cACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EAYpB,MAAM,OAAQ,OAVG,MAAM,mBACtB,QACA,KAAK,OACL;GAAE,GAAG;GAAc,GAAG;GAAS,EAC/B;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAMnC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;;;;;;CAQjD,MAAc,wBACb,YACA,eACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EACpB,MAAM,cAAc,uBAAuB,cAAc;EAazD,MAAM,OAAQ,OAXG,MAAM,yBACtB,QACA,KAAK,OACL,IAAI,WAAW,WAAW,EAC1B,aACA;GACC,OAAO;GACP,QAAS,QAAqC;GAC9C,CACD,EAE4B,MAAM;AAInC,SAAO,KAAK,gBAAgB,KAAK,UAAU,KAAK;;CAGjD,MAAc,qBACb,cACA,SAC+B;EAC/B,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,cAAc,CAKhC,sDAAsD;GACzF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ,GAAG;IACH,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,oDAAoD,SAAS,OAAO,KAAK,YACzE;;EAGF,MAAM,OAAQ,MAAM,SAAS,MAAM;AACnC,SAAO,KAAK,gBAAgB,KAAK;;;;;;;;;;;CAYlC,gBAAwB,KAAmD;EAE1E,MAAM,UAAU,IAAI;AACpB,MAAI,SAAS,UAAU;GAQtB,MAAM,MAPW,QAAQ,WAOF,IAAI,eAAe;GAC1C,MAAM,OAAO,KAAK,cAAc;GAChC,MAAM,SAA8B;IACnC,IAAI,KAAK,YAAY;IACrB,OAAO,KAAK;IACZ;IACA;AACD,OAAI,KAAK,SAAS,MAAM,QAAQ,IAAI,MAAM,CACzC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAO;IACpC,MAAM,EAAE,QAAQ;IAChB,OAAO,EAAE,SAAS;IAClB,KAAK,EAAE,OAAO;IACd,EAAE;AAEJ,UAAO;;EAKR,MAAM,SAA8B;GACnC,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,MAAO,IAAI,QAAmB;GAC9B;EAGD,MAAM,oBAAoB,IAAI;AAC9B,MAAI,mBAAmB,SACtB,QAAO,WAAW,kBAAkB;AAIrC,MAAI,mBAAmB,YAAY,KAClC,QAAO,WAAW,kBAAkB;AAIrC,MAAI,IAAI,YAAY,MAAM,QAAQ,IAAI,SAAS,CAC9C,QAAO,WAAW,IAAI,SAAS,KAAK,KAA8B,SAAiB;GAClF,IAAI;GACJ,MAAO,IAAI,QAAmB;GAC9B,OAAQ,IAAI,SAAoB;GAChC,KAAM,IAAI,OAAkB;GAC5B,EAAE;AAIJ,MAAI,IAAI,SAAS,MAAM,QAAQ,IAAI,MAAM,CACxC,QAAO,QAAQ,IAAI,MAAM,KAAK,OAAgC;GAC7D,MAAO,EAAE,QAAmB;GAC5B,OAAQ,EAAE,SAAoB;GAC9B,KAAM,EAAE,OAAkB;GAC1B,EAAE;AAGJ,SAAO;;;;;;;;;;;;;;;;;;;;;;;AA4BT,SAAgB,6BACf,OACA,QACC;AACD,QAAO,IAAI,8BAA8B,QAAQ,MAAM;;;;;;;;;AAcxD,eAAe,sBAAsB,OAA8D;AAClG,KAAI,iBAAiB,YACpB,QAAO,MAAM,KAAK,IAAI,WAAW,MAAM,CAAC;AAGzC,KAAI,iBAAiB,MAAM;EAE1B,MAAM,SAAS,MAAM,MAAM,aAAa;AACxC,SAAO,MAAM,KAAK,IAAI,WAAW,OAAO,CAAC;;AAG1C,KAAI,OAAO,UAAU,UAAU;EAE9B,MAAM,SAAS,KAAK,MAAM;EAC1B,MAAM,QAAQ,IAAI,WAAW,OAAO,OAAO;AAC3C,OAAK,IAAI,IAAI,GAAG,IAAI,OAAO,QAAQ,IAClC,OAAM,KAAK,OAAO,WAAW,EAAE;AAEhC,SAAO,MAAM,KAAK,MAAM;;AAGzB,OAAM,IAAI,MAAM,yEAAyE;;;;;;;;;AAU1F,SAAS,uBAAuB,OAAmD;AAElF,KAAI,iBAAiB,QAAQ,MAAM,KAClC,QAAO,MAAM;AAKd,QAAO"}
1
+ {"version":3,"file":"workers-ai-transcription.mjs","names":[],"sources":["../../src/adapters/workers-ai-transcription.ts"],"sourcesContent":["import { BaseTranscriptionAdapter } from \"@tanstack/ai/adapters\";\nimport type { TranscriptionOptions, TranscriptionResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch, workersAiRestFetchBinary } from \"../utils/workers-ai-rest\";\nimport { uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support speech-to-text transcription.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n *\n * **Nova-3 note:** `@cf/deepgram/nova-3` uses a different input format than the\n * Whisper models. Via binding it accepts `{ audio: { body: base64, contentType } }`.\n * Via REST it requires multipart form data (not JSON). The adapter handles both.\n */\nexport type WorkersAiTranscriptionModel =\n\t| \"@cf/openai/whisper\"\n\t| \"@cf/openai/whisper-tiny-en\"\n\t| \"@cf/openai/whisper-large-v3-turbo\"\n\t| \"@cf/deepgram/nova-3\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTranscriptionAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTranscriptionAdapter extends BaseTranscriptionAdapter<WorkersAiTranscriptionModel> {\n\treadonly name = \"workers-ai-transcription\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTranscriptionModel) {\n\t\tsuper(model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync transcribe(options: TranscriptionOptions): Promise<TranscriptionResult> {\n\t\tconst { audio, language, prompt, modelOptions } = options;\n\n\t\t// Normalize audio to raw bytes\n\t\tconst audioBytes = await normalizeAudioToBytes(audio);\n\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (language) extra.language = language;\n\t\tif (prompt) extra.initial_prompt = prompt;\n\n\t\t// Build the model-specific audio payload:\n\t\t// - Deepgram Nova-3 (binding): { audio: { body: base64, contentType: \"audio/...\" } }\n\t\t// - Deepgram Nova-3 (REST): multipart FormData (handled separately)\n\t\t// - Whisper Large v3 Turbo (REST/gateway): { audio: base64string }\n\t\t// - Other Whisper models (binding): { audio: number[] }\n\t\tconst audioPayload = this.buildAudioPayload(audioBytes, audio);\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.transcribeViaBinding(audioPayload, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\t// Nova-3 REST requires raw binary audio, not JSON\n\t\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\t\treturn this.transcribeViaRestBinary(audioBytes, audio, extra);\n\t\t\t}\n\t\t\treturn this.transcribeViaRest(audioPayload, extra);\n\t\t}\n\n\t\treturn this.transcribeViaGateway(audioPayload, extra);\n\t}\n\n\t/**\n\t * Build the audio field for the request payload, handling model-specific formats.\n\t *\n\t * - `@cf/deepgram/nova-3` requires `{ body: base64, contentType: \"audio/...\" }`\n\t * - `@cf/openai/whisper-large-v3-turbo` REST/gateway accepts a base64 string\n\t * - Other Whisper models accept `number[]` (binding) or base64 (REST)\n\t */\n\tprivate buildAudioPayload(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t): Record<string, unknown> {\n\t\tif (this.model === \"@cf/deepgram/nova-3\") {\n\t\t\tconst b64 = uint8ArrayToBase64(new Uint8Array(audioBytes));\n\t\t\tconst contentType = detectAudioContentType(originalAudio);\n\t\t\treturn { audio: { body: b64, contentType } };\n\t\t}\n\n\t\tif (this.model === \"@cf/openai/whisper-large-v3-turbo\") {\n\t\t\treturn { audio: uint8ArrayToBase64(new Uint8Array(audioBytes)) };\n\t\t}\n\n\t\treturn { audio: audioBytes };\n\t}\n\n\tprivate async transcribeViaBinding(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = (await ai.run(this.model, {\n\t\t\t...audioPayload,\n\t\t\t...options,\n\t\t})) as Record<string, unknown>;\n\t\treturn this.normalizeResult(result);\n\t}\n\n\tprivate async transcribeViaRest(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ ...audioPayload, ...options },\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\t// Cloudflare REST API wraps responses in { success, result: {...} }.\n\t\t// Use `data.result` when present, fall back to `data` for direct responses.\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\t/**\n\t * Transcribe via REST using raw binary audio.\n\t * Required for models like Deepgram Nova-3 that expect raw audio bytes\n\t * with a Content-Type header (e.g. \"audio/wav\") instead of JSON.\n\t */\n\tprivate async transcribeViaRestBinary(\n\t\taudioBytes: number[],\n\t\toriginalAudio: string | File | Blob | ArrayBuffer,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst contentType = detectAudioContentType(originalAudio);\n\n\t\tconst response = await workersAiRestFetchBinary(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\tnew Uint8Array(audioBytes),\n\t\t\tcontentType,\n\t\t\t{\n\t\t\t\tlabel: \"Workers AI transcription\",\n\t\t\t\tsignal: (options as { signal?: AbortSignal }).signal,\n\t\t\t},\n\t\t);\n\n\t\tconst data = (await response.json()) as {\n\t\t\tresult?: Record<string, unknown>;\n\t\t} & Record<string, unknown>;\n\n\t\treturn this.normalizeResult(data.result ?? data);\n\t}\n\n\tprivate async transcribeViaGateway(\n\t\taudioPayload: Record<string, unknown>,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TranscriptionResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/transcriptions\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\t...audioPayload,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI transcription gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst data = (await response.json()) as Record<string, unknown>;\n\t\treturn this.normalizeResult(data);\n\t}\n\n\t/**\n\t * Normalize Workers AI transcription results into the standard\n\t * TanStack AI TranscriptionResult shape.\n\t *\n\t * Handles three response formats:\n\t * - Whisper: `{ text, words?, vtt? }`\n\t * - Whisper v3-turbo: `{ text, segments?, transcription_info? }`\n\t * - Deepgram Nova-3: `{ results: { channels: [{ alternatives: [{ transcript, words }] }] } }`\n\t */\n\tprivate normalizeResult(raw: Record<string, unknown>): TranscriptionResult {\n\t\t// Deepgram Nova-3 format: { results: { channels: [{ alternatives: [{ transcript, words }] }] } }\n\t\tconst results = raw.results as Record<string, unknown> | undefined;\n\t\tif (results?.channels) {\n\t\t\tconst channels = results.channels as Array<{\n\t\t\t\talternatives?: Array<{\n\t\t\t\t\ttranscript?: string;\n\t\t\t\t\tconfidence?: number;\n\t\t\t\t\twords?: Array<{ word: string; start: number; end: number; confidence: number }>;\n\t\t\t\t}>;\n\t\t\t}>;\n\t\t\tconst alt = channels?.[0]?.alternatives?.[0];\n\t\t\tconst text = alt?.transcript ?? \"\";\n\t\t\tconst result: TranscriptionResult = {\n\t\t\t\tid: this.generateId(),\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t};\n\t\t\tif (alt?.words && Array.isArray(alt.words)) {\n\t\t\t\tresult.words = alt.words.map((w) => ({\n\t\t\t\t\tword: w.word ?? \"\",\n\t\t\t\t\tstart: w.start ?? 0,\n\t\t\t\t\tend: w.end ?? 0,\n\t\t\t\t}));\n\t\t\t}\n\t\t\treturn result;\n\t\t}\n\n\t\t// Whisper format: { text, words?, vtt? }\n\t\t// Whisper v3-turbo format: { text, segments?, transcription_info? }\n\t\tconst result: TranscriptionResult = {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\ttext: (raw.text as string) ?? \"\",\n\t\t};\n\n\t\t// Language from transcription_info (whisper-large-v3-turbo)\n\t\tconst transcriptionInfo = raw.transcription_info as Record<string, unknown> | undefined;\n\t\tif (transcriptionInfo?.language) {\n\t\t\tresult.language = transcriptionInfo.language as string;\n\t\t}\n\n\t\t// Duration\n\t\tif (transcriptionInfo?.duration != null) {\n\t\t\tresult.duration = transcriptionInfo.duration as number;\n\t\t}\n\n\t\t// Segments (whisper-large-v3-turbo returns these)\n\t\tif (raw.segments && Array.isArray(raw.segments)) {\n\t\t\tresult.segments = raw.segments.map((seg: Record<string, unknown>, idx: number) => ({\n\t\t\t\tid: idx,\n\t\t\t\ttext: (seg.text as string) ?? \"\",\n\t\t\t\tstart: (seg.start as number) ?? 0,\n\t\t\t\tend: (seg.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\t// Words — basic whisper returns top-level words[], v3-turbo nests them in segments\n\t\tif (raw.words && Array.isArray(raw.words)) {\n\t\t\tresult.words = raw.words.map((w: Record<string, unknown>) => ({\n\t\t\t\tword: (w.word as string) ?? \"\",\n\t\t\t\tstart: (w.start as number) ?? 0,\n\t\t\t\tend: (w.end as number) ?? 0,\n\t\t\t}));\n\t\t}\n\n\t\treturn result;\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI transcription adapter for speech-to-text.\n *\n * Works with TanStack AI's `generateTranscription()` activity function:\n * ```ts\n * import { generateTranscription } from \"@tanstack/ai\";\n * import { createWorkersAiTranscription } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTranscription(\n * \"@cf/openai/whisper-large-v3-turbo\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateTranscription({ adapter, audio: audioData });\n * // result.text — the transcribed text\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTranscription(\n\tmodel: WorkersAiTranscriptionModel,\n\tconfig: WorkersAiAdapterConfig,\n) {\n\treturn new WorkersAiTranscriptionAdapter(config, model);\n}\n\n// ---------------------------------------------------------------------------\n// Utilities\n// ---------------------------------------------------------------------------\n\n/**\n * Normalize various audio input formats into a number[] (raw bytes).\n *\n * Note: `File extends Blob`, so `File` instances are handled by the\n * `instanceof Blob` branch. `Blob.arrayBuffer()` always reads the full\n * contents regardless of any prior reads — there's no cursor to worry about.\n */\nasync function normalizeAudioToBytes(audio: string | File | Blob | ArrayBuffer): Promise<number[]> {\n\tif (audio instanceof ArrayBuffer) {\n\t\treturn Array.from(new Uint8Array(audio));\n\t}\n\n\tif (audio instanceof Blob) {\n\t\t// This also handles `File` (which extends Blob)\n\t\tconst buffer = await audio.arrayBuffer();\n\t\treturn Array.from(new Uint8Array(buffer));\n\t}\n\n\tif (typeof audio === \"string\") {\n\t\t// Assume base64 string — decode to bytes\n\t\tconst binary = atob(audio);\n\t\tconst bytes = new Uint8Array(binary.length);\n\t\tfor (let i = 0; i < binary.length; i++) {\n\t\t\tbytes[i] = binary.charCodeAt(i);\n\t\t}\n\t\treturn Array.from(bytes);\n\t}\n\n\tthrow new Error(\"Unsupported audio format. Expected string, File, Blob, or ArrayBuffer.\");\n}\n\n/**\n * Detect the MIME type of the audio input for models that require it\n * (e.g., Deepgram Nova-3).\n *\n * - `File` / `Blob`: use the `.type` property (e.g., \"audio/wav\")\n * - `ArrayBuffer` / `string`: defaults to \"audio/wav\"\n */\nfunction detectAudioContentType(audio: string | File | Blob | ArrayBuffer): string {\n\t// File and Blob carry their own MIME type\n\tif (audio instanceof Blob && audio.type) {\n\t\treturn audio.type;\n\t}\n\n\t// For raw bytes, default to audio/wav — this is the most common\n\t// format for transcription inputs and what the E2E tests use.\n\treturn \"audio/wav\";\n}\n"],"mappings":";;;;;;AAyCA,IAAa,gCAAb,cAAmD,yBAAsD;CAIxG,YAAY,QAAgC,OAAoC;EAC/E,MAAM,KAAK;wBAJH,QAAO,0BAAA;wBACR,iBAAA,KAAA,CAAA;EAIP,wBAAwB,MAAM;EAC9B,KAAK,gBAAgB;CACtB;CAEA,MAAM,WAAW,SAA6D;EAC7E,MAAM,EAAE,OAAO,UAAU,QAAQ,iBAAiB;EAGlD,MAAM,aAAa,MAAM,sBAAsB,KAAK;EAEpD,MAAM,QAAiC,EAAE,GAAG,aAAa;EACzD,IAAI,UAAU,MAAM,WAAW;EAC/B,IAAI,QAAQ,MAAM,iBAAiB;EAOnC,MAAM,eAAe,KAAK,kBAAkB,YAAY,KAAK;EAE7D,IAAI,sBAAsB,KAAK,aAAa,GAC3C,OAAO,KAAK,qBAAqB,cAAc,KAAK;EAGrD,IAAI,0BAA0B,KAAK,aAAa,GAAG;GAElD,IAAI,KAAK,UAAU,uBAClB,OAAO,KAAK,wBAAwB,YAAY,OAAO,KAAK;GAE7D,OAAO,KAAK,kBAAkB,cAAc,KAAK;EAClD;EAEA,OAAO,KAAK,qBAAqB,cAAc,KAAK;CACrD;;;;;;;;CASA,kBACC,YACA,eAC0B;EAC1B,IAAI,KAAK,UAAU,uBAGlB,OAAO,EAAE,OAAO;GAAE,MAFN,mBAAmB,IAAI,WAAW,UAAU,CAE9B;GAAG,aADT,uBAAuB,aACJ;EAAE,EAAE;EAG5C,IAAI,KAAK,UAAU,qCAClB,OAAO,EAAE,OAAO,mBAAmB,IAAI,WAAW,UAAU,CAAC,EAAE;EAGhE,OAAO,EAAE,OAAO,WAAW;CAC5B;CAEA,MAAc,qBACb,cACA,SAC+B;EAE/B,MAAM,SAAU,MADJ,KAAK,cAA+C,QACvC,IAAI,KAAK,OAAO;GACxC,GAAG;GACH,GAAG;EACJ,CAAC;EACD,OAAO,KAAK,gBAAgB,MAAM;CACnC;CAEA,MAAc,kBACb,cACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EAYpB,MAAM,OAAQ,OAAM,MAVG,mBACtB,QACA,KAAK,OACL;GAAE,GAAG;GAAc,GAAG;EAAQ,GAC9B;GACC,OAAO;GACP,QAAS,QAAqC;EAC/C,CACD,EAAA,CAE6B,KAAK;EAMlC,OAAO,KAAK,gBAAgB,KAAK,UAAU,IAAI;CAChD;;;;;;CAOA,MAAc,wBACb,YACA,eACA,SAC+B;EAC/B,MAAM,SAAS,KAAK;EACpB,MAAM,cAAc,uBAAuB,aAAa;EAaxD,MAAM,OAAQ,OAAM,MAXG,yBACtB,QACA,KAAK,OACL,IAAI,WAAW,UAAU,GACzB,aACA;GACC,OAAO;GACP,QAAS,QAAqC;EAC/C,CACD,EAAA,CAE6B,KAAK;EAIlC,OAAO,KAAK,gBAAgB,KAAK,UAAU,IAAI;CAChD;CAEA,MAAc,qBACb,cACA,SAC+B;EAC/B,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,aAKpB,CAAC,CAAC,sDAAsD;GACzF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ,GAAG;IACH,GAAG;GACJ,CAAC;EACF,CAAC;EAED,IAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,KAAK;GACtC,MAAM,IAAI,MACT,oDAAoD,SAAS,OAAO,KAAK,WAC1E;EACD;EAEA,MAAM,OAAQ,MAAM,SAAS,KAAK;EAClC,OAAO,KAAK,gBAAgB,IAAI;CACjC;;;;;;;;;;CAWA,gBAAwB,KAAmD;EAE1E,MAAM,UAAU,IAAI;EACpB,IAAI,SAAS,UAAU;GAQtB,MAAM,MAPW,QAAQ,WAOF,EAAE,EAAE,eAAe;GAC1C,MAAM,OAAO,KAAK,cAAc;GAChC,MAAM,SAA8B;IACnC,IAAI,KAAK,WAAW;IACpB,OAAO,KAAK;IACZ;GACD;GACA,IAAI,KAAK,SAAS,MAAM,QAAQ,IAAI,KAAK,GACxC,OAAO,QAAQ,IAAI,MAAM,KAAK,OAAO;IACpC,MAAM,EAAE,QAAQ;IAChB,OAAO,EAAE,SAAS;IAClB,KAAK,EAAE,OAAO;GACf,EAAE;GAEH,OAAO;EACR;EAIA,MAAM,SAA8B;GACnC,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,MAAO,IAAI,QAAmB;EAC/B;EAGA,MAAM,oBAAoB,IAAI;EAC9B,IAAI,mBAAmB,UACtB,OAAO,WAAW,kBAAkB;EAIrC,IAAI,mBAAmB,YAAY,MAClC,OAAO,WAAW,kBAAkB;EAIrC,IAAI,IAAI,YAAY,MAAM,QAAQ,IAAI,QAAQ,GAC7C,OAAO,WAAW,IAAI,SAAS,KAAK,KAA8B,SAAiB;GAClF,IAAI;GACJ,MAAO,IAAI,QAAmB;GAC9B,OAAQ,IAAI,SAAoB;GAChC,KAAM,IAAI,OAAkB;EAC7B,EAAE;EAIH,IAAI,IAAI,SAAS,MAAM,QAAQ,IAAI,KAAK,GACvC,OAAO,QAAQ,IAAI,MAAM,KAAK,OAAgC;GAC7D,MAAO,EAAE,QAAmB;GAC5B,OAAQ,EAAE,SAAoB;GAC9B,KAAM,EAAE,OAAkB;EAC3B,EAAE;EAGH,OAAO;CACR;AACD;;;;;;;;;;;;;;;;;;;;;AA0BA,SAAgB,6BACf,OACA,QACC;CACD,OAAO,IAAI,8BAA8B,QAAQ,KAAK;AACvD;;;;;;;;AAaA,eAAe,sBAAsB,OAA8D;CAClG,IAAI,iBAAiB,aACpB,OAAO,MAAM,KAAK,IAAI,WAAW,KAAK,CAAC;CAGxC,IAAI,iBAAiB,MAAM;EAE1B,MAAM,SAAS,MAAM,MAAM,YAAY;EACvC,OAAO,MAAM,KAAK,IAAI,WAAW,MAAM,CAAC;CACzC;CAEA,IAAI,OAAO,UAAU,UAAU;EAE9B,MAAM,SAAS,KAAK,KAAK;EACzB,MAAM,QAAQ,IAAI,WAAW,OAAO,MAAM;EAC1C,KAAK,IAAI,IAAI,GAAG,IAAI,OAAO,QAAQ,KAClC,MAAM,KAAK,OAAO,WAAW,CAAC;EAE/B,OAAO,MAAM,KAAK,KAAK;CACxB;CAEA,MAAM,IAAI,MAAM,wEAAwE;AACzF;;;;;;;;AASA,SAAS,uBAAuB,OAAmD;CAElF,IAAI,iBAAiB,QAAQ,MAAM,MAClC,OAAO,MAAM;CAKd,OAAO;AACR"}
@@ -1,14 +1,13 @@
1
1
  Object.defineProperty(exports, Symbol.toStringTag, { value: "Module" });
2
- require("../workers-ai-BOZ5iyhY.cjs");
3
- const require_create_fetcher = require("../create-fetcher-By-hTiT9.cjs");
4
- const require_defineProperty = require("../defineProperty-DQoAg20E.cjs");
5
- const require_workers_ai_rest = require("../workers-ai-rest-CkNCtBwv.cjs");
6
- const require_binary = require("../binary-C9FAYwZj.cjs");
2
+ const require_create_fetcher = require("../create-fetcher-YVxWCTVL.cjs");
3
+ const require_defineProperty = require("../defineProperty-In8g9yAD.cjs");
4
+ const require_workers_ai_rest = require("../workers-ai-rest-_MXOmyDs.cjs");
5
+ const require_binary = require("../binary-CZhr1_2n.cjs");
7
6
  let _tanstack_ai_adapters = require("@tanstack/ai/adapters");
8
7
  //#region src/adapters/workers-ai-tts.ts
9
8
  var WorkersAiTTSAdapter = class extends _tanstack_ai_adapters.BaseTTSAdapter {
10
9
  constructor(config, model) {
11
- super({}, model);
10
+ super(model);
12
11
  require_defineProperty._defineProperty(this, "name", "workers-ai-tts");
13
12
  require_defineProperty._defineProperty(this, "adapterConfig", void 0);
14
13
  require_create_fetcher.validateWorkersAiConfig(config);
@@ -1 +1 @@
1
- {"version":3,"file":"workers-ai-tts.cjs","names":["BaseTTSAdapter","isDirectBindingConfig","isDirectCredentialsConfig","workersAiRestFetch","createGatewayFetch","binaryToBase64","uint8ArrayToBase64"],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;;;AAoCA,IAAa,sBAAb,cAAyCA,sBAAAA,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;AACrE,QAAM,EAAE,EAAE,MAAM;+CAJR,QAAO,iBAA0B;+CAClC,iBAAA,KAAA,EAAsC;AAI7C,yBAAA,wBAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,MAAO,OAAM,QAAQ;AACzB,MAAI,SAAS,KAAM,OAAM,QAAQ;AAEjC,MAAIC,uBAAAA,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;AAGpD,MAAIC,uBAAAA,0BAA0B,KAAK,cAAc,CAChD,QAAO,KAAK,gBAAgB,MAAM,QAAQ,MAAM;AAGjD,SAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;;CAGpD,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;GAAS,CAAC;AAE7D,SAAO,KAAK,gBAAgB,QAAQ,OAAO;;CAG5C,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OARE,MAAMC,wBAAAA,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;GAAS,EACpB;GAAE,OAAO;GAAkB,QAAS,QAAqC;GAAQ,CACjF,EAG6B,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;CAG5D,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALIC,uBAAAA,mBAAmB,cAAc,cAAc,CAKhC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,YAC/D;;EAGF,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;;;;;;;CAS5D,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAMC,eAAAA,eAAe,QAAQ,QAAQ;AACjD,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;CAGF,gBAAwB,OAAmB,QAAuC;AACjF,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAOC,eAAAA,mBAAmB,MAAM;GAChC,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;;;;;;;;;;;;;;;;;;;;;;AA4BH,SAAgB,mBAAmB,OAA0B,QAAgC;AAC5F,QAAO,IAAI,oBAAoB,QAAQ,MAAM"}
1
+ {"version":3,"file":"workers-ai-tts.cjs","names":["BaseTTSAdapter","isDirectBindingConfig","isDirectCredentialsConfig","workersAiRestFetch","createGatewayFetch","binaryToBase64","uint8ArrayToBase64"],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper(model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;;AAoCA,IAAa,sBAAb,cAAyCA,sBAAAA,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;EACrE,MAAM,KAAK;+CAJH,QAAO,gBAAA;+CACR,iBAAA,KAAA,CAAA;EAIP,uBAAA,wBAAwB,MAAM;EAC9B,KAAK,gBAAgB;CACtB;CAEA,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,aAAa;EACzD,IAAI,OAAO,MAAM,QAAQ;EACzB,IAAI,SAAS,MAAM,MAAM,QAAQ;EAEjC,IAAIC,uBAAAA,sBAAsB,KAAK,aAAa,GAC3C,OAAO,KAAK,mBAAmB,MAAM,QAAQ,KAAK;EAGnD,IAAIC,uBAAAA,0BAA0B,KAAK,aAAa,GAC/C,OAAO,KAAK,gBAAgB,MAAM,QAAQ,KAAK;EAGhD,OAAO,KAAK,mBAAmB,MAAM,QAAQ,KAAK;CACnD;CAEA,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;EAAQ,CAAC;EAE5D,OAAO,KAAK,gBAAgB,QAAQ,MAAM;CAC3C;CAEA,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OAAM,MAREC,wBAAAA,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;EAAQ,GACnB;GAAE,OAAO;GAAkB,QAAS,QAAqC;EAAO,CACjF,EAAA,CAG8B,YAAY;EAC1C,OAAO,KAAK,gBAAgB,IAAI,WAAW,MAAM,GAAG,MAAM;CAC3D;CAEA,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALIC,uBAAAA,mBAAmB,cAAc,aAKpB,CAAC,CAAC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;GACJ,CAAC;EACF,CAAC;EAED,IAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,KAAK;GACtC,MAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,WAChE;EACD;EAEA,MAAM,SAAS,MAAM,SAAS,YAAY;EAC1C,OAAO,KAAK,gBAAgB,IAAI,WAAW,MAAM,GAAG,MAAM;CAC3D;;;;;;;CAQA,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAMC,eAAAA,eAAe,QAAQ,OAAO;EAChD,OAAO;GACN,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;EACjC;CACD;CAEA,gBAAwB,OAAmB,QAAuC;EACjF,OAAO;GACN,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,OAAOC,eAAAA,mBAAmB,KAAK;GAC/B,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;EACjC;CACD;AACD;;;;;;;;;;;;;;;;;;;;;AA0BA,SAAgB,mBAAmB,OAA0B,QAAgC;CAC5F,OAAO,IAAI,oBAAoB,QAAQ,KAAK;AAC7C"}
@@ -1,4 +1,4 @@
1
- import { i as WorkersAiAdapterConfig } from "../create-fetcher-vAQ8WW-p.cjs";
1
+ import { i as WorkersAiAdapterConfig } from "../create-fetcher-Bp5yCNaO.cjs";
2
2
  import { TTSOptions, TTSResult } from "@tanstack/ai";
3
3
  import { BaseTTSAdapter } from "@tanstack/ai/adapters";
4
4
 
@@ -1,6 +1,6 @@
1
- import { i as WorkersAiAdapterConfig } from "../create-fetcher-6p6heb85.mjs";
2
- import { BaseTTSAdapter } from "@tanstack/ai/adapters";
1
+ import { i as WorkersAiAdapterConfig } from "../create-fetcher-Bp5yCNaO.mjs";
3
2
  import { TTSOptions, TTSResult } from "@tanstack/ai";
3
+ import { BaseTTSAdapter } from "@tanstack/ai/adapters";
4
4
 
5
5
  //#region src/adapters/workers-ai-tts.d.ts
6
6
  /**
@@ -1,12 +1,12 @@
1
- import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-CeUOJgrh.mjs";
2
- import { t as _defineProperty } from "../defineProperty-CbyrzcbA.mjs";
3
- import { t as workersAiRestFetch } from "../workers-ai-rest-GKy2r7eG.mjs";
4
- import { n as uint8ArrayToBase64, t as binaryToBase64 } from "../binary-p4H_N_3M.mjs";
1
+ import { a as validateWorkersAiConfig, i as isDirectCredentialsConfig, r as isDirectBindingConfig, t as createGatewayFetch } from "../create-fetcher-BnSnCaHf.mjs";
2
+ import { t as _defineProperty } from "../defineProperty-BC3bEcwq.mjs";
3
+ import { t as workersAiRestFetch } from "../workers-ai-rest-B6_yU35Q.mjs";
4
+ import { n as uint8ArrayToBase64, t as binaryToBase64 } from "../binary-B5YCVsro.mjs";
5
5
  import { BaseTTSAdapter } from "@tanstack/ai/adapters";
6
6
  //#region src/adapters/workers-ai-tts.ts
7
7
  var WorkersAiTTSAdapter = class extends BaseTTSAdapter {
8
8
  constructor(config, model) {
9
- super({}, model);
9
+ super(model);
10
10
  _defineProperty(this, "name", "workers-ai-tts");
11
11
  _defineProperty(this, "adapterConfig", void 0);
12
12
  validateWorkersAiConfig(config);
@@ -1 +1 @@
1
- {"version":3,"file":"workers-ai-tts.mjs","names":[],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper({}, model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;AAoCA,IAAa,sBAAb,cAAyC,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;AACrE,QAAM,EAAE,EAAE,MAAM;wBAJR,QAAO,iBAA0B;wBAClC,iBAAA,KAAA,EAAsC;AAI7C,0BAAwB,OAAO;AAC/B,OAAK,gBAAgB;;CAGtB,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,cAAc;AAC1D,MAAI,MAAO,OAAM,QAAQ;AACzB,MAAI,SAAS,KAAM,OAAM,QAAQ;AAEjC,MAAI,sBAAsB,KAAK,cAAc,CAC5C,QAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;AAGpD,MAAI,0BAA0B,KAAK,cAAc,CAChD,QAAO,KAAK,gBAAgB,MAAM,QAAQ,MAAM;AAGjD,SAAO,KAAK,mBAAmB,MAAM,QAAQ,MAAM;;CAGpD,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;GAAS,CAAC;AAE7D,SAAO,KAAK,gBAAgB,QAAQ,OAAO;;CAG5C,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OARE,MAAM,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;GAAS,EACpB;GAAE,OAAO;GAAkB,QAAS,QAAqC;GAAQ,CACjF,EAG6B,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;CAG5D,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,cAAc,CAKhC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;IACH,CAAC;GACF,CAAC;AAEF,MAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,MAAM;AACvC,SAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,YAC/D;;EAGF,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,SAAO,KAAK,gBAAgB,IAAI,WAAW,OAAO,EAAE,OAAO;;;;;;;;CAS5D,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAM,eAAe,QAAQ,QAAQ;AACjD,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;CAGF,gBAAwB,OAAmB,QAAuC;AACjF,SAAO;GACN,IAAI,KAAK,YAAY;GACrB,OAAO,KAAK;GACZ,OAAO,mBAAmB,MAAM;GAChC,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;GAChC;;;;;;;;;;;;;;;;;;;;;;;AA4BH,SAAgB,mBAAmB,OAA0B,QAAgC;AAC5F,QAAO,IAAI,oBAAoB,QAAQ,MAAM"}
1
+ {"version":3,"file":"workers-ai-tts.mjs","names":[],"sources":["../../src/adapters/workers-ai-tts.ts"],"sourcesContent":["import { BaseTTSAdapter } from \"@tanstack/ai/adapters\";\nimport type { TTSOptions, TTSResult } from \"@tanstack/ai\";\nimport {\n\ttype WorkersAiAdapterConfig,\n\ttype WorkersAiDirectBindingConfig,\n\ttype WorkersAiDirectCredentialsConfig,\n\ttype AiGatewayAdapterConfig,\n\tcreateGatewayFetch,\n\tisDirectBindingConfig,\n\tisDirectCredentialsConfig,\n\tvalidateWorkersAiConfig,\n} from \"../utils/create-fetcher\";\nimport { workersAiRestFetch } from \"../utils/workers-ai-rest\";\nimport { binaryToBase64, uint8ArrayToBase64 } from \"../utils/binary\";\n\n// ---------------------------------------------------------------------------\n// Model types\n// ---------------------------------------------------------------------------\n\n/**\n * Workers AI models that support text-to-speech generation.\n *\n * Note: the typed `AiModels` interface in `@cloudflare/workers-types` may lag\n * behind what's deployed. We use a string union here that matches the known\n * models including Deepgram partner models.\n */\nexport type WorkersAiTTSModel =\n\t| \"@cf/deepgram/aura-1\"\n\t| \"@cf/deepgram/aura-2-en\"\n\t| \"@cf/deepgram/aura-2-es\"\n\t| (string & {});\n\n// ---------------------------------------------------------------------------\n// WorkersAiTTSAdapter\n// ---------------------------------------------------------------------------\n\nexport class WorkersAiTTSAdapter extends BaseTTSAdapter<WorkersAiTTSModel> {\n\treadonly name = \"workers-ai-tts\" as const;\n\tprivate adapterConfig: WorkersAiAdapterConfig;\n\n\tconstructor(config: WorkersAiAdapterConfig, model: WorkersAiTTSModel) {\n\t\tsuper(model);\n\t\tvalidateWorkersAiConfig(config);\n\t\tthis.adapterConfig = config;\n\t}\n\n\tasync generateSpeech(options: TTSOptions): Promise<TTSResult> {\n\t\tconst { text, voice, format, speed, modelOptions } = options;\n\n\t\t// Workers AI TTS models (Deepgram aura-1) accept { text, lang? }\n\t\tconst extra: Record<string, unknown> = { ...modelOptions };\n\t\tif (voice) extra.voice = voice;\n\t\tif (speed != null) extra.speed = speed;\n\n\t\tif (isDirectBindingConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaBinding(text, format, extra);\n\t\t}\n\n\t\tif (isDirectCredentialsConfig(this.adapterConfig)) {\n\t\t\treturn this.generateViaRest(text, format, extra);\n\t\t}\n\n\t\treturn this.generateViaGateway(text, format, extra);\n\t}\n\n\tprivate async generateViaBinding(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst ai = (this.adapterConfig as WorkersAiDirectBindingConfig).binding;\n\t\tconst result = await ai.run(this.model, { text, ...options });\n\n\t\treturn this.normalizeResult(result, format);\n\t}\n\n\tprivate async generateViaRest(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst config = this.adapterConfig as WorkersAiDirectCredentialsConfig;\n\t\tconst response = await workersAiRestFetch(\n\t\t\tconfig,\n\t\t\tthis.model,\n\t\t\t{ text, ...options },\n\t\t\t{ label: \"Workers AI TTS\", signal: (options as { signal?: AbortSignal }).signal },\n\t\t);\n\n\t\t// Workers AI TTS returns audio bytes directly\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\tprivate async generateViaGateway(\n\t\ttext: string,\n\t\tformat: string | undefined,\n\t\toptions: Record<string, unknown>,\n\t): Promise<TTSResult> {\n\t\tconst gatewayConfig = this.adapterConfig as AiGatewayAdapterConfig;\n\t\tconst gatewayFetch = createGatewayFetch(\"workers-ai\", gatewayConfig);\n\n\t\t// The URL here is a placeholder — createGatewayFetch for \"workers-ai\" extracts\n\t\t// the model from the body, sets it as the endpoint, and routes through the gateway.\n\t\t// The actual URL path is not used.\n\t\tconst response = await gatewayFetch(\"https://api.cloudflare.com/v1/audio/speech\", {\n\t\t\tmethod: \"POST\",\n\t\t\tbody: JSON.stringify({\n\t\t\t\tmodel: this.model,\n\t\t\t\ttext,\n\t\t\t\t...options,\n\t\t\t}),\n\t\t});\n\n\t\tif (!response.ok) {\n\t\t\tconst errorText = await response.text();\n\t\t\tthrow new Error(\n\t\t\t\t`Workers AI TTS gateway request failed (${response.status}): ${errorText}`,\n\t\t\t);\n\t\t}\n\n\t\tconst buffer = await response.arrayBuffer();\n\t\treturn this.wrapAudioResult(new Uint8Array(buffer), format);\n\t}\n\n\t/**\n\t * Normalize binding results. Workers AI TTS can return:\n\t * - Uint8Array / ArrayBuffer (raw audio bytes)\n\t * - ReadableStream<Uint8Array> (streamed audio bytes)\n\t * - { audio: \"base64...\" } (JSON wrapper)\n\t */\n\tprivate async normalizeResult(result: unknown, format: string | undefined): Promise<TTSResult> {\n\t\t// Use the shared binaryToBase64 helper for Uint8Array/ArrayBuffer/ReadableStream\n\t\t// and { audio: \"base64...\" } JSON wrapper\n\t\tconst b64 = await binaryToBase64(result, \"audio\");\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: b64,\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n\n\tprivate wrapAudioResult(bytes: Uint8Array, format: string | undefined): TTSResult {\n\t\treturn {\n\t\t\tid: this.generateId(),\n\t\t\tmodel: this.model,\n\t\t\taudio: uint8ArrayToBase64(bytes),\n\t\t\tformat: format ?? \"mp3\",\n\t\t\tcontentType: `audio/${format ?? \"mp3\"}`,\n\t\t};\n\t}\n}\n\n// ---------------------------------------------------------------------------\n// Factory function\n// ---------------------------------------------------------------------------\n\n/**\n * Creates a Workers AI text-to-speech adapter.\n *\n * Works with TanStack AI's `generateSpeech()` activity function:\n * ```ts\n * import { generateSpeech } from \"@tanstack/ai\";\n * import { createWorkersAiTts } from \"@cloudflare/tanstack-ai\";\n *\n * const adapter = createWorkersAiTts(\n * \"@cf/deepgram/aura-1\",\n * { binding: env.AI },\n * );\n *\n * const result = await generateSpeech({ adapter, text: \"Hello world\" });\n * // result.audio — base64-encoded audio\n * ```\n *\n * Note: Factory takes `(model, config)` for ergonomics — the class constructor\n * uses `(config, model)` to match TanStack AI's upstream convention.\n */\nexport function createWorkersAiTts(model: WorkersAiTTSModel, config: WorkersAiAdapterConfig) {\n\treturn new WorkersAiTTSAdapter(config, model);\n}\n"],"mappings":";;;;;;AAoCA,IAAa,sBAAb,cAAyC,eAAkC;CAI1E,YAAY,QAAgC,OAA0B;EACrE,MAAM,KAAK;wBAJH,QAAO,gBAAA;wBACR,iBAAA,KAAA,CAAA;EAIP,wBAAwB,MAAM;EAC9B,KAAK,gBAAgB;CACtB;CAEA,MAAM,eAAe,SAAyC;EAC7D,MAAM,EAAE,MAAM,OAAO,QAAQ,OAAO,iBAAiB;EAGrD,MAAM,QAAiC,EAAE,GAAG,aAAa;EACzD,IAAI,OAAO,MAAM,QAAQ;EACzB,IAAI,SAAS,MAAM,MAAM,QAAQ;EAEjC,IAAI,sBAAsB,KAAK,aAAa,GAC3C,OAAO,KAAK,mBAAmB,MAAM,QAAQ,KAAK;EAGnD,IAAI,0BAA0B,KAAK,aAAa,GAC/C,OAAO,KAAK,gBAAgB,MAAM,QAAQ,KAAK;EAGhD,OAAO,KAAK,mBAAmB,MAAM,QAAQ,KAAK;CACnD;CAEA,MAAc,mBACb,MACA,QACA,SACqB;EAErB,MAAM,SAAS,MADH,KAAK,cAA+C,QACxC,IAAI,KAAK,OAAO;GAAE;GAAM,GAAG;EAAQ,CAAC;EAE5D,OAAO,KAAK,gBAAgB,QAAQ,MAAM;CAC3C;CAEA,MAAc,gBACb,MACA,QACA,SACqB;EACrB,MAAM,SAAS,KAAK;EASpB,MAAM,SAAS,OAAM,MARE,mBACtB,QACA,KAAK,OACL;GAAE;GAAM,GAAG;EAAQ,GACnB;GAAE,OAAO;GAAkB,QAAS,QAAqC;EAAO,CACjF,EAAA,CAG8B,YAAY;EAC1C,OAAO,KAAK,gBAAgB,IAAI,WAAW,MAAM,GAAG,MAAM;CAC3D;CAEA,MAAc,mBACb,MACA,QACA,SACqB;EACrB,MAAM,gBAAgB,KAAK;EAM3B,MAAM,WAAW,MALI,mBAAmB,cAAc,aAKpB,CAAC,CAAC,8CAA8C;GACjF,QAAQ;GACR,MAAM,KAAK,UAAU;IACpB,OAAO,KAAK;IACZ;IACA,GAAG;GACJ,CAAC;EACF,CAAC;EAED,IAAI,CAAC,SAAS,IAAI;GACjB,MAAM,YAAY,MAAM,SAAS,KAAK;GACtC,MAAM,IAAI,MACT,0CAA0C,SAAS,OAAO,KAAK,WAChE;EACD;EAEA,MAAM,SAAS,MAAM,SAAS,YAAY;EAC1C,OAAO,KAAK,gBAAgB,IAAI,WAAW,MAAM,GAAG,MAAM;CAC3D;;;;;;;CAQA,MAAc,gBAAgB,QAAiB,QAAgD;EAG9F,MAAM,MAAM,MAAM,eAAe,QAAQ,OAAO;EAChD,OAAO;GACN,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,OAAO;GACP,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;EACjC;CACD;CAEA,gBAAwB,OAAmB,QAAuC;EACjF,OAAO;GACN,IAAI,KAAK,WAAW;GACpB,OAAO,KAAK;GACZ,OAAO,mBAAmB,KAAK;GAC/B,QAAQ,UAAU;GAClB,aAAa,SAAS,UAAU;EACjC;CACD;AACD;;;;;;;;;;;;;;;;;;;;;AA0BA,SAAgB,mBAAmB,OAA0B,QAAgC;CAC5F,OAAO,IAAI,oBAAoB,QAAQ,KAAK;AAC7C"}