@elizaos/plugin-edge-tts 2.0.0-alpha.5 → 2.0.0-alpha.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -2,9 +2,9 @@
|
|
|
2
2
|
"version": 3,
|
|
3
3
|
"sources": ["../../src/index.browser.ts"],
|
|
4
4
|
"sourcesContent": [
|
|
5
|
-
"/**\n * Browser entry point for @elizaos/plugin-edge-tts\n *\n * Edge TTS is not available in browser environments because it requires\n * Node.js file system access and WebSocket connections that browsers don't support.\n *\n * For browser TTS, use @elizaos/plugin-elevenlabs or @elizaos/plugin-openai instead.\n */\nimport { type Plugin
|
|
5
|
+
"/**\n * Browser entry point for @elizaos/plugin-edge-tts\n *\n * Edge TTS is not available in browser environments because it requires\n * Node.js file system access and WebSocket connections that browsers don't support.\n *\n * For browser TTS, use @elizaos/plugin-elevenlabs or @elizaos/plugin-openai instead.\n */\nimport { logger, type Plugin } from \"@elizaos/core\";\n\nexport const edgeTTSPlugin: Plugin = {\n name: \"edge-tts\",\n description: \"Edge TTS plugin (browser stub - not available in browser environments)\",\n models: {},\n tests: [],\n};\n\n// Log warning when imported in browser\nif (typeof window !== \"undefined\") {\n logger.warn(\n \"[EdgeTTS] Edge TTS is not available in browser environments. \" +\n \"Use @elizaos/plugin-elevenlabs or @elizaos/plugin-openai for browser TTS.\"\n );\n}\n\nexport default edgeTTSPlugin;\n"
|
|
6
6
|
],
|
|
7
|
-
"mappings": "AAQA,
|
|
7
|
+
"mappings": "AAQA,iBAAS,sBAEF,IAAM,EAAwB,CACnC,KAAM,WACN,YAAa,yEACb,OAAQ,CAAC,EACT,MAAO,CAAC,CACV,EAGA,GAAI,OAAO,OAAW,IACpB,EAAO,KACL,wIAEF,EAGF,IAAe",
|
|
8
8
|
"debugId": "A1DF4939E5621A8064756E2164756E21",
|
|
9
9
|
"names": []
|
|
10
10
|
}
|
package/dist/cjs/index.node.cjs
CHANGED
|
@@ -49,11 +49,11 @@ __export(exports_index_node, {
|
|
|
49
49
|
module.exports = __toCommonJS(exports_index_node);
|
|
50
50
|
|
|
51
51
|
// src/index.ts
|
|
52
|
-
var import_core = require("@elizaos/core");
|
|
53
|
-
var import_node_edge_tts = require("node-edge-tts");
|
|
54
52
|
var import_node_fs = require("node:fs");
|
|
55
53
|
var import_node_os = require("node:os");
|
|
56
54
|
var import_node_path = __toESM(require("node:path"));
|
|
55
|
+
var import_core = require("@elizaos/core");
|
|
56
|
+
var import_node_edge_tts = require("node-edge-tts");
|
|
57
57
|
var DEFAULT_VOICE = "en-US-MichelleNeural";
|
|
58
58
|
var DEFAULT_LANG = "en-US";
|
|
59
59
|
var DEFAULT_OUTPUT_FORMAT = "audio-24khz-48kbitrate-mono-mp3";
|
|
@@ -257,4 +257,4 @@ var _test = {
|
|
|
257
257
|
getEdgeTTSSettings
|
|
258
258
|
};
|
|
259
259
|
|
|
260
|
-
//# debugId=
|
|
260
|
+
//# debugId=44DEBD6EBE84FDA064756E2164756E21
|
|
@@ -2,9 +2,9 @@
|
|
|
2
2
|
"version": 3,
|
|
3
3
|
"sources": ["../../src/index.ts"],
|
|
4
4
|
"sourcesContent": [
|
|
5
|
-
"import {\n type IAgentRuntime,\n ModelType,\n type Plugin,\n logger,\n} from \"@elizaos/core\";\nimport { EdgeTTS } from \"node-edge-tts\";\nimport { mkdtempSync, rmSync, readFileSync } from \"node:fs\";\nimport { tmpdir } from \"node:os\";\nimport path from \"node:path\";\n\n/**\n * Edge TTS voice settings configuration\n */\ninterface EdgeTTSSettings {\n voice: string;\n lang: string;\n outputFormat: string;\n rate?: string;\n pitch?: string;\n volume?: string;\n proxy?: string;\n timeoutMs: number;\n}\n\n/**\n * Extended TTS params with Edge-specific options\n */\ninterface EdgeTTSParams {\n text: string;\n voice?: string;\n speed?: number;\n /** Edge TTS specific: language code */\n lang?: string;\n /** Edge TTS specific: output format */\n outputFormat?: string;\n /** Edge TTS specific: rate adjustment (e.g., +10%, -5%) */\n rate?: string;\n /** Edge TTS specific: pitch adjustment (e.g., +5Hz, -10Hz) */\n pitch?: string;\n /** Edge TTS specific: volume adjustment (e.g., +20%, -10%) */\n volume?: string;\n}\n\n// Default voice configurations\nconst DEFAULT_VOICE = \"en-US-MichelleNeural\";\nconst DEFAULT_LANG = \"en-US\";\nconst DEFAULT_OUTPUT_FORMAT = \"audio-24khz-48kbitrate-mono-mp3\";\nconst DEFAULT_TIMEOUT_MS = 30000;\n\n// Voice presets mapping common voice names to Edge TTS voices\nconst VOICE_PRESETS: Record<string, string> = {\n // Generic voices (map to good defaults)\n alloy: \"en-US-GuyNeural\",\n echo: \"en-US-ChristopherNeural\",\n fable: \"en-GB-RyanNeural\",\n onyx: \"en-US-DavisNeural\",\n nova: \"en-US-JennyNeural\",\n shimmer: \"en-US-AriaNeural\",\n // Direct Edge TTS voice names pass through\n};\n\nfunction getSetting(\n runtime: IAgentRuntime,\n key: string,\n fallback?: string,\n): string | undefined {\n const envValue =\n typeof process !== \"undefined\" &&\n (process as { env?: Record<string, string> }).env\n ? (process as { env: Record<string, string> }).env[key]\n : undefined;\n return (\n (runtime.getSetting(key) as string | undefined) ?? envValue ?? fallback\n );\n}\n\nfunction getEdgeTTSSettings(runtime: IAgentRuntime): EdgeTTSSettings {\n const timeoutStr = getSetting(runtime, \"EDGE_TTS_TIMEOUT_MS\");\n return {\n voice:\n getSetting(runtime, \"EDGE_TTS_VOICE\", DEFAULT_VOICE) ?? DEFAULT_VOICE,\n lang: getSetting(runtime, \"EDGE_TTS_LANG\", DEFAULT_LANG) ?? DEFAULT_LANG,\n outputFormat:\n getSetting(runtime, \"EDGE_TTS_OUTPUT_FORMAT\", DEFAULT_OUTPUT_FORMAT) ??\n DEFAULT_OUTPUT_FORMAT,\n rate: getSetting(runtime, \"EDGE_TTS_RATE\"),\n pitch: getSetting(runtime, \"EDGE_TTS_PITCH\"),\n volume: getSetting(runtime, \"EDGE_TTS_VOLUME\"),\n proxy: getSetting(runtime, \"EDGE_TTS_PROXY\"),\n timeoutMs: timeoutStr\n ? Number.parseInt(timeoutStr, 10)\n : DEFAULT_TIMEOUT_MS,\n };\n}\n\n/**\n * Resolve voice name - handles OpenAI-style voice names and Edge TTS voice IDs\n */\nfunction resolveVoice(voice: string | undefined, defaultVoice: string): string {\n if (!voice) return defaultVoice;\n\n // Check if it's a preset name\n const preset = VOICE_PRESETS[voice.toLowerCase()];\n if (preset) return preset;\n\n // Assume it's a direct Edge TTS voice ID\n return voice;\n}\n\n/**\n * Convert speed multiplier to Edge TTS rate string\n * speed: 1.0 = normal, 0.5 = half speed, 2.0 = double speed\n */\nfunction speedToRate(speed: number | undefined): string | undefined {\n if (speed === undefined || speed === 1.0) return undefined;\n const percentage = Math.round((speed - 1) * 100);\n return percentage >= 0 ? `+${percentage}%` : `${percentage}%`;\n}\n\n/**\n * Infer file extension from Edge TTS output format\n */\nfunction inferExtension(outputFormat: string): string {\n const normalized = outputFormat.toLowerCase();\n if (normalized.includes(\"webm\")) return \".webm\";\n if (normalized.includes(\"ogg\")) return \".ogg\";\n if (normalized.includes(\"opus\")) return \".opus\";\n if (\n normalized.includes(\"wav\") ||\n normalized.includes(\"riff\") ||\n normalized.includes(\"pcm\")\n ) {\n return \".wav\";\n }\n return \".mp3\";\n}\n\n/**\n * Generate speech using Microsoft Edge TTS\n */\nasync function generateSpeech(\n settings: EdgeTTSSettings,\n params: EdgeTTSParams,\n): Promise<Buffer> {\n const voice = resolveVoice(params.voice, settings.voice);\n const lang = params.lang ?? settings.lang;\n const outputFormat = params.outputFormat ?? settings.outputFormat;\n const rate = params.rate ?? speedToRate(params.speed) ?? settings.rate;\n const pitch = params.pitch ?? settings.pitch;\n const volume = params.volume ?? settings.volume;\n\n logger.debug(\n `[EdgeTTS] Generating speech with voice: ${voice}, lang: ${lang}`,\n );\n\n const tts = new EdgeTTS({\n voice,\n lang,\n outputFormat,\n saveSubtitles: false,\n proxy: settings.proxy,\n rate,\n pitch,\n volume,\n timeout: settings.timeoutMs,\n });\n\n // Create temp directory for output\n const tempDir = mkdtempSync(path.join(tmpdir(), \"edge-tts-\"));\n const extension = inferExtension(outputFormat);\n const outputPath = path.join(tempDir, `speech${extension}`);\n\n try {\n await tts.ttsPromise(params.text, outputPath);\n const audioBuffer = readFileSync(outputPath);\n return audioBuffer;\n } finally {\n // Cleanup temp directory\n try {\n rmSync(tempDir, { recursive: true, force: true });\n } catch {\n // Ignore cleanup errors\n }\n }\n}\n\n/**\n * Edge TTS Plugin for ElizaOS\n *\n * Provides free text-to-speech synthesis using Microsoft Edge's TTS service.\n * No API key required - uses the same TTS engine as Microsoft Edge browser.\n *\n * Features:\n * - High-quality neural voices\n * - Multiple languages and locales\n * - Adjustable rate, pitch, and volume\n * - No API key or payment required\n *\n * Optional environment variables:\n * - EDGE_TTS_VOICE: Voice ID (default: en-US-MichelleNeural)\n * - EDGE_TTS_LANG: Language code (default: en-US)\n * - EDGE_TTS_OUTPUT_FORMAT: Output format (default: audio-24khz-48kbitrate-mono-mp3)\n * - EDGE_TTS_RATE: Speech rate adjustment (e.g., +10%, -5%)\n * - EDGE_TTS_PITCH: Pitch adjustment (e.g., +5Hz, -10Hz)\n * - EDGE_TTS_VOLUME: Volume adjustment (e.g., +20%, -10%)\n * - EDGE_TTS_PROXY: HTTP proxy URL\n * - EDGE_TTS_TIMEOUT_MS: Request timeout (default: 30000)\n *\n * Popular voices:\n * - en-US-MichelleNeural (female, US English)\n * - en-US-GuyNeural (male, US English)\n * - en-US-JennyNeural (female, US English)\n * - en-US-AriaNeural (female, US English)\n * - en-GB-SoniaNeural (female, UK English)\n * - en-GB-RyanNeural (male, UK English)\n * - de-DE-KatjaNeural (female, German)\n * - fr-FR-DeniseNeural (female, French)\n * - es-ES-ElviraNeural (female, Spanish)\n * - ja-JP-NanamiNeural (female, Japanese)\n * - zh-CN-XiaoxiaoNeural (female, Chinese)\n */\nexport const edgeTTSPlugin: Plugin = {\n name: \"edge-tts\",\n description:\n \"Free text-to-speech synthesis using Microsoft Edge TTS - no API key required, high-quality neural voices\",\n models: {\n [ModelType.TEXT_TO_SPEECH]: async (\n runtime: IAgentRuntime,\n input: string | EdgeTTSParams,\n ): Promise<Buffer | ArrayBuffer | Uint8Array> => {\n const params: EdgeTTSParams =\n typeof input === \"string\" ? { text: input } : input;\n const settings = getEdgeTTSSettings(runtime);\n\n logger.log(\n `[EdgeTTS] Using TEXT_TO_SPEECH with voice: ${settings.voice}`,\n );\n\n if (!params.text || params.text.trim().length === 0) {\n throw new Error(\"TEXT_TO_SPEECH requires non-empty text\");\n }\n\n // Edge TTS has a practical limit around 5000 characters\n if (params.text.length > 5000) {\n throw new Error(\"TEXT_TO_SPEECH text exceeds 5000 character limit\");\n }\n\n try {\n const audioBuffer = await generateSpeech(settings, params);\n return audioBuffer;\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n logger.error(`EdgeTTS model error: ${msg}`);\n throw error instanceof Error ? error : new Error(msg);\n }\n },\n },\n tests: [\n {\n name: \"test edge tts\",\n tests: [\n {\n name: \"Edge TTS settings validation\",\n fn: async (runtime: IAgentRuntime) => {\n const settings = getEdgeTTSSettings(runtime);\n\n if (!settings.voice) {\n throw new Error(\"Missing voice configuration\");\n }\n\n if (!settings.lang) {\n throw new Error(\"Missing language configuration\");\n }\n\n if (!settings.outputFormat) {\n throw new Error(\"Missing output format configuration\");\n }\n\n logger.success(\"Edge TTS settings validated successfully\");\n },\n },\n {\n name: \"Edge TTS voice preset mapping\",\n fn: async (_runtime: IAgentRuntime) => {\n // Test that OpenAI-style voice names map correctly\n const testCases = [\n { input: \"alloy\", expected: \"en-US-GuyNeural\" },\n { input: \"nova\", expected: \"en-US-JennyNeural\" },\n { input: \"shimmer\", expected: \"en-US-AriaNeural\" },\n {\n input: \"en-US-MichelleNeural\",\n expected: \"en-US-MichelleNeural\",\n },\n ];\n\n for (const tc of testCases) {\n const result = resolveVoice(tc.input, DEFAULT_VOICE);\n if (result !== tc.expected) {\n throw new Error(\n `Voice preset mapping failed: ${tc.input} -> ${result}, expected ${tc.expected}`,\n );\n }\n }\n\n logger.success(\"Voice preset mapping validated successfully\");\n },\n },\n {\n name: \"Edge TTS speed to rate conversion\",\n fn: async (_runtime: IAgentRuntime) => {\n const testCases = [\n { speed: 1.0, expected: undefined },\n { speed: 1.5, expected: \"+50%\" },\n { speed: 0.75, expected: \"-25%\" },\n { speed: 2.0, expected: \"+100%\" },\n ];\n\n for (const tc of testCases) {\n const result = speedToRate(tc.speed);\n if (result !== tc.expected) {\n throw new Error(\n `Speed conversion failed: ${tc.speed} -> ${result}, expected ${tc.expected}`,\n );\n }\n }\n\n logger.success(\"Speed to rate conversion validated successfully\");\n },\n },\n {\n name: \"Edge TTS generation (live test)\",\n fn: async (runtime: IAgentRuntime) => {\n const testText = \"Hello, this is a test of Edge TTS.\";\n\n try {\n const audioBuffer = (await runtime.useModel(\n ModelType.TEXT_TO_SPEECH,\n testText,\n )) as Buffer | Uint8Array;\n\n if (!audioBuffer || audioBuffer.length === 0) {\n throw new Error(\"Received empty audio buffer\");\n }\n\n logger.success(\n `Edge TTS generation successful: ${audioBuffer.length} bytes`,\n );\n } catch (error: unknown) {\n const msg =\n error instanceof Error ? error.message : String(error);\n // Edge TTS might fail in CI environments without network\n if (msg.includes(\"ENOTFOUND\") || msg.includes(\"network\")) {\n logger.warn(\n `Edge TTS live test skipped (network unavailable): ${msg}`,\n );\n return;\n }\n throw error;\n }\n },\n },\n ],\n },\n ],\n};\n\nexport default edgeTTSPlugin;\n\n// Re-export types\nexport type { EdgeTTSSettings, EdgeTTSParams };\n\n// Export helper functions for testing\nexport const _test = {\n resolveVoice,\n speedToRate,\n inferExtension,\n getEdgeTTSSettings,\n};\n"
|
|
5
|
+
"import { mkdtempSync, readFileSync, rmSync } from \"node:fs\";\nimport { tmpdir } from \"node:os\";\nimport path from \"node:path\";\nimport { type IAgentRuntime, logger, ModelType, type Plugin } from \"@elizaos/core\";\nimport { EdgeTTS } from \"node-edge-tts\";\n\n/**\n * Edge TTS voice settings configuration\n */\ninterface EdgeTTSSettings {\n voice: string;\n lang: string;\n outputFormat: string;\n rate?: string;\n pitch?: string;\n volume?: string;\n proxy?: string;\n timeoutMs: number;\n}\n\n/**\n * Extended TTS params with Edge-specific options\n */\ninterface EdgeTTSParams {\n text: string;\n voice?: string;\n speed?: number;\n /** Edge TTS specific: language code */\n lang?: string;\n /** Edge TTS specific: output format */\n outputFormat?: string;\n /** Edge TTS specific: rate adjustment (e.g., +10%, -5%) */\n rate?: string;\n /** Edge TTS specific: pitch adjustment (e.g., +5Hz, -10Hz) */\n pitch?: string;\n /** Edge TTS specific: volume adjustment (e.g., +20%, -10%) */\n volume?: string;\n}\n\n// Default voice configurations\nconst DEFAULT_VOICE = \"en-US-MichelleNeural\";\nconst DEFAULT_LANG = \"en-US\";\nconst DEFAULT_OUTPUT_FORMAT = \"audio-24khz-48kbitrate-mono-mp3\";\nconst DEFAULT_TIMEOUT_MS = 30000;\n\n// Voice presets mapping common voice names to Edge TTS voices\nconst VOICE_PRESETS: Record<string, string> = {\n // Generic voices (map to good defaults)\n alloy: \"en-US-GuyNeural\",\n echo: \"en-US-ChristopherNeural\",\n fable: \"en-GB-RyanNeural\",\n onyx: \"en-US-DavisNeural\",\n nova: \"en-US-JennyNeural\",\n shimmer: \"en-US-AriaNeural\",\n // Direct Edge TTS voice names pass through\n};\n\nfunction getSetting(runtime: IAgentRuntime, key: string, fallback?: string): string | undefined {\n const envValue =\n typeof process !== \"undefined\" && (process as { env?: Record<string, string> }).env\n ? (process as { env: Record<string, string> }).env[key]\n : undefined;\n return (runtime.getSetting(key) as string | undefined) ?? envValue ?? fallback;\n}\n\nfunction getEdgeTTSSettings(runtime: IAgentRuntime): EdgeTTSSettings {\n const timeoutStr = getSetting(runtime, \"EDGE_TTS_TIMEOUT_MS\");\n return {\n voice: getSetting(runtime, \"EDGE_TTS_VOICE\", DEFAULT_VOICE) ?? DEFAULT_VOICE,\n lang: getSetting(runtime, \"EDGE_TTS_LANG\", DEFAULT_LANG) ?? DEFAULT_LANG,\n outputFormat:\n getSetting(runtime, \"EDGE_TTS_OUTPUT_FORMAT\", DEFAULT_OUTPUT_FORMAT) ?? DEFAULT_OUTPUT_FORMAT,\n rate: getSetting(runtime, \"EDGE_TTS_RATE\"),\n pitch: getSetting(runtime, \"EDGE_TTS_PITCH\"),\n volume: getSetting(runtime, \"EDGE_TTS_VOLUME\"),\n proxy: getSetting(runtime, \"EDGE_TTS_PROXY\"),\n timeoutMs: timeoutStr ? Number.parseInt(timeoutStr, 10) : DEFAULT_TIMEOUT_MS,\n };\n}\n\n/**\n * Resolve voice name - handles OpenAI-style voice names and Edge TTS voice IDs\n */\nfunction resolveVoice(voice: string | undefined, defaultVoice: string): string {\n if (!voice) return defaultVoice;\n\n // Check if it's a preset name\n const preset = VOICE_PRESETS[voice.toLowerCase()];\n if (preset) return preset;\n\n // Assume it's a direct Edge TTS voice ID\n return voice;\n}\n\n/**\n * Convert speed multiplier to Edge TTS rate string\n * speed: 1.0 = normal, 0.5 = half speed, 2.0 = double speed\n */\nfunction speedToRate(speed: number | undefined): string | undefined {\n if (speed === undefined || speed === 1.0) return undefined;\n const percentage = Math.round((speed - 1) * 100);\n return percentage >= 0 ? `+${percentage}%` : `${percentage}%`;\n}\n\n/**\n * Infer file extension from Edge TTS output format\n */\nfunction inferExtension(outputFormat: string): string {\n const normalized = outputFormat.toLowerCase();\n if (normalized.includes(\"webm\")) return \".webm\";\n if (normalized.includes(\"ogg\")) return \".ogg\";\n if (normalized.includes(\"opus\")) return \".opus\";\n if (normalized.includes(\"wav\") || normalized.includes(\"riff\") || normalized.includes(\"pcm\")) {\n return \".wav\";\n }\n return \".mp3\";\n}\n\n/**\n * Generate speech using Microsoft Edge TTS\n */\nasync function generateSpeech(settings: EdgeTTSSettings, params: EdgeTTSParams): Promise<Buffer> {\n const voice = resolveVoice(params.voice, settings.voice);\n const lang = params.lang ?? settings.lang;\n const outputFormat = params.outputFormat ?? settings.outputFormat;\n const rate = params.rate ?? speedToRate(params.speed) ?? settings.rate;\n const pitch = params.pitch ?? settings.pitch;\n const volume = params.volume ?? settings.volume;\n\n logger.debug(`[EdgeTTS] Generating speech with voice: ${voice}, lang: ${lang}`);\n\n const tts = new EdgeTTS({\n voice,\n lang,\n outputFormat,\n saveSubtitles: false,\n proxy: settings.proxy,\n rate,\n pitch,\n volume,\n timeout: settings.timeoutMs,\n });\n\n // Create temp directory for output\n const tempDir = mkdtempSync(path.join(tmpdir(), \"edge-tts-\"));\n const extension = inferExtension(outputFormat);\n const outputPath = path.join(tempDir, `speech${extension}`);\n\n try {\n await tts.ttsPromise(params.text, outputPath);\n const audioBuffer = readFileSync(outputPath);\n return audioBuffer;\n } finally {\n // Cleanup temp directory\n try {\n rmSync(tempDir, { recursive: true, force: true });\n } catch {\n // Ignore cleanup errors\n }\n }\n}\n\n/**\n * Edge TTS Plugin for ElizaOS\n *\n * Provides free text-to-speech synthesis using Microsoft Edge's TTS service.\n * No API key required - uses the same TTS engine as Microsoft Edge browser.\n *\n * Features:\n * - High-quality neural voices\n * - Multiple languages and locales\n * - Adjustable rate, pitch, and volume\n * - No API key or payment required\n *\n * Optional environment variables:\n * - EDGE_TTS_VOICE: Voice ID (default: en-US-MichelleNeural)\n * - EDGE_TTS_LANG: Language code (default: en-US)\n * - EDGE_TTS_OUTPUT_FORMAT: Output format (default: audio-24khz-48kbitrate-mono-mp3)\n * - EDGE_TTS_RATE: Speech rate adjustment (e.g., +10%, -5%)\n * - EDGE_TTS_PITCH: Pitch adjustment (e.g., +5Hz, -10Hz)\n * - EDGE_TTS_VOLUME: Volume adjustment (e.g., +20%, -10%)\n * - EDGE_TTS_PROXY: HTTP proxy URL\n * - EDGE_TTS_TIMEOUT_MS: Request timeout (default: 30000)\n *\n * Popular voices:\n * - en-US-MichelleNeural (female, US English)\n * - en-US-GuyNeural (male, US English)\n * - en-US-JennyNeural (female, US English)\n * - en-US-AriaNeural (female, US English)\n * - en-GB-SoniaNeural (female, UK English)\n * - en-GB-RyanNeural (male, UK English)\n * - de-DE-KatjaNeural (female, German)\n * - fr-FR-DeniseNeural (female, French)\n * - es-ES-ElviraNeural (female, Spanish)\n * - ja-JP-NanamiNeural (female, Japanese)\n * - zh-CN-XiaoxiaoNeural (female, Chinese)\n */\nexport const edgeTTSPlugin: Plugin = {\n name: \"edge-tts\",\n description:\n \"Free text-to-speech synthesis using Microsoft Edge TTS - no API key required, high-quality neural voices\",\n models: {\n [ModelType.TEXT_TO_SPEECH]: async (\n runtime: IAgentRuntime,\n input: string | EdgeTTSParams\n ): Promise<Buffer | ArrayBuffer | Uint8Array> => {\n const params: EdgeTTSParams = typeof input === \"string\" ? { text: input } : input;\n const settings = getEdgeTTSSettings(runtime);\n\n logger.log(`[EdgeTTS] Using TEXT_TO_SPEECH with voice: ${settings.voice}`);\n\n if (!params.text || params.text.trim().length === 0) {\n throw new Error(\"TEXT_TO_SPEECH requires non-empty text\");\n }\n\n // Edge TTS has a practical limit around 5000 characters\n if (params.text.length > 5000) {\n throw new Error(\"TEXT_TO_SPEECH text exceeds 5000 character limit\");\n }\n\n try {\n const audioBuffer = await generateSpeech(settings, params);\n return audioBuffer;\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n logger.error(`EdgeTTS model error: ${msg}`);\n throw error instanceof Error ? error : new Error(msg);\n }\n },\n },\n tests: [\n {\n name: \"test edge tts\",\n tests: [\n {\n name: \"Edge TTS settings validation\",\n fn: async (runtime: IAgentRuntime) => {\n const settings = getEdgeTTSSettings(runtime);\n\n if (!settings.voice) {\n throw new Error(\"Missing voice configuration\");\n }\n\n if (!settings.lang) {\n throw new Error(\"Missing language configuration\");\n }\n\n if (!settings.outputFormat) {\n throw new Error(\"Missing output format configuration\");\n }\n\n logger.success(\"Edge TTS settings validated successfully\");\n },\n },\n {\n name: \"Edge TTS voice preset mapping\",\n fn: async (_runtime: IAgentRuntime) => {\n // Test that OpenAI-style voice names map correctly\n const testCases = [\n { input: \"alloy\", expected: \"en-US-GuyNeural\" },\n { input: \"nova\", expected: \"en-US-JennyNeural\" },\n { input: \"shimmer\", expected: \"en-US-AriaNeural\" },\n {\n input: \"en-US-MichelleNeural\",\n expected: \"en-US-MichelleNeural\",\n },\n ];\n\n for (const tc of testCases) {\n const result = resolveVoice(tc.input, DEFAULT_VOICE);\n if (result !== tc.expected) {\n throw new Error(\n `Voice preset mapping failed: ${tc.input} -> ${result}, expected ${tc.expected}`\n );\n }\n }\n\n logger.success(\"Voice preset mapping validated successfully\");\n },\n },\n {\n name: \"Edge TTS speed to rate conversion\",\n fn: async (_runtime: IAgentRuntime) => {\n const testCases = [\n { speed: 1.0, expected: undefined },\n { speed: 1.5, expected: \"+50%\" },\n { speed: 0.75, expected: \"-25%\" },\n { speed: 2.0, expected: \"+100%\" },\n ];\n\n for (const tc of testCases) {\n const result = speedToRate(tc.speed);\n if (result !== tc.expected) {\n throw new Error(\n `Speed conversion failed: ${tc.speed} -> ${result}, expected ${tc.expected}`\n );\n }\n }\n\n logger.success(\"Speed to rate conversion validated successfully\");\n },\n },\n {\n name: \"Edge TTS generation (live test)\",\n fn: async (runtime: IAgentRuntime) => {\n const testText = \"Hello, this is a test of Edge TTS.\";\n\n try {\n const audioBuffer = (await runtime.useModel(ModelType.TEXT_TO_SPEECH, testText)) as\n | Buffer\n | Uint8Array;\n\n if (!audioBuffer || audioBuffer.length === 0) {\n throw new Error(\"Received empty audio buffer\");\n }\n\n logger.success(`Edge TTS generation successful: ${audioBuffer.length} bytes`);\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n // Edge TTS might fail in CI environments without network\n if (msg.includes(\"ENOTFOUND\") || msg.includes(\"network\")) {\n logger.warn(`Edge TTS live test skipped (network unavailable): ${msg}`);\n return;\n }\n throw error;\n }\n },\n },\n ],\n },\n ],\n};\n\nexport default edgeTTSPlugin;\n\n// Re-export types\nexport type { EdgeTTSSettings, EdgeTTSParams };\n\n// Export helper functions for testing\nexport const _test = {\n resolveVoice,\n speedToRate,\n inferExtension,\n getEdgeTTSSettings,\n};\n"
|
|
6
6
|
],
|
|
7
|
-
"mappings": ";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
8
|
-
"debugId": "
|
|
7
|
+
"mappings": ";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAAkD,IAAlD;AACuB,IAAvB;AACiB,IAAjB;AACmE,IAAnE;AACwB,IAAxB;AAoCA,IAAM,gBAAgB;AACtB,IAAM,eAAe;AACrB,IAAM,wBAAwB;AAC9B,IAAM,qBAAqB;AAG3B,IAAM,gBAAwC;AAAA,EAE5C,OAAO;AAAA,EACP,MAAM;AAAA,EACN,OAAO;AAAA,EACP,MAAM;AAAA,EACN,MAAM;AAAA,EACN,SAAS;AAEX;AAEA,SAAS,UAAU,CAAC,SAAwB,KAAa,UAAuC;AAAA,EAC9F,MAAM,WACJ,OAAO,YAAY,eAAgB,QAA6C,MAC3E,QAA4C,IAAI,OACjD;AAAA,EACN,OAAQ,QAAQ,WAAW,GAAG,KAA4B,YAAY;AAAA;AAGxE,SAAS,kBAAkB,CAAC,SAAyC;AAAA,EACnE,MAAM,aAAa,WAAW,SAAS,qBAAqB;AAAA,EAC5D,OAAO;AAAA,IACL,OAAO,WAAW,SAAS,kBAAkB,aAAa,KAAK;AAAA,IAC/D,MAAM,WAAW,SAAS,iBAAiB,YAAY,KAAK;AAAA,IAC5D,cACE,WAAW,SAAS,0BAA0B,qBAAqB,KAAK;AAAA,IAC1E,MAAM,WAAW,SAAS,eAAe;AAAA,IACzC,OAAO,WAAW,SAAS,gBAAgB;AAAA,IAC3C,QAAQ,WAAW,SAAS,iBAAiB;AAAA,IAC7C,OAAO,WAAW,SAAS,gBAAgB;AAAA,IAC3C,WAAW,aAAa,OAAO,SAAS,YAAY,EAAE,IAAI;AAAA,EAC5D;AAAA;AAMF,SAAS,YAAY,CAAC,OAA2B,cAA8B;AAAA,EAC7E,IAAI,CAAC;AAAA,IAAO,OAAO;AAAA,EAGnB,MAAM,SAAS,cAAc,MAAM,YAAY;AAAA,EAC/C,IAAI;AAAA,IAAQ,OAAO;AAAA,EAGnB,OAAO;AAAA;AAOT,SAAS,WAAW,CAAC,OAA+C;AAAA,EAClE,IAAI,UAAU,aAAa,UAAU;AAAA,IAAK;AAAA,EAC1C,MAAM,aAAa,KAAK,OAAO,QAAQ,KAAK,GAAG;AAAA,EAC/C,OAAO,cAAc,IAAI,IAAI,gBAAgB,GAAG;AAAA;AAMlD,SAAS,cAAc,CAAC,cAA8B;AAAA,EACpD,MAAM,aAAa,aAAa,YAAY;AAAA,EAC5C,IAAI,WAAW,SAAS,MAAM;AAAA,IAAG,OAAO;AAAA,EACxC,IAAI,WAAW,SAAS,KAAK;AAAA,IAAG,OAAO;AAAA,EACvC,IAAI,WAAW,SAAS,MAAM;AAAA,IAAG,OAAO;AAAA,EACxC,IAAI,WAAW,SAAS,KAAK,KAAK,WAAW,SAAS,MAAM,KAAK,WAAW,SAAS,KAAK,GAAG;AAAA,IAC3F,OAAO;AAAA,EACT;AAAA,EACA,OAAO;AAAA;AAMT,eAAe,cAAc,CAAC,UAA2B,QAAwC;AAAA,EAC/F,MAAM,QAAQ,aAAa,OAAO,OAAO,SAAS,KAAK;AAAA,EACvD,MAAM,OAAO,OAAO,QAAQ,SAAS;AAAA,EACrC,MAAM,eAAe,OAAO,gBAAgB,SAAS;AAAA,EACrD,MAAM,OAAO,OAAO,QAAQ,YAAY,OAAO,KAAK,KAAK,SAAS;AAAA,EAClE,MAAM,QAAQ,OAAO,SAAS,SAAS;AAAA,EACvC,MAAM,SAAS,OAAO,UAAU,SAAS;AAAA,EAEzC,mBAAO,MAAM,2CAA2C,gBAAgB,MAAM;AAAA,EAE9E,MAAM,MAAM,IAAI,6BAAQ;AAAA,IACtB;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe;AAAA,IACf,OAAO,SAAS;AAAA,IAChB;AAAA,IACA;AAAA,IACA;AAAA,IACA,SAAS,SAAS;AAAA,EACpB,CAAC;AAAA,EAGD,MAAM,UAAU,2BAAY,yBAAK,KAAK,sBAAO,GAAG,WAAW,CAAC;AAAA,EAC5D,MAAM,YAAY,eAAe,YAAY;AAAA,EAC7C,MAAM,aAAa,yBAAK,KAAK,SAAS,SAAS,WAAW;AAAA,EAE1D,IAAI;AAAA,IACF,MAAM,IAAI,WAAW,OAAO,MAAM,UAAU;AAAA,IAC5C,MAAM,cAAc,4BAAa,UAAU;AAAA,IAC3C,OAAO;AAAA,YACP;AAAA,IAEA,IAAI;AAAA,MACF,sBAAO,SAAS,EAAE,WAAW,MAAM,OAAO,KAAK,CAAC;AAAA,MAChD,MAAM;AAAA;AAAA;AAyCL,IAAM,gBAAwB;AAAA,EACnC,MAAM;AAAA,EACN,aACE;AAAA,EACF,QAAQ;AAAA,KACL,sBAAU,iBAAiB,OAC1B,SACA,UAC+C;AAAA,MAC/C,MAAM,SAAwB,OAAO,UAAU,WAAW,EAAE,MAAM,MAAM,IAAI;AAAA,MAC5E,MAAM,WAAW,mBAAmB,OAAO;AAAA,MAE3C,mBAAO,IAAI,8CAA8C,SAAS,OAAO;AAAA,MAEzE,IAAI,CAAC,OAAO,QAAQ,OAAO,KAAK,KAAK,EAAE,WAAW,GAAG;AAAA,QACnD,MAAM,IAAI,MAAM,wCAAwC;AAAA,MAC1D;AAAA,MAGA,IAAI,OAAO,KAAK,SAAS,MAAM;AAAA,QAC7B,MAAM,IAAI,MAAM,kDAAkD;AAAA,MACpE;AAAA,MAEA,IAAI;AAAA,QACF,MAAM,cAAc,MAAM,eAAe,UAAU,MAAM;AAAA,QACzD,OAAO;AAAA,QACP,OAAO,OAAgB;AAAA,QACvB,MAAM,MAAM,iBAAiB,QAAQ,MAAM,UAAU,OAAO,KAAK;AAAA,QACjE,mBAAO,MAAM,wBAAwB,KAAK;AAAA,QAC1C,MAAM,iBAAiB,QAAQ,QAAQ,IAAI,MAAM,GAAG;AAAA;AAAA;AAAA,EAG1D;AAAA,EACA,OAAO;AAAA,IACL;AAAA,MACE,MAAM;AAAA,MACN,OAAO;AAAA,QACL;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,YAA2B;AAAA,YACpC,MAAM,WAAW,mBAAmB,OAAO;AAAA,YAE3C,IAAI,CAAC,SAAS,OAAO;AAAA,cACnB,MAAM,IAAI,MAAM,6BAA6B;AAAA,YAC/C;AAAA,YAEA,IAAI,CAAC,SAAS,MAAM;AAAA,cAClB,MAAM,IAAI,MAAM,gCAAgC;AAAA,YAClD;AAAA,YAEA,IAAI,CAAC,SAAS,cAAc;AAAA,cAC1B,MAAM,IAAI,MAAM,qCAAqC;AAAA,YACvD;AAAA,YAEA,mBAAO,QAAQ,0CAA0C;AAAA;AAAA,QAE7D;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,aAA4B;AAAA,YAErC,MAAM,YAAY;AAAA,cAChB,EAAE,OAAO,SAAS,UAAU,kBAAkB;AAAA,cAC9C,EAAE,OAAO,QAAQ,UAAU,oBAAoB;AAAA,cAC/C,EAAE,OAAO,WAAW,UAAU,mBAAmB;AAAA,cACjD;AAAA,gBACE,OAAO;AAAA,gBACP,UAAU;AAAA,cACZ;AAAA,YACF;AAAA,YAEA,WAAW,MAAM,WAAW;AAAA,cAC1B,MAAM,SAAS,aAAa,GAAG,OAAO,aAAa;AAAA,cACnD,IAAI,WAAW,GAAG,UAAU;AAAA,gBAC1B,MAAM,IAAI,MACR,gCAAgC,GAAG,YAAY,oBAAoB,GAAG,UACxE;AAAA,cACF;AAAA,YACF;AAAA,YAEA,mBAAO,QAAQ,6CAA6C;AAAA;AAAA,QAEhE;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,aAA4B;AAAA,YACrC,MAAM,YAAY;AAAA,cAChB,EAAE,OAAO,GAAK,UAAU,UAAU;AAAA,cAClC,EAAE,OAAO,KAAK,UAAU,OAAO;AAAA,cAC/B,EAAE,OAAO,MAAM,UAAU,OAAO;AAAA,cAChC,EAAE,OAAO,GAAK,UAAU,QAAQ;AAAA,YAClC;AAAA,YAEA,WAAW,MAAM,WAAW;AAAA,cAC1B,MAAM,SAAS,YAAY,GAAG,KAAK;AAAA,cACnC,IAAI,WAAW,GAAG,UAAU;AAAA,gBAC1B,MAAM,IAAI,MACR,4BAA4B,GAAG,YAAY,oBAAoB,GAAG,UACpE;AAAA,cACF;AAAA,YACF;AAAA,YAEA,mBAAO,QAAQ,iDAAiD;AAAA;AAAA,QAEpE;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,YAA2B;AAAA,YACpC,MAAM,WAAW;AAAA,YAEjB,IAAI;AAAA,cACF,MAAM,cAAe,MAAM,QAAQ,SAAS,sBAAU,gBAAgB,QAAQ;AAAA,cAI9E,IAAI,CAAC,eAAe,YAAY,WAAW,GAAG;AAAA,gBAC5C,MAAM,IAAI,MAAM,6BAA6B;AAAA,cAC/C;AAAA,cAEA,mBAAO,QAAQ,mCAAmC,YAAY,cAAc;AAAA,cAC5E,OAAO,OAAgB;AAAA,cACvB,MAAM,MAAM,iBAAiB,QAAQ,MAAM,UAAU,OAAO,KAAK;AAAA,cAEjE,IAAI,IAAI,SAAS,WAAW,KAAK,IAAI,SAAS,SAAS,GAAG;AAAA,gBACxD,mBAAO,KAAK,qDAAqD,KAAK;AAAA,gBACtE;AAAA,cACF;AAAA,cACA,MAAM;AAAA;AAAA;AAAA,QAGZ;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;AAEA,IAAe;AAMR,IAAM,QAAQ;AAAA,EACnB;AAAA,EACA;AAAA,EACA;AAAA,EACA;AACF;",
|
|
8
|
+
"debugId": "44DEBD6EBE84FDA064756E2164756E21",
|
|
9
9
|
"names": []
|
|
10
10
|
}
|
package/dist/index.d.ts
CHANGED
|
@@ -1,90 +1 @@
|
|
|
1
|
-
|
|
2
|
-
/**
|
|
3
|
-
* Edge TTS voice settings configuration
|
|
4
|
-
*/
|
|
5
|
-
interface EdgeTTSSettings {
|
|
6
|
-
voice: string;
|
|
7
|
-
lang: string;
|
|
8
|
-
outputFormat: string;
|
|
9
|
-
rate?: string;
|
|
10
|
-
pitch?: string;
|
|
11
|
-
volume?: string;
|
|
12
|
-
proxy?: string;
|
|
13
|
-
timeoutMs: number;
|
|
14
|
-
}
|
|
15
|
-
/**
|
|
16
|
-
* Extended TTS params with Edge-specific options
|
|
17
|
-
*/
|
|
18
|
-
interface EdgeTTSParams {
|
|
19
|
-
text: string;
|
|
20
|
-
voice?: string;
|
|
21
|
-
speed?: number;
|
|
22
|
-
/** Edge TTS specific: language code */
|
|
23
|
-
lang?: string;
|
|
24
|
-
/** Edge TTS specific: output format */
|
|
25
|
-
outputFormat?: string;
|
|
26
|
-
/** Edge TTS specific: rate adjustment (e.g., +10%, -5%) */
|
|
27
|
-
rate?: string;
|
|
28
|
-
/** Edge TTS specific: pitch adjustment (e.g., +5Hz, -10Hz) */
|
|
29
|
-
pitch?: string;
|
|
30
|
-
/** Edge TTS specific: volume adjustment (e.g., +20%, -10%) */
|
|
31
|
-
volume?: string;
|
|
32
|
-
}
|
|
33
|
-
declare function getEdgeTTSSettings(runtime: IAgentRuntime): EdgeTTSSettings;
|
|
34
|
-
/**
|
|
35
|
-
* Resolve voice name - handles OpenAI-style voice names and Edge TTS voice IDs
|
|
36
|
-
*/
|
|
37
|
-
declare function resolveVoice(voice: string | undefined, defaultVoice: string): string;
|
|
38
|
-
/**
|
|
39
|
-
* Convert speed multiplier to Edge TTS rate string
|
|
40
|
-
* speed: 1.0 = normal, 0.5 = half speed, 2.0 = double speed
|
|
41
|
-
*/
|
|
42
|
-
declare function speedToRate(speed: number | undefined): string | undefined;
|
|
43
|
-
/**
|
|
44
|
-
* Infer file extension from Edge TTS output format
|
|
45
|
-
*/
|
|
46
|
-
declare function inferExtension(outputFormat: string): string;
|
|
47
|
-
/**
|
|
48
|
-
* Edge TTS Plugin for ElizaOS
|
|
49
|
-
*
|
|
50
|
-
* Provides free text-to-speech synthesis using Microsoft Edge's TTS service.
|
|
51
|
-
* No API key required - uses the same TTS engine as Microsoft Edge browser.
|
|
52
|
-
*
|
|
53
|
-
* Features:
|
|
54
|
-
* - High-quality neural voices
|
|
55
|
-
* - Multiple languages and locales
|
|
56
|
-
* - Adjustable rate, pitch, and volume
|
|
57
|
-
* - No API key or payment required
|
|
58
|
-
*
|
|
59
|
-
* Optional environment variables:
|
|
60
|
-
* - EDGE_TTS_VOICE: Voice ID (default: en-US-MichelleNeural)
|
|
61
|
-
* - EDGE_TTS_LANG: Language code (default: en-US)
|
|
62
|
-
* - EDGE_TTS_OUTPUT_FORMAT: Output format (default: audio-24khz-48kbitrate-mono-mp3)
|
|
63
|
-
* - EDGE_TTS_RATE: Speech rate adjustment (e.g., +10%, -5%)
|
|
64
|
-
* - EDGE_TTS_PITCH: Pitch adjustment (e.g., +5Hz, -10Hz)
|
|
65
|
-
* - EDGE_TTS_VOLUME: Volume adjustment (e.g., +20%, -10%)
|
|
66
|
-
* - EDGE_TTS_PROXY: HTTP proxy URL
|
|
67
|
-
* - EDGE_TTS_TIMEOUT_MS: Request timeout (default: 30000)
|
|
68
|
-
*
|
|
69
|
-
* Popular voices:
|
|
70
|
-
* - en-US-MichelleNeural (female, US English)
|
|
71
|
-
* - en-US-GuyNeural (male, US English)
|
|
72
|
-
* - en-US-JennyNeural (female, US English)
|
|
73
|
-
* - en-US-AriaNeural (female, US English)
|
|
74
|
-
* - en-GB-SoniaNeural (female, UK English)
|
|
75
|
-
* - en-GB-RyanNeural (male, UK English)
|
|
76
|
-
* - de-DE-KatjaNeural (female, German)
|
|
77
|
-
* - fr-FR-DeniseNeural (female, French)
|
|
78
|
-
* - es-ES-ElviraNeural (female, Spanish)
|
|
79
|
-
* - ja-JP-NanamiNeural (female, Japanese)
|
|
80
|
-
* - zh-CN-XiaoxiaoNeural (female, Chinese)
|
|
81
|
-
*/
|
|
82
|
-
export declare const edgeTTSPlugin: Plugin;
|
|
83
|
-
export default edgeTTSPlugin;
|
|
84
|
-
export type { EdgeTTSSettings, EdgeTTSParams };
|
|
85
|
-
export declare const _test: {
|
|
86
|
-
resolveVoice: typeof resolveVoice;
|
|
87
|
-
speedToRate: typeof speedToRate;
|
|
88
|
-
inferExtension: typeof inferExtension;
|
|
89
|
-
getEdgeTTSSettings: typeof getEdgeTTSSettings;
|
|
90
|
-
};
|
|
1
|
+
export * from "@elizaos/core";
|
package/dist/node/index.node.js
CHANGED
|
@@ -1,12 +1,9 @@
|
|
|
1
1
|
// src/index.ts
|
|
2
|
-
import {
|
|
3
|
-
ModelType,
|
|
4
|
-
logger
|
|
5
|
-
} from "@elizaos/core";
|
|
6
|
-
import { EdgeTTS } from "node-edge-tts";
|
|
7
|
-
import { mkdtempSync, rmSync, readFileSync } from "node:fs";
|
|
2
|
+
import { mkdtempSync, readFileSync, rmSync } from "node:fs";
|
|
8
3
|
import { tmpdir } from "node:os";
|
|
9
4
|
import path from "node:path";
|
|
5
|
+
import { logger, ModelType } from "@elizaos/core";
|
|
6
|
+
import { EdgeTTS } from "node-edge-tts";
|
|
10
7
|
var DEFAULT_VOICE = "en-US-MichelleNeural";
|
|
11
8
|
var DEFAULT_LANG = "en-US";
|
|
12
9
|
var DEFAULT_OUTPUT_FORMAT = "audio-24khz-48kbitrate-mono-mp3";
|
|
@@ -215,4 +212,4 @@ export {
|
|
|
215
212
|
_test
|
|
216
213
|
};
|
|
217
214
|
|
|
218
|
-
//# debugId=
|
|
215
|
+
//# debugId=72B923D58112D3ED64756E2164756E21
|
|
@@ -2,9 +2,9 @@
|
|
|
2
2
|
"version": 3,
|
|
3
3
|
"sources": ["../../src/index.ts"],
|
|
4
4
|
"sourcesContent": [
|
|
5
|
-
"import {\n type IAgentRuntime,\n ModelType,\n type Plugin,\n logger,\n} from \"@elizaos/core\";\nimport { EdgeTTS } from \"node-edge-tts\";\nimport { mkdtempSync, rmSync, readFileSync } from \"node:fs\";\nimport { tmpdir } from \"node:os\";\nimport path from \"node:path\";\n\n/**\n * Edge TTS voice settings configuration\n */\ninterface EdgeTTSSettings {\n voice: string;\n lang: string;\n outputFormat: string;\n rate?: string;\n pitch?: string;\n volume?: string;\n proxy?: string;\n timeoutMs: number;\n}\n\n/**\n * Extended TTS params with Edge-specific options\n */\ninterface EdgeTTSParams {\n text: string;\n voice?: string;\n speed?: number;\n /** Edge TTS specific: language code */\n lang?: string;\n /** Edge TTS specific: output format */\n outputFormat?: string;\n /** Edge TTS specific: rate adjustment (e.g., +10%, -5%) */\n rate?: string;\n /** Edge TTS specific: pitch adjustment (e.g., +5Hz, -10Hz) */\n pitch?: string;\n /** Edge TTS specific: volume adjustment (e.g., +20%, -10%) */\n volume?: string;\n}\n\n// Default voice configurations\nconst DEFAULT_VOICE = \"en-US-MichelleNeural\";\nconst DEFAULT_LANG = \"en-US\";\nconst DEFAULT_OUTPUT_FORMAT = \"audio-24khz-48kbitrate-mono-mp3\";\nconst DEFAULT_TIMEOUT_MS = 30000;\n\n// Voice presets mapping common voice names to Edge TTS voices\nconst VOICE_PRESETS: Record<string, string> = {\n // Generic voices (map to good defaults)\n alloy: \"en-US-GuyNeural\",\n echo: \"en-US-ChristopherNeural\",\n fable: \"en-GB-RyanNeural\",\n onyx: \"en-US-DavisNeural\",\n nova: \"en-US-JennyNeural\",\n shimmer: \"en-US-AriaNeural\",\n // Direct Edge TTS voice names pass through\n};\n\nfunction getSetting(\n runtime: IAgentRuntime,\n key: string,\n fallback?: string,\n): string | undefined {\n const envValue =\n typeof process !== \"undefined\" &&\n (process as { env?: Record<string, string> }).env\n ? (process as { env: Record<string, string> }).env[key]\n : undefined;\n return (\n (runtime.getSetting(key) as string | undefined) ?? envValue ?? fallback\n );\n}\n\nfunction getEdgeTTSSettings(runtime: IAgentRuntime): EdgeTTSSettings {\n const timeoutStr = getSetting(runtime, \"EDGE_TTS_TIMEOUT_MS\");\n return {\n voice:\n getSetting(runtime, \"EDGE_TTS_VOICE\", DEFAULT_VOICE) ?? DEFAULT_VOICE,\n lang: getSetting(runtime, \"EDGE_TTS_LANG\", DEFAULT_LANG) ?? DEFAULT_LANG,\n outputFormat:\n getSetting(runtime, \"EDGE_TTS_OUTPUT_FORMAT\", DEFAULT_OUTPUT_FORMAT) ??\n DEFAULT_OUTPUT_FORMAT,\n rate: getSetting(runtime, \"EDGE_TTS_RATE\"),\n pitch: getSetting(runtime, \"EDGE_TTS_PITCH\"),\n volume: getSetting(runtime, \"EDGE_TTS_VOLUME\"),\n proxy: getSetting(runtime, \"EDGE_TTS_PROXY\"),\n timeoutMs: timeoutStr\n ? Number.parseInt(timeoutStr, 10)\n : DEFAULT_TIMEOUT_MS,\n };\n}\n\n/**\n * Resolve voice name - handles OpenAI-style voice names and Edge TTS voice IDs\n */\nfunction resolveVoice(voice: string | undefined, defaultVoice: string): string {\n if (!voice) return defaultVoice;\n\n // Check if it's a preset name\n const preset = VOICE_PRESETS[voice.toLowerCase()];\n if (preset) return preset;\n\n // Assume it's a direct Edge TTS voice ID\n return voice;\n}\n\n/**\n * Convert speed multiplier to Edge TTS rate string\n * speed: 1.0 = normal, 0.5 = half speed, 2.0 = double speed\n */\nfunction speedToRate(speed: number | undefined): string | undefined {\n if (speed === undefined || speed === 1.0) return undefined;\n const percentage = Math.round((speed - 1) * 100);\n return percentage >= 0 ? `+${percentage}%` : `${percentage}%`;\n}\n\n/**\n * Infer file extension from Edge TTS output format\n */\nfunction inferExtension(outputFormat: string): string {\n const normalized = outputFormat.toLowerCase();\n if (normalized.includes(\"webm\")) return \".webm\";\n if (normalized.includes(\"ogg\")) return \".ogg\";\n if (normalized.includes(\"opus\")) return \".opus\";\n if (\n normalized.includes(\"wav\") ||\n normalized.includes(\"riff\") ||\n normalized.includes(\"pcm\")\n ) {\n return \".wav\";\n }\n return \".mp3\";\n}\n\n/**\n * Generate speech using Microsoft Edge TTS\n */\nasync function generateSpeech(\n settings: EdgeTTSSettings,\n params: EdgeTTSParams,\n): Promise<Buffer> {\n const voice = resolveVoice(params.voice, settings.voice);\n const lang = params.lang ?? settings.lang;\n const outputFormat = params.outputFormat ?? settings.outputFormat;\n const rate = params.rate ?? speedToRate(params.speed) ?? settings.rate;\n const pitch = params.pitch ?? settings.pitch;\n const volume = params.volume ?? settings.volume;\n\n logger.debug(\n `[EdgeTTS] Generating speech with voice: ${voice}, lang: ${lang}`,\n );\n\n const tts = new EdgeTTS({\n voice,\n lang,\n outputFormat,\n saveSubtitles: false,\n proxy: settings.proxy,\n rate,\n pitch,\n volume,\n timeout: settings.timeoutMs,\n });\n\n // Create temp directory for output\n const tempDir = mkdtempSync(path.join(tmpdir(), \"edge-tts-\"));\n const extension = inferExtension(outputFormat);\n const outputPath = path.join(tempDir, `speech${extension}`);\n\n try {\n await tts.ttsPromise(params.text, outputPath);\n const audioBuffer = readFileSync(outputPath);\n return audioBuffer;\n } finally {\n // Cleanup temp directory\n try {\n rmSync(tempDir, { recursive: true, force: true });\n } catch {\n // Ignore cleanup errors\n }\n }\n}\n\n/**\n * Edge TTS Plugin for ElizaOS\n *\n * Provides free text-to-speech synthesis using Microsoft Edge's TTS service.\n * No API key required - uses the same TTS engine as Microsoft Edge browser.\n *\n * Features:\n * - High-quality neural voices\n * - Multiple languages and locales\n * - Adjustable rate, pitch, and volume\n * - No API key or payment required\n *\n * Optional environment variables:\n * - EDGE_TTS_VOICE: Voice ID (default: en-US-MichelleNeural)\n * - EDGE_TTS_LANG: Language code (default: en-US)\n * - EDGE_TTS_OUTPUT_FORMAT: Output format (default: audio-24khz-48kbitrate-mono-mp3)\n * - EDGE_TTS_RATE: Speech rate adjustment (e.g., +10%, -5%)\n * - EDGE_TTS_PITCH: Pitch adjustment (e.g., +5Hz, -10Hz)\n * - EDGE_TTS_VOLUME: Volume adjustment (e.g., +20%, -10%)\n * - EDGE_TTS_PROXY: HTTP proxy URL\n * - EDGE_TTS_TIMEOUT_MS: Request timeout (default: 30000)\n *\n * Popular voices:\n * - en-US-MichelleNeural (female, US English)\n * - en-US-GuyNeural (male, US English)\n * - en-US-JennyNeural (female, US English)\n * - en-US-AriaNeural (female, US English)\n * - en-GB-SoniaNeural (female, UK English)\n * - en-GB-RyanNeural (male, UK English)\n * - de-DE-KatjaNeural (female, German)\n * - fr-FR-DeniseNeural (female, French)\n * - es-ES-ElviraNeural (female, Spanish)\n * - ja-JP-NanamiNeural (female, Japanese)\n * - zh-CN-XiaoxiaoNeural (female, Chinese)\n */\nexport const edgeTTSPlugin: Plugin = {\n name: \"edge-tts\",\n description:\n \"Free text-to-speech synthesis using Microsoft Edge TTS - no API key required, high-quality neural voices\",\n models: {\n [ModelType.TEXT_TO_SPEECH]: async (\n runtime: IAgentRuntime,\n input: string | EdgeTTSParams,\n ): Promise<Buffer | ArrayBuffer | Uint8Array> => {\n const params: EdgeTTSParams =\n typeof input === \"string\" ? { text: input } : input;\n const settings = getEdgeTTSSettings(runtime);\n\n logger.log(\n `[EdgeTTS] Using TEXT_TO_SPEECH with voice: ${settings.voice}`,\n );\n\n if (!params.text || params.text.trim().length === 0) {\n throw new Error(\"TEXT_TO_SPEECH requires non-empty text\");\n }\n\n // Edge TTS has a practical limit around 5000 characters\n if (params.text.length > 5000) {\n throw new Error(\"TEXT_TO_SPEECH text exceeds 5000 character limit\");\n }\n\n try {\n const audioBuffer = await generateSpeech(settings, params);\n return audioBuffer;\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n logger.error(`EdgeTTS model error: ${msg}`);\n throw error instanceof Error ? error : new Error(msg);\n }\n },\n },\n tests: [\n {\n name: \"test edge tts\",\n tests: [\n {\n name: \"Edge TTS settings validation\",\n fn: async (runtime: IAgentRuntime) => {\n const settings = getEdgeTTSSettings(runtime);\n\n if (!settings.voice) {\n throw new Error(\"Missing voice configuration\");\n }\n\n if (!settings.lang) {\n throw new Error(\"Missing language configuration\");\n }\n\n if (!settings.outputFormat) {\n throw new Error(\"Missing output format configuration\");\n }\n\n logger.success(\"Edge TTS settings validated successfully\");\n },\n },\n {\n name: \"Edge TTS voice preset mapping\",\n fn: async (_runtime: IAgentRuntime) => {\n // Test that OpenAI-style voice names map correctly\n const testCases = [\n { input: \"alloy\", expected: \"en-US-GuyNeural\" },\n { input: \"nova\", expected: \"en-US-JennyNeural\" },\n { input: \"shimmer\", expected: \"en-US-AriaNeural\" },\n {\n input: \"en-US-MichelleNeural\",\n expected: \"en-US-MichelleNeural\",\n },\n ];\n\n for (const tc of testCases) {\n const result = resolveVoice(tc.input, DEFAULT_VOICE);\n if (result !== tc.expected) {\n throw new Error(\n `Voice preset mapping failed: ${tc.input} -> ${result}, expected ${tc.expected}`,\n );\n }\n }\n\n logger.success(\"Voice preset mapping validated successfully\");\n },\n },\n {\n name: \"Edge TTS speed to rate conversion\",\n fn: async (_runtime: IAgentRuntime) => {\n const testCases = [\n { speed: 1.0, expected: undefined },\n { speed: 1.5, expected: \"+50%\" },\n { speed: 0.75, expected: \"-25%\" },\n { speed: 2.0, expected: \"+100%\" },\n ];\n\n for (const tc of testCases) {\n const result = speedToRate(tc.speed);\n if (result !== tc.expected) {\n throw new Error(\n `Speed conversion failed: ${tc.speed} -> ${result}, expected ${tc.expected}`,\n );\n }\n }\n\n logger.success(\"Speed to rate conversion validated successfully\");\n },\n },\n {\n name: \"Edge TTS generation (live test)\",\n fn: async (runtime: IAgentRuntime) => {\n const testText = \"Hello, this is a test of Edge TTS.\";\n\n try {\n const audioBuffer = (await runtime.useModel(\n ModelType.TEXT_TO_SPEECH,\n testText,\n )) as Buffer | Uint8Array;\n\n if (!audioBuffer || audioBuffer.length === 0) {\n throw new Error(\"Received empty audio buffer\");\n }\n\n logger.success(\n `Edge TTS generation successful: ${audioBuffer.length} bytes`,\n );\n } catch (error: unknown) {\n const msg =\n error instanceof Error ? error.message : String(error);\n // Edge TTS might fail in CI environments without network\n if (msg.includes(\"ENOTFOUND\") || msg.includes(\"network\")) {\n logger.warn(\n `Edge TTS live test skipped (network unavailable): ${msg}`,\n );\n return;\n }\n throw error;\n }\n },\n },\n ],\n },\n ],\n};\n\nexport default edgeTTSPlugin;\n\n// Re-export types\nexport type { EdgeTTSSettings, EdgeTTSParams };\n\n// Export helper functions for testing\nexport const _test = {\n resolveVoice,\n speedToRate,\n inferExtension,\n getEdgeTTSSettings,\n};\n"
|
|
5
|
+
"import { mkdtempSync, readFileSync, rmSync } from \"node:fs\";\nimport { tmpdir } from \"node:os\";\nimport path from \"node:path\";\nimport { type IAgentRuntime, logger, ModelType, type Plugin } from \"@elizaos/core\";\nimport { EdgeTTS } from \"node-edge-tts\";\n\n/**\n * Edge TTS voice settings configuration\n */\ninterface EdgeTTSSettings {\n voice: string;\n lang: string;\n outputFormat: string;\n rate?: string;\n pitch?: string;\n volume?: string;\n proxy?: string;\n timeoutMs: number;\n}\n\n/**\n * Extended TTS params with Edge-specific options\n */\ninterface EdgeTTSParams {\n text: string;\n voice?: string;\n speed?: number;\n /** Edge TTS specific: language code */\n lang?: string;\n /** Edge TTS specific: output format */\n outputFormat?: string;\n /** Edge TTS specific: rate adjustment (e.g., +10%, -5%) */\n rate?: string;\n /** Edge TTS specific: pitch adjustment (e.g., +5Hz, -10Hz) */\n pitch?: string;\n /** Edge TTS specific: volume adjustment (e.g., +20%, -10%) */\n volume?: string;\n}\n\n// Default voice configurations\nconst DEFAULT_VOICE = \"en-US-MichelleNeural\";\nconst DEFAULT_LANG = \"en-US\";\nconst DEFAULT_OUTPUT_FORMAT = \"audio-24khz-48kbitrate-mono-mp3\";\nconst DEFAULT_TIMEOUT_MS = 30000;\n\n// Voice presets mapping common voice names to Edge TTS voices\nconst VOICE_PRESETS: Record<string, string> = {\n // Generic voices (map to good defaults)\n alloy: \"en-US-GuyNeural\",\n echo: \"en-US-ChristopherNeural\",\n fable: \"en-GB-RyanNeural\",\n onyx: \"en-US-DavisNeural\",\n nova: \"en-US-JennyNeural\",\n shimmer: \"en-US-AriaNeural\",\n // Direct Edge TTS voice names pass through\n};\n\nfunction getSetting(runtime: IAgentRuntime, key: string, fallback?: string): string | undefined {\n const envValue =\n typeof process !== \"undefined\" && (process as { env?: Record<string, string> }).env\n ? (process as { env: Record<string, string> }).env[key]\n : undefined;\n return (runtime.getSetting(key) as string | undefined) ?? envValue ?? fallback;\n}\n\nfunction getEdgeTTSSettings(runtime: IAgentRuntime): EdgeTTSSettings {\n const timeoutStr = getSetting(runtime, \"EDGE_TTS_TIMEOUT_MS\");\n return {\n voice: getSetting(runtime, \"EDGE_TTS_VOICE\", DEFAULT_VOICE) ?? DEFAULT_VOICE,\n lang: getSetting(runtime, \"EDGE_TTS_LANG\", DEFAULT_LANG) ?? DEFAULT_LANG,\n outputFormat:\n getSetting(runtime, \"EDGE_TTS_OUTPUT_FORMAT\", DEFAULT_OUTPUT_FORMAT) ?? DEFAULT_OUTPUT_FORMAT,\n rate: getSetting(runtime, \"EDGE_TTS_RATE\"),\n pitch: getSetting(runtime, \"EDGE_TTS_PITCH\"),\n volume: getSetting(runtime, \"EDGE_TTS_VOLUME\"),\n proxy: getSetting(runtime, \"EDGE_TTS_PROXY\"),\n timeoutMs: timeoutStr ? Number.parseInt(timeoutStr, 10) : DEFAULT_TIMEOUT_MS,\n };\n}\n\n/**\n * Resolve voice name - handles OpenAI-style voice names and Edge TTS voice IDs\n */\nfunction resolveVoice(voice: string | undefined, defaultVoice: string): string {\n if (!voice) return defaultVoice;\n\n // Check if it's a preset name\n const preset = VOICE_PRESETS[voice.toLowerCase()];\n if (preset) return preset;\n\n // Assume it's a direct Edge TTS voice ID\n return voice;\n}\n\n/**\n * Convert speed multiplier to Edge TTS rate string\n * speed: 1.0 = normal, 0.5 = half speed, 2.0 = double speed\n */\nfunction speedToRate(speed: number | undefined): string | undefined {\n if (speed === undefined || speed === 1.0) return undefined;\n const percentage = Math.round((speed - 1) * 100);\n return percentage >= 0 ? `+${percentage}%` : `${percentage}%`;\n}\n\n/**\n * Infer file extension from Edge TTS output format\n */\nfunction inferExtension(outputFormat: string): string {\n const normalized = outputFormat.toLowerCase();\n if (normalized.includes(\"webm\")) return \".webm\";\n if (normalized.includes(\"ogg\")) return \".ogg\";\n if (normalized.includes(\"opus\")) return \".opus\";\n if (normalized.includes(\"wav\") || normalized.includes(\"riff\") || normalized.includes(\"pcm\")) {\n return \".wav\";\n }\n return \".mp3\";\n}\n\n/**\n * Generate speech using Microsoft Edge TTS\n */\nasync function generateSpeech(settings: EdgeTTSSettings, params: EdgeTTSParams): Promise<Buffer> {\n const voice = resolveVoice(params.voice, settings.voice);\n const lang = params.lang ?? settings.lang;\n const outputFormat = params.outputFormat ?? settings.outputFormat;\n const rate = params.rate ?? speedToRate(params.speed) ?? settings.rate;\n const pitch = params.pitch ?? settings.pitch;\n const volume = params.volume ?? settings.volume;\n\n logger.debug(`[EdgeTTS] Generating speech with voice: ${voice}, lang: ${lang}`);\n\n const tts = new EdgeTTS({\n voice,\n lang,\n outputFormat,\n saveSubtitles: false,\n proxy: settings.proxy,\n rate,\n pitch,\n volume,\n timeout: settings.timeoutMs,\n });\n\n // Create temp directory for output\n const tempDir = mkdtempSync(path.join(tmpdir(), \"edge-tts-\"));\n const extension = inferExtension(outputFormat);\n const outputPath = path.join(tempDir, `speech${extension}`);\n\n try {\n await tts.ttsPromise(params.text, outputPath);\n const audioBuffer = readFileSync(outputPath);\n return audioBuffer;\n } finally {\n // Cleanup temp directory\n try {\n rmSync(tempDir, { recursive: true, force: true });\n } catch {\n // Ignore cleanup errors\n }\n }\n}\n\n/**\n * Edge TTS Plugin for ElizaOS\n *\n * Provides free text-to-speech synthesis using Microsoft Edge's TTS service.\n * No API key required - uses the same TTS engine as Microsoft Edge browser.\n *\n * Features:\n * - High-quality neural voices\n * - Multiple languages and locales\n * - Adjustable rate, pitch, and volume\n * - No API key or payment required\n *\n * Optional environment variables:\n * - EDGE_TTS_VOICE: Voice ID (default: en-US-MichelleNeural)\n * - EDGE_TTS_LANG: Language code (default: en-US)\n * - EDGE_TTS_OUTPUT_FORMAT: Output format (default: audio-24khz-48kbitrate-mono-mp3)\n * - EDGE_TTS_RATE: Speech rate adjustment (e.g., +10%, -5%)\n * - EDGE_TTS_PITCH: Pitch adjustment (e.g., +5Hz, -10Hz)\n * - EDGE_TTS_VOLUME: Volume adjustment (e.g., +20%, -10%)\n * - EDGE_TTS_PROXY: HTTP proxy URL\n * - EDGE_TTS_TIMEOUT_MS: Request timeout (default: 30000)\n *\n * Popular voices:\n * - en-US-MichelleNeural (female, US English)\n * - en-US-GuyNeural (male, US English)\n * - en-US-JennyNeural (female, US English)\n * - en-US-AriaNeural (female, US English)\n * - en-GB-SoniaNeural (female, UK English)\n * - en-GB-RyanNeural (male, UK English)\n * - de-DE-KatjaNeural (female, German)\n * - fr-FR-DeniseNeural (female, French)\n * - es-ES-ElviraNeural (female, Spanish)\n * - ja-JP-NanamiNeural (female, Japanese)\n * - zh-CN-XiaoxiaoNeural (female, Chinese)\n */\nexport const edgeTTSPlugin: Plugin = {\n name: \"edge-tts\",\n description:\n \"Free text-to-speech synthesis using Microsoft Edge TTS - no API key required, high-quality neural voices\",\n models: {\n [ModelType.TEXT_TO_SPEECH]: async (\n runtime: IAgentRuntime,\n input: string | EdgeTTSParams\n ): Promise<Buffer | ArrayBuffer | Uint8Array> => {\n const params: EdgeTTSParams = typeof input === \"string\" ? { text: input } : input;\n const settings = getEdgeTTSSettings(runtime);\n\n logger.log(`[EdgeTTS] Using TEXT_TO_SPEECH with voice: ${settings.voice}`);\n\n if (!params.text || params.text.trim().length === 0) {\n throw new Error(\"TEXT_TO_SPEECH requires non-empty text\");\n }\n\n // Edge TTS has a practical limit around 5000 characters\n if (params.text.length > 5000) {\n throw new Error(\"TEXT_TO_SPEECH text exceeds 5000 character limit\");\n }\n\n try {\n const audioBuffer = await generateSpeech(settings, params);\n return audioBuffer;\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n logger.error(`EdgeTTS model error: ${msg}`);\n throw error instanceof Error ? error : new Error(msg);\n }\n },\n },\n tests: [\n {\n name: \"test edge tts\",\n tests: [\n {\n name: \"Edge TTS settings validation\",\n fn: async (runtime: IAgentRuntime) => {\n const settings = getEdgeTTSSettings(runtime);\n\n if (!settings.voice) {\n throw new Error(\"Missing voice configuration\");\n }\n\n if (!settings.lang) {\n throw new Error(\"Missing language configuration\");\n }\n\n if (!settings.outputFormat) {\n throw new Error(\"Missing output format configuration\");\n }\n\n logger.success(\"Edge TTS settings validated successfully\");\n },\n },\n {\n name: \"Edge TTS voice preset mapping\",\n fn: async (_runtime: IAgentRuntime) => {\n // Test that OpenAI-style voice names map correctly\n const testCases = [\n { input: \"alloy\", expected: \"en-US-GuyNeural\" },\n { input: \"nova\", expected: \"en-US-JennyNeural\" },\n { input: \"shimmer\", expected: \"en-US-AriaNeural\" },\n {\n input: \"en-US-MichelleNeural\",\n expected: \"en-US-MichelleNeural\",\n },\n ];\n\n for (const tc of testCases) {\n const result = resolveVoice(tc.input, DEFAULT_VOICE);\n if (result !== tc.expected) {\n throw new Error(\n `Voice preset mapping failed: ${tc.input} -> ${result}, expected ${tc.expected}`\n );\n }\n }\n\n logger.success(\"Voice preset mapping validated successfully\");\n },\n },\n {\n name: \"Edge TTS speed to rate conversion\",\n fn: async (_runtime: IAgentRuntime) => {\n const testCases = [\n { speed: 1.0, expected: undefined },\n { speed: 1.5, expected: \"+50%\" },\n { speed: 0.75, expected: \"-25%\" },\n { speed: 2.0, expected: \"+100%\" },\n ];\n\n for (const tc of testCases) {\n const result = speedToRate(tc.speed);\n if (result !== tc.expected) {\n throw new Error(\n `Speed conversion failed: ${tc.speed} -> ${result}, expected ${tc.expected}`\n );\n }\n }\n\n logger.success(\"Speed to rate conversion validated successfully\");\n },\n },\n {\n name: \"Edge TTS generation (live test)\",\n fn: async (runtime: IAgentRuntime) => {\n const testText = \"Hello, this is a test of Edge TTS.\";\n\n try {\n const audioBuffer = (await runtime.useModel(ModelType.TEXT_TO_SPEECH, testText)) as\n | Buffer\n | Uint8Array;\n\n if (!audioBuffer || audioBuffer.length === 0) {\n throw new Error(\"Received empty audio buffer\");\n }\n\n logger.success(`Edge TTS generation successful: ${audioBuffer.length} bytes`);\n } catch (error: unknown) {\n const msg = error instanceof Error ? error.message : String(error);\n // Edge TTS might fail in CI environments without network\n if (msg.includes(\"ENOTFOUND\") || msg.includes(\"network\")) {\n logger.warn(`Edge TTS live test skipped (network unavailable): ${msg}`);\n return;\n }\n throw error;\n }\n },\n },\n ],\n },\n ],\n};\n\nexport default edgeTTSPlugin;\n\n// Re-export types\nexport type { EdgeTTSSettings, EdgeTTSParams };\n\n// Export helper functions for testing\nexport const _test = {\n resolveVoice,\n speedToRate,\n inferExtension,\n getEdgeTTSSettings,\n};\n"
|
|
6
6
|
],
|
|
7
|
-
"mappings": ";AAAA;
|
|
8
|
-
"debugId": "
|
|
7
|
+
"mappings": ";AAAA;AACA;AACA;AACA;AACA;AAoCA,IAAM,gBAAgB;AACtB,IAAM,eAAe;AACrB,IAAM,wBAAwB;AAC9B,IAAM,qBAAqB;AAG3B,IAAM,gBAAwC;AAAA,EAE5C,OAAO;AAAA,EACP,MAAM;AAAA,EACN,OAAO;AAAA,EACP,MAAM;AAAA,EACN,MAAM;AAAA,EACN,SAAS;AAEX;AAEA,SAAS,UAAU,CAAC,SAAwB,KAAa,UAAuC;AAAA,EAC9F,MAAM,WACJ,OAAO,YAAY,eAAgB,QAA6C,MAC3E,QAA4C,IAAI,OACjD;AAAA,EACN,OAAQ,QAAQ,WAAW,GAAG,KAA4B,YAAY;AAAA;AAGxE,SAAS,kBAAkB,CAAC,SAAyC;AAAA,EACnE,MAAM,aAAa,WAAW,SAAS,qBAAqB;AAAA,EAC5D,OAAO;AAAA,IACL,OAAO,WAAW,SAAS,kBAAkB,aAAa,KAAK;AAAA,IAC/D,MAAM,WAAW,SAAS,iBAAiB,YAAY,KAAK;AAAA,IAC5D,cACE,WAAW,SAAS,0BAA0B,qBAAqB,KAAK;AAAA,IAC1E,MAAM,WAAW,SAAS,eAAe;AAAA,IACzC,OAAO,WAAW,SAAS,gBAAgB;AAAA,IAC3C,QAAQ,WAAW,SAAS,iBAAiB;AAAA,IAC7C,OAAO,WAAW,SAAS,gBAAgB;AAAA,IAC3C,WAAW,aAAa,OAAO,SAAS,YAAY,EAAE,IAAI;AAAA,EAC5D;AAAA;AAMF,SAAS,YAAY,CAAC,OAA2B,cAA8B;AAAA,EAC7E,IAAI,CAAC;AAAA,IAAO,OAAO;AAAA,EAGnB,MAAM,SAAS,cAAc,MAAM,YAAY;AAAA,EAC/C,IAAI;AAAA,IAAQ,OAAO;AAAA,EAGnB,OAAO;AAAA;AAOT,SAAS,WAAW,CAAC,OAA+C;AAAA,EAClE,IAAI,UAAU,aAAa,UAAU;AAAA,IAAK;AAAA,EAC1C,MAAM,aAAa,KAAK,OAAO,QAAQ,KAAK,GAAG;AAAA,EAC/C,OAAO,cAAc,IAAI,IAAI,gBAAgB,GAAG;AAAA;AAMlD,SAAS,cAAc,CAAC,cAA8B;AAAA,EACpD,MAAM,aAAa,aAAa,YAAY;AAAA,EAC5C,IAAI,WAAW,SAAS,MAAM;AAAA,IAAG,OAAO;AAAA,EACxC,IAAI,WAAW,SAAS,KAAK;AAAA,IAAG,OAAO;AAAA,EACvC,IAAI,WAAW,SAAS,MAAM;AAAA,IAAG,OAAO;AAAA,EACxC,IAAI,WAAW,SAAS,KAAK,KAAK,WAAW,SAAS,MAAM,KAAK,WAAW,SAAS,KAAK,GAAG;AAAA,IAC3F,OAAO;AAAA,EACT;AAAA,EACA,OAAO;AAAA;AAMT,eAAe,cAAc,CAAC,UAA2B,QAAwC;AAAA,EAC/F,MAAM,QAAQ,aAAa,OAAO,OAAO,SAAS,KAAK;AAAA,EACvD,MAAM,OAAO,OAAO,QAAQ,SAAS;AAAA,EACrC,MAAM,eAAe,OAAO,gBAAgB,SAAS;AAAA,EACrD,MAAM,OAAO,OAAO,QAAQ,YAAY,OAAO,KAAK,KAAK,SAAS;AAAA,EAClE,MAAM,QAAQ,OAAO,SAAS,SAAS;AAAA,EACvC,MAAM,SAAS,OAAO,UAAU,SAAS;AAAA,EAEzC,OAAO,MAAM,2CAA2C,gBAAgB,MAAM;AAAA,EAE9E,MAAM,MAAM,IAAI,QAAQ;AAAA,IACtB;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe;AAAA,IACf,OAAO,SAAS;AAAA,IAChB;AAAA,IACA;AAAA,IACA;AAAA,IACA,SAAS,SAAS;AAAA,EACpB,CAAC;AAAA,EAGD,MAAM,UAAU,YAAY,KAAK,KAAK,OAAO,GAAG,WAAW,CAAC;AAAA,EAC5D,MAAM,YAAY,eAAe,YAAY;AAAA,EAC7C,MAAM,aAAa,KAAK,KAAK,SAAS,SAAS,WAAW;AAAA,EAE1D,IAAI;AAAA,IACF,MAAM,IAAI,WAAW,OAAO,MAAM,UAAU;AAAA,IAC5C,MAAM,cAAc,aAAa,UAAU;AAAA,IAC3C,OAAO;AAAA,YACP;AAAA,IAEA,IAAI;AAAA,MACF,OAAO,SAAS,EAAE,WAAW,MAAM,OAAO,KAAK,CAAC;AAAA,MAChD,MAAM;AAAA;AAAA;AAyCL,IAAM,gBAAwB;AAAA,EACnC,MAAM;AAAA,EACN,aACE;AAAA,EACF,QAAQ;AAAA,KACL,UAAU,iBAAiB,OAC1B,SACA,UAC+C;AAAA,MAC/C,MAAM,SAAwB,OAAO,UAAU,WAAW,EAAE,MAAM,MAAM,IAAI;AAAA,MAC5E,MAAM,WAAW,mBAAmB,OAAO;AAAA,MAE3C,OAAO,IAAI,8CAA8C,SAAS,OAAO;AAAA,MAEzE,IAAI,CAAC,OAAO,QAAQ,OAAO,KAAK,KAAK,EAAE,WAAW,GAAG;AAAA,QACnD,MAAM,IAAI,MAAM,wCAAwC;AAAA,MAC1D;AAAA,MAGA,IAAI,OAAO,KAAK,SAAS,MAAM;AAAA,QAC7B,MAAM,IAAI,MAAM,kDAAkD;AAAA,MACpE;AAAA,MAEA,IAAI;AAAA,QACF,MAAM,cAAc,MAAM,eAAe,UAAU,MAAM;AAAA,QACzD,OAAO;AAAA,QACP,OAAO,OAAgB;AAAA,QACvB,MAAM,MAAM,iBAAiB,QAAQ,MAAM,UAAU,OAAO,KAAK;AAAA,QACjE,OAAO,MAAM,wBAAwB,KAAK;AAAA,QAC1C,MAAM,iBAAiB,QAAQ,QAAQ,IAAI,MAAM,GAAG;AAAA;AAAA;AAAA,EAG1D;AAAA,EACA,OAAO;AAAA,IACL;AAAA,MACE,MAAM;AAAA,MACN,OAAO;AAAA,QACL;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,YAA2B;AAAA,YACpC,MAAM,WAAW,mBAAmB,OAAO;AAAA,YAE3C,IAAI,CAAC,SAAS,OAAO;AAAA,cACnB,MAAM,IAAI,MAAM,6BAA6B;AAAA,YAC/C;AAAA,YAEA,IAAI,CAAC,SAAS,MAAM;AAAA,cAClB,MAAM,IAAI,MAAM,gCAAgC;AAAA,YAClD;AAAA,YAEA,IAAI,CAAC,SAAS,cAAc;AAAA,cAC1B,MAAM,IAAI,MAAM,qCAAqC;AAAA,YACvD;AAAA,YAEA,OAAO,QAAQ,0CAA0C;AAAA;AAAA,QAE7D;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,aAA4B;AAAA,YAErC,MAAM,YAAY;AAAA,cAChB,EAAE,OAAO,SAAS,UAAU,kBAAkB;AAAA,cAC9C,EAAE,OAAO,QAAQ,UAAU,oBAAoB;AAAA,cAC/C,EAAE,OAAO,WAAW,UAAU,mBAAmB;AAAA,cACjD;AAAA,gBACE,OAAO;AAAA,gBACP,UAAU;AAAA,cACZ;AAAA,YACF;AAAA,YAEA,WAAW,MAAM,WAAW;AAAA,cAC1B,MAAM,SAAS,aAAa,GAAG,OAAO,aAAa;AAAA,cACnD,IAAI,WAAW,GAAG,UAAU;AAAA,gBAC1B,MAAM,IAAI,MACR,gCAAgC,GAAG,YAAY,oBAAoB,GAAG,UACxE;AAAA,cACF;AAAA,YACF;AAAA,YAEA,OAAO,QAAQ,6CAA6C;AAAA;AAAA,QAEhE;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,aAA4B;AAAA,YACrC,MAAM,YAAY;AAAA,cAChB,EAAE,OAAO,GAAK,UAAU,UAAU;AAAA,cAClC,EAAE,OAAO,KAAK,UAAU,OAAO;AAAA,cAC/B,EAAE,OAAO,MAAM,UAAU,OAAO;AAAA,cAChC,EAAE,OAAO,GAAK,UAAU,QAAQ;AAAA,YAClC;AAAA,YAEA,WAAW,MAAM,WAAW;AAAA,cAC1B,MAAM,SAAS,YAAY,GAAG,KAAK;AAAA,cACnC,IAAI,WAAW,GAAG,UAAU;AAAA,gBAC1B,MAAM,IAAI,MACR,4BAA4B,GAAG,YAAY,oBAAoB,GAAG,UACpE;AAAA,cACF;AAAA,YACF;AAAA,YAEA,OAAO,QAAQ,iDAAiD;AAAA;AAAA,QAEpE;AAAA,QACA;AAAA,UACE,MAAM;AAAA,UACN,IAAI,OAAO,YAA2B;AAAA,YACpC,MAAM,WAAW;AAAA,YAEjB,IAAI;AAAA,cACF,MAAM,cAAe,MAAM,QAAQ,SAAS,UAAU,gBAAgB,QAAQ;AAAA,cAI9E,IAAI,CAAC,eAAe,YAAY,WAAW,GAAG;AAAA,gBAC5C,MAAM,IAAI,MAAM,6BAA6B;AAAA,cAC/C;AAAA,cAEA,OAAO,QAAQ,mCAAmC,YAAY,cAAc;AAAA,cAC5E,OAAO,OAAgB;AAAA,cACvB,MAAM,MAAM,iBAAiB,QAAQ,MAAM,UAAU,OAAO,KAAK;AAAA,cAEjE,IAAI,IAAI,SAAS,WAAW,KAAK,IAAI,SAAS,SAAS,GAAG;AAAA,gBACxD,OAAO,KAAK,qDAAqD,KAAK;AAAA,gBACtE;AAAA,cACF;AAAA,cACA,MAAM;AAAA;AAAA;AAAA,QAGZ;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACF;AAEA,IAAe;AAMR,IAAM,QAAQ;AAAA,EACnB;AAAA,EACA;AAAA,EACA;AAAA,EACA;AACF;",
|
|
8
|
+
"debugId": "72B923D58112D3ED64756E2164756E21",
|
|
9
9
|
"names": []
|
|
10
10
|
}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@elizaos/plugin-edge-tts",
|
|
3
|
-
"version": "2.0.0-alpha.
|
|
3
|
+
"version": "2.0.0-alpha.8",
|
|
4
4
|
"type": "module",
|
|
5
5
|
"main": "dist/cjs/index.node.cjs",
|
|
6
6
|
"module": "dist/node/index.node.js",
|
|
@@ -44,7 +44,7 @@
|
|
|
44
44
|
"dist"
|
|
45
45
|
],
|
|
46
46
|
"dependencies": {
|
|
47
|
-
"@elizaos/core": "
|
|
47
|
+
"@elizaos/core": "next",
|
|
48
48
|
"node-edge-tts": "^1.0.7"
|
|
49
49
|
},
|
|
50
50
|
"devDependencies": {
|
|
@@ -56,7 +56,7 @@
|
|
|
56
56
|
"scripts": {
|
|
57
57
|
"build": "bun run build.ts",
|
|
58
58
|
"dev": "bun --hot build.ts",
|
|
59
|
-
"test": "
|
|
59
|
+
"test": "npx -y vitest@4.0.18 run --passWithNoTests",
|
|
60
60
|
"clean": "rm -rf dist .turbo node_modules .turbo-tsconfig.json tsconfig.tsbuildinfo",
|
|
61
61
|
"format": "bunx @biomejs/biome format --write .",
|
|
62
62
|
"format:check": "bunx @biomejs/biome format .",
|
|
@@ -124,7 +124,7 @@
|
|
|
124
124
|
}
|
|
125
125
|
}
|
|
126
126
|
},
|
|
127
|
-
"
|
|
127
|
+
"milady": {
|
|
128
128
|
"platforms": [
|
|
129
129
|
"browser",
|
|
130
130
|
"node"
|