@framers/agentos 0.1.46 → 0.1.47
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +7 -7
- package/dist/cognitive_substrate/IGMI.d.ts +2 -0
- package/dist/cognitive_substrate/IGMI.d.ts.map +1 -1
- package/dist/cognitive_substrate/IGMI.js.map +1 -1
- package/dist/cognitive_substrate/personas/IPersonaDefinition.d.ts +2 -0
- package/dist/cognitive_substrate/personas/IPersonaDefinition.d.ts.map +1 -1
- package/dist/core/audio/AdaptiveVAD.d.ts +147 -0
- package/dist/core/audio/AdaptiveVAD.d.ts.map +1 -0
- package/dist/core/audio/AdaptiveVAD.js +239 -0
- package/dist/core/audio/AdaptiveVAD.js.map +1 -0
- package/dist/core/audio/AudioProcessor.d.ts +121 -0
- package/dist/core/audio/AudioProcessor.d.ts.map +1 -0
- package/dist/core/audio/AudioProcessor.js +299 -0
- package/dist/core/audio/AudioProcessor.js.map +1 -0
- package/dist/core/audio/EnvironmentalCalibrator.d.ts +187 -0
- package/dist/core/audio/EnvironmentalCalibrator.d.ts.map +1 -0
- package/dist/core/audio/EnvironmentalCalibrator.js +360 -0
- package/dist/core/audio/EnvironmentalCalibrator.js.map +1 -0
- package/dist/core/audio/SilenceDetector.d.ts +111 -0
- package/dist/core/audio/SilenceDetector.d.ts.map +1 -0
- package/dist/core/audio/SilenceDetector.js +178 -0
- package/dist/core/audio/SilenceDetector.js.map +1 -0
- package/dist/core/llm/IPromptEngine.d.ts +2 -0
- package/dist/core/llm/IPromptEngine.d.ts.map +1 -1
- package/dist/core/llm/IPromptEngine.js.map +1 -1
- package/dist/core/llm/providers/implementations/OpenAIProvider.d.ts.map +1 -1
- package/dist/core/llm/providers/implementations/OpenAIProvider.js +8 -1
- package/dist/core/llm/providers/implementations/OpenAIProvider.js.map +1 -1
- package/dist/extensions/ExtensionManager.d.ts.map +1 -1
- package/dist/extensions/ExtensionManager.js +9 -1
- package/dist/extensions/ExtensionManager.js.map +1 -1
- package/dist/extensions/types.d.ts +20 -2
- package/dist/extensions/types.d.ts.map +1 -1
- package/dist/extensions/types.js +4 -0
- package/dist/extensions/types.js.map +1 -1
- package/dist/index.d.ts +2 -0
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +4 -0
- package/dist/index.js.map +1 -1
- package/dist/memory/CognitiveMemoryManager.d.ts +133 -0
- package/dist/memory/CognitiveMemoryManager.d.ts.map +1 -0
- package/dist/memory/CognitiveMemoryManager.js +519 -0
- package/dist/memory/CognitiveMemoryManager.js.map +1 -0
- package/dist/memory/config.d.ts +135 -0
- package/dist/memory/config.d.ts.map +1 -0
- package/dist/memory/config.js +28 -0
- package/dist/memory/config.js.map +1 -0
- package/dist/memory/consolidation/ConsolidationPipeline.d.ts +70 -0
- package/dist/memory/consolidation/ConsolidationPipeline.d.ts.map +1 -0
- package/dist/memory/consolidation/ConsolidationPipeline.js +301 -0
- package/dist/memory/consolidation/ConsolidationPipeline.js.map +1 -0
- package/dist/memory/context/CompactionEngine.d.ts +21 -0
- package/dist/memory/context/CompactionEngine.d.ts.map +1 -0
- package/dist/memory/context/CompactionEngine.js +35 -0
- package/dist/memory/context/CompactionEngine.js.map +1 -0
- package/dist/memory/context/CompactionLog.d.ts +50 -0
- package/dist/memory/context/CompactionLog.d.ts.map +1 -0
- package/dist/memory/context/CompactionLog.js +139 -0
- package/dist/memory/context/CompactionLog.js.map +1 -0
- package/dist/memory/context/ContextWindowManager.d.ts +114 -0
- package/dist/memory/context/ContextWindowManager.d.ts.map +1 -0
- package/dist/memory/context/ContextWindowManager.js +225 -0
- package/dist/memory/context/ContextWindowManager.js.map +1 -0
- package/dist/memory/context/RollingSummaryChain.d.ts +53 -0
- package/dist/memory/context/RollingSummaryChain.d.ts.map +1 -0
- package/dist/memory/context/RollingSummaryChain.js +193 -0
- package/dist/memory/context/RollingSummaryChain.js.map +1 -0
- package/dist/memory/context/index.d.ts +15 -0
- package/dist/memory/context/index.d.ts.map +1 -0
- package/dist/memory/context/index.js +14 -0
- package/dist/memory/context/index.js.map +1 -0
- package/dist/memory/context/strategies/HierarchicalStrategy.d.ts +25 -0
- package/dist/memory/context/strategies/HierarchicalStrategy.d.ts.map +1 -0
- package/dist/memory/context/strategies/HierarchicalStrategy.js +240 -0
- package/dist/memory/context/strategies/HierarchicalStrategy.js.map +1 -0
- package/dist/memory/context/strategies/HybridStrategy.d.ts +26 -0
- package/dist/memory/context/strategies/HybridStrategy.d.ts.map +1 -0
- package/dist/memory/context/strategies/HybridStrategy.js +245 -0
- package/dist/memory/context/strategies/HybridStrategy.js.map +1 -0
- package/dist/memory/context/strategies/SlidingSummaryStrategy.d.ts +22 -0
- package/dist/memory/context/strategies/SlidingSummaryStrategy.d.ts.map +1 -0
- package/dist/memory/context/strategies/SlidingSummaryStrategy.js +203 -0
- package/dist/memory/context/strategies/SlidingSummaryStrategy.js.map +1 -0
- package/dist/memory/context/types.d.ts +120 -0
- package/dist/memory/context/types.d.ts.map +1 -0
- package/dist/memory/context/types.js +17 -0
- package/dist/memory/context/types.js.map +1 -0
- package/dist/memory/decay/DecayModel.d.ts +87 -0
- package/dist/memory/decay/DecayModel.d.ts.map +1 -0
- package/dist/memory/decay/DecayModel.js +117 -0
- package/dist/memory/decay/DecayModel.js.map +1 -0
- package/dist/memory/decay/RetrievalPriorityScorer.d.ts +63 -0
- package/dist/memory/decay/RetrievalPriorityScorer.d.ts.map +1 -0
- package/dist/memory/decay/RetrievalPriorityScorer.js +110 -0
- package/dist/memory/decay/RetrievalPriorityScorer.js.map +1 -0
- package/dist/memory/encoding/ContentFeatureDetector.d.ts +37 -0
- package/dist/memory/encoding/ContentFeatureDetector.d.ts.map +1 -0
- package/dist/memory/encoding/ContentFeatureDetector.js +176 -0
- package/dist/memory/encoding/ContentFeatureDetector.js.map +1 -0
- package/dist/memory/encoding/EncodingModel.d.ts +67 -0
- package/dist/memory/encoding/EncodingModel.d.ts.map +1 -0
- package/dist/memory/encoding/EncodingModel.js +171 -0
- package/dist/memory/encoding/EncodingModel.js.map +1 -0
- package/dist/memory/extension/CognitiveMemoryExtension.d.ts +18 -0
- package/dist/memory/extension/CognitiveMemoryExtension.d.ts.map +1 -0
- package/dist/memory/extension/CognitiveMemoryExtension.js +131 -0
- package/dist/memory/extension/CognitiveMemoryExtension.js.map +1 -0
- package/dist/memory/graph/GraphologyMemoryGraph.d.ts +29 -0
- package/dist/memory/graph/GraphologyMemoryGraph.d.ts.map +1 -0
- package/dist/memory/graph/GraphologyMemoryGraph.js +224 -0
- package/dist/memory/graph/GraphologyMemoryGraph.js.map +1 -0
- package/dist/memory/graph/IMemoryGraph.d.ts +70 -0
- package/dist/memory/graph/IMemoryGraph.d.ts.map +1 -0
- package/dist/memory/graph/IMemoryGraph.js +15 -0
- package/dist/memory/graph/IMemoryGraph.js.map +1 -0
- package/dist/memory/graph/KnowledgeGraphMemoryGraph.d.ts +38 -0
- package/dist/memory/graph/KnowledgeGraphMemoryGraph.d.ts.map +1 -0
- package/dist/memory/graph/KnowledgeGraphMemoryGraph.js +264 -0
- package/dist/memory/graph/KnowledgeGraphMemoryGraph.js.map +1 -0
- package/dist/memory/graph/SpreadingActivation.d.ts +36 -0
- package/dist/memory/graph/SpreadingActivation.d.ts.map +1 -0
- package/dist/memory/graph/SpreadingActivation.js +100 -0
- package/dist/memory/graph/SpreadingActivation.js.map +1 -0
- package/dist/memory/index.d.ts +52 -0
- package/dist/memory/index.d.ts.map +1 -0
- package/dist/memory/index.js +43 -0
- package/dist/memory/index.js.map +1 -0
- package/dist/memory/observation/MemoryObserver.d.ts +59 -0
- package/dist/memory/observation/MemoryObserver.d.ts.map +1 -0
- package/dist/memory/observation/MemoryObserver.js +136 -0
- package/dist/memory/observation/MemoryObserver.js.map +1 -0
- package/dist/memory/observation/MemoryReflector.d.ts +51 -0
- package/dist/memory/observation/MemoryReflector.d.ts.map +1 -0
- package/dist/memory/observation/MemoryReflector.js +184 -0
- package/dist/memory/observation/MemoryReflector.js.map +1 -0
- package/dist/memory/observation/ObservationBuffer.d.ts +51 -0
- package/dist/memory/observation/ObservationBuffer.d.ts.map +1 -0
- package/dist/memory/observation/ObservationBuffer.js +81 -0
- package/dist/memory/observation/ObservationBuffer.js.map +1 -0
- package/dist/memory/prompt/MemoryFormatters.d.ts +22 -0
- package/dist/memory/prompt/MemoryFormatters.d.ts.map +1 -0
- package/dist/memory/prompt/MemoryFormatters.js +113 -0
- package/dist/memory/prompt/MemoryFormatters.js.map +1 -0
- package/dist/memory/prompt/MemoryPromptAssembler.d.ts +40 -0
- package/dist/memory/prompt/MemoryPromptAssembler.d.ts.map +1 -0
- package/dist/memory/prompt/MemoryPromptAssembler.js +180 -0
- package/dist/memory/prompt/MemoryPromptAssembler.js.map +1 -0
- package/dist/memory/prospective/ProspectiveMemoryManager.d.ts +83 -0
- package/dist/memory/prospective/ProspectiveMemoryManager.d.ts.map +1 -0
- package/dist/memory/prospective/ProspectiveMemoryManager.js +128 -0
- package/dist/memory/prospective/ProspectiveMemoryManager.js.map +1 -0
- package/dist/memory/store/MemoryStore.d.ts +76 -0
- package/dist/memory/store/MemoryStore.d.ts.map +1 -0
- package/dist/memory/store/MemoryStore.js +320 -0
- package/dist/memory/store/MemoryStore.js.map +1 -0
- package/dist/memory/types.d.ts +184 -0
- package/dist/memory/types.d.ts.map +1 -0
- package/dist/memory/types.js +14 -0
- package/dist/memory/types.js.map +1 -0
- package/dist/memory/working/CognitiveWorkingMemory.d.ts +87 -0
- package/dist/memory/working/CognitiveWorkingMemory.d.ts.map +1 -0
- package/dist/memory/working/CognitiveWorkingMemory.js +230 -0
- package/dist/memory/working/CognitiveWorkingMemory.js.map +1 -0
- package/dist/rag/EmbeddingManager.d.ts.map +1 -1
- package/dist/rag/EmbeddingManager.js +8 -1
- package/dist/rag/EmbeddingManager.js.map +1 -1
- package/dist/speech/SpeechProviderRegistry.d.ts +17 -0
- package/dist/speech/SpeechProviderRegistry.d.ts.map +1 -0
- package/dist/speech/SpeechProviderRegistry.js +47 -0
- package/dist/speech/SpeechProviderRegistry.js.map +1 -0
- package/dist/speech/SpeechRuntime.d.ts +28 -0
- package/dist/speech/SpeechRuntime.d.ts.map +1 -0
- package/dist/speech/SpeechRuntime.js +138 -0
- package/dist/speech/SpeechRuntime.js.map +1 -0
- package/dist/speech/SpeechSession.d.ts +37 -0
- package/dist/speech/SpeechSession.d.ts.map +1 -0
- package/dist/speech/SpeechSession.js +285 -0
- package/dist/speech/SpeechSession.js.map +1 -0
- package/dist/speech/audio.d.ts +3 -0
- package/dist/speech/audio.d.ts.map +1 -0
- package/dist/speech/audio.js +39 -0
- package/dist/speech/audio.js.map +1 -0
- package/dist/speech/index.d.ts +11 -0
- package/dist/speech/index.d.ts.map +1 -0
- package/dist/speech/index.js +11 -0
- package/dist/speech/index.js.map +1 -0
- package/dist/speech/providerCatalog.d.ts +7 -0
- package/dist/speech/providerCatalog.d.ts.map +1 -0
- package/dist/speech/providerCatalog.js +243 -0
- package/dist/speech/providerCatalog.js.map +1 -0
- package/dist/speech/providers/BuiltInAdaptiveVadProvider.d.ts +20 -0
- package/dist/speech/providers/BuiltInAdaptiveVadProvider.d.ts.map +1 -0
- package/dist/speech/providers/BuiltInAdaptiveVadProvider.js +29 -0
- package/dist/speech/providers/BuiltInAdaptiveVadProvider.js.map +1 -0
- package/dist/speech/providers/ElevenLabsTextToSpeechProvider.d.ts +20 -0
- package/dist/speech/providers/ElevenLabsTextToSpeechProvider.d.ts.map +1 -0
- package/dist/speech/providers/ElevenLabsTextToSpeechProvider.js +95 -0
- package/dist/speech/providers/ElevenLabsTextToSpeechProvider.js.map +1 -0
- package/dist/speech/providers/OpenAITextToSpeechProvider.d.ts +20 -0
- package/dist/speech/providers/OpenAITextToSpeechProvider.d.ts.map +1 -0
- package/dist/speech/providers/OpenAITextToSpeechProvider.js +75 -0
- package/dist/speech/providers/OpenAITextToSpeechProvider.js.map +1 -0
- package/dist/speech/providers/OpenAIWhisperSpeechToTextProvider.d.ts +18 -0
- package/dist/speech/providers/OpenAIWhisperSpeechToTextProvider.d.ts.map +1 -0
- package/dist/speech/providers/OpenAIWhisperSpeechToTextProvider.js +109 -0
- package/dist/speech/providers/OpenAIWhisperSpeechToTextProvider.js.map +1 -0
- package/dist/speech/types.d.ts +270 -0
- package/dist/speech/types.d.ts.map +1 -0
- package/dist/speech/types.js +2 -0
- package/dist/speech/types.js.map +1 -0
- package/package.json +22 -2
|
@@ -0,0 +1,243 @@
|
|
|
1
|
+
export const SPEECH_PROVIDER_CATALOG = [
|
|
2
|
+
{
|
|
3
|
+
id: 'twilio',
|
|
4
|
+
kind: 'telephony',
|
|
5
|
+
label: 'Twilio',
|
|
6
|
+
envVars: ['TWILIO_ACCOUNT_SID', 'TWILIO_AUTH_TOKEN'],
|
|
7
|
+
local: false,
|
|
8
|
+
description: 'Telephony call control via Twilio programmable voice.',
|
|
9
|
+
extensionName: 'voice-twilio',
|
|
10
|
+
features: ['telephony', 'webhooks', 'media-streams'],
|
|
11
|
+
},
|
|
12
|
+
{
|
|
13
|
+
id: 'telnyx',
|
|
14
|
+
kind: 'telephony',
|
|
15
|
+
label: 'Telnyx',
|
|
16
|
+
envVars: ['TELNYX_API_KEY', 'TELNYX_CONNECTION_ID'],
|
|
17
|
+
local: false,
|
|
18
|
+
description: 'Telephony call control via Telnyx Call Control.',
|
|
19
|
+
extensionName: 'voice-telnyx',
|
|
20
|
+
features: ['telephony', 'sip', 'media-streams'],
|
|
21
|
+
},
|
|
22
|
+
{
|
|
23
|
+
id: 'plivo',
|
|
24
|
+
kind: 'telephony',
|
|
25
|
+
label: 'Plivo',
|
|
26
|
+
envVars: ['PLIVO_AUTH_ID', 'PLIVO_AUTH_TOKEN'],
|
|
27
|
+
local: false,
|
|
28
|
+
description: 'Telephony call control via the Plivo Voice API.',
|
|
29
|
+
extensionName: 'voice-plivo',
|
|
30
|
+
features: ['telephony', 'xml'],
|
|
31
|
+
},
|
|
32
|
+
{
|
|
33
|
+
id: 'openai-whisper',
|
|
34
|
+
kind: 'stt',
|
|
35
|
+
label: 'OpenAI Whisper',
|
|
36
|
+
envVars: ['OPENAI_API_KEY'],
|
|
37
|
+
local: false,
|
|
38
|
+
description: 'Hosted Whisper speech-to-text for file and utterance transcription.',
|
|
39
|
+
defaultModel: 'whisper-1',
|
|
40
|
+
streaming: false,
|
|
41
|
+
features: ['cloud', 'timestamps', 'transcription'],
|
|
42
|
+
},
|
|
43
|
+
{
|
|
44
|
+
id: 'deepgram',
|
|
45
|
+
kind: 'stt',
|
|
46
|
+
label: 'Deepgram',
|
|
47
|
+
envVars: ['DEEPGRAM_API_KEY'],
|
|
48
|
+
local: false,
|
|
49
|
+
description: 'Streaming-first speech-to-text for live conversations.',
|
|
50
|
+
streaming: true,
|
|
51
|
+
features: ['cloud', 'streaming'],
|
|
52
|
+
},
|
|
53
|
+
{
|
|
54
|
+
id: 'assemblyai',
|
|
55
|
+
kind: 'stt',
|
|
56
|
+
label: 'AssemblyAI',
|
|
57
|
+
envVars: ['ASSEMBLYAI_API_KEY'],
|
|
58
|
+
local: false,
|
|
59
|
+
description: 'Hosted speech-to-text with diarization and analytics.',
|
|
60
|
+
streaming: true,
|
|
61
|
+
features: ['cloud', 'streaming', 'diarization'],
|
|
62
|
+
},
|
|
63
|
+
{
|
|
64
|
+
id: 'google-cloud-stt',
|
|
65
|
+
kind: 'stt',
|
|
66
|
+
label: 'Google Cloud STT',
|
|
67
|
+
envVars: ['GOOGLE_STT_CREDENTIALS'],
|
|
68
|
+
local: false,
|
|
69
|
+
description: 'Google Cloud speech recognition.',
|
|
70
|
+
streaming: true,
|
|
71
|
+
features: ['cloud', 'streaming'],
|
|
72
|
+
},
|
|
73
|
+
{
|
|
74
|
+
id: 'azure-speech-stt',
|
|
75
|
+
kind: 'stt',
|
|
76
|
+
label: 'Azure Speech STT',
|
|
77
|
+
envVars: ['AZURE_SPEECH_KEY', 'AZURE_SPEECH_REGION'],
|
|
78
|
+
local: false,
|
|
79
|
+
description: 'Azure speech recognition for batch and live transcription.',
|
|
80
|
+
streaming: true,
|
|
81
|
+
features: ['cloud', 'streaming'],
|
|
82
|
+
},
|
|
83
|
+
{
|
|
84
|
+
id: 'whisper-local',
|
|
85
|
+
kind: 'stt',
|
|
86
|
+
label: 'Whisper.cpp',
|
|
87
|
+
envVars: [],
|
|
88
|
+
local: true,
|
|
89
|
+
description: 'Local Whisper.cpp offline transcription.',
|
|
90
|
+
features: ['local', 'offline'],
|
|
91
|
+
},
|
|
92
|
+
{
|
|
93
|
+
id: 'vosk',
|
|
94
|
+
kind: 'stt',
|
|
95
|
+
label: 'Vosk',
|
|
96
|
+
envVars: [],
|
|
97
|
+
local: true,
|
|
98
|
+
description: 'Local streaming speech recognition via Vosk.',
|
|
99
|
+
streaming: true,
|
|
100
|
+
features: ['local', 'offline', 'streaming'],
|
|
101
|
+
},
|
|
102
|
+
{
|
|
103
|
+
id: 'nvidia-nemo',
|
|
104
|
+
kind: 'stt',
|
|
105
|
+
label: 'NVIDIA NeMo',
|
|
106
|
+
envVars: [],
|
|
107
|
+
local: true,
|
|
108
|
+
description: 'Local/offline ASR via NVIDIA NeMo.',
|
|
109
|
+
features: ['local', 'offline'],
|
|
110
|
+
},
|
|
111
|
+
{
|
|
112
|
+
id: 'openai-tts',
|
|
113
|
+
kind: 'tts',
|
|
114
|
+
label: 'OpenAI TTS',
|
|
115
|
+
envVars: ['OPENAI_API_KEY'],
|
|
116
|
+
local: false,
|
|
117
|
+
streaming: true,
|
|
118
|
+
description: 'Hosted speech synthesis via OpenAI speech models.',
|
|
119
|
+
defaultModel: 'tts-1',
|
|
120
|
+
defaultVoice: 'nova',
|
|
121
|
+
features: ['cloud', 'tts'],
|
|
122
|
+
},
|
|
123
|
+
{
|
|
124
|
+
id: 'elevenlabs',
|
|
125
|
+
kind: 'tts',
|
|
126
|
+
label: 'ElevenLabs',
|
|
127
|
+
envVars: ['ELEVENLABS_API_KEY'],
|
|
128
|
+
local: false,
|
|
129
|
+
streaming: true,
|
|
130
|
+
description: 'High-quality neural TTS with voice cloning.',
|
|
131
|
+
extensionName: 'voice-synthesis',
|
|
132
|
+
defaultModel: 'eleven_multilingual_v2',
|
|
133
|
+
features: ['cloud', 'tts', 'voice-cloning'],
|
|
134
|
+
},
|
|
135
|
+
{
|
|
136
|
+
id: 'google-cloud-tts',
|
|
137
|
+
kind: 'tts',
|
|
138
|
+
label: 'Google Cloud TTS',
|
|
139
|
+
envVars: ['GOOGLE_TTS_CREDENTIALS'],
|
|
140
|
+
local: false,
|
|
141
|
+
description: 'Google Cloud neural text-to-speech.',
|
|
142
|
+
features: ['cloud', 'tts'],
|
|
143
|
+
},
|
|
144
|
+
{
|
|
145
|
+
id: 'amazon-polly',
|
|
146
|
+
kind: 'tts',
|
|
147
|
+
label: 'Amazon Polly',
|
|
148
|
+
envVars: ['AWS_ACCESS_KEY_ID', 'AWS_SECRET_ACCESS_KEY'],
|
|
149
|
+
local: false,
|
|
150
|
+
streaming: true,
|
|
151
|
+
description: 'Amazon Polly neural text-to-speech.',
|
|
152
|
+
features: ['cloud', 'tts'],
|
|
153
|
+
},
|
|
154
|
+
{
|
|
155
|
+
id: 'azure-speech-tts',
|
|
156
|
+
kind: 'tts',
|
|
157
|
+
label: 'Azure Speech TTS',
|
|
158
|
+
envVars: ['AZURE_SPEECH_KEY', 'AZURE_SPEECH_REGION'],
|
|
159
|
+
local: false,
|
|
160
|
+
streaming: true,
|
|
161
|
+
description: 'Azure neural text-to-speech.',
|
|
162
|
+
features: ['cloud', 'tts'],
|
|
163
|
+
},
|
|
164
|
+
{
|
|
165
|
+
id: 'piper',
|
|
166
|
+
kind: 'tts',
|
|
167
|
+
label: 'Piper',
|
|
168
|
+
envVars: [],
|
|
169
|
+
local: true,
|
|
170
|
+
description: 'Offline local TTS via Piper.',
|
|
171
|
+
features: ['local', 'offline', 'tts'],
|
|
172
|
+
},
|
|
173
|
+
{
|
|
174
|
+
id: 'coqui',
|
|
175
|
+
kind: 'tts',
|
|
176
|
+
label: 'Coqui XTTS',
|
|
177
|
+
envVars: [],
|
|
178
|
+
local: true,
|
|
179
|
+
streaming: true,
|
|
180
|
+
description: 'Local XTTS / Coqui speech synthesis.',
|
|
181
|
+
features: ['local', 'tts', 'voice-cloning'],
|
|
182
|
+
},
|
|
183
|
+
{
|
|
184
|
+
id: 'bark',
|
|
185
|
+
kind: 'tts',
|
|
186
|
+
label: 'Bark',
|
|
187
|
+
envVars: [],
|
|
188
|
+
local: true,
|
|
189
|
+
description: 'Local Bark expressive speech synthesis.',
|
|
190
|
+
features: ['local', 'tts'],
|
|
191
|
+
},
|
|
192
|
+
{
|
|
193
|
+
id: 'styletts2',
|
|
194
|
+
kind: 'tts',
|
|
195
|
+
label: 'StyleTTS2',
|
|
196
|
+
envVars: [],
|
|
197
|
+
local: true,
|
|
198
|
+
description: 'Local StyleTTS2 expressive speech synthesis.',
|
|
199
|
+
features: ['local', 'tts'],
|
|
200
|
+
},
|
|
201
|
+
{
|
|
202
|
+
id: 'agentos-adaptive-vad',
|
|
203
|
+
kind: 'vad',
|
|
204
|
+
label: 'AgentOS Adaptive VAD',
|
|
205
|
+
envVars: [],
|
|
206
|
+
local: true,
|
|
207
|
+
description: 'Built-in adaptive VAD backed by environmental calibration.',
|
|
208
|
+
features: ['local', 'vad', 'adaptive'],
|
|
209
|
+
},
|
|
210
|
+
{
|
|
211
|
+
id: 'porcupine',
|
|
212
|
+
kind: 'wake-word',
|
|
213
|
+
label: 'Porcupine',
|
|
214
|
+
envVars: ['PICOVOICE_ACCESS_KEY'],
|
|
215
|
+
local: true,
|
|
216
|
+
description: 'Wake-word detection via Picovoice Porcupine.',
|
|
217
|
+
features: ['local', 'wake-word'],
|
|
218
|
+
},
|
|
219
|
+
{
|
|
220
|
+
id: 'openwakeword',
|
|
221
|
+
kind: 'wake-word',
|
|
222
|
+
label: 'OpenWakeWord',
|
|
223
|
+
envVars: [],
|
|
224
|
+
local: true,
|
|
225
|
+
description: 'Wake-word detection via OpenWakeWord.',
|
|
226
|
+
features: ['local', 'wake-word'],
|
|
227
|
+
},
|
|
228
|
+
];
|
|
229
|
+
export function getSpeechProviderCatalog(kind) {
|
|
230
|
+
if (!kind)
|
|
231
|
+
return [...SPEECH_PROVIDER_CATALOG];
|
|
232
|
+
return SPEECH_PROVIDER_CATALOG.filter((entry) => entry.kind === kind);
|
|
233
|
+
}
|
|
234
|
+
export function getSpeechProviderKinds() {
|
|
235
|
+
return ['telephony', 'stt', 'tts', 'vad', 'wake-word'];
|
|
236
|
+
}
|
|
237
|
+
export function findSpeechProviderCatalogEntry(id) {
|
|
238
|
+
return SPEECH_PROVIDER_CATALOG.find((entry) => entry.id === id);
|
|
239
|
+
}
|
|
240
|
+
export function isSpeechProviderConfigured(entry, env = process.env) {
|
|
241
|
+
return entry.local || entry.envVars.every((envVar) => Boolean(env[envVar]));
|
|
242
|
+
}
|
|
243
|
+
//# sourceMappingURL=providerCatalog.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"providerCatalog.js","sourceRoot":"","sources":["../../src/speech/providerCatalog.ts"],"names":[],"mappings":"AAEA,MAAM,CAAC,MAAM,uBAAuB,GAA0C;IAC5E;QACE,EAAE,EAAE,QAAQ;QACZ,IAAI,EAAE,WAAW;QACjB,KAAK,EAAE,QAAQ;QACf,OAAO,EAAE,CAAC,oBAAoB,EAAE,mBAAmB,CAAC;QACpD,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,uDAAuD;QACpE,aAAa,EAAE,cAAc;QAC7B,QAAQ,EAAE,CAAC,WAAW,EAAE,UAAU,EAAE,eAAe,CAAC;KACrD;IACD;QACE,EAAE,EAAE,QAAQ;QACZ,IAAI,EAAE,WAAW;QACjB,KAAK,EAAE,QAAQ;QACf,OAAO,EAAE,CAAC,gBAAgB,EAAE,sBAAsB,CAAC;QACnD,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,iDAAiD;QAC9D,aAAa,EAAE,cAAc;QAC7B,QAAQ,EAAE,CAAC,WAAW,EAAE,KAAK,EAAE,eAAe,CAAC;KAChD;IACD;QACE,EAAE,EAAE,OAAO;QACX,IAAI,EAAE,WAAW;QACjB,KAAK,EAAE,OAAO;QACd,OAAO,EAAE,CAAC,eAAe,EAAE,kBAAkB,CAAC;QAC9C,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,iDAAiD;QAC9D,aAAa,EAAE,aAAa;QAC5B,QAAQ,EAAE,CAAC,WAAW,EAAE,KAAK,CAAC;KAC/B;IACD;QACE,EAAE,EAAE,gBAAgB;QACpB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,gBAAgB;QACvB,OAAO,EAAE,CAAC,gBAAgB,CAAC;QAC3B,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,qEAAqE;QAClF,YAAY,EAAE,WAAW;QACzB,SAAS,EAAE,KAAK;QAChB,QAAQ,EAAE,CAAC,OAAO,EAAE,YAAY,EAAE,eAAe,CAAC;KACnD;IACD;QACE,EAAE,EAAE,UAAU;QACd,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,UAAU;QACjB,OAAO,EAAE,CAAC,kBAAkB,CAAC;QAC7B,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,wDAAwD;QACrE,SAAS,EAAE,IAAI;QACf,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC;KACjC;IACD;QACE,EAAE,EAAE,YAAY;QAChB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,YAAY;QACnB,OAAO,EAAE,CAAC,oBAAoB,CAAC;QAC/B,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,uDAAuD;QACpE,SAAS,EAAE,IAAI;QACf,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,EAAE,aAAa,CAAC;KAChD;IACD;QACE,EAAE,EAAE,kBAAkB;QACtB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,kBAAkB;QACzB,OAAO,EAAE,CAAC,wBAAwB,CAAC;QACnC,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,kCAAkC;QAC/C,SAAS,EAAE,IAAI;QACf,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC;KACjC;IACD;QACE,EAAE,EAAE,kBAAkB;QACtB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,kBAAkB;QACzB,OAAO,EAAE,CAAC,kBAAkB,EAAE,qBAAqB,CAAC;QACpD,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,4DAA4D;QACzE,SAAS,EAAE,IAAI;QACf,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC;KACjC;IACD;QACE,EAAE,EAAE,eAAe;QACnB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,aAAa;QACpB,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,0CAA0C;QACvD,QAAQ,EAAE,CAAC,OAAO,EAAE,SAAS,CAAC;KAC/B;IACD;QACE,EAAE,EAAE,MAAM;QACV,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,MAAM;QACb,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,8CAA8C;QAC3D,SAAS,EAAE,IAAI;QACf,QAAQ,EAAE,CAAC,OAAO,EAAE,SAAS,EAAE,WAAW,CAAC;KAC5C;IACD;QACE,EAAE,EAAE,aAAa;QACjB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,aAAa;QACpB,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,oCAAoC;QACjD,QAAQ,EAAE,CAAC,OAAO,EAAE,SAAS,CAAC;KAC/B;IACD;QACE,EAAE,EAAE,YAAY;QAChB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,YAAY;QACnB,OAAO,EAAE,CAAC,gBAAgB,CAAC;QAC3B,KAAK,EAAE,KAAK;QACZ,SAAS,EAAE,IAAI;QACf,WAAW,EAAE,mDAAmD;QAChE,YAAY,EAAE,OAAO;QACrB,YAAY,EAAE,MAAM;QACpB,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,YAAY;QAChB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,YAAY;QACnB,OAAO,EAAE,CAAC,oBAAoB,CAAC;QAC/B,KAAK,EAAE,KAAK;QACZ,SAAS,EAAE,IAAI;QACf,WAAW,EAAE,6CAA6C;QAC1D,aAAa,EAAE,iBAAiB;QAChC,YAAY,EAAE,wBAAwB;QACtC,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,EAAE,eAAe,CAAC;KAC5C;IACD;QACE,EAAE,EAAE,kBAAkB;QACtB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,kBAAkB;QACzB,OAAO,EAAE,CAAC,wBAAwB,CAAC;QACnC,KAAK,EAAE,KAAK;QACZ,WAAW,EAAE,qCAAqC;QAClD,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,cAAc;QAClB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,cAAc;QACrB,OAAO,EAAE,CAAC,mBAAmB,EAAE,uBAAuB,CAAC;QACvD,KAAK,EAAE,KAAK;QACZ,SAAS,EAAE,IAAI;QACf,WAAW,EAAE,qCAAqC;QAClD,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,kBAAkB;QACtB,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,kBAAkB;QACzB,OAAO,EAAE,CAAC,kBAAkB,EAAE,qBAAqB,CAAC;QACpD,KAAK,EAAE,KAAK;QACZ,SAAS,EAAE,IAAI;QACf,WAAW,EAAE,8BAA8B;QAC3C,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,OAAO;QACX,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,OAAO;QACd,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,8BAA8B;QAC3C,QAAQ,EAAE,CAAC,OAAO,EAAE,SAAS,EAAE,KAAK,CAAC;KACtC;IACD;QACE,EAAE,EAAE,OAAO;QACX,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,YAAY;QACnB,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,SAAS,EAAE,IAAI;QACf,WAAW,EAAE,sCAAsC;QACnD,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,EAAE,eAAe,CAAC;KAC5C;IACD;QACE,EAAE,EAAE,MAAM;QACV,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,MAAM;QACb,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,yCAAyC;QACtD,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,WAAW;QACf,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,WAAW;QAClB,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,8CAA8C;QAC3D,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,CAAC;KAC3B;IACD;QACE,EAAE,EAAE,sBAAsB;QAC1B,IAAI,EAAE,KAAK;QACX,KAAK,EAAE,sBAAsB;QAC7B,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,4DAA4D;QACzE,QAAQ,EAAE,CAAC,OAAO,EAAE,KAAK,EAAE,UAAU,CAAC;KACvC;IACD;QACE,EAAE,EAAE,WAAW;QACf,IAAI,EAAE,WAAW;QACjB,KAAK,EAAE,WAAW;QAClB,OAAO,EAAE,CAAC,sBAAsB,CAAC;QACjC,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,8CAA8C;QAC3D,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC;KACjC;IACD;QACE,EAAE,EAAE,cAAc;QAClB,IAAI,EAAE,WAAW;QACjB,KAAK,EAAE,cAAc;QACrB,OAAO,EAAE,EAAE;QACX,KAAK,EAAE,IAAI;QACX,WAAW,EAAE,uCAAuC;QACpD,QAAQ,EAAE,CAAC,OAAO,EAAE,WAAW,CAAC;KACjC;CACO,CAAC;AAEX,MAAM,UAAU,wBAAwB,CACtC,IAAyB;IAEzB,IAAI,CAAC,IAAI;QAAE,OAAO,CAAC,GAAG,uBAAuB,CAAC,CAAC;IAC/C,OAAO,uBAAuB,CAAC,MAAM,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,IAAI,KAAK,IAAI,CAAC,CAAC;AACxE,CAAC;AAED,MAAM,UAAU,sBAAsB;IACpC,OAAO,CAAC,WAAW,EAAE,KAAK,EAAE,KAAK,EAAE,KAAK,EAAE,WAAW,CAAC,CAAC;AACzD,CAAC;AAED,MAAM,UAAU,8BAA8B,CAC5C,EAAU;IAEV,OAAO,uBAAuB,CAAC,IAAI,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,EAAE,KAAK,EAAE,CAAC,CAAC;AAClE,CAAC;AAED,MAAM,UAAU,0BAA0B,CACxC,KAAiC,EACjC,MAA0C,OAAO,CAAC,GAAG;IAErD,OAAO,KAAK,CAAC,KAAK,IAAI,KAAK,CAAC,OAAO,CAAC,KAAK,CAAC,CAAC,MAAM,EAAE,EAAE,CAAC,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;AAC9E,CAAC"}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
import type { AdaptiveVADConfig } from '../../core/audio/AdaptiveVAD.js';
|
|
2
|
+
import type { CalibrationConfig } from '../../core/audio/EnvironmentalCalibrator.js';
|
|
3
|
+
import type { SpeechVadDecision, SpeechVadProvider } from '../types.js';
|
|
4
|
+
export interface BuiltInAdaptiveVadProviderConfig {
|
|
5
|
+
sampleRate?: number;
|
|
6
|
+
frameDurationMs?: number;
|
|
7
|
+
calibration?: CalibrationConfig;
|
|
8
|
+
vad?: AdaptiveVADConfig;
|
|
9
|
+
}
|
|
10
|
+
export declare class BuiltInAdaptiveVadProvider implements SpeechVadProvider {
|
|
11
|
+
readonly id = "agentos-adaptive-vad";
|
|
12
|
+
readonly displayName = "AgentOS Adaptive VAD";
|
|
13
|
+
private readonly calibrator;
|
|
14
|
+
private readonly vad;
|
|
15
|
+
constructor(config?: BuiltInAdaptiveVadProviderConfig);
|
|
16
|
+
processFrame(frame: Float32Array): SpeechVadDecision;
|
|
17
|
+
reset(): void;
|
|
18
|
+
getNoiseProfile(): import("../../core/audio/EnvironmentalCalibrator.js").NoiseProfile | null;
|
|
19
|
+
}
|
|
20
|
+
//# sourceMappingURL=BuiltInAdaptiveVadProvider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"BuiltInAdaptiveVadProvider.d.ts","sourceRoot":"","sources":["../../../src/speech/providers/BuiltInAdaptiveVadProvider.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EACV,iBAAiB,EAClB,MAAM,iCAAiC,CAAC;AACzC,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,6CAA6C,CAAC;AACrF,OAAO,KAAK,EAAE,iBAAiB,EAAE,iBAAiB,EAAE,MAAM,aAAa,CAAC;AAExE,MAAM,WAAW,gCAAgC;IAC/C,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,WAAW,CAAC,EAAE,iBAAiB,CAAC;IAChC,GAAG,CAAC,EAAE,iBAAiB,CAAC;CACzB;AAED,qBAAa,0BAA2B,YAAW,iBAAiB;IAClE,SAAgB,EAAE,0BAA0B;IAC5C,SAAgB,WAAW,0BAA0B;IACrD,OAAO,CAAC,QAAQ,CAAC,UAAU,CAA0B;IACrD,OAAO,CAAC,QAAQ,CAAC,GAAG,CAAc;gBAEtB,MAAM,GAAE,gCAAqC;IAYzD,YAAY,CAAC,KAAK,EAAE,YAAY,GAAG,iBAAiB;IAUpD,KAAK,IAAI,IAAI;IAIb,eAAe;CAGhB"}
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
import { AdaptiveVAD } from '../../core/audio/AdaptiveVAD.js';
|
|
2
|
+
import { EnvironmentalCalibrator } from '../../core/audio/EnvironmentalCalibrator.js';
|
|
3
|
+
export class BuiltInAdaptiveVadProvider {
|
|
4
|
+
constructor(config = {}) {
|
|
5
|
+
this.id = 'agentos-adaptive-vad';
|
|
6
|
+
this.displayName = 'AgentOS Adaptive VAD';
|
|
7
|
+
this.calibrator = new EnvironmentalCalibrator({
|
|
8
|
+
sampleRate: config.sampleRate ?? 16000,
|
|
9
|
+
...(config.calibration ?? {}),
|
|
10
|
+
});
|
|
11
|
+
this.vad = new AdaptiveVAD(config.vad ?? {}, this.calibrator, config.frameDurationMs ?? 20);
|
|
12
|
+
}
|
|
13
|
+
processFrame(frame) {
|
|
14
|
+
const result = this.vad.processFrame(frame);
|
|
15
|
+
return {
|
|
16
|
+
isSpeech: result.isSpeech,
|
|
17
|
+
confidence: result.confidence,
|
|
18
|
+
result,
|
|
19
|
+
profile: this.calibrator.getCurrentProfile(),
|
|
20
|
+
};
|
|
21
|
+
}
|
|
22
|
+
reset() {
|
|
23
|
+
this.vad.resetState();
|
|
24
|
+
}
|
|
25
|
+
getNoiseProfile() {
|
|
26
|
+
return this.calibrator.getCurrentProfile();
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
//# sourceMappingURL=BuiltInAdaptiveVadProvider.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"BuiltInAdaptiveVadProvider.js","sourceRoot":"","sources":["../../../src/speech/providers/BuiltInAdaptiveVadProvider.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,WAAW,EAAE,MAAM,iCAAiC,CAAC;AAC9D,OAAO,EAAE,uBAAuB,EAAE,MAAM,6CAA6C,CAAC;AActF,MAAM,OAAO,0BAA0B;IAMrC,YAAY,SAA2C,EAAE;QALzC,OAAE,GAAG,sBAAsB,CAAC;QAC5B,gBAAW,GAAG,sBAAsB,CAAC;QAKnD,IAAI,CAAC,UAAU,GAAG,IAAI,uBAAuB,CAAC;YAC5C,UAAU,EAAE,MAAM,CAAC,UAAU,IAAI,KAAM;YACvC,GAAG,CAAC,MAAM,CAAC,WAAW,IAAI,EAAE,CAAC;SAC9B,CAAC,CAAC;QACH,IAAI,CAAC,GAAG,GAAG,IAAI,WAAW,CACxB,MAAM,CAAC,GAAG,IAAI,EAAE,EAChB,IAAI,CAAC,UAAU,EACf,MAAM,CAAC,eAAe,IAAI,EAAE,CAC7B,CAAC;IACJ,CAAC;IAED,YAAY,CAAC,KAAmB;QAC9B,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,KAAK,CAAC,CAAC;QAC5C,OAAO;YACL,QAAQ,EAAE,MAAM,CAAC,QAAQ;YACzB,UAAU,EAAE,MAAM,CAAC,UAAU;YAC7B,MAAM;YACN,OAAO,EAAE,IAAI,CAAC,UAAU,CAAC,iBAAiB,EAAE;SAC7C,CAAC;IACJ,CAAC;IAED,KAAK;QACH,IAAI,CAAC,GAAG,CAAC,UAAU,EAAE,CAAC;IACxB,CAAC;IAED,eAAe;QACb,OAAO,IAAI,CAAC,UAAU,CAAC,iBAAiB,EAAE,CAAC;IAC7C,CAAC;CACF"}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
import type { SpeechSynthesisOptions, SpeechSynthesisResult, SpeechVoice, TextToSpeechProvider } from '../types.js';
|
|
2
|
+
export interface ElevenLabsTextToSpeechProviderConfig {
|
|
3
|
+
apiKey: string;
|
|
4
|
+
baseUrl?: string;
|
|
5
|
+
voiceId?: string;
|
|
6
|
+
model?: string;
|
|
7
|
+
fetchImpl?: typeof fetch;
|
|
8
|
+
}
|
|
9
|
+
export declare class ElevenLabsTextToSpeechProvider implements TextToSpeechProvider {
|
|
10
|
+
private readonly config;
|
|
11
|
+
readonly id = "elevenlabs";
|
|
12
|
+
readonly displayName = "ElevenLabs";
|
|
13
|
+
readonly supportsStreaming = true;
|
|
14
|
+
private readonly fetchImpl;
|
|
15
|
+
constructor(config: ElevenLabsTextToSpeechProviderConfig);
|
|
16
|
+
getProviderName(): string;
|
|
17
|
+
synthesize(text: string, options?: SpeechSynthesisOptions): Promise<SpeechSynthesisResult>;
|
|
18
|
+
listAvailableVoices(): Promise<SpeechVoice[]>;
|
|
19
|
+
}
|
|
20
|
+
//# sourceMappingURL=ElevenLabsTextToSpeechProvider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"ElevenLabsTextToSpeechProvider.d.ts","sourceRoot":"","sources":["../../../src/speech/providers/ElevenLabsTextToSpeechProvider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,sBAAsB,EACtB,qBAAqB,EACrB,WAAW,EACX,oBAAoB,EACrB,MAAM,aAAa,CAAC;AAErB,MAAM,WAAW,oCAAoC;IACnD,MAAM,EAAE,MAAM,CAAC;IACf,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,SAAS,CAAC,EAAE,OAAO,KAAK,CAAC;CAC1B;AAED,qBAAa,8BAA+B,YAAW,oBAAoB;IAM7D,OAAO,CAAC,QAAQ,CAAC,MAAM;IALnC,SAAgB,EAAE,gBAAgB;IAClC,SAAgB,WAAW,gBAAgB;IAC3C,SAAgB,iBAAiB,QAAQ;IACzC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAe;gBAEZ,MAAM,EAAE,oCAAoC;IAIzE,eAAe,IAAI,MAAM;IAInB,UAAU,CACd,IAAI,EAAE,MAAM,EACZ,OAAO,GAAE,sBAA2B,GACnC,OAAO,CAAC,qBAAqB,CAAC;IA8D3B,mBAAmB,IAAI,OAAO,CAAC,WAAW,EAAE,CAAC;CAwCpD"}
|
|
@@ -0,0 +1,95 @@
|
|
|
1
|
+
export class ElevenLabsTextToSpeechProvider {
|
|
2
|
+
constructor(config) {
|
|
3
|
+
this.config = config;
|
|
4
|
+
this.id = 'elevenlabs';
|
|
5
|
+
this.displayName = 'ElevenLabs';
|
|
6
|
+
this.supportsStreaming = true;
|
|
7
|
+
this.fetchImpl = config.fetchImpl ?? fetch;
|
|
8
|
+
}
|
|
9
|
+
getProviderName() {
|
|
10
|
+
return this.displayName;
|
|
11
|
+
}
|
|
12
|
+
async synthesize(text, options = {}) {
|
|
13
|
+
const voiceId = options.voice ??
|
|
14
|
+
this.config.voiceId ??
|
|
15
|
+
(typeof options.providerSpecificOptions?.voiceId === 'string'
|
|
16
|
+
? options.providerSpecificOptions.voiceId
|
|
17
|
+
: undefined) ??
|
|
18
|
+
'EXAVITQu4vr4xnSDxMaL';
|
|
19
|
+
const model = options.model ?? this.config.model ?? 'eleven_multilingual_v2';
|
|
20
|
+
const response = await this.fetchImpl(`${this.config.baseUrl ?? 'https://api.elevenlabs.io/v1'}/text-to-speech/${voiceId}`, {
|
|
21
|
+
method: 'POST',
|
|
22
|
+
headers: {
|
|
23
|
+
'xi-api-key': this.config.apiKey,
|
|
24
|
+
'Content-Type': 'application/json',
|
|
25
|
+
Accept: 'audio/mpeg',
|
|
26
|
+
},
|
|
27
|
+
body: JSON.stringify({
|
|
28
|
+
text,
|
|
29
|
+
model_id: model,
|
|
30
|
+
voice_settings: {
|
|
31
|
+
stability: typeof options.providerSpecificOptions?.stability === 'number'
|
|
32
|
+
? options.providerSpecificOptions.stability
|
|
33
|
+
: 0.5,
|
|
34
|
+
similarity_boost: typeof options.providerSpecificOptions?.similarityBoost === 'number'
|
|
35
|
+
? options.providerSpecificOptions.similarityBoost
|
|
36
|
+
: 0.75,
|
|
37
|
+
style: typeof options.providerSpecificOptions?.style === 'number'
|
|
38
|
+
? options.providerSpecificOptions.style
|
|
39
|
+
: undefined,
|
|
40
|
+
use_speaker_boost: typeof options.providerSpecificOptions?.useSpeakerBoost === 'boolean'
|
|
41
|
+
? options.providerSpecificOptions.useSpeakerBoost
|
|
42
|
+
: true,
|
|
43
|
+
},
|
|
44
|
+
}),
|
|
45
|
+
});
|
|
46
|
+
if (!response.ok) {
|
|
47
|
+
const message = await response.text();
|
|
48
|
+
throw new Error(`ElevenLabs synthesis failed (${response.status}): ${message}`);
|
|
49
|
+
}
|
|
50
|
+
const audioBuffer = Buffer.from(await response.arrayBuffer());
|
|
51
|
+
return {
|
|
52
|
+
audioBuffer,
|
|
53
|
+
mimeType: 'audio/mpeg',
|
|
54
|
+
cost: 0,
|
|
55
|
+
voiceUsed: voiceId,
|
|
56
|
+
providerName: this.displayName,
|
|
57
|
+
usage: {
|
|
58
|
+
characters: text.length,
|
|
59
|
+
modelUsed: model,
|
|
60
|
+
},
|
|
61
|
+
};
|
|
62
|
+
}
|
|
63
|
+
async listAvailableVoices() {
|
|
64
|
+
const response = await this.fetchImpl(`${this.config.baseUrl ?? 'https://api.elevenlabs.io/v1'}/voices`, {
|
|
65
|
+
method: 'GET',
|
|
66
|
+
headers: {
|
|
67
|
+
'xi-api-key': this.config.apiKey,
|
|
68
|
+
},
|
|
69
|
+
});
|
|
70
|
+
if (!response.ok) {
|
|
71
|
+
return [];
|
|
72
|
+
}
|
|
73
|
+
const payload = (await response.json());
|
|
74
|
+
return (payload.voices ?? [])
|
|
75
|
+
.filter((voice) => typeof voice === 'object' && voice !== null)
|
|
76
|
+
.map((voice) => {
|
|
77
|
+
const labels = typeof voice.labels === 'object' && voice.labels !== null
|
|
78
|
+
? voice.labels
|
|
79
|
+
: {};
|
|
80
|
+
return {
|
|
81
|
+
id: typeof voice.voice_id === 'string' ? voice.voice_id : '',
|
|
82
|
+
name: typeof voice.name === 'string' ? voice.name : 'Unknown',
|
|
83
|
+
lang: typeof labels.accent === 'string'
|
|
84
|
+
? labels.accent
|
|
85
|
+
: typeof labels.language === 'string'
|
|
86
|
+
? labels.language
|
|
87
|
+
: 'various',
|
|
88
|
+
description: typeof voice.description === 'string' ? voice.description : undefined,
|
|
89
|
+
provider: this.id,
|
|
90
|
+
};
|
|
91
|
+
})
|
|
92
|
+
.filter((voice) => voice.id);
|
|
93
|
+
}
|
|
94
|
+
}
|
|
95
|
+
//# sourceMappingURL=ElevenLabsTextToSpeechProvider.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"ElevenLabsTextToSpeechProvider.js","sourceRoot":"","sources":["../../../src/speech/providers/ElevenLabsTextToSpeechProvider.ts"],"names":[],"mappings":"AAeA,MAAM,OAAO,8BAA8B;IAMzC,YAA6B,MAA4C;QAA5C,WAAM,GAAN,MAAM,CAAsC;QALzD,OAAE,GAAG,YAAY,CAAC;QAClB,gBAAW,GAAG,YAAY,CAAC;QAC3B,sBAAiB,GAAG,IAAI,CAAC;QAIvC,IAAI,CAAC,SAAS,GAAG,MAAM,CAAC,SAAS,IAAI,KAAK,CAAC;IAC7C,CAAC;IAED,eAAe;QACb,OAAO,IAAI,CAAC,WAAW,CAAC;IAC1B,CAAC;IAED,KAAK,CAAC,UAAU,CACd,IAAY,EACZ,UAAkC,EAAE;QAEpC,MAAM,OAAO,GACX,OAAO,CAAC,KAAK;YACb,IAAI,CAAC,MAAM,CAAC,OAAO;YACnB,CAAC,OAAO,OAAO,CAAC,uBAAuB,EAAE,OAAO,KAAK,QAAQ;gBAC3D,CAAC,CAAC,OAAO,CAAC,uBAAuB,CAAC,OAAO;gBACzC,CAAC,CAAC,SAAS,CAAC;YACd,sBAAsB,CAAC;QACzB,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,IAAI,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,wBAAwB,CAAC;QAC7E,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,SAAS,CACnC,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,IAAI,8BAA8B,mBAAmB,OAAO,EAAE,EACpF;YACE,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,YAAY,EAAE,IAAI,CAAC,MAAM,CAAC,MAAM;gBAChC,cAAc,EAAE,kBAAkB;gBAClC,MAAM,EAAE,YAAY;aACrB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC;gBACnB,IAAI;gBACJ,QAAQ,EAAE,KAAK;gBACf,cAAc,EAAE;oBACd,SAAS,EACP,OAAO,OAAO,CAAC,uBAAuB,EAAE,SAAS,KAAK,QAAQ;wBAC5D,CAAC,CAAC,OAAO,CAAC,uBAAuB,CAAC,SAAS;wBAC3C,CAAC,CAAC,GAAG;oBACT,gBAAgB,EACd,OAAO,OAAO,CAAC,uBAAuB,EAAE,eAAe,KAAK,QAAQ;wBAClE,CAAC,CAAC,OAAO,CAAC,uBAAuB,CAAC,eAAe;wBACjD,CAAC,CAAC,IAAI;oBACV,KAAK,EACH,OAAO,OAAO,CAAC,uBAAuB,EAAE,KAAK,KAAK,QAAQ;wBACxD,CAAC,CAAC,OAAO,CAAC,uBAAuB,CAAC,KAAK;wBACvC,CAAC,CAAC,SAAS;oBACf,iBAAiB,EACf,OAAO,OAAO,CAAC,uBAAuB,EAAE,eAAe,KAAK,SAAS;wBACnE,CAAC,CAAC,OAAO,CAAC,uBAAuB,CAAC,eAAe;wBACjD,CAAC,CAAC,IAAI;iBACX;aACF,CAAC;SACH,CACF,CAAC;QAEF,IAAI,CAAC,QAAQ,CAAC,EAAE,EAAE,CAAC;YACjB,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,IAAI,EAAE,CAAC;YACtC,MAAM,IAAI,KAAK,CAAC,gCAAgC,QAAQ,CAAC,MAAM,MAAM,OAAO,EAAE,CAAC,CAAC;QAClF,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,QAAQ,CAAC,WAAW,EAAE,CAAC,CAAC;QAC9D,OAAO;YACL,WAAW;YACX,QAAQ,EAAE,YAAY;YACtB,IAAI,EAAE,CAAC;YACP,SAAS,EAAE,OAAO;YAClB,YAAY,EAAE,IAAI,CAAC,WAAW;YAC9B,KAAK,EAAE;gBACL,UAAU,EAAE,IAAI,CAAC,MAAM;gBACvB,SAAS,EAAE,KAAK;aACjB;SACF,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,mBAAmB;QACvB,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,SAAS,CACnC,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,IAAI,8BAA8B,SAAS,EACjE;YACE,MAAM,EAAE,KAAK;YACb,OAAO,EAAE;gBACP,YAAY,EAAE,IAAI,CAAC,MAAM,CAAC,MAAM;aACjC;SACF,CACF,CAAC;QAEF,IAAI,CAAC,QAAQ,CAAC,EAAE,EAAE,CAAC;YACjB,OAAO,EAAE,CAAC;QACZ,CAAC;QAED,MAAM,OAAO,GAAG,CAAC,MAAM,QAAQ,CAAC,IAAI,EAAE,CAAgD,CAAC;QACvF,OAAO,CAAC,OAAO,CAAC,MAAM,IAAI,EAAE,CAAC;aAC1B,MAAM,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,OAAO,KAAK,KAAK,QAAQ,IAAI,KAAK,KAAK,IAAI,CAAC;aAC9D,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE;YACb,MAAM,MAAM,GACV,OAAO,KAAK,CAAC,MAAM,KAAK,QAAQ,IAAI,KAAK,CAAC,MAAM,KAAK,IAAI;gBACvD,CAAC,CAAE,KAAK,CAAC,MAAkC;gBAC3C,CAAC,CAAC,EAAE,CAAC;YAET,OAAO;gBACL,EAAE,EAAE,OAAO,KAAK,CAAC,QAAQ,KAAK,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,EAAE;gBAC5D,IAAI,EAAE,OAAO,KAAK,CAAC,IAAI,KAAK,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,SAAS;gBAC7D,IAAI,EACF,OAAO,MAAM,CAAC,MAAM,KAAK,QAAQ;oBAC/B,CAAC,CAAC,MAAM,CAAC,MAAM;oBACf,CAAC,CAAC,OAAO,MAAM,CAAC,QAAQ,KAAK,QAAQ;wBACrC,CAAC,CAAC,MAAM,CAAC,QAAQ;wBACjB,CAAC,CAAC,SAAS;gBACf,WAAW,EACT,OAAO,KAAK,CAAC,WAAW,KAAK,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,WAAW,CAAC,CAAC,CAAC,SAAS;gBACvE,QAAQ,EAAE,IAAI,CAAC,EAAE;aAClB,CAAC;QACJ,CAAC,CAAC;aACD,MAAM,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;IACjC,CAAC;CACF"}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
import type { SpeechSynthesisOptions, SpeechSynthesisResult, SpeechVoice, TextToSpeechProvider } from '../types.js';
|
|
2
|
+
export interface OpenAITextToSpeechProviderConfig {
|
|
3
|
+
apiKey: string;
|
|
4
|
+
baseUrl?: string;
|
|
5
|
+
model?: string;
|
|
6
|
+
voice?: string;
|
|
7
|
+
fetchImpl?: typeof fetch;
|
|
8
|
+
}
|
|
9
|
+
export declare class OpenAITextToSpeechProvider implements TextToSpeechProvider {
|
|
10
|
+
private readonly config;
|
|
11
|
+
readonly id = "openai-tts";
|
|
12
|
+
readonly displayName = "OpenAI TTS";
|
|
13
|
+
readonly supportsStreaming = true;
|
|
14
|
+
private readonly fetchImpl;
|
|
15
|
+
constructor(config: OpenAITextToSpeechProviderConfig);
|
|
16
|
+
getProviderName(): string;
|
|
17
|
+
synthesize(text: string, options?: SpeechSynthesisOptions): Promise<SpeechSynthesisResult>;
|
|
18
|
+
listAvailableVoices(): Promise<SpeechVoice[]>;
|
|
19
|
+
}
|
|
20
|
+
//# sourceMappingURL=OpenAITextToSpeechProvider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"OpenAITextToSpeechProvider.d.ts","sourceRoot":"","sources":["../../../src/speech/providers/OpenAITextToSpeechProvider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,sBAAsB,EACtB,qBAAqB,EACrB,WAAW,EACX,oBAAoB,EACrB,MAAM,aAAa,CAAC;AAErB,MAAM,WAAW,gCAAgC;IAC/C,MAAM,EAAE,MAAM,CAAC;IACf,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,SAAS,CAAC,EAAE,OAAO,KAAK,CAAC;CAC1B;AA4BD,qBAAa,0BAA2B,YAAW,oBAAoB;IAMzD,OAAO,CAAC,QAAQ,CAAC,MAAM;IALnC,SAAgB,EAAE,gBAAgB;IAClC,SAAgB,WAAW,gBAAgB;IAC3C,SAAgB,iBAAiB,QAAQ;IACzC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAe;gBAEZ,MAAM,EAAE,gCAAgC;IAIrE,eAAe,IAAI,MAAM;IAInB,UAAU,CACd,IAAI,EAAE,MAAM,EACZ,OAAO,GAAE,sBAA2B,GACnC,OAAO,CAAC,qBAAqB,CAAC;IAyC3B,mBAAmB,IAAI,OAAO,CAAC,WAAW,EAAE,CAAC;CAGpD"}
|
|
@@ -0,0 +1,75 @@
|
|
|
1
|
+
const OPENAI_VOICES = [
|
|
2
|
+
{ id: 'alloy', name: 'Alloy', provider: 'openai-tts', lang: 'various', isDefault: false },
|
|
3
|
+
{ id: 'echo', name: 'Echo', provider: 'openai-tts', lang: 'various', isDefault: false },
|
|
4
|
+
{ id: 'fable', name: 'Fable', provider: 'openai-tts', lang: 'various', isDefault: false },
|
|
5
|
+
{ id: 'onyx', name: 'Onyx', provider: 'openai-tts', lang: 'various', isDefault: false },
|
|
6
|
+
{ id: 'nova', name: 'Nova', provider: 'openai-tts', lang: 'various', isDefault: true },
|
|
7
|
+
{ id: 'shimmer', name: 'Shimmer', provider: 'openai-tts', lang: 'various', isDefault: false },
|
|
8
|
+
];
|
|
9
|
+
function mimeTypeForOutput(format) {
|
|
10
|
+
switch (format) {
|
|
11
|
+
case 'opus':
|
|
12
|
+
return 'audio/opus';
|
|
13
|
+
case 'aac':
|
|
14
|
+
return 'audio/aac';
|
|
15
|
+
case 'flac':
|
|
16
|
+
return 'audio/flac';
|
|
17
|
+
case 'wav':
|
|
18
|
+
return 'audio/wav';
|
|
19
|
+
case 'pcm':
|
|
20
|
+
return 'audio/L16';
|
|
21
|
+
default:
|
|
22
|
+
return 'audio/mpeg';
|
|
23
|
+
}
|
|
24
|
+
}
|
|
25
|
+
export class OpenAITextToSpeechProvider {
|
|
26
|
+
constructor(config) {
|
|
27
|
+
this.config = config;
|
|
28
|
+
this.id = 'openai-tts';
|
|
29
|
+
this.displayName = 'OpenAI TTS';
|
|
30
|
+
this.supportsStreaming = true;
|
|
31
|
+
this.fetchImpl = config.fetchImpl ?? fetch;
|
|
32
|
+
}
|
|
33
|
+
getProviderName() {
|
|
34
|
+
return this.displayName;
|
|
35
|
+
}
|
|
36
|
+
async synthesize(text, options = {}) {
|
|
37
|
+
const model = options.model ?? this.config.model ?? 'tts-1';
|
|
38
|
+
const voice = options.voice ?? this.config.voice ?? 'nova';
|
|
39
|
+
const outputFormat = options.outputFormat ?? 'mp3';
|
|
40
|
+
const response = await this.fetchImpl(`${this.config.baseUrl ?? 'https://api.openai.com/v1'}/audio/speech`, {
|
|
41
|
+
method: 'POST',
|
|
42
|
+
headers: {
|
|
43
|
+
Authorization: `Bearer ${this.config.apiKey}`,
|
|
44
|
+
'Content-Type': 'application/json',
|
|
45
|
+
},
|
|
46
|
+
body: JSON.stringify({
|
|
47
|
+
model,
|
|
48
|
+
voice,
|
|
49
|
+
input: text,
|
|
50
|
+
response_format: outputFormat,
|
|
51
|
+
speed: options.speed,
|
|
52
|
+
}),
|
|
53
|
+
});
|
|
54
|
+
if (!response.ok) {
|
|
55
|
+
const message = await response.text();
|
|
56
|
+
throw new Error(`OpenAI TTS synthesis failed (${response.status}): ${message}`);
|
|
57
|
+
}
|
|
58
|
+
const audioBuffer = Buffer.from(await response.arrayBuffer());
|
|
59
|
+
return {
|
|
60
|
+
audioBuffer,
|
|
61
|
+
mimeType: mimeTypeForOutput(outputFormat),
|
|
62
|
+
cost: 0,
|
|
63
|
+
voiceUsed: voice,
|
|
64
|
+
providerName: this.displayName,
|
|
65
|
+
usage: {
|
|
66
|
+
characters: text.length,
|
|
67
|
+
modelUsed: model,
|
|
68
|
+
},
|
|
69
|
+
};
|
|
70
|
+
}
|
|
71
|
+
async listAvailableVoices() {
|
|
72
|
+
return [...OPENAI_VOICES];
|
|
73
|
+
}
|
|
74
|
+
}
|
|
75
|
+
//# sourceMappingURL=OpenAITextToSpeechProvider.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"OpenAITextToSpeechProvider.js","sourceRoot":"","sources":["../../../src/speech/providers/OpenAITextToSpeechProvider.ts"],"names":[],"mappings":"AAeA,MAAM,aAAa,GAA2B;IAC5C,EAAE,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,KAAK,EAAE;IACzF,EAAE,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,KAAK,EAAE;IACvF,EAAE,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,KAAK,EAAE;IACzF,EAAE,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,KAAK,EAAE;IACvF,EAAE,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,IAAI,EAAE;IACtF,EAAE,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,SAAS,EAAE,QAAQ,EAAE,YAAY,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,KAAK,EAAE;CAC9F,CAAC;AAEF,SAAS,iBAAiB,CAAC,MAA0B;IACnD,QAAQ,MAAM,EAAE,CAAC;QACf,KAAK,MAAM;YACT,OAAO,YAAY,CAAC;QACtB,KAAK,KAAK;YACR,OAAO,WAAW,CAAC;QACrB,KAAK,MAAM;YACT,OAAO,YAAY,CAAC;QACtB,KAAK,KAAK;YACR,OAAO,WAAW,CAAC;QACrB,KAAK,KAAK;YACR,OAAO,WAAW,CAAC;QACrB;YACE,OAAO,YAAY,CAAC;IACxB,CAAC;AACH,CAAC;AAED,MAAM,OAAO,0BAA0B;IAMrC,YAA6B,MAAwC;QAAxC,WAAM,GAAN,MAAM,CAAkC;QALrD,OAAE,GAAG,YAAY,CAAC;QAClB,gBAAW,GAAG,YAAY,CAAC;QAC3B,sBAAiB,GAAG,IAAI,CAAC;QAIvC,IAAI,CAAC,SAAS,GAAG,MAAM,CAAC,SAAS,IAAI,KAAK,CAAC;IAC7C,CAAC;IAED,eAAe;QACb,OAAO,IAAI,CAAC,WAAW,CAAC;IAC1B,CAAC;IAED,KAAK,CAAC,UAAU,CACd,IAAY,EACZ,UAAkC,EAAE;QAEpC,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,IAAI,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,OAAO,CAAC;QAC5D,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,IAAI,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,MAAM,CAAC;QAC3D,MAAM,YAAY,GAAG,OAAO,CAAC,YAAY,IAAI,KAAK,CAAC;QACnD,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,SAAS,CACnC,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,IAAI,2BAA2B,eAAe,EACpE;YACE,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,aAAa,EAAE,UAAU,IAAI,CAAC,MAAM,CAAC,MAAM,EAAE;gBAC7C,cAAc,EAAE,kBAAkB;aACnC;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC;gBACnB,KAAK;gBACL,KAAK;gBACL,KAAK,EAAE,IAAI;gBACX,eAAe,EAAE,YAAY;gBAC7B,KAAK,EAAE,OAAO,CAAC,KAAK;aACrB,CAAC;SACH,CACF,CAAC;QAEF,IAAI,CAAC,QAAQ,CAAC,EAAE,EAAE,CAAC;YACjB,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,IAAI,EAAE,CAAC;YACtC,MAAM,IAAI,KAAK,CAAC,gCAAgC,QAAQ,CAAC,MAAM,MAAM,OAAO,EAAE,CAAC,CAAC;QAClF,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,QAAQ,CAAC,WAAW,EAAE,CAAC,CAAC;QAC9D,OAAO;YACL,WAAW;YACX,QAAQ,EAAE,iBAAiB,CAAC,YAAY,CAAC;YACzC,IAAI,EAAE,CAAC;YACP,SAAS,EAAE,KAAK;YAChB,YAAY,EAAE,IAAI,CAAC,WAAW;YAC9B,KAAK,EAAE;gBACL,UAAU,EAAE,IAAI,CAAC,MAAM;gBACvB,SAAS,EAAE,KAAK;aACjB;SACF,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,mBAAmB;QACvB,OAAO,CAAC,GAAG,aAAa,CAAC,CAAC;IAC5B,CAAC;CACF"}
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
import type { SpeechAudioInput, SpeechToTextProvider, SpeechTranscriptionOptions, SpeechTranscriptionResult } from '../types.js';
|
|
2
|
+
export interface OpenAIWhisperSpeechToTextProviderConfig {
|
|
3
|
+
apiKey: string;
|
|
4
|
+
baseUrl?: string;
|
|
5
|
+
model?: string;
|
|
6
|
+
fetchImpl?: typeof fetch;
|
|
7
|
+
}
|
|
8
|
+
export declare class OpenAIWhisperSpeechToTextProvider implements SpeechToTextProvider {
|
|
9
|
+
private readonly config;
|
|
10
|
+
readonly id = "openai-whisper";
|
|
11
|
+
readonly displayName = "OpenAI Whisper";
|
|
12
|
+
readonly supportsStreaming = false;
|
|
13
|
+
private readonly fetchImpl;
|
|
14
|
+
constructor(config: OpenAIWhisperSpeechToTextProviderConfig);
|
|
15
|
+
getProviderName(): string;
|
|
16
|
+
transcribe(audio: SpeechAudioInput, options?: SpeechTranscriptionOptions): Promise<SpeechTranscriptionResult>;
|
|
17
|
+
}
|
|
18
|
+
//# sourceMappingURL=OpenAIWhisperSpeechToTextProvider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"OpenAIWhisperSpeechToTextProvider.d.ts","sourceRoot":"","sources":["../../../src/speech/providers/OpenAIWhisperSpeechToTextProvider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,gBAAgB,EAEhB,oBAAoB,EACpB,0BAA0B,EAC1B,yBAAyB,EAE1B,MAAM,aAAa,CAAC;AAErB,MAAM,WAAW,uCAAuC;IACtD,MAAM,EAAE,MAAM,CAAC;IACf,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,SAAS,CAAC,EAAE,OAAO,KAAK,CAAC;CAC1B;AA8CD,qBAAa,iCAAkC,YAAW,oBAAoB;IAMhE,OAAO,CAAC,QAAQ,CAAC,MAAM;IALnC,SAAgB,EAAE,oBAAoB;IACtC,SAAgB,WAAW,oBAAoB;IAC/C,SAAgB,iBAAiB,SAAS;IAC1C,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAe;gBAEZ,MAAM,EAAE,uCAAuC;IAI5E,eAAe,IAAI,MAAM;IAInB,UAAU,CACd,KAAK,EAAE,gBAAgB,EACvB,OAAO,GAAE,0BAA+B,GACvC,OAAO,CAAC,yBAAyB,CAAC;CAoEtC"}
|