@getpaseo/server 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.env.example +20 -0
- package/README.md +107 -0
- package/agent-prompt.md +339 -0
- package/dist/scripts/daemon-runner.js +32 -0
- package/dist/scripts/daemon-runner.js.map +1 -0
- package/dist/scripts/dev-runner.js +19 -0
- package/dist/scripts/dev-runner.js.map +1 -0
- package/dist/scripts/mcp-stdio-socket-bridge-cli.mjs +62 -0
- package/dist/scripts/supervisor.js +95 -0
- package/dist/scripts/supervisor.js.map +1 -0
- package/dist/server/client/daemon-client.d.ts +383 -0
- package/dist/server/client/daemon-client.d.ts.map +1 -0
- package/dist/server/client/daemon-client.js +2443 -0
- package/dist/server/client/daemon-client.js.map +1 -0
- package/dist/server/server/agent/activity-curator.d.ts +8 -0
- package/dist/server/server/agent/activity-curator.d.ts.map +1 -0
- package/dist/server/server/agent/activity-curator.js +228 -0
- package/dist/server/server/agent/activity-curator.js.map +1 -0
- package/dist/server/server/agent/agent-management-mcp.d.ts +34 -0
- package/dist/server/server/agent/agent-management-mcp.d.ts.map +1 -0
- package/dist/server/server/agent/agent-management-mcp.js +619 -0
- package/dist/server/server/agent/agent-management-mcp.js.map +1 -0
- package/dist/server/server/agent/agent-manager.d.ts +182 -0
- package/dist/server/server/agent/agent-manager.d.ts.map +1 -0
- package/dist/server/server/agent/agent-manager.js +1066 -0
- package/dist/server/server/agent/agent-manager.js.map +1 -0
- package/dist/server/server/agent/agent-metadata-generator.d.ts +29 -0
- package/dist/server/server/agent/agent-metadata-generator.d.ts.map +1 -0
- package/dist/server/server/agent/agent-metadata-generator.js +157 -0
- package/dist/server/server/agent/agent-metadata-generator.js.map +1 -0
- package/dist/server/server/agent/agent-projections.d.ts +12 -0
- package/dist/server/server/agent/agent-projections.d.ts.map +1 -0
- package/dist/server/server/agent/agent-projections.js +238 -0
- package/dist/server/server/agent/agent-projections.js.map +1 -0
- package/dist/server/server/agent/agent-response-loop.d.ts +32 -0
- package/dist/server/server/agent/agent-response-loop.d.ts.map +1 -0
- package/dist/server/server/agent/agent-response-loop.js +224 -0
- package/dist/server/server/agent/agent-response-loop.js.map +1 -0
- package/dist/server/server/agent/agent-sdk-types.d.ts +360 -0
- package/dist/server/server/agent/agent-sdk-types.d.ts.map +1 -0
- package/dist/server/server/agent/agent-sdk-types.js +2 -0
- package/dist/server/server/agent/agent-sdk-types.js.map +1 -0
- package/dist/server/server/agent/agent-storage.d.ts +187 -0
- package/dist/server/server/agent/agent-storage.d.ts.map +1 -0
- package/dist/server/server/agent/agent-storage.js +328 -0
- package/dist/server/server/agent/agent-storage.js.map +1 -0
- package/dist/server/server/agent/audio-utils.d.ts +3 -0
- package/dist/server/server/agent/audio-utils.d.ts.map +1 -0
- package/dist/server/server/agent/audio-utils.js +19 -0
- package/dist/server/server/agent/audio-utils.js.map +1 -0
- package/dist/server/server/agent/dictation-debug.d.ts +13 -0
- package/dist/server/server/agent/dictation-debug.d.ts.map +1 -0
- package/dist/server/server/agent/dictation-debug.js +50 -0
- package/dist/server/server/agent/dictation-debug.js.map +1 -0
- package/dist/server/server/agent/llm-openai.d.ts +7 -0
- package/dist/server/server/agent/llm-openai.d.ts.map +1 -0
- package/dist/server/server/agent/llm-openai.js +8 -0
- package/dist/server/server/agent/llm-openai.js.map +1 -0
- package/dist/server/server/agent/mcp-server.d.ts +26 -0
- package/dist/server/server/agent/mcp-server.d.ts.map +1 -0
- package/dist/server/server/agent/mcp-server.js +762 -0
- package/dist/server/server/agent/mcp-server.js.map +1 -0
- package/dist/server/server/agent/model-resolver.d.ts +11 -0
- package/dist/server/server/agent/model-resolver.d.ts.map +1 -0
- package/dist/server/server/agent/model-resolver.js +21 -0
- package/dist/server/server/agent/model-resolver.js.map +1 -0
- package/dist/server/server/agent/orchestrator-instructions.d.ts +7 -0
- package/dist/server/server/agent/orchestrator-instructions.d.ts.map +1 -0
- package/dist/server/server/agent/orchestrator-instructions.js +51 -0
- package/dist/server/server/agent/orchestrator-instructions.js.map +1 -0
- package/dist/server/server/agent/orchestrator.d.ts +12 -0
- package/dist/server/server/agent/orchestrator.d.ts.map +1 -0
- package/dist/server/server/agent/orchestrator.js +12 -0
- package/dist/server/server/agent/orchestrator.js.map +1 -0
- package/dist/server/server/agent/pcm16-resampler.d.ts +14 -0
- package/dist/server/server/agent/pcm16-resampler.d.ts.map +1 -0
- package/dist/server/server/agent/pcm16-resampler.js +63 -0
- package/dist/server/server/agent/pcm16-resampler.js.map +1 -0
- package/dist/server/server/agent/provider-launch-config.d.ts +139 -0
- package/dist/server/server/agent/provider-launch-config.d.ts.map +1 -0
- package/dist/server/server/agent/provider-launch-config.js +83 -0
- package/dist/server/server/agent/provider-launch-config.js.map +1 -0
- package/dist/server/server/agent/provider-manifest.d.ts +20 -0
- package/dist/server/server/agent/provider-manifest.d.ts.map +1 -0
- package/dist/server/server/agent/provider-manifest.js +97 -0
- package/dist/server/server/agent/provider-manifest.js.map +1 -0
- package/dist/server/server/agent/provider-registry.d.ts +18 -0
- package/dist/server/server/agent/provider-registry.d.ts.map +1 -0
- package/dist/server/server/agent/provider-registry.js +45 -0
- package/dist/server/server/agent/provider-registry.js.map +1 -0
- package/dist/server/server/agent/providers/claude/tool-call-detail-parser.d.ts +3 -0
- package/dist/server/server/agent/providers/claude/tool-call-detail-parser.d.ts.map +1 -0
- package/dist/server/server/agent/providers/claude/tool-call-detail-parser.js +42 -0
- package/dist/server/server/agent/providers/claude/tool-call-detail-parser.js.map +1 -0
- package/dist/server/server/agent/providers/claude/tool-call-mapper.d.ts +16 -0
- package/dist/server/server/agent/providers/claude/tool-call-mapper.d.ts.map +1 -0
- package/dist/server/server/agent/providers/claude/tool-call-mapper.js +73 -0
- package/dist/server/server/agent/providers/claude/tool-call-mapper.js.map +1 -0
- package/dist/server/server/agent/providers/claude-agent.d.ts +35 -0
- package/dist/server/server/agent/providers/claude-agent.d.ts.map +1 -0
- package/dist/server/server/agent/providers/claude-agent.js +2056 -0
- package/dist/server/server/agent/providers/claude-agent.js.map +1 -0
- package/dist/server/server/agent/providers/codex/tool-call-detail-parser.d.ts +13 -0
- package/dist/server/server/agent/providers/codex/tool-call-detail-parser.d.ts.map +1 -0
- package/dist/server/server/agent/providers/codex/tool-call-detail-parser.js +67 -0
- package/dist/server/server/agent/providers/codex/tool-call-detail-parser.js.map +1 -0
- package/dist/server/server/agent/providers/codex/tool-call-mapper.d.ts +15 -0
- package/dist/server/server/agent/providers/codex/tool-call-mapper.d.ts.map +1 -0
- package/dist/server/server/agent/providers/codex/tool-call-mapper.js +640 -0
- package/dist/server/server/agent/providers/codex/tool-call-mapper.js.map +1 -0
- package/dist/server/server/agent/providers/codex-app-server-agent.d.ts +34 -0
- package/dist/server/server/agent/providers/codex-app-server-agent.d.ts.map +1 -0
- package/dist/server/server/agent/providers/codex-app-server-agent.js +2476 -0
- package/dist/server/server/agent/providers/codex-app-server-agent.js.map +1 -0
- package/dist/server/server/agent/providers/codex-rollout-timeline.d.ts +9 -0
- package/dist/server/server/agent/providers/codex-rollout-timeline.d.ts.map +1 -0
- package/dist/server/server/agent/providers/codex-rollout-timeline.js +486 -0
- package/dist/server/server/agent/providers/codex-rollout-timeline.js.map +1 -0
- package/dist/server/server/agent/providers/opencode/tool-call-detail-parser.d.ts +3 -0
- package/dist/server/server/agent/providers/opencode/tool-call-detail-parser.d.ts.map +1 -0
- package/dist/server/server/agent/providers/opencode/tool-call-detail-parser.js +33 -0
- package/dist/server/server/agent/providers/opencode/tool-call-detail-parser.js.map +1 -0
- package/dist/server/server/agent/providers/opencode/tool-call-mapper.d.ts +13 -0
- package/dist/server/server/agent/providers/opencode/tool-call-mapper.d.ts.map +1 -0
- package/dist/server/server/agent/providers/opencode/tool-call-mapper.js +75 -0
- package/dist/server/server/agent/providers/opencode/tool-call-mapper.js.map +1 -0
- package/dist/server/server/agent/providers/opencode-agent.d.ts +37 -0
- package/dist/server/server/agent/providers/opencode-agent.d.ts.map +1 -0
- package/dist/server/server/agent/providers/opencode-agent.js +822 -0
- package/dist/server/server/agent/providers/opencode-agent.js.map +1 -0
- package/dist/server/server/agent/providers/tool-call-detail-primitives.d.ts +1363 -0
- package/dist/server/server/agent/providers/tool-call-detail-primitives.d.ts.map +1 -0
- package/dist/server/server/agent/providers/tool-call-detail-primitives.js +534 -0
- package/dist/server/server/agent/providers/tool-call-detail-primitives.js.map +1 -0
- package/dist/server/server/agent/providers/tool-call-mapper-utils.d.ts +18 -0
- package/dist/server/server/agent/providers/tool-call-mapper-utils.d.ts.map +1 -0
- package/dist/server/server/agent/providers/tool-call-mapper-utils.js +119 -0
- package/dist/server/server/agent/providers/tool-call-mapper-utils.js.map +1 -0
- package/dist/server/server/agent/recordings-debug.d.ts +3 -0
- package/dist/server/server/agent/recordings-debug.d.ts.map +1 -0
- package/dist/server/server/agent/recordings-debug.js +19 -0
- package/dist/server/server/agent/recordings-debug.js.map +1 -0
- package/dist/server/server/agent/stt-debug.d.ts +10 -0
- package/dist/server/server/agent/stt-debug.d.ts.map +1 -0
- package/dist/server/server/agent/stt-debug.js +33 -0
- package/dist/server/server/agent/stt-debug.js.map +1 -0
- package/dist/server/server/agent/stt-manager.d.ts +32 -0
- package/dist/server/server/agent/stt-manager.d.ts.map +1 -0
- package/dist/server/server/agent/stt-manager.js +231 -0
- package/dist/server/server/agent/stt-manager.js.map +1 -0
- package/dist/server/server/agent/system-prompt.d.ts +3 -0
- package/dist/server/server/agent/system-prompt.d.ts.map +1 -0
- package/dist/server/server/agent/system-prompt.js +19 -0
- package/dist/server/server/agent/system-prompt.js.map +1 -0
- package/dist/server/server/agent/tool-name-normalization.d.ts +7 -0
- package/dist/server/server/agent/tool-name-normalization.d.ts.map +1 -0
- package/dist/server/server/agent/tool-name-normalization.js +45 -0
- package/dist/server/server/agent/tool-name-normalization.js.map +1 -0
- package/dist/server/server/agent/tts-debug.d.ts +8 -0
- package/dist/server/server/agent/tts-debug.d.ts.map +1 -0
- package/dist/server/server/agent/tts-debug.js +24 -0
- package/dist/server/server/agent/tts-debug.js.map +1 -0
- package/dist/server/server/agent/tts-manager.d.ts +33 -0
- package/dist/server/server/agent/tts-manager.d.ts.map +1 -0
- package/dist/server/server/agent/tts-manager.js +261 -0
- package/dist/server/server/agent/tts-manager.js.map +1 -0
- package/dist/server/server/agent/wait-for-agent-tracker.d.ts +15 -0
- package/dist/server/server/agent/wait-for-agent-tracker.d.ts.map +1 -0
- package/dist/server/server/agent/wait-for-agent-tracker.js +53 -0
- package/dist/server/server/agent/wait-for-agent-tracker.js.map +1 -0
- package/dist/server/server/allowed-hosts.d.ts +13 -0
- package/dist/server/server/allowed-hosts.d.ts.map +1 -0
- package/dist/server/server/allowed-hosts.js +94 -0
- package/dist/server/server/allowed-hosts.js.map +1 -0
- package/dist/server/server/bootstrap.d.ts +49 -0
- package/dist/server/server/bootstrap.d.ts.map +1 -0
- package/dist/server/server/bootstrap.js +483 -0
- package/dist/server/server/bootstrap.js.map +1 -0
- package/dist/server/server/config.d.ts +13 -0
- package/dist/server/server/config.d.ts.map +1 -0
- package/dist/server/server/config.js +84 -0
- package/dist/server/server/config.js.map +1 -0
- package/dist/server/server/connection-offer.d.ts +19 -0
- package/dist/server/server/connection-offer.d.ts.map +1 -0
- package/dist/server/server/connection-offer.js +60 -0
- package/dist/server/server/connection-offer.js.map +1 -0
- package/dist/server/server/daemon-keypair.d.ts +8 -0
- package/dist/server/server/daemon-keypair.d.ts.map +1 -0
- package/dist/server/server/daemon-keypair.js +40 -0
- package/dist/server/server/daemon-keypair.js.map +1 -0
- package/dist/server/server/dictation/dictation-stream-manager.d.ts +76 -0
- package/dist/server/server/dictation/dictation-stream-manager.d.ts.map +1 -0
- package/dist/server/server/dictation/dictation-stream-manager.js +481 -0
- package/dist/server/server/dictation/dictation-stream-manager.js.map +1 -0
- package/dist/server/server/exports.d.ts +11 -0
- package/dist/server/server/exports.d.ts.map +1 -0
- package/dist/server/server/exports.js +11 -0
- package/dist/server/server/exports.js.map +1 -0
- package/dist/server/server/file-download/token-store.d.ts +25 -0
- package/dist/server/server/file-download/token-store.d.ts.map +1 -0
- package/dist/server/server/file-download/token-store.js +40 -0
- package/dist/server/server/file-download/token-store.js.map +1 -0
- package/dist/server/server/file-explorer/service.d.ts +41 -0
- package/dist/server/server/file-explorer/service.d.ts.map +1 -0
- package/dist/server/server/file-explorer/service.js +163 -0
- package/dist/server/server/file-explorer/service.js.map +1 -0
- package/dist/server/server/index.d.ts +2 -0
- package/dist/server/server/index.d.ts.map +1 -0
- package/dist/server/server/index.js +90 -0
- package/dist/server/server/index.js.map +1 -0
- package/dist/server/server/json-utils.d.ts +11 -0
- package/dist/server/server/json-utils.d.ts.map +1 -0
- package/dist/server/server/json-utils.js +45 -0
- package/dist/server/server/json-utils.js.map +1 -0
- package/dist/server/server/logger.d.ts +12 -0
- package/dist/server/server/logger.d.ts.map +1 -0
- package/dist/server/server/logger.js +29 -0
- package/dist/server/server/logger.js.map +1 -0
- package/dist/server/server/messages.d.ts +9 -0
- package/dist/server/server/messages.d.ts.map +1 -0
- package/dist/server/server/messages.js +29 -0
- package/dist/server/server/messages.js.map +1 -0
- package/dist/server/server/pairing-offer.d.ts +16 -0
- package/dist/server/server/pairing-offer.d.ts.map +1 -0
- package/dist/server/server/pairing-offer.js +45 -0
- package/dist/server/server/pairing-offer.js.map +1 -0
- package/dist/server/server/pairing-qr.d.ts +7 -0
- package/dist/server/server/pairing-qr.d.ts.map +1 -0
- package/dist/server/server/pairing-qr.js +45 -0
- package/dist/server/server/pairing-qr.js.map +1 -0
- package/dist/server/server/paseo-home.d.ts +2 -0
- package/dist/server/server/paseo-home.d.ts.map +1 -0
- package/dist/server/server/paseo-home.js +19 -0
- package/dist/server/server/paseo-home.js.map +1 -0
- package/dist/server/server/path-utils.d.ts +3 -0
- package/dist/server/server/path-utils.d.ts.map +1 -0
- package/dist/server/server/path-utils.js +20 -0
- package/dist/server/server/path-utils.js.map +1 -0
- package/dist/server/server/persisted-config.d.ts +500 -0
- package/dist/server/server/persisted-config.d.ts.map +1 -0
- package/dist/server/server/persisted-config.js +212 -0
- package/dist/server/server/persisted-config.js.map +1 -0
- package/dist/server/server/persistence-hooks.d.ts +24 -0
- package/dist/server/server/persistence-hooks.d.ts.map +1 -0
- package/dist/server/server/persistence-hooks.js +60 -0
- package/dist/server/server/persistence-hooks.js.map +1 -0
- package/dist/server/server/pid-lock.d.ts +19 -0
- package/dist/server/server/pid-lock.d.ts.map +1 -0
- package/dist/server/server/pid-lock.js +115 -0
- package/dist/server/server/pid-lock.js.map +1 -0
- package/dist/server/server/push/push-service.d.ts +21 -0
- package/dist/server/server/push/push-service.d.ts.map +1 -0
- package/dist/server/server/push/push-service.js +68 -0
- package/dist/server/server/push/push-service.js.map +1 -0
- package/dist/server/server/push/token-store.d.ts +18 -0
- package/dist/server/server/push/token-store.d.ts.map +1 -0
- package/dist/server/server/push/token-store.js +70 -0
- package/dist/server/server/push/token-store.js.map +1 -0
- package/dist/server/server/relay-transport.d.ts +22 -0
- package/dist/server/server/relay-transport.d.ts.map +1 -0
- package/dist/server/server/relay-transport.js +374 -0
- package/dist/server/server/relay-transport.js.map +1 -0
- package/dist/server/server/server-id.d.ts +17 -0
- package/dist/server/server/server-id.d.ts.map +1 -0
- package/dist/server/server/server-id.js +63 -0
- package/dist/server/server/server-id.js.map +1 -0
- package/dist/server/server/session.d.ts +360 -0
- package/dist/server/server/session.d.ts.map +1 -0
- package/dist/server/server/session.js +4615 -0
- package/dist/server/server/session.js.map +1 -0
- package/dist/server/server/speech/audio.d.ts +10 -0
- package/dist/server/server/speech/audio.d.ts.map +1 -0
- package/dist/server/server/speech/audio.js +101 -0
- package/dist/server/server/speech/audio.js.map +1 -0
- package/dist/server/server/speech/providers/local/config.d.ts +26 -0
- package/dist/server/server/speech/providers/local/config.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/config.js +93 -0
- package/dist/server/server/speech/providers/local/config.js.map +1 -0
- package/dist/server/server/speech/providers/local/models.d.ts +12 -0
- package/dist/server/server/speech/providers/local/models.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/models.js +18 -0
- package/dist/server/server/speech/providers/local/models.js.map +1 -0
- package/dist/server/server/speech/providers/local/pocket/pocket-tts-onnx.d.ts +24 -0
- package/dist/server/server/speech/providers/local/pocket/pocket-tts-onnx.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/pocket/pocket-tts-onnx.js +422 -0
- package/dist/server/server/speech/providers/local/pocket/pocket-tts-onnx.js.map +1 -0
- package/dist/server/server/speech/providers/local/runtime.d.ts +30 -0
- package/dist/server/server/speech/providers/local/runtime.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/runtime.js +254 -0
- package/dist/server/server/speech/providers/local/runtime.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/model-catalog.d.ts +117 -0
- package/dist/server/server/speech/providers/local/sherpa/model-catalog.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/model-catalog.js +166 -0
- package/dist/server/server/speech/providers/local/sherpa/model-catalog.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/model-downloader.d.ts +17 -0
- package/dist/server/server/speech/providers/local/sherpa/model-downloader.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/model-downloader.js +151 -0
- package/dist/server/server/speech/providers/local/sherpa/model-downloader.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-offline-recognizer.d.ts +28 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-offline-recognizer.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-offline-recognizer.js +68 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-offline-recognizer.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-online-recognizer.d.ts +37 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-online-recognizer.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-online-recognizer.js +79 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-online-recognizer.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-loader.d.ts +7 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-loader.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-loader.js +11 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-loader.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.d.ts +7 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.js +44 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.d.ts +28 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.js +131 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-stt.d.ts +21 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-stt.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-stt.js +132 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-parakeet-stt.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-realtime-session.d.ts +23 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-realtime-session.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-realtime-session.js +112 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-realtime-session.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-stt.d.ts +23 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-stt.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-stt.js +140 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-stt.js.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-tts.d.ts +21 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-tts.d.ts.map +1 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-tts.js +95 -0
- package/dist/server/server/speech/providers/local/sherpa/sherpa-tts.js.map +1 -0
- package/dist/server/server/speech/providers/openai/config.d.ts +22 -0
- package/dist/server/server/speech/providers/openai/config.d.ts.map +1 -0
- package/dist/server/server/speech/providers/openai/config.js +94 -0
- package/dist/server/server/speech/providers/openai/config.js.map +1 -0
- package/dist/server/server/speech/providers/openai/realtime-transcription-session.d.ts +42 -0
- package/dist/server/server/speech/providers/openai/realtime-transcription-session.d.ts.map +1 -0
- package/dist/server/server/speech/providers/openai/realtime-transcription-session.js +165 -0
- package/dist/server/server/speech/providers/openai/realtime-transcription-session.js.map +1 -0
- package/dist/server/server/speech/providers/openai/runtime.d.ts +27 -0
- package/dist/server/server/speech/providers/openai/runtime.d.ts.map +1 -0
- package/dist/server/server/speech/providers/openai/runtime.js +103 -0
- package/dist/server/server/speech/providers/openai/runtime.js.map +1 -0
- package/dist/server/server/speech/providers/openai/stt.d.ts +22 -0
- package/dist/server/server/speech/providers/openai/stt.d.ts.map +1 -0
- package/dist/server/server/speech/providers/openai/stt.js +208 -0
- package/dist/server/server/speech/providers/openai/stt.js.map +1 -0
- package/dist/server/server/speech/providers/openai/tts.d.ts +18 -0
- package/dist/server/server/speech/providers/openai/tts.d.ts.map +1 -0
- package/dist/server/server/speech/providers/openai/tts.js +46 -0
- package/dist/server/server/speech/providers/openai/tts.js.map +1 -0
- package/dist/server/server/speech/speech-config-resolver.d.ts +11 -0
- package/dist/server/server/speech/speech-config-resolver.d.ts.map +1 -0
- package/dist/server/server/speech/speech-config-resolver.js +64 -0
- package/dist/server/server/speech/speech-config-resolver.js.map +1 -0
- package/dist/server/server/speech/speech-provider.d.ts +59 -0
- package/dist/server/server/speech/speech-provider.d.ts.map +1 -0
- package/dist/server/server/speech/speech-provider.js +2 -0
- package/dist/server/server/speech/speech-provider.js.map +1 -0
- package/dist/server/server/speech/speech-runtime.d.ts +20 -0
- package/dist/server/server/speech/speech-runtime.d.ts.map +1 -0
- package/dist/server/server/speech/speech-runtime.js +119 -0
- package/dist/server/server/speech/speech-runtime.js.map +1 -0
- package/dist/server/server/speech/speech-types.d.ts +20 -0
- package/dist/server/server/speech/speech-types.d.ts.map +1 -0
- package/dist/server/server/speech/speech-types.js +7 -0
- package/dist/server/server/speech/speech-types.js.map +1 -0
- package/dist/server/server/terminal-mcp/index.d.ts +4 -0
- package/dist/server/server/terminal-mcp/index.d.ts.map +1 -0
- package/dist/server/server/terminal-mcp/index.js +3 -0
- package/dist/server/server/terminal-mcp/index.js.map +1 -0
- package/dist/server/server/terminal-mcp/server.d.ts +10 -0
- package/dist/server/server/terminal-mcp/server.d.ts.map +1 -0
- package/dist/server/server/terminal-mcp/server.js +217 -0
- package/dist/server/server/terminal-mcp/server.js.map +1 -0
- package/dist/server/server/terminal-mcp/terminal-manager.d.ts +123 -0
- package/dist/server/server/terminal-mcp/terminal-manager.d.ts.map +1 -0
- package/dist/server/server/terminal-mcp/terminal-manager.js +351 -0
- package/dist/server/server/terminal-mcp/terminal-manager.js.map +1 -0
- package/dist/server/server/terminal-mcp/tmux.d.ts +207 -0
- package/dist/server/server/terminal-mcp/tmux.d.ts.map +1 -0
- package/dist/server/server/terminal-mcp/tmux.js +924 -0
- package/dist/server/server/terminal-mcp/tmux.js.map +1 -0
- package/dist/server/server/types.d.ts +5 -0
- package/dist/server/server/types.d.ts.map +1 -0
- package/dist/server/server/types.js +3 -0
- package/dist/server/server/types.js.map +1 -0
- package/dist/server/server/utils/diff-highlighter.d.ts +52 -0
- package/dist/server/server/utils/diff-highlighter.d.ts.map +1 -0
- package/dist/server/server/utils/diff-highlighter.js +244 -0
- package/dist/server/server/utils/diff-highlighter.js.map +1 -0
- package/dist/server/server/utils/syntax-highlighter.d.ts +10 -0
- package/dist/server/server/utils/syntax-highlighter.d.ts.map +1 -0
- package/dist/server/server/utils/syntax-highlighter.js +141 -0
- package/dist/server/server/utils/syntax-highlighter.js.map +1 -0
- package/dist/server/server/voice-config.d.ts +14 -0
- package/dist/server/server/voice-config.d.ts.map +1 -0
- package/dist/server/server/voice-config.js +51 -0
- package/dist/server/server/voice-config.js.map +1 -0
- package/dist/server/server/voice-mcp-bridge-command.d.ts +17 -0
- package/dist/server/server/voice-mcp-bridge-command.d.ts.map +1 -0
- package/dist/server/server/voice-mcp-bridge-command.js +31 -0
- package/dist/server/server/voice-mcp-bridge-command.js.map +1 -0
- package/dist/server/server/voice-mcp-bridge.d.ts +18 -0
- package/dist/server/server/voice-mcp-bridge.d.ts.map +1 -0
- package/dist/server/server/voice-mcp-bridge.js +109 -0
- package/dist/server/server/voice-mcp-bridge.js.map +1 -0
- package/dist/server/server/voice-permission-policy.d.ts +4 -0
- package/dist/server/server/voice-permission-policy.d.ts.map +1 -0
- package/dist/server/server/voice-permission-policy.js +13 -0
- package/dist/server/server/voice-permission-policy.js.map +1 -0
- package/dist/server/server/voice-types.d.ts +17 -0
- package/dist/server/server/voice-types.d.ts.map +1 -0
- package/dist/server/server/voice-types.js +2 -0
- package/dist/server/server/voice-types.js.map +1 -0
- package/dist/server/server/websocket-server.d.ts +80 -0
- package/dist/server/server/websocket-server.d.ts.map +1 -0
- package/dist/server/server/websocket-server.js +447 -0
- package/dist/server/server/websocket-server.js.map +1 -0
- package/dist/server/shared/agent-lifecycle.d.ts +3 -0
- package/dist/server/shared/agent-lifecycle.d.ts.map +1 -0
- package/dist/server/shared/agent-lifecycle.js +8 -0
- package/dist/server/shared/agent-lifecycle.js.map +1 -0
- package/dist/server/shared/connection-offer.d.ts +62 -0
- package/dist/server/shared/connection-offer.d.ts.map +1 -0
- package/dist/server/shared/connection-offer.js +17 -0
- package/dist/server/shared/connection-offer.js.map +1 -0
- package/dist/server/shared/daemon-endpoints.d.ts +19 -0
- package/dist/server/shared/daemon-endpoints.d.ts.map +1 -0
- package/dist/server/shared/daemon-endpoints.js +98 -0
- package/dist/server/shared/daemon-endpoints.js.map +1 -0
- package/dist/server/shared/messages.d.ts +36729 -0
- package/dist/server/shared/messages.d.ts.map +1 -0
- package/dist/server/shared/messages.js +1666 -0
- package/dist/server/shared/messages.js.map +1 -0
- package/dist/server/shared/path-utils.d.ts +2 -0
- package/dist/server/shared/path-utils.d.ts.map +1 -0
- package/dist/server/shared/path-utils.js +16 -0
- package/dist/server/shared/path-utils.js.map +1 -0
- package/dist/server/shared/tool-call-display.d.ts +11 -0
- package/dist/server/shared/tool-call-display.d.ts.map +1 -0
- package/dist/server/shared/tool-call-display.js +82 -0
- package/dist/server/shared/tool-call-display.js.map +1 -0
- package/dist/server/terminal/terminal-manager.d.ts +14 -0
- package/dist/server/terminal/terminal-manager.d.ts.map +1 -0
- package/dist/server/terminal/terminal-manager.js +67 -0
- package/dist/server/terminal/terminal-manager.js.map +1 -0
- package/dist/server/terminal/terminal.d.ts +67 -0
- package/dist/server/terminal/terminal.d.ts.map +1 -0
- package/dist/server/terminal/terminal.js +190 -0
- package/dist/server/terminal/terminal.js.map +1 -0
- package/dist/server/utils/checkout-git.d.ts +138 -0
- package/dist/server/utils/checkout-git.d.ts.map +1 -0
- package/dist/server/utils/checkout-git.js +1079 -0
- package/dist/server/utils/checkout-git.js.map +1 -0
- package/dist/server/utils/path.d.ts +5 -0
- package/dist/server/utils/path.d.ts.map +1 -0
- package/dist/server/utils/path.js +15 -0
- package/dist/server/utils/path.js.map +1 -0
- package/dist/server/utils/project-icon.d.ts +39 -0
- package/dist/server/utils/project-icon.d.ts.map +1 -0
- package/dist/server/utils/project-icon.js +391 -0
- package/dist/server/utils/project-icon.js.map +1 -0
- package/dist/server/utils/worktree-metadata.d.ts +21 -0
- package/dist/server/utils/worktree-metadata.d.ts.map +1 -0
- package/dist/server/utils/worktree-metadata.js +74 -0
- package/dist/server/utils/worktree-metadata.js.map +1 -0
- package/dist/server/utils/worktree.d.ts +95 -0
- package/dist/server/utils/worktree.d.ts.map +1 -0
- package/dist/server/utils/worktree.js +568 -0
- package/dist/server/utils/worktree.js.map +1 -0
- package/package.json +108 -0
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
import type pino from "pino";
|
|
2
|
+
import type { LogprobToken, SpeechToTextProvider, StreamingTranscriptionSession, TranscriptionResult } from "../../speech-provider.js";
|
|
3
|
+
export type { LogprobToken, TranscriptionResult };
|
|
4
|
+
export interface STTConfig {
|
|
5
|
+
apiKey: string;
|
|
6
|
+
model?: "whisper-1" | "gpt-4o-transcribe" | "gpt-4o-mini-transcribe" | (string & {});
|
|
7
|
+
confidenceThreshold?: number;
|
|
8
|
+
}
|
|
9
|
+
export declare class OpenAISTT implements SpeechToTextProvider {
|
|
10
|
+
private readonly openaiClient;
|
|
11
|
+
private readonly config;
|
|
12
|
+
private readonly logger;
|
|
13
|
+
readonly id: "openai";
|
|
14
|
+
constructor(sttConfig: STTConfig, parentLogger: pino.Logger);
|
|
15
|
+
createSession(params: {
|
|
16
|
+
logger: pino.Logger;
|
|
17
|
+
language?: string;
|
|
18
|
+
prompt?: string;
|
|
19
|
+
}): StreamingTranscriptionSession;
|
|
20
|
+
private transcribeAudioInternal;
|
|
21
|
+
}
|
|
22
|
+
//# sourceMappingURL=stt.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"stt.d.ts","sourceRoot":"","sources":["../../../../../../src/server/speech/providers/openai/stt.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAO7B,OAAO,KAAK,EACV,YAAY,EACZ,oBAAoB,EACpB,6BAA6B,EAC7B,mBAAmB,EACpB,MAAM,0BAA0B,CAAC;AAElC,YAAY,EAAE,YAAY,EAAE,mBAAmB,EAAE,CAAC;AAElD,MAAM,WAAW,SAAS;IACxB,MAAM,EAAE,MAAM,CAAC;IACf,KAAK,CAAC,EAAE,WAAW,GAAG,mBAAmB,GAAG,wBAAwB,GAAG,CAAC,MAAM,GAAG,EAAE,CAAC,CAAC;IACrF,mBAAmB,CAAC,EAAE,MAAM,CAAC;CAC9B;AA0BD,qBAAa,SAAU,YAAW,oBAAoB;IACpD,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAS;IACtC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAY;IACnC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAc;IACrC,SAAgB,EAAE,EAAG,QAAQ,CAAU;gBAE3B,SAAS,EAAE,SAAS,EAAE,YAAY,EAAE,IAAI,CAAC,MAAM;IASpD,aAAa,CAAC,MAAM,EAAE;QAC3B,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC;QACpB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,MAAM,CAAC,EAAE,MAAM,CAAC;KACjB,GAAG,6BAA6B;YAkHnB,uBAAuB;CAwFtC"}
|
|
@@ -0,0 +1,208 @@
|
|
|
1
|
+
import { EventEmitter } from "node:events";
|
|
2
|
+
import OpenAI from "openai";
|
|
3
|
+
import { writeFile, unlink } from "fs/promises";
|
|
4
|
+
import { join } from "path";
|
|
5
|
+
import { tmpdir } from "os";
|
|
6
|
+
import { v4 } from "uuid";
|
|
7
|
+
import { inferAudioExtension } from "../../../agent/audio-utils.js";
|
|
8
|
+
function isObject(value) {
|
|
9
|
+
return typeof value === "object" && value !== null;
|
|
10
|
+
}
|
|
11
|
+
function isLogprobToken(value) {
|
|
12
|
+
if (!isObject(value)) {
|
|
13
|
+
return false;
|
|
14
|
+
}
|
|
15
|
+
if (typeof value.token !== "string") {
|
|
16
|
+
return false;
|
|
17
|
+
}
|
|
18
|
+
if (typeof value.logprob !== "number") {
|
|
19
|
+
return false;
|
|
20
|
+
}
|
|
21
|
+
if (value.bytes === undefined) {
|
|
22
|
+
return true;
|
|
23
|
+
}
|
|
24
|
+
return Array.isArray(value.bytes) && value.bytes.every((entry) => typeof entry === "number");
|
|
25
|
+
}
|
|
26
|
+
function isLogprobTokenArray(value) {
|
|
27
|
+
return Array.isArray(value) && value.every((entry) => isLogprobToken(entry));
|
|
28
|
+
}
|
|
29
|
+
export class OpenAISTT {
|
|
30
|
+
constructor(sttConfig, parentLogger) {
|
|
31
|
+
this.id = "openai";
|
|
32
|
+
this.config = sttConfig;
|
|
33
|
+
this.logger = parentLogger.child({ module: "agent", provider: "openai", component: "stt" });
|
|
34
|
+
this.openaiClient = new OpenAI({
|
|
35
|
+
apiKey: sttConfig.apiKey,
|
|
36
|
+
});
|
|
37
|
+
this.logger.info({ model: sttConfig.model || "whisper-1" }, "STT (OpenAI Whisper) initialized");
|
|
38
|
+
}
|
|
39
|
+
createSession(params) {
|
|
40
|
+
const emitter = new EventEmitter();
|
|
41
|
+
const logger = params.logger.child({ provider: "openai", component: "stt-session" });
|
|
42
|
+
const requiredSampleRate = 24000;
|
|
43
|
+
let connected = false;
|
|
44
|
+
let segmentId = v4();
|
|
45
|
+
let previousSegmentId = null;
|
|
46
|
+
let pcm16 = Buffer.alloc(0);
|
|
47
|
+
const transcribeAudio = this.transcribeAudioInternal.bind(this);
|
|
48
|
+
const convertPCMToWavBuffer = (pcmBuffer) => {
|
|
49
|
+
const headerSize = 44;
|
|
50
|
+
const channels = 1;
|
|
51
|
+
const bitsPerSample = 16;
|
|
52
|
+
const sampleRate = requiredSampleRate;
|
|
53
|
+
const wavBuffer = Buffer.alloc(headerSize + pcmBuffer.length);
|
|
54
|
+
const byteRate = (sampleRate * channels * bitsPerSample) / 8;
|
|
55
|
+
const blockAlign = (channels * bitsPerSample) / 8;
|
|
56
|
+
wavBuffer.write("RIFF", 0);
|
|
57
|
+
wavBuffer.writeUInt32LE(36 + pcmBuffer.length, 4);
|
|
58
|
+
wavBuffer.write("WAVE", 8);
|
|
59
|
+
wavBuffer.write("fmt ", 12);
|
|
60
|
+
wavBuffer.writeUInt32LE(16, 16);
|
|
61
|
+
wavBuffer.writeUInt16LE(1, 20);
|
|
62
|
+
wavBuffer.writeUInt16LE(channels, 22);
|
|
63
|
+
wavBuffer.writeUInt32LE(sampleRate, 24);
|
|
64
|
+
wavBuffer.writeUInt32LE(byteRate, 28);
|
|
65
|
+
wavBuffer.writeUInt16LE(blockAlign, 32);
|
|
66
|
+
wavBuffer.writeUInt16LE(bitsPerSample, 34);
|
|
67
|
+
wavBuffer.write("data", 36);
|
|
68
|
+
wavBuffer.writeUInt32LE(pcmBuffer.length, 40);
|
|
69
|
+
pcmBuffer.copy(wavBuffer, 44);
|
|
70
|
+
return wavBuffer;
|
|
71
|
+
};
|
|
72
|
+
return {
|
|
73
|
+
requiredSampleRate,
|
|
74
|
+
async connect() {
|
|
75
|
+
connected = true;
|
|
76
|
+
},
|
|
77
|
+
appendPcm16(chunk) {
|
|
78
|
+
if (!connected) {
|
|
79
|
+
emitter.emit("error", new Error("STT session not connected"));
|
|
80
|
+
return;
|
|
81
|
+
}
|
|
82
|
+
pcm16 = pcm16.length === 0 ? chunk : Buffer.concat([pcm16, chunk]);
|
|
83
|
+
},
|
|
84
|
+
commit() {
|
|
85
|
+
if (!connected) {
|
|
86
|
+
emitter.emit("error", new Error("STT session not connected"));
|
|
87
|
+
return;
|
|
88
|
+
}
|
|
89
|
+
const committedId = segmentId;
|
|
90
|
+
const prev = previousSegmentId;
|
|
91
|
+
emitter.emit("committed", { segmentId: committedId, previousSegmentId: prev });
|
|
92
|
+
void (async () => {
|
|
93
|
+
try {
|
|
94
|
+
if (pcm16.length === 0) {
|
|
95
|
+
emitter.emit("transcript", {
|
|
96
|
+
segmentId: committedId,
|
|
97
|
+
transcript: "",
|
|
98
|
+
isFinal: true,
|
|
99
|
+
language: params.language,
|
|
100
|
+
isLowConfidence: true,
|
|
101
|
+
});
|
|
102
|
+
return;
|
|
103
|
+
}
|
|
104
|
+
const wav = convertPCMToWavBuffer(pcm16);
|
|
105
|
+
const result = await transcribeAudio(wav, "audio/wav", params.language ?? "en", logger);
|
|
106
|
+
emitter.emit("transcript", {
|
|
107
|
+
segmentId: committedId,
|
|
108
|
+
transcript: result.text,
|
|
109
|
+
isFinal: true,
|
|
110
|
+
language: result.language,
|
|
111
|
+
logprobs: result.logprobs,
|
|
112
|
+
avgLogprob: result.avgLogprob,
|
|
113
|
+
isLowConfidence: result.isLowConfidence,
|
|
114
|
+
});
|
|
115
|
+
}
|
|
116
|
+
catch (err) {
|
|
117
|
+
emitter.emit("error", err);
|
|
118
|
+
}
|
|
119
|
+
finally {
|
|
120
|
+
previousSegmentId = committedId;
|
|
121
|
+
segmentId = v4();
|
|
122
|
+
pcm16 = Buffer.alloc(0);
|
|
123
|
+
}
|
|
124
|
+
})();
|
|
125
|
+
},
|
|
126
|
+
clear() {
|
|
127
|
+
pcm16 = Buffer.alloc(0);
|
|
128
|
+
segmentId = v4();
|
|
129
|
+
},
|
|
130
|
+
close() {
|
|
131
|
+
connected = false;
|
|
132
|
+
pcm16 = Buffer.alloc(0);
|
|
133
|
+
},
|
|
134
|
+
on(event, handler) {
|
|
135
|
+
emitter.on(event, handler);
|
|
136
|
+
return undefined;
|
|
137
|
+
},
|
|
138
|
+
};
|
|
139
|
+
}
|
|
140
|
+
async transcribeAudioInternal(audioBuffer, format, language, logger) {
|
|
141
|
+
const startTime = Date.now();
|
|
142
|
+
let tempFilePath = null;
|
|
143
|
+
try {
|
|
144
|
+
const ext = inferAudioExtension(format);
|
|
145
|
+
tempFilePath = join(tmpdir(), `audio-${v4()}.${ext}`);
|
|
146
|
+
await writeFile(tempFilePath, audioBuffer);
|
|
147
|
+
logger.debug({ tempFilePath, bytes: audioBuffer.length }, "Transcribing audio file");
|
|
148
|
+
const modelToUse = this.config.model ?? "whisper-1";
|
|
149
|
+
const supportsLogprobs = modelToUse === "gpt-4o-transcribe" || modelToUse === "gpt-4o-mini-transcribe";
|
|
150
|
+
const includeLogprobs = ["logprobs"];
|
|
151
|
+
const response = await this.openaiClient.audio.transcriptions.create({
|
|
152
|
+
file: await import("fs").then((fs) => fs.createReadStream(tempFilePath)),
|
|
153
|
+
language,
|
|
154
|
+
model: modelToUse,
|
|
155
|
+
...(supportsLogprobs ? { include: includeLogprobs } : {}),
|
|
156
|
+
response_format: "json",
|
|
157
|
+
});
|
|
158
|
+
const duration = Date.now() - startTime;
|
|
159
|
+
const confidenceThreshold = this.config.confidenceThreshold ?? -3.0;
|
|
160
|
+
let avgLogprob;
|
|
161
|
+
let isLowConfidence = false;
|
|
162
|
+
const logprobs = supportsLogprobs &&
|
|
163
|
+
isObject(response) &&
|
|
164
|
+
isLogprobTokenArray(response.logprobs)
|
|
165
|
+
? response.logprobs
|
|
166
|
+
: undefined;
|
|
167
|
+
if (logprobs && logprobs.length > 0) {
|
|
168
|
+
const totalLogprob = logprobs.reduce((sum, token) => sum + token.logprob, 0);
|
|
169
|
+
avgLogprob = totalLogprob / logprobs.length;
|
|
170
|
+
isLowConfidence = avgLogprob < confidenceThreshold;
|
|
171
|
+
if (isLowConfidence) {
|
|
172
|
+
logger.debug({
|
|
173
|
+
avgLogprob,
|
|
174
|
+
threshold: confidenceThreshold,
|
|
175
|
+
text: response.text,
|
|
176
|
+
tokenLogprobs: logprobs.map((t) => `${t.token}:${t.logprob.toFixed(2)}`).join(", "),
|
|
177
|
+
}, "Low confidence transcription detected");
|
|
178
|
+
}
|
|
179
|
+
}
|
|
180
|
+
logger.debug({ duration, text: response.text, avgLogprob }, "Transcription complete");
|
|
181
|
+
return {
|
|
182
|
+
text: response.text,
|
|
183
|
+
duration: duration,
|
|
184
|
+
logprobs: logprobs,
|
|
185
|
+
avgLogprob: avgLogprob,
|
|
186
|
+
isLowConfidence: isLowConfidence,
|
|
187
|
+
language: isObject(response) && typeof response.language === "string"
|
|
188
|
+
? response.language
|
|
189
|
+
: undefined,
|
|
190
|
+
};
|
|
191
|
+
}
|
|
192
|
+
catch (error) {
|
|
193
|
+
logger.error({ err: error }, "Transcription error");
|
|
194
|
+
throw new Error(`STT transcription failed: ${error.message}`);
|
|
195
|
+
}
|
|
196
|
+
finally {
|
|
197
|
+
if (tempFilePath) {
|
|
198
|
+
try {
|
|
199
|
+
await unlink(tempFilePath);
|
|
200
|
+
}
|
|
201
|
+
catch (cleanupError) {
|
|
202
|
+
logger.warn({ tempFilePath }, "Failed to clean up temp file");
|
|
203
|
+
}
|
|
204
|
+
}
|
|
205
|
+
}
|
|
206
|
+
}
|
|
207
|
+
}
|
|
208
|
+
//# sourceMappingURL=stt.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"stt.js","sourceRoot":"","sources":["../../../../../../src/server/speech/providers/openai/stt.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAE3C,OAAO,MAAM,MAAM,QAAQ,CAAC;AAC5B,OAAO,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,aAAa,CAAC;AAChD,OAAO,EAAE,IAAI,EAAE,MAAM,MAAM,CAAC;AAC5B,OAAO,EAAE,MAAM,EAAE,MAAM,IAAI,CAAC;AAC5B,OAAO,EAAE,EAAE,EAAE,MAAM,MAAM,CAAC;AAC1B,OAAO,EAAE,mBAAmB,EAAE,MAAM,+BAA+B,CAAC;AAgBpE,SAAS,QAAQ,CAAC,KAAc;IAC9B,OAAO,OAAO,KAAK,KAAK,QAAQ,IAAI,KAAK,KAAK,IAAI,CAAC;AACrD,CAAC;AAED,SAAS,cAAc,CAAC,KAAc;IACpC,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;QACrB,OAAO,KAAK,CAAC;IACf,CAAC;IACD,IAAI,OAAO,KAAK,CAAC,KAAK,KAAK,QAAQ,EAAE,CAAC;QACpC,OAAO,KAAK,CAAC;IACf,CAAC;IACD,IAAI,OAAO,KAAK,CAAC,OAAO,KAAK,QAAQ,EAAE,CAAC;QACtC,OAAO,KAAK,CAAC;IACf,CAAC;IACD,IAAI,KAAK,CAAC,KAAK,KAAK,SAAS,EAAE,CAAC;QAC9B,OAAO,IAAI,CAAC;IACd,CAAC;IACD,OAAO,KAAK,CAAC,OAAO,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,OAAO,KAAK,KAAK,QAAQ,CAAC,CAAC;AAC/F,CAAC;AAED,SAAS,mBAAmB,CAAC,KAAc;IACzC,OAAO,KAAK,CAAC,OAAO,CAAC,KAAK,CAAC,IAAI,KAAK,CAAC,KAAK,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,cAAc,CAAC,KAAK,CAAC,CAAC,CAAC;AAC/E,CAAC;AAED,MAAM,OAAO,SAAS;IAMpB,YAAY,SAAoB,EAAE,YAAyB;QAF3C,OAAE,GAAG,QAAiB,CAAC;QAGrC,IAAI,CAAC,MAAM,GAAG,SAAS,CAAC;QACxB,IAAI,CAAC,MAAM,GAAG,YAAY,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,OAAO,EAAE,QAAQ,EAAE,QAAQ,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC,CAAC;QAC5F,IAAI,CAAC,YAAY,GAAG,IAAI,MAAM,CAAC;YAC7B,MAAM,EAAE,SAAS,CAAC,MAAM;SACzB,CAAC,CAAC;QACH,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,KAAK,EAAE,SAAS,CAAC,KAAK,IAAI,WAAW,EAAE,EAAE,kCAAkC,CAAC,CAAC;IAClG,CAAC;IAEM,aAAa,CAAC,MAIpB;QACC,MAAM,OAAO,GAAG,IAAI,YAAY,EAAE,CAAC;QACnC,MAAM,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE,QAAQ,EAAE,QAAQ,EAAE,SAAS,EAAE,aAAa,EAAE,CAAC,CAAC;QACrF,MAAM,kBAAkB,GAAG,KAAK,CAAC;QAEjC,IAAI,SAAS,GAAG,KAAK,CAAC;QACtB,IAAI,SAAS,GAAG,EAAE,EAAE,CAAC;QACrB,IAAI,iBAAiB,GAAkB,IAAI,CAAC;QAC5C,IAAI,KAAK,GAAW,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QACpC,MAAM,eAAe,GAAG,IAAI,CAAC,uBAAuB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAEhE,MAAM,qBAAqB,GAAG,CAAC,SAAiB,EAAU,EAAE;YAC1D,MAAM,UAAU,GAAG,EAAE,CAAC;YACtB,MAAM,QAAQ,GAAG,CAAC,CAAC;YACnB,MAAM,aAAa,GAAG,EAAE,CAAC;YACzB,MAAM,UAAU,GAAG,kBAAkB,CAAC;YACtC,MAAM,SAAS,GAAG,MAAM,CAAC,KAAK,CAAC,UAAU,GAAG,SAAS,CAAC,MAAM,CAAC,CAAC;YAC9D,MAAM,QAAQ,GAAG,CAAC,UAAU,GAAG,QAAQ,GAAG,aAAa,CAAC,GAAG,CAAC,CAAC;YAC7D,MAAM,UAAU,GAAG,CAAC,QAAQ,GAAG,aAAa,CAAC,GAAG,CAAC,CAAC;YAElD,SAAS,CAAC,KAAK,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;YAC3B,SAAS,CAAC,aAAa,CAAC,EAAE,GAAG,SAAS,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;YAClD,SAAS,CAAC,KAAK,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;YAC3B,SAAS,CAAC,KAAK,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;YAC5B,SAAS,CAAC,aAAa,CAAC,EAAE,EAAE,EAAE,CAAC,CAAC;YAChC,SAAS,CAAC,aAAa,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;YAC/B,SAAS,CAAC,aAAa,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;YACtC,SAAS,CAAC,aAAa,CAAC,UAAU,EAAE,EAAE,CAAC,CAAC;YACxC,SAAS,CAAC,aAAa,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;YACtC,SAAS,CAAC,aAAa,CAAC,UAAU,EAAE,EAAE,CAAC,CAAC;YACxC,SAAS,CAAC,aAAa,CAAC,aAAa,EAAE,EAAE,CAAC,CAAC;YAC3C,SAAS,CAAC,KAAK,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;YAC5B,SAAS,CAAC,aAAa,CAAC,SAAS,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;YAC9C,SAAS,CAAC,IAAI,CAAC,SAAS,EAAE,EAAE,CAAC,CAAC;YAE9B,OAAO,SAAS,CAAC;QACnB,CAAC,CAAC;QAEF,OAAO;YACL,kBAAkB;YAClB,KAAK,CAAC,OAAO;gBACX,SAAS,GAAG,IAAI,CAAC;YACnB,CAAC;YACD,WAAW,CAAC,KAAa;gBACvB,IAAI,CAAC,SAAS,EAAE,CAAC;oBACd,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,2BAA2B,CAAC,CAAC,CAAC;oBACvE,OAAO;gBACT,CAAC;gBACD,KAAK,GAAG,KAAK,CAAC,MAAM,KAAK,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC,CAAC;YACrE,CAAC;YACD,MAAM;gBACJ,IAAI,CAAC,SAAS,EAAE,CAAC;oBACd,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,2BAA2B,CAAC,CAAC,CAAC;oBACvE,OAAO;gBACT,CAAC;gBAED,MAAM,WAAW,GAAG,SAAS,CAAC;gBAC9B,MAAM,IAAI,GAAG,iBAAiB,CAAC;gBAC9B,OAAe,CAAC,IAAI,CAAC,WAAW,EAAE,EAAE,SAAS,EAAE,WAAW,EAAE,iBAAiB,EAAE,IAAI,EAAE,CAAC,CAAC;gBAExF,KAAK,CAAC,KAAK,IAAI,EAAE;oBACf,IAAI,CAAC;wBACH,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;4BACtB,OAAe,CAAC,IAAI,CAAC,YAAY,EAAE;gCAClC,SAAS,EAAE,WAAW;gCACtB,UAAU,EAAE,EAAE;gCACd,OAAO,EAAE,IAAI;gCACb,QAAQ,EAAE,MAAM,CAAC,QAAQ;gCACzB,eAAe,EAAE,IAAI;6BACtB,CAAC,CAAC;4BACH,OAAO;wBACT,CAAC;wBAED,MAAM,GAAG,GAAG,qBAAqB,CAAC,KAAK,CAAC,CAAC;wBACzC,MAAM,MAAM,GAAG,MAAM,eAAe,CAClC,GAAG,EACH,WAAW,EACX,MAAM,CAAC,QAAQ,IAAI,IAAI,EACvB,MAAM,CACP,CAAC;wBAED,OAAe,CAAC,IAAI,CAAC,YAAY,EAAE;4BAClC,SAAS,EAAE,WAAW;4BACtB,UAAU,EAAE,MAAM,CAAC,IAAI;4BACvB,OAAO,EAAE,IAAI;4BACb,QAAQ,EAAE,MAAM,CAAC,QAAQ;4BACzB,QAAQ,EAAE,MAAM,CAAC,QAAQ;4BACzB,UAAU,EAAE,MAAM,CAAC,UAAU;4BAC7B,eAAe,EAAE,MAAM,CAAC,eAAe;yBACxC,CAAC,CAAC;oBACL,CAAC;oBAAC,OAAO,GAAG,EAAE,CAAC;wBACZ,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,GAAG,CAAC,CAAC;oBACtC,CAAC;4BAAS,CAAC;wBACT,iBAAiB,GAAG,WAAW,CAAC;wBAChC,SAAS,GAAG,EAAE,EAAE,CAAC;wBACjB,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;oBAC1B,CAAC;gBACH,CAAC,CAAC,EAAE,CAAC;YACP,CAAC;YACD,KAAK;gBACH,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;gBACxB,SAAS,GAAG,EAAE,EAAE,CAAC;YACnB,CAAC;YACD,KAAK;gBACH,SAAS,GAAG,KAAK,CAAC;gBAClB,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;YAC1B,CAAC;YACD,EAAE,CAAC,KAAU,EAAE,OAAY;gBACzB,OAAO,CAAC,EAAE,CAAC,KAAK,EAAE,OAAO,CAAC,CAAC;gBAC3B,OAAO,SAAS,CAAC;YACnB,CAAC;SACF,CAAC;IACJ,CAAC;IAEO,KAAK,CAAC,uBAAuB,CACnC,WAAmB,EACnB,MAAc,EACd,QAAgB,EAChB,MAAmB;QAEnB,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAC7B,IAAI,YAAY,GAAkB,IAAI,CAAC;QAEvC,IAAI,CAAC;YACH,MAAM,GAAG,GAAG,mBAAmB,CAAC,MAAM,CAAC,CAAC;YACxC,YAAY,GAAG,IAAI,CAAC,MAAM,EAAE,EAAE,SAAS,EAAE,EAAE,IAAI,GAAG,EAAE,CAAC,CAAC;YACtD,MAAM,SAAS,CAAC,YAAY,EAAE,WAAW,CAAC,CAAC;YAE3C,MAAM,CAAC,KAAK,CACV,EAAE,YAAY,EAAE,KAAK,EAAE,WAAW,CAAC,MAAM,EAAE,EAC3C,yBAAyB,CAC1B,CAAC;YAEF,MAAM,UAAU,GAAG,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,WAAW,CAAC;YACpD,MAAM,gBAAgB,GACpB,UAAU,KAAK,mBAAmB,IAAI,UAAU,KAAK,wBAAwB,CAAC;YAChF,MAAM,eAAe,GAAiB,CAAC,UAAU,CAAC,CAAC;YAEnD,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,YAAY,CAAC,KAAK,CAAC,cAAc,CAAC,MAAM,CAAC;gBACnE,IAAI,EAAE,MAAM,MAAM,CAAC,IAAI,CAAC,CAAC,IAAI,CAAC,CAAC,EAAE,EAAE,EAAE,CAAC,EAAE,CAAC,gBAAgB,CAAC,YAAa,CAAC,CAAC;gBACzE,QAAQ;gBACR,KAAK,EAAE,UAAU;gBACjB,GAAG,CAAC,gBAAgB,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,eAAe,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBACzD,eAAe,EAAE,MAAM;aACxB,CAAC,CAAC;YAEH,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YACxC,MAAM,mBAAmB,GAAG,IAAI,CAAC,MAAM,CAAC,mBAAmB,IAAI,CAAC,GAAG,CAAC;YAEpE,IAAI,UAA8B,CAAC;YACnC,IAAI,eAAe,GAAG,KAAK,CAAC;YAC5B,MAAM,QAAQ,GACZ,gBAAgB;gBAChB,QAAQ,CAAC,QAAQ,CAAC;gBAClB,mBAAmB,CAAC,QAAQ,CAAC,QAAQ,CAAC;gBACpC,CAAC,CAAC,QAAQ,CAAC,QAAQ;gBACnB,CAAC,CAAC,SAAS,CAAC;YAEhB,IAAI,QAAQ,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACpC,MAAM,YAAY,GAAG,QAAQ,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE,CAAC,GAAG,GAAG,KAAK,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC;gBAC7E,UAAU,GAAG,YAAY,GAAG,QAAQ,CAAC,MAAM,CAAC;gBAC5C,eAAe,GAAG,UAAU,GAAG,mBAAmB,CAAC;gBAEnD,IAAI,eAAe,EAAE,CAAC;oBACpB,MAAM,CAAC,KAAK,CACV;wBACE,UAAU;wBACV,SAAS,EAAE,mBAAmB;wBAC9B,IAAI,EAAE,QAAQ,CAAC,IAAI;wBACnB,aAAa,EAAE,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,GAAG,CAAC,CAAC,KAAK,IAAI,CAAC,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC;qBACpF,EACD,uCAAuC,CACxC,CAAC;gBACJ,CAAC;YACH,CAAC;YAED,MAAM,CAAC,KAAK,CAAC,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,CAAC,IAAI,EAAE,UAAU,EAAE,EAAE,wBAAwB,CAAC,CAAC;YAEtF,OAAO;gBACL,IAAI,EAAE,QAAQ,CAAC,IAAI;gBACnB,QAAQ,EAAE,QAAQ;gBAClB,QAAQ,EAAE,QAAQ;gBAClB,UAAU,EAAE,UAAU;gBACtB,eAAe,EAAE,eAAe;gBAChC,QAAQ,EACN,QAAQ,CAAC,QAAQ,CAAC,IAAI,OAAO,QAAQ,CAAC,QAAQ,KAAK,QAAQ;oBACzD,CAAC,CAAC,QAAQ,CAAC,QAAQ;oBACnB,CAAC,CAAC,SAAS;aAChB,CAAC;QACJ,CAAC;QAAC,OAAO,KAAU,EAAE,CAAC;YACpB,MAAM,CAAC,KAAK,CAAC,EAAE,GAAG,EAAE,KAAK,EAAE,EAAE,qBAAqB,CAAC,CAAC;YACpD,MAAM,IAAI,KAAK,CAAC,6BAA6B,KAAK,CAAC,OAAO,EAAE,CAAC,CAAC;QAChE,CAAC;gBAAS,CAAC;YACT,IAAI,YAAY,EAAE,CAAC;gBACjB,IAAI,CAAC;oBACH,MAAM,MAAM,CAAC,YAAY,CAAC,CAAC;gBAC7B,CAAC;gBAAC,OAAO,YAAY,EAAE,CAAC;oBACtB,MAAM,CAAC,IAAI,CAAC,EAAE,YAAY,EAAE,EAAE,8BAA8B,CAAC,CAAC;gBAChE,CAAC;YACH,CAAC;QACH,CAAC;IACH,CAAC;CACF"}
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
import type pino from "pino";
|
|
2
|
+
import type { SpeechStreamResult, TextToSpeechProvider } from "../../speech-provider.js";
|
|
3
|
+
export type { SpeechStreamResult };
|
|
4
|
+
export interface TTSConfig {
|
|
5
|
+
apiKey: string;
|
|
6
|
+
model?: "tts-1" | "tts-1-hd";
|
|
7
|
+
voice?: "alloy" | "echo" | "fable" | "onyx" | "nova" | "shimmer";
|
|
8
|
+
responseFormat?: "mp3" | "opus" | "aac" | "flac" | "wav" | "pcm";
|
|
9
|
+
}
|
|
10
|
+
export declare class OpenAITTS implements TextToSpeechProvider {
|
|
11
|
+
private readonly openaiClient;
|
|
12
|
+
private readonly config;
|
|
13
|
+
private readonly logger;
|
|
14
|
+
constructor(ttsConfig: TTSConfig, parentLogger: pino.Logger);
|
|
15
|
+
getConfig(): TTSConfig;
|
|
16
|
+
synthesizeSpeech(text: string): Promise<SpeechStreamResult>;
|
|
17
|
+
}
|
|
18
|
+
//# sourceMappingURL=tts.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts.d.ts","sourceRoot":"","sources":["../../../../../../src/server/speech/providers/openai/tts.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAG7B,OAAO,KAAK,EAAE,kBAAkB,EAAE,oBAAoB,EAAE,MAAM,0BAA0B,CAAC;AAEzF,YAAY,EAAE,kBAAkB,EAAE,CAAC;AAEnC,MAAM,WAAW,SAAS;IACxB,MAAM,EAAE,MAAM,CAAC;IACf,KAAK,CAAC,EAAE,OAAO,GAAG,UAAU,CAAC;IAC7B,KAAK,CAAC,EAAE,OAAO,GAAG,MAAM,GAAG,OAAO,GAAG,MAAM,GAAG,MAAM,GAAG,SAAS,CAAC;IACjE,cAAc,CAAC,EAAE,KAAK,GAAG,MAAM,GAAG,KAAK,GAAG,MAAM,GAAG,KAAK,GAAG,KAAK,CAAC;CAClE;AAED,qBAAa,SAAU,YAAW,oBAAoB;IACpD,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAS;IACtC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAY;IACnC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAc;gBAEzB,SAAS,EAAE,SAAS,EAAE,YAAY,EAAE,IAAI,CAAC,MAAM;IAkBpD,SAAS,IAAI,SAAS;IAIhB,gBAAgB,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,kBAAkB,CAAC;CAkCzE"}
|
|
@@ -0,0 +1,46 @@
|
|
|
1
|
+
import OpenAI from "openai";
|
|
2
|
+
export class OpenAITTS {
|
|
3
|
+
constructor(ttsConfig, parentLogger) {
|
|
4
|
+
this.config = {
|
|
5
|
+
model: "tts-1",
|
|
6
|
+
voice: "alloy",
|
|
7
|
+
responseFormat: "pcm",
|
|
8
|
+
...ttsConfig,
|
|
9
|
+
};
|
|
10
|
+
this.logger = parentLogger.child({ module: "agent", provider: "openai", component: "tts" });
|
|
11
|
+
this.openaiClient = new OpenAI({
|
|
12
|
+
apiKey: ttsConfig.apiKey,
|
|
13
|
+
});
|
|
14
|
+
this.logger.info({ voice: this.config.voice, model: this.config.model, format: this.config.responseFormat }, "TTS (OpenAI) initialized");
|
|
15
|
+
}
|
|
16
|
+
getConfig() {
|
|
17
|
+
return this.config;
|
|
18
|
+
}
|
|
19
|
+
async synthesizeSpeech(text) {
|
|
20
|
+
if (!text || text.trim().length === 0) {
|
|
21
|
+
throw new Error("Cannot synthesize empty text");
|
|
22
|
+
}
|
|
23
|
+
const startTime = Date.now();
|
|
24
|
+
try {
|
|
25
|
+
this.logger.debug({ textLength: text.length, preview: text.substring(0, 50) }, "Synthesizing speech");
|
|
26
|
+
const response = await this.openaiClient.audio.speech.create({
|
|
27
|
+
model: this.config.model,
|
|
28
|
+
voice: this.config.voice,
|
|
29
|
+
input: text,
|
|
30
|
+
response_format: this.config.responseFormat,
|
|
31
|
+
});
|
|
32
|
+
const audioStream = response.body;
|
|
33
|
+
const duration = Date.now() - startTime;
|
|
34
|
+
this.logger.debug({ duration }, "Speech synthesis stream ready");
|
|
35
|
+
return {
|
|
36
|
+
stream: audioStream,
|
|
37
|
+
format: this.config.responseFormat || "mp3",
|
|
38
|
+
};
|
|
39
|
+
}
|
|
40
|
+
catch (error) {
|
|
41
|
+
this.logger.error({ err: error }, "Speech synthesis error");
|
|
42
|
+
throw new Error(`TTS synthesis failed: ${error.message}`);
|
|
43
|
+
}
|
|
44
|
+
}
|
|
45
|
+
}
|
|
46
|
+
//# sourceMappingURL=tts.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts.js","sourceRoot":"","sources":["../../../../../../src/server/speech/providers/openai/tts.ts"],"names":[],"mappings":"AACA,OAAO,MAAM,MAAM,QAAQ,CAAC;AAa5B,MAAM,OAAO,SAAS;IAKpB,YAAY,SAAoB,EAAE,YAAyB;QACzD,IAAI,CAAC,MAAM,GAAG;YACZ,KAAK,EAAE,OAAO;YACd,KAAK,EAAE,OAAO;YACd,cAAc,EAAE,KAAK;YACrB,GAAG,SAAS;SACb,CAAC;QACF,IAAI,CAAC,MAAM,GAAG,YAAY,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,OAAO,EAAE,QAAQ,EAAE,QAAQ,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC,CAAC;QAC5F,IAAI,CAAC,YAAY,GAAG,IAAI,MAAM,CAAC;YAC7B,MAAM,EAAE,SAAS,CAAC,MAAM;SACzB,CAAC,CAAC;QAEH,IAAI,CAAC,MAAM,CAAC,IAAI,CACd,EAAE,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,cAAc,EAAE,EAC1F,0BAA0B,CAC3B,CAAC;IACJ,CAAC;IAEM,SAAS;QACd,OAAO,IAAI,CAAC,MAAM,CAAC;IACrB,CAAC;IAEM,KAAK,CAAC,gBAAgB,CAAC,IAAY;QACxC,IAAI,CAAC,IAAI,IAAI,IAAI,CAAC,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACtC,MAAM,IAAI,KAAK,CAAC,8BAA8B,CAAC,CAAC;QAClD,CAAC;QAED,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAE7B,IAAI,CAAC;YACH,IAAI,CAAC,MAAM,CAAC,KAAK,CACf,EAAE,UAAU,EAAE,IAAI,CAAC,MAAM,EAAE,OAAO,EAAE,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,CAAC,EAAE,EAC3D,qBAAqB,CACtB,CAAC;YAEF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,YAAY,CAAC,KAAK,CAAC,MAAM,CAAC,MAAM,CAAC;gBAC3D,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAM;gBACzB,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,KAAM;gBACzB,KAAK,EAAE,IAAI;gBACX,eAAe,EAAE,IAAI,CAAC,MAAM,CAAC,cAAiE;aAC/F,CAAC,CAAC;YAEH,MAAM,WAAW,GAAG,QAAQ,CAAC,IAA2B,CAAC;YAEzD,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YACxC,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE,QAAQ,EAAE,EAAE,+BAA+B,CAAC,CAAC;YAEjE,OAAO;gBACL,MAAM,EAAE,WAAW;gBACnB,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,cAAc,IAAI,KAAK;aAC5C,CAAC;QACJ,CAAC;QAAC,OAAO,KAAU,EAAE,CAAC;YACpB,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE,GAAG,EAAE,KAAK,EAAE,EAAE,wBAAwB,CAAC,CAAC;YAC5D,MAAM,IAAI,KAAK,CAAC,yBAAyB,KAAK,CAAC,OAAO,EAAE,CAAC,CAAC;QAC5D,CAAC;IACH,CAAC;CACF"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import type { PersistedConfig } from "../persisted-config.js";
|
|
2
|
+
import type { PaseoOpenAIConfig, PaseoSpeechConfig } from "../bootstrap.js";
|
|
3
|
+
export declare function resolveSpeechConfig(params: {
|
|
4
|
+
paseoHome: string;
|
|
5
|
+
env: NodeJS.ProcessEnv;
|
|
6
|
+
persisted: PersistedConfig;
|
|
7
|
+
}): {
|
|
8
|
+
openai: PaseoOpenAIConfig | undefined;
|
|
9
|
+
speech: PaseoSpeechConfig;
|
|
10
|
+
};
|
|
11
|
+
//# sourceMappingURL=speech-config-resolver.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-config-resolver.d.ts","sourceRoot":"","sources":["../../../../src/server/speech/speech-config-resolver.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,eAAe,EAAE,MAAM,wBAAwB,CAAC;AAC9D,OAAO,KAAK,EAAE,iBAAiB,EAAE,iBAAiB,EAAE,MAAM,iBAAiB,CAAC;AAkE5E,wBAAgB,mBAAmB,CAAC,MAAM,EAAE;IAC1C,SAAS,EAAE,MAAM,CAAC;IAClB,GAAG,EAAE,MAAM,CAAC,UAAU,CAAC;IACvB,SAAS,EAAE,eAAe,CAAC;CAC5B,GAAG;IACF,MAAM,EAAE,iBAAiB,GAAG,SAAS,CAAC;IACtC,MAAM,EAAE,iBAAiB,CAAC;CAC3B,CA4BA"}
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
import { z } from "zod";
|
|
2
|
+
import { resolveLocalSpeechConfig } from "./providers/local/config.js";
|
|
3
|
+
import { resolveOpenAiSpeechConfig } from "./providers/openai/config.js";
|
|
4
|
+
import { SpeechProviderIdSchema, } from "./speech-types.js";
|
|
5
|
+
const OptionalSpeechProviderSchema = z
|
|
6
|
+
.string()
|
|
7
|
+
.trim()
|
|
8
|
+
.toLowerCase()
|
|
9
|
+
.pipe(SpeechProviderIdSchema)
|
|
10
|
+
.optional();
|
|
11
|
+
const RequestedSpeechProvidersSchema = z.object({
|
|
12
|
+
dictationStt: OptionalSpeechProviderSchema.default("local"),
|
|
13
|
+
voiceStt: OptionalSpeechProviderSchema.default("local"),
|
|
14
|
+
voiceTts: OptionalSpeechProviderSchema.default("local"),
|
|
15
|
+
});
|
|
16
|
+
function resolveRequestedSpeechProviders(params) {
|
|
17
|
+
const resolveFeatureProvider = (configuredValue, parsedValue) => ({
|
|
18
|
+
provider: parsedValue,
|
|
19
|
+
explicit: configuredValue !== undefined,
|
|
20
|
+
});
|
|
21
|
+
const dictationSttProviderFromConfig = params.env.PASEO_DICTATION_STT_PROVIDER ??
|
|
22
|
+
params.persisted.features?.dictation?.stt?.provider;
|
|
23
|
+
const voiceSttProviderFromConfig = params.env.PASEO_VOICE_STT_PROVIDER ??
|
|
24
|
+
params.persisted.features?.voiceMode?.stt?.provider;
|
|
25
|
+
const voiceTtsProviderFromConfig = params.env.PASEO_VOICE_TTS_PROVIDER ??
|
|
26
|
+
params.persisted.features?.voiceMode?.tts?.provider;
|
|
27
|
+
const parsed = RequestedSpeechProvidersSchema.parse({
|
|
28
|
+
dictationStt: dictationSttProviderFromConfig ?? "local",
|
|
29
|
+
voiceStt: voiceSttProviderFromConfig ?? "local",
|
|
30
|
+
voiceTts: voiceTtsProviderFromConfig ?? "local",
|
|
31
|
+
});
|
|
32
|
+
return {
|
|
33
|
+
dictationStt: resolveFeatureProvider(dictationSttProviderFromConfig, parsed.dictationStt),
|
|
34
|
+
voiceStt: resolveFeatureProvider(voiceSttProviderFromConfig, parsed.voiceStt),
|
|
35
|
+
voiceTts: resolveFeatureProvider(voiceTtsProviderFromConfig, parsed.voiceTts),
|
|
36
|
+
};
|
|
37
|
+
}
|
|
38
|
+
export function resolveSpeechConfig(params) {
|
|
39
|
+
const providers = resolveRequestedSpeechProviders({
|
|
40
|
+
env: params.env,
|
|
41
|
+
persisted: params.persisted,
|
|
42
|
+
});
|
|
43
|
+
const local = resolveLocalSpeechConfig({
|
|
44
|
+
paseoHome: params.paseoHome,
|
|
45
|
+
env: params.env,
|
|
46
|
+
persisted: params.persisted,
|
|
47
|
+
providers,
|
|
48
|
+
});
|
|
49
|
+
const openai = resolveOpenAiSpeechConfig({
|
|
50
|
+
env: params.env,
|
|
51
|
+
persisted: params.persisted,
|
|
52
|
+
providers,
|
|
53
|
+
});
|
|
54
|
+
return {
|
|
55
|
+
openai,
|
|
56
|
+
speech: {
|
|
57
|
+
providers,
|
|
58
|
+
...(local.local
|
|
59
|
+
? { local: local.local }
|
|
60
|
+
: {}),
|
|
61
|
+
},
|
|
62
|
+
};
|
|
63
|
+
}
|
|
64
|
+
//# sourceMappingURL=speech-config-resolver.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-config-resolver.js","sourceRoot":"","sources":["../../../../src/server/speech/speech-config-resolver.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,CAAC,EAAE,MAAM,KAAK,CAAC;AAIxB,OAAO,EAAE,wBAAwB,EAAE,MAAM,6BAA6B,CAAC;AACvE,OAAO,EAAE,yBAAyB,EAAE,MAAM,8BAA8B,CAAC;AACzE,OAAO,EACL,sBAAsB,GAGvB,MAAM,mBAAmB,CAAC;AAE3B,MAAM,4BAA4B,GAAG,CAAC;KACnC,MAAM,EAAE;KACR,IAAI,EAAE;KACN,WAAW,EAAE;KACb,IAAI,CAAC,sBAAsB,CAAC;KAC5B,QAAQ,EAAE,CAAC;AAEd,MAAM,8BAA8B,GAAG,CAAC,CAAC,MAAM,CAAC;IAC9C,YAAY,EAAE,4BAA4B,CAAC,OAAO,CAAC,OAAO,CAAC;IAC3D,QAAQ,EAAE,4BAA4B,CAAC,OAAO,CAAC,OAAO,CAAC;IACvD,QAAQ,EAAE,4BAA4B,CAAC,OAAO,CAAC,OAAO,CAAC;CACxD,CAAC,CAAC;AAEH,SAAS,+BAA+B,CAAC,MAGxC;IACC,MAAM,sBAAsB,GAAG,CAC7B,eAAmC,EACnC,WAAmD,EAC1B,EAAE,CAAC,CAAC;QAC7B,QAAQ,EAAE,WAAW;QACrB,QAAQ,EAAE,eAAe,KAAK,SAAS;KACxC,CAAC,CAAC;IAEH,MAAM,8BAA8B,GAClC,MAAM,CAAC,GAAG,CAAC,4BAA4B;QACvC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,QAAQ,CAAC;IACtD,MAAM,0BAA0B,GAC9B,MAAM,CAAC,GAAG,CAAC,wBAAwB;QACnC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,QAAQ,CAAC;IACtD,MAAM,0BAA0B,GAC9B,MAAM,CAAC,GAAG,CAAC,wBAAwB;QACnC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,QAAQ,CAAC;IAEtD,MAAM,MAAM,GAAG,8BAA8B,CAAC,KAAK,CAAC;QAClD,YAAY,EAAE,8BAA8B,IAAI,OAAO;QACvD,QAAQ,EAAE,0BAA0B,IAAI,OAAO;QAC/C,QAAQ,EAAE,0BAA0B,IAAI,OAAO;KAChD,CAAC,CAAC;IAEH,OAAO;QACL,YAAY,EAAE,sBAAsB,CAClC,8BAA8B,EAC9B,MAAM,CAAC,YAAY,CACpB;QACD,QAAQ,EAAE,sBAAsB,CAC9B,0BAA0B,EAC1B,MAAM,CAAC,QAAQ,CAChB;QACD,QAAQ,EAAE,sBAAsB,CAC9B,0BAA0B,EAC1B,MAAM,CAAC,QAAQ,CAChB;KACF,CAAC;AACJ,CAAC;AAED,MAAM,UAAU,mBAAmB,CAAC,MAInC;IAIC,MAAM,SAAS,GAAG,+BAA+B,CAAC;QAChD,GAAG,EAAE,MAAM,CAAC,GAAG;QACf,SAAS,EAAE,MAAM,CAAC,SAAS;KAC5B,CAAC,CAAC;IAEH,MAAM,KAAK,GAAG,wBAAwB,CAAC;QACrC,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,GAAG,EAAE,MAAM,CAAC,GAAG;QACf,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,SAAS;KACV,CAAC,CAAC;IAEH,MAAM,MAAM,GAAG,yBAAyB,CAAC;QACvC,GAAG,EAAE,MAAM,CAAC,GAAG;QACf,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,SAAS;KACV,CAAC,CAAC;IAEH,OAAO;QACL,MAAM;QACN,MAAM,EAAE;YACN,SAAS;YACT,GAAG,CAAC,KAAK,CAAC,KAAK;gBACb,CAAC,CAAC,EAAE,KAAK,EAAE,KAAK,CAAC,KAAK,EAAE;gBACxB,CAAC,CAAC,EAAE,CAAC;SACR;KACF,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,59 @@
|
|
|
1
|
+
import type pino from "pino";
|
|
2
|
+
import type { Readable } from "node:stream";
|
|
3
|
+
export interface LogprobToken {
|
|
4
|
+
token: string;
|
|
5
|
+
logprob: number;
|
|
6
|
+
bytes?: number[];
|
|
7
|
+
}
|
|
8
|
+
export interface TranscriptionResult {
|
|
9
|
+
text: string;
|
|
10
|
+
language?: string;
|
|
11
|
+
duration?: number;
|
|
12
|
+
logprobs?: LogprobToken[];
|
|
13
|
+
avgLogprob?: number;
|
|
14
|
+
isLowConfidence?: boolean;
|
|
15
|
+
}
|
|
16
|
+
export interface StreamingTranscriptionCommittedEvent {
|
|
17
|
+
segmentId: string;
|
|
18
|
+
previousSegmentId: string | null;
|
|
19
|
+
}
|
|
20
|
+
export interface StreamingTranscriptionEvent {
|
|
21
|
+
segmentId: string;
|
|
22
|
+
transcript: string;
|
|
23
|
+
isFinal: boolean;
|
|
24
|
+
language?: string;
|
|
25
|
+
logprobs?: LogprobToken[];
|
|
26
|
+
avgLogprob?: number;
|
|
27
|
+
isLowConfidence?: boolean;
|
|
28
|
+
}
|
|
29
|
+
export type StreamingTranscriptionSession = {
|
|
30
|
+
/**
|
|
31
|
+
* Required PCM16LE sample rate for `appendPcm16()`.
|
|
32
|
+
* Callers are responsible for resampling before appending.
|
|
33
|
+
*/
|
|
34
|
+
requiredSampleRate: number;
|
|
35
|
+
connect(): Promise<void>;
|
|
36
|
+
appendPcm16(pcm16le: Buffer): void;
|
|
37
|
+
commit(): void;
|
|
38
|
+
clear(): void;
|
|
39
|
+
close(): void;
|
|
40
|
+
on(event: "committed", handler: (payload: StreamingTranscriptionCommittedEvent) => void): unknown;
|
|
41
|
+
on(event: "transcript", handler: (payload: StreamingTranscriptionEvent) => void): unknown;
|
|
42
|
+
on(event: "error", handler: (err: unknown) => void): unknown;
|
|
43
|
+
};
|
|
44
|
+
export interface SpeechToTextProvider {
|
|
45
|
+
id: "openai" | "local" | (string & {});
|
|
46
|
+
createSession(params: {
|
|
47
|
+
logger: pino.Logger;
|
|
48
|
+
language?: string;
|
|
49
|
+
prompt?: string;
|
|
50
|
+
}): StreamingTranscriptionSession;
|
|
51
|
+
}
|
|
52
|
+
export interface SpeechStreamResult {
|
|
53
|
+
stream: Readable;
|
|
54
|
+
format: string;
|
|
55
|
+
}
|
|
56
|
+
export interface TextToSpeechProvider {
|
|
57
|
+
synthesizeSpeech(text: string): Promise<SpeechStreamResult>;
|
|
58
|
+
}
|
|
59
|
+
//# sourceMappingURL=speech-provider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-provider.d.ts","sourceRoot":"","sources":["../../../../src/server/speech/speech-provider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAC7B,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AAE5C,MAAM,WAAW,YAAY;IAC3B,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,EAAE,MAAM,CAAC;IAChB,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,MAAM,WAAW,mBAAmB;IAClC,IAAI,EAAE,MAAM,CAAC;IACb,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,QAAQ,CAAC,EAAE,YAAY,EAAE,CAAC;IAC1B,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,eAAe,CAAC,EAAE,OAAO,CAAC;CAC3B;AAED,MAAM,WAAW,oCAAoC;IACnD,SAAS,EAAE,MAAM,CAAC;IAClB,iBAAiB,EAAE,MAAM,GAAG,IAAI,CAAC;CAClC;AAED,MAAM,WAAW,2BAA2B;IAC1C,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,OAAO,EAAE,OAAO,CAAC;IACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,QAAQ,CAAC,EAAE,YAAY,EAAE,CAAC;IAC1B,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,eAAe,CAAC,EAAE,OAAO,CAAC;CAC3B;AAED,MAAM,MAAM,6BAA6B,GAAG;IAC1C;;;OAGG;IACH,kBAAkB,EAAE,MAAM,CAAC;IAE3B,OAAO,IAAI,OAAO,CAAC,IAAI,CAAC,CAAC;IACzB,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI,CAAC;IACnC,MAAM,IAAI,IAAI,CAAC;IACf,KAAK,IAAI,IAAI,CAAC;IACd,KAAK,IAAI,IAAI,CAAC;IAEd,EAAE,CACA,KAAK,EAAE,WAAW,EAClB,OAAO,EAAE,CAAC,OAAO,EAAE,oCAAoC,KAAK,IAAI,GAC/D,OAAO,CAAC;IACX,EAAE,CACA,KAAK,EAAE,YAAY,EACnB,OAAO,EAAE,CAAC,OAAO,EAAE,2BAA2B,KAAK,IAAI,GACtD,OAAO,CAAC;IACX,EAAE,CAAC,KAAK,EAAE,OAAO,EAAE,OAAO,EAAE,CAAC,GAAG,EAAE,OAAO,KAAK,IAAI,GAAG,OAAO,CAAC;CAC9D,CAAC;AAEF,MAAM,WAAW,oBAAoB;IACnC,EAAE,EAAE,QAAQ,GAAG,OAAO,GAAG,CAAC,MAAM,GAAG,EAAE,CAAC,CAAC;IACvC,aAAa,CAAC,MAAM,EAAE;QACpB,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC;QACpB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,MAAM,CAAC,EAAE,MAAM,CAAC;KACjB,GAAG,6BAA6B,CAAC;CACnC;AAED,MAAM,WAAW,kBAAkB;IACjC,MAAM,EAAE,QAAQ,CAAC;IACjB,MAAM,EAAE,MAAM,CAAC;CAChB;AAED,MAAM,WAAW,oBAAoB;IACnC,gBAAgB,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,kBAAkB,CAAC,CAAC;CAC7D"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-provider.js","sourceRoot":"","sources":["../../../../src/server/speech/speech-provider.ts"],"names":[],"mappings":""}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
import type { Logger } from "pino";
|
|
2
|
+
import type { PaseoOpenAIConfig, PaseoSpeechConfig } from "../bootstrap.js";
|
|
3
|
+
import type { LocalSpeechModelId } from "./providers/local/config.js";
|
|
4
|
+
import type { SpeechToTextProvider, TextToSpeechProvider } from "./speech-provider.js";
|
|
5
|
+
export type InitializedSpeechRuntime = {
|
|
6
|
+
sttService: SpeechToTextProvider | null;
|
|
7
|
+
ttsService: TextToSpeechProvider | null;
|
|
8
|
+
dictationSttService: SpeechToTextProvider | null;
|
|
9
|
+
cleanup: () => void;
|
|
10
|
+
localModelConfig: {
|
|
11
|
+
modelsDir: string;
|
|
12
|
+
defaultModelIds: LocalSpeechModelId[];
|
|
13
|
+
} | null;
|
|
14
|
+
};
|
|
15
|
+
export declare function initializeSpeechRuntime(params: {
|
|
16
|
+
logger: Logger;
|
|
17
|
+
openaiConfig?: PaseoOpenAIConfig;
|
|
18
|
+
speechConfig?: PaseoSpeechConfig;
|
|
19
|
+
}): Promise<InitializedSpeechRuntime>;
|
|
20
|
+
//# sourceMappingURL=speech-runtime.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-runtime.d.ts","sourceRoot":"","sources":["../../../../src/server/speech/speech-runtime.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,MAAM,EAAE,MAAM,MAAM,CAAC;AAEnC,OAAO,KAAK,EAAE,iBAAiB,EAAE,iBAAiB,EAAE,MAAM,iBAAiB,CAAC;AAK5E,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,6BAA6B,CAAC;AAMtE,OAAO,KAAK,EAAE,oBAAoB,EAAE,oBAAoB,EAAE,MAAM,sBAAsB,CAAC;AAkBvF,MAAM,MAAM,wBAAwB,GAAG;IACrC,UAAU,EAAE,oBAAoB,GAAG,IAAI,CAAC;IACxC,UAAU,EAAE,oBAAoB,GAAG,IAAI,CAAC;IACxC,mBAAmB,EAAE,oBAAoB,GAAG,IAAI,CAAC;IACjD,OAAO,EAAE,MAAM,IAAI,CAAC;IACpB,gBAAgB,EAAE;QAChB,SAAS,EAAE,MAAM,CAAC;QAClB,eAAe,EAAE,kBAAkB,EAAE,CAAC;KACvC,GAAG,IAAI,CAAC;CACV,CAAC;AAEF,wBAAsB,uBAAuB,CAAC,MAAM,EAAE;IACpD,MAAM,EAAE,MAAM,CAAC;IACf,YAAY,CAAC,EAAE,iBAAiB,CAAC;IACjC,YAAY,CAAC,EAAE,iBAAiB,CAAC;CAClC,GAAG,OAAO,CAAC,wBAAwB,CAAC,CA8HpC"}
|
|
@@ -0,0 +1,119 @@
|
|
|
1
|
+
import { getLocalSpeechAvailability, initializeLocalSpeechServices, } from "./providers/local/runtime.js";
|
|
2
|
+
import { getOpenAiSpeechAvailability, initializeOpenAiSpeechServices, validateOpenAiCredentialRequirements, } from "./providers/openai/runtime.js";
|
|
3
|
+
function resolveRequestedSpeechProviders(speechConfig) {
|
|
4
|
+
const fromConfig = speechConfig?.providers;
|
|
5
|
+
if (fromConfig) {
|
|
6
|
+
return fromConfig;
|
|
7
|
+
}
|
|
8
|
+
return {
|
|
9
|
+
dictationStt: { provider: "local", explicit: false },
|
|
10
|
+
voiceStt: { provider: "local", explicit: false },
|
|
11
|
+
voiceTts: { provider: "local", explicit: false },
|
|
12
|
+
};
|
|
13
|
+
}
|
|
14
|
+
export async function initializeSpeechRuntime(params) {
|
|
15
|
+
const logger = params.logger;
|
|
16
|
+
const speechConfig = params.speechConfig ?? null;
|
|
17
|
+
const openaiConfig = params.openaiConfig;
|
|
18
|
+
const providers = resolveRequestedSpeechProviders(speechConfig);
|
|
19
|
+
validateOpenAiCredentialRequirements({
|
|
20
|
+
providers,
|
|
21
|
+
openaiConfig,
|
|
22
|
+
logger,
|
|
23
|
+
});
|
|
24
|
+
logger.info({
|
|
25
|
+
requestedProviders: {
|
|
26
|
+
dictationStt: providers.dictationStt.provider,
|
|
27
|
+
voiceStt: providers.voiceStt.provider,
|
|
28
|
+
voiceTts: providers.voiceTts.provider,
|
|
29
|
+
},
|
|
30
|
+
availability: {
|
|
31
|
+
openai: getOpenAiSpeechAvailability(openaiConfig),
|
|
32
|
+
local: getLocalSpeechAvailability(speechConfig),
|
|
33
|
+
},
|
|
34
|
+
}, "Speech provider reconciliation started");
|
|
35
|
+
const localSpeech = await initializeLocalSpeechServices({
|
|
36
|
+
providers,
|
|
37
|
+
speechConfig,
|
|
38
|
+
logger,
|
|
39
|
+
});
|
|
40
|
+
const openAiSpeech = initializeOpenAiSpeechServices({
|
|
41
|
+
providers,
|
|
42
|
+
openaiConfig,
|
|
43
|
+
existing: {
|
|
44
|
+
sttService: localSpeech.sttService,
|
|
45
|
+
ttsService: localSpeech.ttsService,
|
|
46
|
+
dictationSttService: localSpeech.dictationSttService,
|
|
47
|
+
},
|
|
48
|
+
logger,
|
|
49
|
+
});
|
|
50
|
+
const effectiveProviders = {
|
|
51
|
+
dictationStt: openAiSpeech.dictationSttService?.id ?? "unavailable",
|
|
52
|
+
voiceStt: openAiSpeech.sttService?.id ?? "unavailable",
|
|
53
|
+
voiceTts: !openAiSpeech.ttsService
|
|
54
|
+
? "unavailable"
|
|
55
|
+
: openAiSpeech.ttsService === localSpeech.localVoiceTtsProvider
|
|
56
|
+
? "local"
|
|
57
|
+
: "openai",
|
|
58
|
+
};
|
|
59
|
+
const unavailableFeatures = [
|
|
60
|
+
!openAiSpeech.dictationSttService ? "dictation.stt" : null,
|
|
61
|
+
!openAiSpeech.sttService ? "voice.stt" : null,
|
|
62
|
+
!openAiSpeech.ttsService ? "voice.tts" : null,
|
|
63
|
+
].filter((feature) => feature !== null);
|
|
64
|
+
const explicitlyConfiguredUnavailableFeatures = unavailableFeatures.filter((feature) => {
|
|
65
|
+
if (feature === "dictation.stt") {
|
|
66
|
+
return providers.dictationStt.explicit;
|
|
67
|
+
}
|
|
68
|
+
if (feature === "voice.stt") {
|
|
69
|
+
return providers.voiceStt.explicit;
|
|
70
|
+
}
|
|
71
|
+
return providers.voiceTts.explicit;
|
|
72
|
+
});
|
|
73
|
+
if (explicitlyConfiguredUnavailableFeatures.length > 0) {
|
|
74
|
+
logger.error({
|
|
75
|
+
requestedProviders: {
|
|
76
|
+
dictationStt: providers.dictationStt.provider,
|
|
77
|
+
voiceStt: providers.voiceStt.provider,
|
|
78
|
+
voiceTts: providers.voiceTts.provider,
|
|
79
|
+
},
|
|
80
|
+
explicitProviders: {
|
|
81
|
+
dictationStt: providers.dictationStt.explicit,
|
|
82
|
+
voiceStt: providers.voiceStt.explicit,
|
|
83
|
+
voiceTts: providers.voiceTts.explicit,
|
|
84
|
+
},
|
|
85
|
+
effectiveProviders,
|
|
86
|
+
unavailableFeatures: explicitlyConfiguredUnavailableFeatures,
|
|
87
|
+
}, "Speech provider reconciliation failed: configured features are unavailable");
|
|
88
|
+
throw new Error(`Configured speech features unavailable: ${explicitlyConfiguredUnavailableFeatures.join(", ")}`);
|
|
89
|
+
}
|
|
90
|
+
if (unavailableFeatures.length > 0) {
|
|
91
|
+
logger.warn({
|
|
92
|
+
requestedProviders: {
|
|
93
|
+
dictationStt: providers.dictationStt.provider,
|
|
94
|
+
voiceStt: providers.voiceStt.provider,
|
|
95
|
+
voiceTts: providers.voiceTts.provider,
|
|
96
|
+
},
|
|
97
|
+
explicitProviders: {
|
|
98
|
+
dictationStt: providers.dictationStt.explicit,
|
|
99
|
+
voiceStt: providers.voiceStt.explicit,
|
|
100
|
+
voiceTts: providers.voiceTts.explicit,
|
|
101
|
+
},
|
|
102
|
+
effectiveProviders,
|
|
103
|
+
unavailableFeatures,
|
|
104
|
+
}, "Speech provider reconciliation completed with unavailable default features");
|
|
105
|
+
}
|
|
106
|
+
else {
|
|
107
|
+
logger.info({
|
|
108
|
+
effectiveProviders,
|
|
109
|
+
}, "Speech provider reconciliation completed");
|
|
110
|
+
}
|
|
111
|
+
return {
|
|
112
|
+
sttService: openAiSpeech.sttService,
|
|
113
|
+
ttsService: openAiSpeech.ttsService,
|
|
114
|
+
dictationSttService: openAiSpeech.dictationSttService,
|
|
115
|
+
cleanup: localSpeech.cleanup,
|
|
116
|
+
localModelConfig: localSpeech.localModelConfig,
|
|
117
|
+
};
|
|
118
|
+
}
|
|
119
|
+
//# sourceMappingURL=speech-runtime.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-runtime.js","sourceRoot":"","sources":["../../../../src/server/speech/speech-runtime.ts"],"names":[],"mappings":"AAGA,OAAO,EACL,0BAA0B,EAC1B,6BAA6B,GAC9B,MAAM,8BAA8B,CAAC;AAEtC,OAAO,EACL,2BAA2B,EAC3B,8BAA8B,EAC9B,oCAAoC,GACrC,MAAM,+BAA+B,CAAC;AAIvC,SAAS,+BAA+B,CACtC,YAAsC;IAEtC,MAAM,UAAU,GAAG,YAAY,EAAE,SAAS,CAAC;IAC3C,IAAI,UAAU,EAAE,CAAC;QACf,OAAO,UAAU,CAAC;IACpB,CAAC;IAED,OAAO;QACL,YAAY,EAAE,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,KAAK,EAAE;QACpD,QAAQ,EAAE,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,KAAK,EAAE;QAChD,QAAQ,EAAE,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,KAAK,EAAE;KACjD,CAAC;AACJ,CAAC;AAaD,MAAM,CAAC,KAAK,UAAU,uBAAuB,CAAC,MAI7C;IACC,MAAM,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;IAC7B,MAAM,YAAY,GAAG,MAAM,CAAC,YAAY,IAAI,IAAI,CAAC;IACjD,MAAM,YAAY,GAAG,MAAM,CAAC,YAAY,CAAC;IACzC,MAAM,SAAS,GAAG,+BAA+B,CAAC,YAAY,CAAC,CAAC;IAEhE,oCAAoC,CAAC;QACnC,SAAS;QACT,YAAY;QACZ,MAAM;KACP,CAAC,CAAC;IAEH,MAAM,CAAC,IAAI,CACT;QACE,kBAAkB,EAAE;YAClB,YAAY,EAAE,SAAS,CAAC,YAAY,CAAC,QAAQ;YAC7C,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;YACrC,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;SACtC;QACD,YAAY,EAAE;YACZ,MAAM,EAAE,2BAA2B,CAAC,YAAY,CAAC;YACjD,KAAK,EAAE,0BAA0B,CAAC,YAAY,CAAC;SAChD;KACF,EACD,wCAAwC,CACzC,CAAC;IAEF,MAAM,WAAW,GAAG,MAAM,6BAA6B,CAAC;QACtD,SAAS;QACT,YAAY;QACZ,MAAM;KACP,CAAC,CAAC;IAEH,MAAM,YAAY,GAAG,8BAA8B,CAAC;QAClD,SAAS;QACT,YAAY;QACZ,QAAQ,EAAE;YACR,UAAU,EAAE,WAAW,CAAC,UAAU;YAClC,UAAU,EAAE,WAAW,CAAC,UAAU;YAClC,mBAAmB,EAAE,WAAW,CAAC,mBAAmB;SACrD;QACD,MAAM;KACP,CAAC,CAAC;IAEH,MAAM,kBAAkB,GAAG;QACzB,YAAY,EAAE,YAAY,CAAC,mBAAmB,EAAE,EAAE,IAAI,aAAa;QACnE,QAAQ,EAAE,YAAY,CAAC,UAAU,EAAE,EAAE,IAAI,aAAa;QACtD,QAAQ,EACN,CAAC,YAAY,CAAC,UAAU;YACtB,CAAC,CAAC,aAAa;YACf,CAAC,CAAC,YAAY,CAAC,UAAU,KAAK,WAAW,CAAC,qBAAqB;gBAC7D,CAAC,CAAC,OAAO;gBACT,CAAC,CAAC,QAAQ;KACjB,CAAC;IACF,MAAM,mBAAmB,GAAG;QAC1B,CAAC,YAAY,CAAC,mBAAmB,CAAC,CAAC,CAAC,eAAe,CAAC,CAAC,CAAC,IAAI;QAC1D,CAAC,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC,WAAW,CAAC,CAAC,CAAC,IAAI;QAC7C,CAAC,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC,WAAW,CAAC,CAAC,CAAC,IAAI;KAC9C,CAAC,MAAM,CAAC,CAAC,OAAO,EAAqB,EAAE,CAAC,OAAO,KAAK,IAAI,CAAC,CAAC;IAC3D,MAAM,uCAAuC,GAAG,mBAAmB,CAAC,MAAM,CAAC,CAAC,OAAO,EAAE,EAAE;QACrF,IAAI,OAAO,KAAK,eAAe,EAAE,CAAC;YAChC,OAAO,SAAS,CAAC,YAAY,CAAC,QAAQ,CAAC;QACzC,CAAC;QACD,IAAI,OAAO,KAAK,WAAW,EAAE,CAAC;YAC5B,OAAO,SAAS,CAAC,QAAQ,CAAC,QAAQ,CAAC;QACrC,CAAC;QACD,OAAO,SAAS,CAAC,QAAQ,CAAC,QAAQ,CAAC;IACrC,CAAC,CAAC,CAAC;IAEH,IAAI,uCAAuC,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACvD,MAAM,CAAC,KAAK,CACV;YACE,kBAAkB,EAAE;gBAClB,YAAY,EAAE,SAAS,CAAC,YAAY,CAAC,QAAQ;gBAC7C,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;gBACrC,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;aACtC;YACD,iBAAiB,EAAE;gBACjB,YAAY,EAAE,SAAS,CAAC,YAAY,CAAC,QAAQ;gBAC7C,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;gBACrC,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;aACtC;YACD,kBAAkB;YAClB,mBAAmB,EAAE,uCAAuC;SAC7D,EACD,4EAA4E,CAC7E,CAAC;QACF,MAAM,IAAI,KAAK,CACb,2CAA2C,uCAAuC,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAChG,CAAC;IACJ,CAAC;IAED,IAAI,mBAAmB,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACnC,MAAM,CAAC,IAAI,CACT;YACE,kBAAkB,EAAE;gBAClB,YAAY,EAAE,SAAS,CAAC,YAAY,CAAC,QAAQ;gBAC7C,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;gBACrC,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;aACtC;YACD,iBAAiB,EAAE;gBACjB,YAAY,EAAE,SAAS,CAAC,YAAY,CAAC,QAAQ;gBAC7C,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;gBACrC,QAAQ,EAAE,SAAS,CAAC,QAAQ,CAAC,QAAQ;aACtC;YACD,kBAAkB;YAClB,mBAAmB;SACpB,EACD,4EAA4E,CAC7E,CAAC;IACJ,CAAC;SAAM,CAAC;QACN,MAAM,CAAC,IAAI,CACT;YACE,kBAAkB;SACnB,EACD,0CAA0C,CAC3C,CAAC;IACJ,CAAC;IAED,OAAO;QACL,UAAU,EAAE,YAAY,CAAC,UAAU;QACnC,UAAU,EAAE,YAAY,CAAC,UAAU;QACnC,mBAAmB,EAAE,YAAY,CAAC,mBAAmB;QACrD,OAAO,EAAE,WAAW,CAAC,OAAO;QAC5B,gBAAgB,EAAE,WAAW,CAAC,gBAAgB;KAC/C,CAAC;AACJ,CAAC"}
|