@getpaseo/server 0.1.37 → 0.1.38

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (295) hide show
  1. package/dist/scripts/dev-runner.js +1 -1
  2. package/dist/scripts/dev-runner.js.map +1 -1
  3. package/dist/scripts/{daemon-runner.js → supervisor-entrypoint.js} +7 -9
  4. package/dist/scripts/supervisor-entrypoint.js.map +1 -0
  5. package/dist/scripts/supervisor.js +17 -1
  6. package/dist/scripts/supervisor.js.map +1 -1
  7. package/dist/server/server/bootstrap.d.ts +0 -4
  8. package/dist/server/server/bootstrap.d.ts.map +1 -1
  9. package/dist/server/server/bootstrap.js +8 -22
  10. package/dist/server/server/bootstrap.js.map +1 -1
  11. package/dist/server/server/index.js +0 -4
  12. package/dist/server/server/index.js.map +1 -1
  13. package/dist/server/server/pid-lock.d.ts +7 -2
  14. package/dist/server/server/pid-lock.d.ts.map +1 -1
  15. package/dist/server/server/pid-lock.js +21 -0
  16. package/dist/server/server/pid-lock.js.map +1 -1
  17. package/dist/server/server/session.d.ts.map +1 -1
  18. package/dist/server/server/session.js +2 -2
  19. package/dist/server/server/session.js.map +1 -1
  20. package/dist/src/server/pid-lock.js +21 -0
  21. package/dist/src/server/pid-lock.js.map +1 -1
  22. package/package.json +3 -3
  23. package/dist/scripts/daemon-runner.js.map +0 -1
  24. package/dist/src/server/agent/activity-curator.js +0 -243
  25. package/dist/src/server/agent/activity-curator.js.map +0 -1
  26. package/dist/src/server/agent/agent-manager.js +0 -1855
  27. package/dist/src/server/agent/agent-manager.js.map +0 -1
  28. package/dist/src/server/agent/agent-metadata-generator.js +0 -161
  29. package/dist/src/server/agent/agent-metadata-generator.js.map +0 -1
  30. package/dist/src/server/agent/agent-projections.js +0 -254
  31. package/dist/src/server/agent/agent-projections.js.map +0 -1
  32. package/dist/src/server/agent/agent-response-loop.js +0 -304
  33. package/dist/src/server/agent/agent-response-loop.js.map +0 -1
  34. package/dist/src/server/agent/agent-sdk-types.js +0 -12
  35. package/dist/src/server/agent/agent-sdk-types.js.map +0 -1
  36. package/dist/src/server/agent/agent-storage.js +0 -302
  37. package/dist/src/server/agent/agent-storage.js.map +0 -1
  38. package/dist/src/server/agent/agent-title-limits.js +0 -3
  39. package/dist/src/server/agent/agent-title-limits.js.map +0 -1
  40. package/dist/src/server/agent/audio-utils.js +0 -19
  41. package/dist/src/server/agent/audio-utils.js.map +0 -1
  42. package/dist/src/server/agent/dictation-debug.js +0 -50
  43. package/dist/src/server/agent/dictation-debug.js.map +0 -1
  44. package/dist/src/server/agent/mcp-server.js +0 -754
  45. package/dist/src/server/agent/mcp-server.js.map +0 -1
  46. package/dist/src/server/agent/orchestrator-instructions.js +0 -51
  47. package/dist/src/server/agent/orchestrator-instructions.js.map +0 -1
  48. package/dist/src/server/agent/pcm16-resampler.js +0 -63
  49. package/dist/src/server/agent/pcm16-resampler.js.map +0 -1
  50. package/dist/src/server/agent/provider-launch-config.js +0 -213
  51. package/dist/src/server/agent/provider-launch-config.js.map +0 -1
  52. package/dist/src/server/agent/provider-manifest.js +0 -127
  53. package/dist/src/server/agent/provider-manifest.js.map +0 -1
  54. package/dist/src/server/agent/provider-registry.js +0 -45
  55. package/dist/src/server/agent/provider-registry.js.map +0 -1
  56. package/dist/src/server/agent/providers/claude/partial-json.js +0 -306
  57. package/dist/src/server/agent/providers/claude/partial-json.js.map +0 -1
  58. package/dist/src/server/agent/providers/claude/sdk-model-resolver.js +0 -104
  59. package/dist/src/server/agent/providers/claude/sdk-model-resolver.js.map +0 -1
  60. package/dist/src/server/agent/providers/claude/sidechain-tracker.js +0 -230
  61. package/dist/src/server/agent/providers/claude/sidechain-tracker.js.map +0 -1
  62. package/dist/src/server/agent/providers/claude/task-notification-tool-call.js +0 -267
  63. package/dist/src/server/agent/providers/claude/task-notification-tool-call.js.map +0 -1
  64. package/dist/src/server/agent/providers/claude/tool-call-detail-parser.js +0 -121
  65. package/dist/src/server/agent/providers/claude/tool-call-detail-parser.js.map +0 -1
  66. package/dist/src/server/agent/providers/claude/tool-call-mapper.js +0 -252
  67. package/dist/src/server/agent/providers/claude/tool-call-mapper.js.map +0 -1
  68. package/dist/src/server/agent/providers/claude-agent.js +0 -3166
  69. package/dist/src/server/agent/providers/claude-agent.js.map +0 -1
  70. package/dist/src/server/agent/providers/codex/tool-call-detail-parser.js +0 -104
  71. package/dist/src/server/agent/providers/codex/tool-call-detail-parser.js.map +0 -1
  72. package/dist/src/server/agent/providers/codex/tool-call-mapper.js +0 -758
  73. package/dist/src/server/agent/providers/codex/tool-call-mapper.js.map +0 -1
  74. package/dist/src/server/agent/providers/codex-app-server-agent.js +0 -2949
  75. package/dist/src/server/agent/providers/codex-app-server-agent.js.map +0 -1
  76. package/dist/src/server/agent/providers/codex-rollout-timeline.js +0 -544
  77. package/dist/src/server/agent/providers/codex-rollout-timeline.js.map +0 -1
  78. package/dist/src/server/agent/providers/opencode/tool-call-detail-parser.js +0 -39
  79. package/dist/src/server/agent/providers/opencode/tool-call-detail-parser.js.map +0 -1
  80. package/dist/src/server/agent/providers/opencode/tool-call-mapper.js +0 -144
  81. package/dist/src/server/agent/providers/opencode/tool-call-mapper.js.map +0 -1
  82. package/dist/src/server/agent/providers/opencode-agent.js +0 -1193
  83. package/dist/src/server/agent/providers/opencode-agent.js.map +0 -1
  84. package/dist/src/server/agent/providers/tool-call-detail-primitives.js +0 -686
  85. package/dist/src/server/agent/providers/tool-call-detail-primitives.js.map +0 -1
  86. package/dist/src/server/agent/providers/tool-call-mapper-utils.js +0 -115
  87. package/dist/src/server/agent/providers/tool-call-mapper-utils.js.map +0 -1
  88. package/dist/src/server/agent/recordings-debug.js +0 -19
  89. package/dist/src/server/agent/recordings-debug.js.map +0 -1
  90. package/dist/src/server/agent/stt-debug.js +0 -33
  91. package/dist/src/server/agent/stt-debug.js.map +0 -1
  92. package/dist/src/server/agent/stt-manager.js +0 -232
  93. package/dist/src/server/agent/stt-manager.js.map +0 -1
  94. package/dist/src/server/agent/timeline-append.js +0 -27
  95. package/dist/src/server/agent/timeline-append.js.map +0 -1
  96. package/dist/src/server/agent/timeline-projection.js +0 -215
  97. package/dist/src/server/agent/timeline-projection.js.map +0 -1
  98. package/dist/src/server/agent/tool-name-normalization.js +0 -45
  99. package/dist/src/server/agent/tool-name-normalization.js.map +0 -1
  100. package/dist/src/server/agent/tts-debug.js +0 -24
  101. package/dist/src/server/agent/tts-debug.js.map +0 -1
  102. package/dist/src/server/agent/tts-manager.js +0 -374
  103. package/dist/src/server/agent/tts-manager.js.map +0 -1
  104. package/dist/src/server/agent/wait-for-agent-tracker.js +0 -53
  105. package/dist/src/server/agent/wait-for-agent-tracker.js.map +0 -1
  106. package/dist/src/server/agent-attention-policy.js +0 -40
  107. package/dist/src/server/agent-attention-policy.js.map +0 -1
  108. package/dist/src/server/allowed-hosts.js +0 -94
  109. package/dist/src/server/allowed-hosts.js.map +0 -1
  110. package/dist/src/server/bootstrap.js +0 -620
  111. package/dist/src/server/bootstrap.js.map +0 -1
  112. package/dist/src/server/chat/chat-mentions.js +0 -71
  113. package/dist/src/server/chat/chat-mentions.js.map +0 -1
  114. package/dist/src/server/chat/chat-rpc-schemas.js +0 -103
  115. package/dist/src/server/chat/chat-rpc-schemas.js.map +0 -1
  116. package/dist/src/server/chat/chat-service.js +0 -330
  117. package/dist/src/server/chat/chat-service.js.map +0 -1
  118. package/dist/src/server/chat/chat-types.js +0 -22
  119. package/dist/src/server/chat/chat-types.js.map +0 -1
  120. package/dist/src/server/checkout-diff-manager.js +0 -272
  121. package/dist/src/server/checkout-diff-manager.js.map +0 -1
  122. package/dist/src/server/checkout-git-utils.js +0 -37
  123. package/dist/src/server/checkout-git-utils.js.map +0 -1
  124. package/dist/src/server/client-message-id.js +0 -12
  125. package/dist/src/server/client-message-id.js.map +0 -1
  126. package/dist/src/server/config.js +0 -73
  127. package/dist/src/server/config.js.map +0 -1
  128. package/dist/src/server/connection-offer.js +0 -59
  129. package/dist/src/server/connection-offer.js.map +0 -1
  130. package/dist/src/server/daemon-keypair.js +0 -40
  131. package/dist/src/server/daemon-keypair.js.map +0 -1
  132. package/dist/src/server/daemon-version.js +0 -22
  133. package/dist/src/server/daemon-version.js.map +0 -1
  134. package/dist/src/server/dictation/dictation-stream-manager.js +0 -571
  135. package/dist/src/server/dictation/dictation-stream-manager.js.map +0 -1
  136. package/dist/src/server/file-download/token-store.js +0 -40
  137. package/dist/src/server/file-download/token-store.js.map +0 -1
  138. package/dist/src/server/file-explorer/service.js +0 -180
  139. package/dist/src/server/file-explorer/service.js.map +0 -1
  140. package/dist/src/server/json-utils.js +0 -45
  141. package/dist/src/server/json-utils.js.map +0 -1
  142. package/dist/src/server/loop/rpc-schemas.js +0 -159
  143. package/dist/src/server/loop/rpc-schemas.js.map +0 -1
  144. package/dist/src/server/loop-service.js +0 -741
  145. package/dist/src/server/loop-service.js.map +0 -1
  146. package/dist/src/server/messages.js +0 -29
  147. package/dist/src/server/messages.js.map +0 -1
  148. package/dist/src/server/package-version.js +0 -46
  149. package/dist/src/server/package-version.js.map +0 -1
  150. package/dist/src/server/pairing-offer.js +0 -45
  151. package/dist/src/server/pairing-offer.js.map +0 -1
  152. package/dist/src/server/pairing-qr.js +0 -45
  153. package/dist/src/server/pairing-qr.js.map +0 -1
  154. package/dist/src/server/path-utils.js +0 -20
  155. package/dist/src/server/path-utils.js.map +0 -1
  156. package/dist/src/server/persisted-config.js +0 -265
  157. package/dist/src/server/persisted-config.js.map +0 -1
  158. package/dist/src/server/persistence-hooks.js +0 -60
  159. package/dist/src/server/persistence-hooks.js.map +0 -1
  160. package/dist/src/server/push/push-service.js +0 -68
  161. package/dist/src/server/push/push-service.js.map +0 -1
  162. package/dist/src/server/push/token-store.js +0 -70
  163. package/dist/src/server/push/token-store.js.map +0 -1
  164. package/dist/src/server/relay-transport.js +0 -461
  165. package/dist/src/server/relay-transport.js.map +0 -1
  166. package/dist/src/server/schedule/cron.js +0 -103
  167. package/dist/src/server/schedule/cron.js.map +0 -1
  168. package/dist/src/server/schedule/rpc-schemas.js +0 -112
  169. package/dist/src/server/schedule/rpc-schemas.js.map +0 -1
  170. package/dist/src/server/schedule/service.js +0 -397
  171. package/dist/src/server/schedule/service.js.map +0 -1
  172. package/dist/src/server/schedule/store.js +0 -56
  173. package/dist/src/server/schedule/store.js.map +0 -1
  174. package/dist/src/server/schedule/types.js +0 -73
  175. package/dist/src/server/schedule/types.js.map +0 -1
  176. package/dist/src/server/server-id.js +0 -63
  177. package/dist/src/server/server-id.js.map +0 -1
  178. package/dist/src/server/session.js +0 -6381
  179. package/dist/src/server/session.js.map +0 -1
  180. package/dist/src/server/speech/audio.js +0 -101
  181. package/dist/src/server/speech/audio.js.map +0 -1
  182. package/dist/src/server/speech/provider-resolver.js +0 -7
  183. package/dist/src/server/speech/provider-resolver.js.map +0 -1
  184. package/dist/src/server/speech/providers/local/config.js +0 -74
  185. package/dist/src/server/speech/providers/local/config.js.map +0 -1
  186. package/dist/src/server/speech/providers/local/models.js +0 -17
  187. package/dist/src/server/speech/providers/local/models.js.map +0 -1
  188. package/dist/src/server/speech/providers/local/pocket/pocket-tts-onnx.js +0 -436
  189. package/dist/src/server/speech/providers/local/pocket/pocket-tts-onnx.js.map +0 -1
  190. package/dist/src/server/speech/providers/local/runtime.js +0 -238
  191. package/dist/src/server/speech/providers/local/runtime.js.map +0 -1
  192. package/dist/src/server/speech/providers/local/sherpa/model-catalog.js +0 -166
  193. package/dist/src/server/speech/providers/local/sherpa/model-catalog.js.map +0 -1
  194. package/dist/src/server/speech/providers/local/sherpa/model-downloader.js +0 -165
  195. package/dist/src/server/speech/providers/local/sherpa/model-downloader.js.map +0 -1
  196. package/dist/src/server/speech/providers/local/sherpa/sherpa-offline-recognizer.js +0 -73
  197. package/dist/src/server/speech/providers/local/sherpa/sherpa-offline-recognizer.js.map +0 -1
  198. package/dist/src/server/speech/providers/local/sherpa/sherpa-online-recognizer.js +0 -84
  199. package/dist/src/server/speech/providers/local/sherpa/sherpa-online-recognizer.js.map +0 -1
  200. package/dist/src/server/speech/providers/local/sherpa/sherpa-onnx-loader.js +0 -11
  201. package/dist/src/server/speech/providers/local/sherpa/sherpa-onnx-loader.js.map +0 -1
  202. package/dist/src/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.js +0 -102
  203. package/dist/src/server/speech/providers/local/sherpa/sherpa-onnx-node-loader.js.map +0 -1
  204. package/dist/src/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.js +0 -135
  205. package/dist/src/server/speech/providers/local/sherpa/sherpa-parakeet-realtime-session.js.map +0 -1
  206. package/dist/src/server/speech/providers/local/sherpa/sherpa-parakeet-stt.js +0 -130
  207. package/dist/src/server/speech/providers/local/sherpa/sherpa-parakeet-stt.js.map +0 -1
  208. package/dist/src/server/speech/providers/local/sherpa/sherpa-realtime-session.js +0 -110
  209. package/dist/src/server/speech/providers/local/sherpa/sherpa-realtime-session.js.map +0 -1
  210. package/dist/src/server/speech/providers/local/sherpa/sherpa-stt.js +0 -138
  211. package/dist/src/server/speech/providers/local/sherpa/sherpa-stt.js.map +0 -1
  212. package/dist/src/server/speech/providers/local/sherpa/sherpa-tts.js +0 -98
  213. package/dist/src/server/speech/providers/local/sherpa/sherpa-tts.js.map +0 -1
  214. package/dist/src/server/speech/providers/local/sherpa/silero-vad-provider.js +0 -23
  215. package/dist/src/server/speech/providers/local/sherpa/silero-vad-provider.js.map +0 -1
  216. package/dist/src/server/speech/providers/local/sherpa/silero-vad-session.js +0 -107
  217. package/dist/src/server/speech/providers/local/sherpa/silero-vad-session.js.map +0 -1
  218. package/dist/src/server/speech/providers/openai/config.js +0 -80
  219. package/dist/src/server/speech/providers/openai/config.js.map +0 -1
  220. package/dist/src/server/speech/providers/openai/realtime-transcription-session.js +0 -168
  221. package/dist/src/server/speech/providers/openai/realtime-transcription-session.js.map +0 -1
  222. package/dist/src/server/speech/providers/openai/runtime.js +0 -112
  223. package/dist/src/server/speech/providers/openai/runtime.js.map +0 -1
  224. package/dist/src/server/speech/providers/openai/stt.js +0 -206
  225. package/dist/src/server/speech/providers/openai/stt.js.map +0 -1
  226. package/dist/src/server/speech/providers/openai/tts.js +0 -46
  227. package/dist/src/server/speech/providers/openai/tts.js.map +0 -1
  228. package/dist/src/server/speech/speech-config-resolver.js +0 -102
  229. package/dist/src/server/speech/speech-config-resolver.js.map +0 -1
  230. package/dist/src/server/speech/speech-provider.js +0 -2
  231. package/dist/src/server/speech/speech-provider.js.map +0 -1
  232. package/dist/src/server/speech/speech-runtime.js +0 -530
  233. package/dist/src/server/speech/speech-runtime.js.map +0 -1
  234. package/dist/src/server/speech/speech-types.js +0 -8
  235. package/dist/src/server/speech/speech-types.js.map +0 -1
  236. package/dist/src/server/speech/turn-detection-provider.js +0 -2
  237. package/dist/src/server/speech/turn-detection-provider.js.map +0 -1
  238. package/dist/src/server/utils/diff-highlighter.js +0 -257
  239. package/dist/src/server/utils/diff-highlighter.js.map +0 -1
  240. package/dist/src/server/voice/fixed-duration-pcm-ring-buffer.js +0 -35
  241. package/dist/src/server/voice/fixed-duration-pcm-ring-buffer.js.map +0 -1
  242. package/dist/src/server/voice/voice-turn-controller.js +0 -159
  243. package/dist/src/server/voice/voice-turn-controller.js.map +0 -1
  244. package/dist/src/server/voice-config.js +0 -51
  245. package/dist/src/server/voice-config.js.map +0 -1
  246. package/dist/src/server/voice-mcp-bridge-command.js +0 -31
  247. package/dist/src/server/voice-mcp-bridge-command.js.map +0 -1
  248. package/dist/src/server/voice-mcp-bridge.js +0 -109
  249. package/dist/src/server/voice-mcp-bridge.js.map +0 -1
  250. package/dist/src/server/voice-permission-policy.js +0 -13
  251. package/dist/src/server/voice-permission-policy.js.map +0 -1
  252. package/dist/src/server/voice-types.js +0 -2
  253. package/dist/src/server/voice-types.js.map +0 -1
  254. package/dist/src/server/websocket-server.js +0 -1048
  255. package/dist/src/server/websocket-server.js.map +0 -1
  256. package/dist/src/server/workspace-registry-bootstrap.js +0 -98
  257. package/dist/src/server/workspace-registry-bootstrap.js.map +0 -1
  258. package/dist/src/server/workspace-registry-model.js +0 -175
  259. package/dist/src/server/workspace-registry-model.js.map +0 -1
  260. package/dist/src/server/workspace-registry.js +0 -151
  261. package/dist/src/server/workspace-registry.js.map +0 -1
  262. package/dist/src/server/worktree-bootstrap.js +0 -508
  263. package/dist/src/server/worktree-bootstrap.js.map +0 -1
  264. package/dist/src/shared/agent-attention-notification.js +0 -130
  265. package/dist/src/shared/agent-attention-notification.js.map +0 -1
  266. package/dist/src/shared/agent-lifecycle.js +0 -8
  267. package/dist/src/shared/agent-lifecycle.js.map +0 -1
  268. package/dist/src/shared/connection-offer.js +0 -17
  269. package/dist/src/shared/connection-offer.js.map +0 -1
  270. package/dist/src/shared/daemon-endpoints.js +0 -122
  271. package/dist/src/shared/daemon-endpoints.js.map +0 -1
  272. package/dist/src/shared/messages.js +0 -2107
  273. package/dist/src/shared/messages.js.map +0 -1
  274. package/dist/src/shared/path-utils.js +0 -16
  275. package/dist/src/shared/path-utils.js.map +0 -1
  276. package/dist/src/shared/terminal-stream-protocol.js +0 -99
  277. package/dist/src/shared/terminal-stream-protocol.js.map +0 -1
  278. package/dist/src/shared/tool-call-display.js +0 -122
  279. package/dist/src/shared/tool-call-display.js.map +0 -1
  280. package/dist/src/terminal/terminal-manager.js +0 -136
  281. package/dist/src/terminal/terminal-manager.js.map +0 -1
  282. package/dist/src/terminal/terminal.js +0 -333
  283. package/dist/src/terminal/terminal.js.map +0 -1
  284. package/dist/src/utils/checkout-git.js +0 -1518
  285. package/dist/src/utils/checkout-git.js.map +0 -1
  286. package/dist/src/utils/directory-suggestions.js +0 -671
  287. package/dist/src/utils/directory-suggestions.js.map +0 -1
  288. package/dist/src/utils/path.js +0 -15
  289. package/dist/src/utils/path.js.map +0 -1
  290. package/dist/src/utils/project-icon.js +0 -389
  291. package/dist/src/utils/project-icon.js.map +0 -1
  292. package/dist/src/utils/worktree-metadata.js +0 -116
  293. package/dist/src/utils/worktree-metadata.js.map +0 -1
  294. package/dist/src/utils/worktree.js +0 -744
  295. package/dist/src/utils/worktree.js.map +0 -1
@@ -1,110 +0,0 @@
1
- import { EventEmitter } from "node:events";
2
- import { v4 as uuidv4 } from "uuid";
3
- import { pcm16lePeakAbs, pcm16leToFloat32 } from "../../../audio.js";
4
- export class SherpaRealtimeTranscriptionSession extends EventEmitter {
5
- constructor(params) {
6
- super();
7
- this.stream = null;
8
- this.connected = false;
9
- this.currentSegmentId = null;
10
- this.previousSegmentId = null;
11
- this.lastPartialText = "";
12
- this.engine = params.engine;
13
- this.requiredSampleRate = this.engine.sampleRate;
14
- this.tailPaddingMs = params.tailPaddingMs ?? 500;
15
- }
16
- async connect() {
17
- if (this.connected) {
18
- return;
19
- }
20
- this.stream = this.engine.createStream();
21
- this.currentSegmentId = uuidv4();
22
- this.connected = true;
23
- }
24
- appendPcm16(pcm16le) {
25
- if (!this.connected || !this.stream || !this.currentSegmentId) {
26
- this.emit("error", new Error("Sherpa realtime session not connected"));
27
- return;
28
- }
29
- try {
30
- const peak = pcm16lePeakAbs(pcm16le);
31
- const peakFloat = peak / 32768.0;
32
- const targetPeak = 0.6;
33
- const maxGain = 50;
34
- const gain = peakFloat > 0 && peakFloat < targetPeak ? Math.min(maxGain, targetPeak / peakFloat) : 1;
35
- const floatSamples = pcm16leToFloat32(pcm16le, gain);
36
- this.stream.acceptWaveform(this.engine.sampleRate, floatSamples);
37
- while (this.engine.recognizer.isReady(this.stream)) {
38
- this.engine.recognizer.decode(this.stream);
39
- }
40
- const text = String(this.engine.recognizer.getResult(this.stream)?.text ?? "").trim();
41
- if (text !== this.lastPartialText) {
42
- this.lastPartialText = text;
43
- this.emit("transcript", {
44
- segmentId: this.currentSegmentId,
45
- transcript: text,
46
- isFinal: false,
47
- });
48
- }
49
- }
50
- catch (err) {
51
- this.emit("error", err instanceof Error ? err : new Error(String(err)));
52
- }
53
- }
54
- commit() {
55
- if (!this.connected || !this.stream || !this.currentSegmentId) {
56
- this.emit("error", new Error("Sherpa realtime session not connected"));
57
- return;
58
- }
59
- try {
60
- const padSamples = Math.max(0, Math.round((this.engine.sampleRate * this.tailPaddingMs) / 1000));
61
- if (padSamples > 0) {
62
- this.stream.acceptWaveform(this.engine.sampleRate, new Float32Array(padSamples));
63
- }
64
- while (this.engine.recognizer.isReady(this.stream)) {
65
- this.engine.recognizer.decode(this.stream);
66
- }
67
- const finalText = String(this.engine.recognizer.getResult(this.stream)?.text ?? "").trim();
68
- const segmentId = this.currentSegmentId;
69
- const previousSegmentId = this.previousSegmentId;
70
- this.emit("committed", { segmentId, previousSegmentId });
71
- this.emit("transcript", { segmentId, transcript: finalText, isFinal: true });
72
- this.previousSegmentId = segmentId;
73
- this.currentSegmentId = uuidv4();
74
- this.lastPartialText = "";
75
- this.engine.recognizer.reset(this.stream);
76
- }
77
- catch (err) {
78
- this.emit("error", err instanceof Error ? err : new Error(String(err)));
79
- }
80
- }
81
- clear() {
82
- if (!this.connected || !this.stream) {
83
- return;
84
- }
85
- try {
86
- this.engine.recognizer.reset(this.stream);
87
- this.currentSegmentId = uuidv4();
88
- this.lastPartialText = "";
89
- }
90
- catch (err) {
91
- this.emit("error", err instanceof Error ? err : new Error(String(err)));
92
- }
93
- }
94
- close() {
95
- if (!this.stream) {
96
- return;
97
- }
98
- try {
99
- this.stream.free?.();
100
- }
101
- catch {
102
- // ignore
103
- }
104
- finally {
105
- this.stream = null;
106
- this.connected = false;
107
- }
108
- }
109
- }
110
- //# sourceMappingURL=sherpa-realtime-session.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"sherpa-realtime-session.js","sourceRoot":"","sources":["../../../../../../../src/server/speech/providers/local/sherpa/sherpa-realtime-session.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAC3C,OAAO,EAAE,EAAE,IAAI,MAAM,EAAE,MAAM,MAAM,CAAC;AAGpC,OAAO,EAAE,cAAc,EAAE,gBAAgB,EAAE,MAAM,mBAAmB,CAAC;AAGrE,MAAM,OAAO,kCACX,SAAQ,YAAY;IAapB,YAAY,MAAwE;QAClF,KAAK,EAAE,CAAC;QAVF,WAAM,GAAe,IAAI,CAAC;QAC1B,cAAS,GAAG,KAAK,CAAC;QAGlB,qBAAgB,GAAkB,IAAI,CAAC;QACvC,sBAAiB,GAAkB,IAAI,CAAC;QACxC,oBAAe,GAAG,EAAE,CAAC;QAK3B,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,kBAAkB,GAAG,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC;QACjD,IAAI,CAAC,aAAa,GAAG,MAAM,CAAC,aAAa,IAAI,GAAG,CAAC;IACnD,CAAC;IAED,KAAK,CAAC,OAAO;QACX,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;YACnB,OAAO;QACT,CAAC;QACD,IAAI,CAAC,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,YAAY,EAAE,CAAC;QACzC,IAAI,CAAC,gBAAgB,GAAG,MAAM,EAAE,CAAC;QACjC,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC;IACxB,CAAC;IAED,WAAW,CAAC,OAAe;QACzB,IAAI,CAAC,IAAI,CAAC,SAAS,IAAI,CAAC,IAAI,CAAC,MAAM,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,CAAC;YAC9D,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,uCAAuC,CAAC,CAAC,CAAC;YACvE,OAAO;QACT,CAAC;QAED,IAAI,CAAC;YACH,MAAM,IAAI,GAAG,cAAc,CAAC,OAAO,CAAC,CAAC;YACrC,MAAM,SAAS,GAAG,IAAI,GAAG,OAAO,CAAC;YACjC,MAAM,UAAU,GAAG,GAAG,CAAC;YACvB,MAAM,OAAO,GAAG,EAAE,CAAC;YACnB,MAAM,IAAI,GACR,SAAS,GAAG,CAAC,IAAI,SAAS,GAAG,UAAU,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,UAAU,GAAG,SAAS,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAC1F,MAAM,YAAY,GAAG,gBAAgB,CAAC,OAAO,EAAE,IAAI,CAAC,CAAC;YACrD,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,YAAY,CAAC,CAAC;YAEjE,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,EAAE,CAAC;gBACnD,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC7C,CAAC;YAED,MAAM,IAAI,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,SAAS,CAAC,IAAI,CAAC,MAAM,CAAC,EAAE,IAAI,IAAI,EAAE,CAAC,CAAC,IAAI,EAAE,CAAC;YACtF,IAAI,IAAI,KAAK,IAAI,CAAC,eAAe,EAAE,CAAC;gBAClC,IAAI,CAAC,eAAe,GAAG,IAAI,CAAC;gBAC5B,IAAI,CAAC,IAAI,CAAC,YAAY,EAAE;oBACtB,SAAS,EAAE,IAAI,CAAC,gBAAgB;oBAChC,UAAU,EAAE,IAAI;oBAChB,OAAO,EAAE,KAAK;iBACf,CAAC,CAAC;YACL,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC1E,CAAC;IACH,CAAC;IAED,MAAM;QACJ,IAAI,CAAC,IAAI,CAAC,SAAS,IAAI,CAAC,IAAI,CAAC,MAAM,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,CAAC;YAC9D,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,uCAAuC,CAAC,CAAC,CAAC;YACvE,OAAO;QACT,CAAC;QAED,IAAI,CAAC;YACH,MAAM,UAAU,GAAG,IAAI,CAAC,GAAG,CACzB,CAAC,EACD,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,GAAG,IAAI,CAAC,CACjE,CAAC;YACF,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;gBACnB,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,IAAI,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC;YACnF,CAAC;YAED,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,EAAE,CAAC;gBACnD,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC7C,CAAC;YAED,MAAM,SAAS,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,SAAS,CAAC,IAAI,CAAC,MAAM,CAAC,EAAE,IAAI,IAAI,EAAE,CAAC,CAAC,IAAI,EAAE,CAAC;YAC3F,MAAM,SAAS,GAAG,IAAI,CAAC,gBAAgB,CAAC;YACxC,MAAM,iBAAiB,GAAG,IAAI,CAAC,iBAAiB,CAAC;YAEjD,IAAI,CAAC,IAAI,CAAC,WAAW,EAAE,EAAE,SAAS,EAAE,iBAAiB,EAAE,CAAC,CAAC;YACzD,IAAI,CAAC,IAAI,CAAC,YAAY,EAAE,EAAE,SAAS,EAAE,UAAU,EAAE,SAAS,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;YAE7E,IAAI,CAAC,iBAAiB,GAAG,SAAS,CAAC;YACnC,IAAI,CAAC,gBAAgB,GAAG,MAAM,EAAE,CAAC;YACjC,IAAI,CAAC,eAAe,GAAG,EAAE,CAAC;YAC1B,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QAC5C,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC1E,CAAC;IACH,CAAC;IAED,KAAK;QACH,IAAI,CAAC,IAAI,CAAC,SAAS,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,CAAC;YACpC,OAAO;QACT,CAAC;QACD,IAAI,CAAC;YACH,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC1C,IAAI,CAAC,gBAAgB,GAAG,MAAM,EAAE,CAAC;YACjC,IAAI,CAAC,eAAe,GAAG,EAAE,CAAC;QAC5B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC1E,CAAC;IACH,CAAC;IAED,KAAK;QACH,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,CAAC;YACjB,OAAO;QACT,CAAC;QACD,IAAI,CAAC;YACH,IAAI,CAAC,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;QACvB,CAAC;QAAC,MAAM,CAAC;YACP,SAAS;QACX,CAAC;gBAAS,CAAC;YACT,IAAI,CAAC,MAAM,GAAG,IAAI,CAAC;YACnB,IAAI,CAAC,SAAS,GAAG,KAAK,CAAC;QACzB,CAAC;IACH,CAAC;CACF"}
@@ -1,138 +0,0 @@
1
- import { EventEmitter } from "node:events";
2
- import { v4 as uuidv4 } from "uuid";
3
- import { Pcm16MonoResampler } from "../../../../agent/pcm16-resampler.js";
4
- import { parsePcm16MonoWav, parsePcmRateFromFormat, pcm16lePeakAbs, pcm16leToFloat32, } from "../../../audio.js";
5
- export class SherpaOnnxSTT {
6
- constructor(config, logger) {
7
- this.id = "local";
8
- this.engine = config.engine;
9
- this.silencePeakThreshold = config.silencePeakThreshold ?? 300;
10
- this.tailPaddingMs = config.tailPaddingMs ?? 500;
11
- this.logger = logger.child({ module: "speech", provider: "local", component: "stt" });
12
- }
13
- createSession(params) {
14
- const emitter = new EventEmitter();
15
- void params;
16
- const requiredSampleRate = this.engine.sampleRate;
17
- let connected = false;
18
- let segmentId = uuidv4();
19
- let previousSegmentId = null;
20
- let pcm16 = Buffer.alloc(0);
21
- return {
22
- requiredSampleRate,
23
- async connect() {
24
- connected = true;
25
- },
26
- appendPcm16(chunk) {
27
- if (!connected) {
28
- emitter.emit("error", new Error("STT session not connected"));
29
- return;
30
- }
31
- pcm16 = pcm16.length === 0 ? chunk : Buffer.concat([pcm16, chunk]);
32
- },
33
- commit: () => {
34
- if (!connected) {
35
- emitter.emit("error", new Error("STT session not connected"));
36
- return;
37
- }
38
- const committedId = segmentId;
39
- const prev = previousSegmentId;
40
- emitter.emit("committed", { segmentId: committedId, previousSegmentId: prev });
41
- void (async () => {
42
- try {
43
- const rt = await this.transcribeAudio(pcm16, `audio/pcm;rate=${requiredSampleRate}`);
44
- emitter.emit("transcript", {
45
- segmentId: committedId,
46
- transcript: rt.text,
47
- isFinal: true,
48
- language: rt.language,
49
- logprobs: rt.logprobs,
50
- avgLogprob: rt.avgLogprob,
51
- isLowConfidence: rt.isLowConfidence,
52
- });
53
- }
54
- catch (err) {
55
- emitter.emit("error", err);
56
- }
57
- finally {
58
- previousSegmentId = committedId;
59
- segmentId = uuidv4();
60
- pcm16 = Buffer.alloc(0);
61
- }
62
- })();
63
- },
64
- clear() {
65
- pcm16 = Buffer.alloc(0);
66
- segmentId = uuidv4();
67
- },
68
- close() {
69
- connected = false;
70
- pcm16 = Buffer.alloc(0);
71
- },
72
- on(event, handler) {
73
- emitter.on(event, handler);
74
- return undefined;
75
- },
76
- };
77
- }
78
- async transcribeAudio(audioBuffer, format) {
79
- const start = Date.now();
80
- let inputRate;
81
- let pcm16;
82
- if (format.toLowerCase().includes("audio/wav")) {
83
- const parsed = parsePcm16MonoWav(audioBuffer);
84
- inputRate = parsed.sampleRate;
85
- pcm16 = parsed.pcm16;
86
- }
87
- else if (format.toLowerCase().includes("audio/pcm")) {
88
- inputRate = parsePcmRateFromFormat(format, this.engine.sampleRate) ?? this.engine.sampleRate;
89
- pcm16 = audioBuffer;
90
- }
91
- else {
92
- throw new Error(`Unsupported audio format for sherpa STT: ${format}`);
93
- }
94
- const peak = pcm16lePeakAbs(pcm16);
95
- if (peak < this.silencePeakThreshold) {
96
- return { text: "", duration: Date.now() - start, isLowConfidence: true };
97
- }
98
- let pcmForModel = pcm16;
99
- if (inputRate !== this.engine.sampleRate) {
100
- const resampler = new Pcm16MonoResampler({ inputRate, outputRate: this.engine.sampleRate });
101
- pcmForModel = resampler.processChunk(pcm16);
102
- inputRate = this.engine.sampleRate;
103
- }
104
- const peakForModel = pcm16lePeakAbs(pcmForModel);
105
- const peakFloat = peakForModel / 32768.0;
106
- const targetPeak = 0.6;
107
- const maxGain = 50;
108
- const gain = peakFloat > 0 && peakFloat < targetPeak ? Math.min(maxGain, targetPeak / peakFloat) : 1;
109
- const stream = this.engine.createStream();
110
- try {
111
- const floatSamples = pcm16leToFloat32(pcmForModel, gain);
112
- stream.acceptWaveform(inputRate, floatSamples);
113
- while (this.engine.recognizer.isReady(stream)) {
114
- this.engine.recognizer.decode(stream);
115
- }
116
- const padSamples = Math.max(0, Math.round((this.engine.sampleRate * this.tailPaddingMs) / 1000));
117
- if (padSamples > 0) {
118
- stream.acceptWaveform(this.engine.sampleRate, new Float32Array(padSamples));
119
- }
120
- while (this.engine.recognizer.isReady(stream)) {
121
- this.engine.recognizer.decode(stream);
122
- }
123
- const text = String(this.engine.recognizer.getResult(stream)?.text ?? "").trim();
124
- const duration = Date.now() - start;
125
- this.logger.debug({ duration, textLength: text.length }, "Sherpa transcription complete");
126
- return { text, duration, ...(text.length === 0 ? { isLowConfidence: true } : {}) };
127
- }
128
- finally {
129
- try {
130
- stream.free?.();
131
- }
132
- catch {
133
- // ignore
134
- }
135
- }
136
- }
137
- }
138
- //# sourceMappingURL=sherpa-stt.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"sherpa-stt.js","sourceRoot":"","sources":["../../../../../../../src/server/speech/providers/local/sherpa/sherpa-stt.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAC3C,OAAO,EAAE,EAAE,IAAI,MAAM,EAAE,MAAM,MAAM,CAAC;AAQpC,OAAO,EAAE,kBAAkB,EAAE,MAAM,sCAAsC,CAAC;AAC1E,OAAO,EACL,iBAAiB,EACjB,sBAAsB,EACtB,cAAc,EACd,gBAAgB,GACjB,MAAM,mBAAmB,CAAC;AAS3B,MAAM,OAAO,aAAa;IAOxB,YAAY,MAAuB,EAAE,MAAmB;QAFxC,OAAE,GAAG,OAAgB,CAAC;QAGpC,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,oBAAoB,GAAG,MAAM,CAAC,oBAAoB,IAAI,GAAG,CAAC;QAC/D,IAAI,CAAC,aAAa,GAAG,MAAM,CAAC,aAAa,IAAI,GAAG,CAAC;QACjD,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,OAAO,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC,CAAC;IACxF,CAAC;IAEM,aAAa,CAAC,MAIpB;QACC,MAAM,OAAO,GAAG,IAAI,YAAY,EAAE,CAAC;QACnC,KAAK,MAAM,CAAC;QACZ,MAAM,kBAAkB,GAAG,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC;QAClD,IAAI,SAAS,GAAG,KAAK,CAAC;QACtB,IAAI,SAAS,GAAG,MAAM,EAAE,CAAC;QACzB,IAAI,iBAAiB,GAAkB,IAAI,CAAC;QAC5C,IAAI,KAAK,GAAW,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QAEpC,OAAO;YACL,kBAAkB;YAClB,KAAK,CAAC,OAAO;gBACX,SAAS,GAAG,IAAI,CAAC;YACnB,CAAC;YACD,WAAW,CAAC,KAAa;gBACvB,IAAI,CAAC,SAAS,EAAE,CAAC;oBACd,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,2BAA2B,CAAC,CAAC,CAAC;oBACvE,OAAO;gBACT,CAAC;gBACD,KAAK,GAAG,KAAK,CAAC,MAAM,KAAK,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC,CAAC;YACrE,CAAC;YACD,MAAM,EAAE,GAAG,EAAE;gBACX,IAAI,CAAC,SAAS,EAAE,CAAC;oBACd,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,2BAA2B,CAAC,CAAC,CAAC;oBACvE,OAAO;gBACT,CAAC;gBAED,MAAM,WAAW,GAAG,SAAS,CAAC;gBAC9B,MAAM,IAAI,GAAG,iBAAiB,CAAC;gBAC9B,OAAe,CAAC,IAAI,CAAC,WAAW,EAAE,EAAE,SAAS,EAAE,WAAW,EAAE,iBAAiB,EAAE,IAAI,EAAE,CAAC,CAAC;gBAExF,KAAK,CAAC,KAAK,IAAI,EAAE;oBACf,IAAI,CAAC;wBACH,MAAM,EAAE,GAAG,MAAM,IAAI,CAAC,eAAe,CAAC,KAAK,EAAE,kBAAkB,kBAAkB,EAAE,CAAC,CAAC;wBACpF,OAAe,CAAC,IAAI,CAAC,YAAY,EAAE;4BAClC,SAAS,EAAE,WAAW;4BACtB,UAAU,EAAE,EAAE,CAAC,IAAI;4BACnB,OAAO,EAAE,IAAI;4BACb,QAAQ,EAAE,EAAE,CAAC,QAAQ;4BACrB,QAAQ,EAAE,EAAE,CAAC,QAAQ;4BACrB,UAAU,EAAE,EAAE,CAAC,UAAU;4BACzB,eAAe,EAAE,EAAE,CAAC,eAAe;yBACpC,CAAC,CAAC;oBACL,CAAC;oBAAC,OAAO,GAAG,EAAE,CAAC;wBACZ,OAAe,CAAC,IAAI,CAAC,OAAO,EAAE,GAAG,CAAC,CAAC;oBACtC,CAAC;4BAAS,CAAC;wBACT,iBAAiB,GAAG,WAAW,CAAC;wBAChC,SAAS,GAAG,MAAM,EAAE,CAAC;wBACrB,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;oBAC1B,CAAC;gBACH,CAAC,CAAC,EAAE,CAAC;YACP,CAAC;YACD,KAAK;gBACH,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;gBACxB,SAAS,GAAG,MAAM,EAAE,CAAC;YACvB,CAAC;YACD,KAAK;gBACH,SAAS,GAAG,KAAK,CAAC;gBAClB,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;YAC1B,CAAC;YACD,EAAE,CAAC,KAAU,EAAE,OAAY;gBACzB,OAAO,CAAC,EAAE,CAAC,KAAK,EAAE,OAAO,CAAC,CAAC;gBAC3B,OAAO,SAAS,CAAC;YACnB,CAAC;SACF,CAAC;IACJ,CAAC;IAEM,KAAK,CAAC,eAAe,CAAC,WAAmB,EAAE,MAAc;QAC9D,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAEzB,IAAI,SAAiB,CAAC;QACtB,IAAI,KAAa,CAAC;QAElB,IAAI,MAAM,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,WAAW,CAAC,EAAE,CAAC;YAC/C,MAAM,MAAM,GAAG,iBAAiB,CAAC,WAAW,CAAC,CAAC;YAC9C,SAAS,GAAG,MAAM,CAAC,UAAU,CAAC;YAC9B,KAAK,GAAG,MAAM,CAAC,KAAK,CAAC;QACvB,CAAC;aAAM,IAAI,MAAM,CAAC,WAAW,EAAE,CAAC,QAAQ,CAAC,WAAW,CAAC,EAAE,CAAC;YACtD,SAAS,GAAG,sBAAsB,CAAC,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,IAAI,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC;YAC7F,KAAK,GAAG,WAAW,CAAC;QACtB,CAAC;aAAM,CAAC;YACN,MAAM,IAAI,KAAK,CAAC,4CAA4C,MAAM,EAAE,CAAC,CAAC;QACxE,CAAC;QAED,MAAM,IAAI,GAAG,cAAc,CAAC,KAAK,CAAC,CAAC;QACnC,IAAI,IAAI,GAAG,IAAI,CAAC,oBAAoB,EAAE,CAAC;YACrC,OAAO,EAAE,IAAI,EAAE,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK,EAAE,eAAe,EAAE,IAAI,EAAE,CAAC;QAC3E,CAAC;QAED,IAAI,WAAW,GAAG,KAAK,CAAC;QACxB,IAAI,SAAS,KAAK,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC;YACzC,MAAM,SAAS,GAAG,IAAI,kBAAkB,CAAC,EAAE,SAAS,EAAE,UAAU,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC,CAAC;YAC5F,WAAW,GAAG,SAAS,CAAC,YAAY,CAAC,KAAK,CAAC,CAAC;YAC5C,SAAS,GAAG,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC;QACrC,CAAC;QAED,MAAM,YAAY,GAAG,cAAc,CAAC,WAAW,CAAC,CAAC;QACjD,MAAM,SAAS,GAAG,YAAY,GAAG,OAAO,CAAC;QACzC,MAAM,UAAU,GAAG,GAAG,CAAC;QACvB,MAAM,OAAO,GAAG,EAAE,CAAC;QACnB,MAAM,IAAI,GACR,SAAS,GAAG,CAAC,IAAI,SAAS,GAAG,UAAU,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,UAAU,GAAG,SAAS,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QAE1F,MAAM,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,YAAY,EAAE,CAAC;QAC1C,IAAI,CAAC;YACH,MAAM,YAAY,GAAG,gBAAgB,CAAC,WAAW,EAAE,IAAI,CAAC,CAAC;YACzD,MAAM,CAAC,cAAc,CAAC,SAAS,EAAE,YAAY,CAAC,CAAC;YAE/C,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,OAAO,CAAC,MAAM,CAAC,EAAE,CAAC;gBAC9C,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;YACxC,CAAC;YAED,MAAM,UAAU,GAAG,IAAI,CAAC,GAAG,CACzB,CAAC,EACD,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,GAAG,IAAI,CAAC,CACjE,CAAC;YACF,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;gBACnB,MAAM,CAAC,cAAc,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,IAAI,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC;YAC9E,CAAC;YAED,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,OAAO,CAAC,MAAM,CAAC,EAAE,CAAC;gBAC9C,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;YACxC,CAAC;YAED,MAAM,IAAI,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,SAAS,CAAC,MAAM,CAAC,EAAE,IAAI,IAAI,EAAE,CAAC,CAAC,IAAI,EAAE,CAAC;YACjF,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK,CAAC;YACpC,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE,QAAQ,EAAE,UAAU,EAAE,IAAI,CAAC,MAAM,EAAE,EAAE,+BAA+B,CAAC,CAAC;YAC1F,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE,GAAG,CAAC,IAAI,CAAC,MAAM,KAAK,CAAC,CAAC,CAAC,CAAC,EAAE,eAAe,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,CAAC;QACrF,CAAC;gBAAS,CAAC;YACT,IAAI,CAAC;gBACH,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;YAClB,CAAC;YAAC,MAAM,CAAC;gBACP,SAAS;YACX,CAAC;QACH,CAAC;IACH,CAAC;CACF"}
@@ -1,98 +0,0 @@
1
- import { Readable } from "node:stream";
2
- import { existsSync } from "node:fs";
3
- import { chunkBuffer, float32ToPcm16le } from "../../../audio.js";
4
- import { loadSherpaOnnxNode } from "./sherpa-onnx-node-loader.js";
5
- function assertFileExists(filePath, label) {
6
- if (!existsSync(filePath)) {
7
- throw new Error(`Missing ${label}: ${filePath}`);
8
- }
9
- }
10
- export class SherpaOnnxTTS {
11
- constructor(config, logger) {
12
- if (config.preset !== "kokoro-en-v0_19" && config.preset !== "kitten-nano-en-v0_1-fp16") {
13
- throw new Error(`Unsupported Sherpa TTS preset: ${config.preset}`);
14
- }
15
- this.logger = logger.child({ module: "speech", provider: "local", component: "tts" });
16
- this.speakerId = config.speakerId ?? 0;
17
- this.speed = config.speed ?? 1.0;
18
- const sherpa = loadSherpaOnnxNode();
19
- if (typeof sherpa.OfflineTts !== "function") {
20
- throw new Error("sherpa-onnx-node OfflineTts is unavailable");
21
- }
22
- const modelFile = config.preset === "kokoro-en-v0_19" ? "model.onnx" : "model.fp16.onnx";
23
- const modelPath = `${config.modelDir}/${modelFile}`;
24
- const voicesPath = `${config.modelDir}/voices.bin`;
25
- const tokensPath = `${config.modelDir}/tokens.txt`;
26
- const dataDir = `${config.modelDir}/espeak-ng-data`;
27
- assertFileExists(modelPath, "TTS model");
28
- assertFileExists(voicesPath, "TTS voices");
29
- assertFileExists(tokensPath, "TTS tokens");
30
- assertFileExists(dataDir, "TTS espeak-ng dataDir");
31
- const modelConfig = config.preset === "kokoro-en-v0_19"
32
- ? {
33
- kokoro: {
34
- model: modelPath,
35
- voices: voicesPath,
36
- tokens: tokensPath,
37
- dataDir,
38
- lengthScale: config.lengthScale ?? 1.0,
39
- },
40
- }
41
- : {
42
- kitten: {
43
- model: modelPath,
44
- voices: voicesPath,
45
- tokens: tokensPath,
46
- dataDir,
47
- lengthScale: config.lengthScale ?? 1.0,
48
- },
49
- };
50
- const offlineTtsConfig = {
51
- model: modelConfig,
52
- numThreads: config.numThreads ?? 2,
53
- provider: "cpu",
54
- maxNumSentences: 1,
55
- };
56
- this.tts = new sherpa.OfflineTts(offlineTtsConfig);
57
- this.logger.info({ preset: config.preset, modelDir: config.modelDir }, "Sherpa offline TTS initialized");
58
- }
59
- async synthesizeSpeech(text) {
60
- const trimmed = text.trim();
61
- if (!trimmed) {
62
- throw new Error("Cannot synthesize empty text");
63
- }
64
- const audio = this.tts.generate({ text: trimmed, sid: this.speakerId, speed: this.speed });
65
- const samples = audio && audio.samples instanceof Float32Array
66
- ? audio.samples
67
- : audio && Array.isArray(audio.samples)
68
- ? Float32Array.from(audio.samples)
69
- : null;
70
- const sampleRate = audio &&
71
- typeof audio.sampleRate === "number" &&
72
- Number.isFinite(audio.sampleRate) &&
73
- audio.sampleRate > 0
74
- ? audio.sampleRate
75
- : typeof this.tts.sampleRate === "number"
76
- ? this.tts.sampleRate
77
- : 24000;
78
- if (!samples) {
79
- throw new Error("Unexpected sherpa TTS output: missing Float32 samples");
80
- }
81
- const pcm16 = float32ToPcm16le(samples);
82
- const chunkBytes = Math.max(2, Math.round(sampleRate * 0.05) * 2); // ~50ms
83
- const chunks = chunkBuffer(pcm16, chunkBytes);
84
- return {
85
- stream: Readable.from(chunks),
86
- format: `pcm;rate=${sampleRate}`,
87
- };
88
- }
89
- free() {
90
- try {
91
- this.tts?.free?.();
92
- }
93
- catch {
94
- // ignore
95
- }
96
- }
97
- }
98
- //# sourceMappingURL=sherpa-tts.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"sherpa-tts.js","sourceRoot":"","sources":["../../../../../../../src/server/speech/providers/local/sherpa/sherpa-tts.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AACvC,OAAO,EAAE,UAAU,EAAE,MAAM,SAAS,CAAC;AAGrC,OAAO,EAAE,WAAW,EAAE,gBAAgB,EAAE,MAAM,mBAAmB,CAAC;AAClE,OAAO,EAAE,kBAAkB,EAAE,MAAM,8BAA8B,CAAC;AAalE,SAAS,gBAAgB,CAAC,QAAgB,EAAE,KAAa;IACvD,IAAI,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;QAC1B,MAAM,IAAI,KAAK,CAAC,WAAW,KAAK,KAAK,QAAQ,EAAE,CAAC,CAAC;IACnD,CAAC;AACH,CAAC;AAED,MAAM,OAAO,aAAa;IAMxB,YAAY,MAAuB,EAAE,MAAmB;QACtD,IAAI,MAAM,CAAC,MAAM,KAAK,iBAAiB,IAAI,MAAM,CAAC,MAAM,KAAK,0BAA0B,EAAE,CAAC;YACxF,MAAM,IAAI,KAAK,CAAC,kCAAkC,MAAM,CAAC,MAAM,EAAE,CAAC,CAAC;QACrE,CAAC;QACD,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,OAAO,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC,CAAC;QACtF,IAAI,CAAC,SAAS,GAAG,MAAM,CAAC,SAAS,IAAI,CAAC,CAAC;QACvC,IAAI,CAAC,KAAK,GAAG,MAAM,CAAC,KAAK,IAAI,GAAG,CAAC;QAEjC,MAAM,MAAM,GAAG,kBAAkB,EAAE,CAAC;QACpC,IAAI,OAAO,MAAM,CAAC,UAAU,KAAK,UAAU,EAAE,CAAC;YAC5C,MAAM,IAAI,KAAK,CAAC,4CAA4C,CAAC,CAAC;QAChE,CAAC;QAED,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,KAAK,iBAAiB,CAAC,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,iBAAiB,CAAC;QACzF,MAAM,SAAS,GAAG,GAAG,MAAM,CAAC,QAAQ,IAAI,SAAS,EAAE,CAAC;QACpD,MAAM,UAAU,GAAG,GAAG,MAAM,CAAC,QAAQ,aAAa,CAAC;QACnD,MAAM,UAAU,GAAG,GAAG,MAAM,CAAC,QAAQ,aAAa,CAAC;QACnD,MAAM,OAAO,GAAG,GAAG,MAAM,CAAC,QAAQ,iBAAiB,CAAC;QAEpD,gBAAgB,CAAC,SAAS,EAAE,WAAW,CAAC,CAAC;QACzC,gBAAgB,CAAC,UAAU,EAAE,YAAY,CAAC,CAAC;QAC3C,gBAAgB,CAAC,UAAU,EAAE,YAAY,CAAC,CAAC;QAC3C,gBAAgB,CAAC,OAAO,EAAE,uBAAuB,CAAC,CAAC;QAEnD,MAAM,WAAW,GACf,MAAM,CAAC,MAAM,KAAK,iBAAiB;YACjC,CAAC,CAAC;gBACE,MAAM,EAAE;oBACN,KAAK,EAAE,SAAS;oBAChB,MAAM,EAAE,UAAU;oBAClB,MAAM,EAAE,UAAU;oBAClB,OAAO;oBACP,WAAW,EAAE,MAAM,CAAC,WAAW,IAAI,GAAG;iBACvC;aACF;YACH,CAAC,CAAC;gBACE,MAAM,EAAE;oBACN,KAAK,EAAE,SAAS;oBAChB,MAAM,EAAE,UAAU;oBAClB,MAAM,EAAE,UAAU;oBAClB,OAAO;oBACP,WAAW,EAAE,MAAM,CAAC,WAAW,IAAI,GAAG;iBACvC;aACF,CAAC;QAER,MAAM,gBAAgB,GAAG;YACvB,KAAK,EAAE,WAAW;YAClB,UAAU,EAAE,MAAM,CAAC,UAAU,IAAI,CAAC;YAClC,QAAQ,EAAE,KAAK;YACf,eAAe,EAAE,CAAC;SACnB,CAAC;QAEF,IAAI,CAAC,GAAG,GAAG,IAAI,MAAM,CAAC,UAAU,CAAC,gBAAgB,CAAC,CAAC;QACnD,IAAI,CAAC,MAAM,CAAC,IAAI,CACd,EAAE,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,QAAQ,EAAE,MAAM,CAAC,QAAQ,EAAE,EACpD,gCAAgC,CACjC,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,gBAAgB,CAAC,IAAY;QACjC,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;QAC5B,IAAI,CAAC,OAAO,EAAE,CAAC;YACb,MAAM,IAAI,KAAK,CAAC,8BAA8B,CAAC,CAAC;QAClD,CAAC;QAED,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,QAAQ,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,GAAG,EAAE,IAAI,CAAC,SAAS,EAAE,KAAK,EAAE,IAAI,CAAC,KAAK,EAAE,CAAC,CAAC;QAC3F,MAAM,OAAO,GACX,KAAK,IAAI,KAAK,CAAC,OAAO,YAAY,YAAY;YAC5C,CAAC,CAAC,KAAK,CAAC,OAAO;YACf,CAAC,CAAC,KAAK,IAAI,KAAK,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC;gBACrC,CAAC,CAAC,YAAY,CAAC,IAAI,CAAC,KAAK,CAAC,OAAmB,CAAC;gBAC9C,CAAC,CAAC,IAAI,CAAC;QACb,MAAM,UAAU,GACd,KAAK;YACL,OAAO,KAAK,CAAC,UAAU,KAAK,QAAQ;YACpC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,UAAU,CAAC;YACjC,KAAK,CAAC,UAAU,GAAG,CAAC;YAClB,CAAC,CAAC,KAAK,CAAC,UAAU;YAClB,CAAC,CAAC,OAAO,IAAI,CAAC,GAAG,CAAC,UAAU,KAAK,QAAQ;gBACvC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,UAAU;gBACrB,CAAC,CAAC,KAAK,CAAC;QAEd,IAAI,CAAC,OAAO,EAAE,CAAC;YACb,MAAM,IAAI,KAAK,CAAC,uDAAuD,CAAC,CAAC;QAC3E,CAAC;QAED,MAAM,KAAK,GAAG,gBAAgB,CAAC,OAAO,CAAC,CAAC;QACxC,MAAM,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ;QAC3E,MAAM,MAAM,GAAG,WAAW,CAAC,KAAK,EAAE,UAAU,CAAC,CAAC;QAE9C,OAAO;YACL,MAAM,EAAE,QAAQ,CAAC,IAAI,CAAC,MAAM,CAAC;YAC7B,MAAM,EAAE,YAAY,UAAU,EAAE;SACjC,CAAC;IACJ,CAAC;IAED,IAAI;QACF,IAAI,CAAC;YACH,IAAI,CAAC,GAAG,EAAE,IAAI,EAAE,EAAE,CAAC;QACrB,CAAC;QAAC,MAAM,CAAC;YACP,SAAS;QACX,CAAC;IACH,CAAC;CACF"}
@@ -1,23 +0,0 @@
1
- import { SherpaSileroVadSession } from "./silero-vad-session.js";
2
- export class SherpaSileroTurnDetectionProvider {
3
- constructor(config, logger) {
4
- this.id = "local";
5
- this.config = config;
6
- this.logger = logger.child({
7
- module: "speech",
8
- provider: "local",
9
- component: "silero-vad",
10
- });
11
- }
12
- createSession(params) {
13
- this.logger.debug({ sampleRate: this.config.sampleRate, modelPath: this.config.modelPath }, "Creating Silero VAD turn-detection session");
14
- return new SherpaSileroVadSession({
15
- logger: params.logger.child({
16
- provider: "local",
17
- component: "silero-vad-session",
18
- }),
19
- config: this.config,
20
- });
21
- }
22
- }
23
- //# sourceMappingURL=silero-vad-provider.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"silero-vad-provider.js","sourceRoot":"","sources":["../../../../../../../src/server/speech/providers/local/sherpa/silero-vad-provider.ts"],"names":[],"mappings":"AAMA,OAAO,EAAE,sBAAsB,EAAqC,MAAM,yBAAyB,CAAC;AAEpG,MAAM,OAAO,iCAAiC;IAM5C,YAAY,MAAoC,EAAE,MAAc;QALhD,OAAE,GAAG,OAAgB,CAAC;QAMpC,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,KAAK,CAAC;YACzB,MAAM,EAAE,QAAQ;YAChB,QAAQ,EAAE,OAAO;YACjB,SAAS,EAAE,YAAY;SACxB,CAAC,CAAC;IACL,CAAC;IAED,aAAa,CAAC,MAA0B;QACtC,IAAI,CAAC,MAAM,CAAC,KAAK,CACf,EAAE,UAAU,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,SAAS,EAAE,IAAI,CAAC,MAAM,CAAC,SAAS,EAAE,EACxE,4CAA4C,CAC7C,CAAC;QACF,OAAO,IAAI,sBAAsB,CAAC;YAChC,MAAM,EAAE,MAAM,CAAC,MAAM,CAAC,KAAK,CAAC;gBAC1B,QAAQ,EAAE,OAAO;gBACjB,SAAS,EAAE,oBAAoB;aAChC,CAAC;YACF,MAAM,EAAE,IAAI,CAAC,MAAM;SACpB,CAAC,CAAC;IACL,CAAC;CACF"}
@@ -1,107 +0,0 @@
1
- import { EventEmitter } from "node:events";
2
- import { fileURLToPath } from "node:url";
3
- import { pcm16leToFloat32 } from "../../../audio.js";
4
- import { loadSherpaOnnxNode } from "./sherpa-onnx-node-loader.js";
5
- const DEFAULT_SAMPLE_RATE = 16000;
6
- const DEFAULT_BUFFER_SIZE_SECONDS = 60;
7
- const DEFAULT_SILERO_THRESHOLD = 0.5;
8
- const DEFAULT_MIN_SILENCE_DURATION = 1.2;
9
- const DEFAULT_MIN_SPEECH_DURATION = 0.2;
10
- const DEFAULT_WINDOW_SIZE = 512;
11
- function resolveBundledSileroVadModelPath() {
12
- return fileURLToPath(new URL("./assets/silero_vad.onnx", import.meta.url));
13
- }
14
- export class SherpaSileroVadSession extends EventEmitter {
15
- constructor(params) {
16
- super();
17
- this.connected = false;
18
- this.inSpeech = false;
19
- this.logger = params.logger;
20
- const config = params.config ?? {};
21
- this.requiredSampleRate = config.sampleRate ?? DEFAULT_SAMPLE_RATE;
22
- this.windowSize = config.windowSize ?? DEFAULT_WINDOW_SIZE;
23
- const sherpa = loadSherpaOnnxNode();
24
- this.vad = new sherpa.Vad({
25
- sileroVad: {
26
- model: config.modelPath ?? resolveBundledSileroVadModelPath(),
27
- threshold: config.threshold ?? DEFAULT_SILERO_THRESHOLD,
28
- minSilenceDuration: config.minSilenceDuration ?? DEFAULT_MIN_SILENCE_DURATION,
29
- minSpeechDuration: config.minSpeechDuration ?? DEFAULT_MIN_SPEECH_DURATION,
30
- windowSize: config.windowSize ?? DEFAULT_WINDOW_SIZE,
31
- },
32
- sampleRate: this.requiredSampleRate,
33
- numThreads: 1,
34
- provider: "cpu",
35
- debug: 0,
36
- }, config.bufferSizeInSeconds ?? DEFAULT_BUFFER_SIZE_SECONDS);
37
- this.inputBuffer = new sherpa.CircularBuffer((config.bufferSizeInSeconds ?? DEFAULT_BUFFER_SIZE_SECONDS) * this.requiredSampleRate);
38
- }
39
- async connect() {
40
- this.connected = true;
41
- }
42
- appendPcm16(pcm16le) {
43
- if (!this.connected) {
44
- this.emit("error", new Error("Turn detection session not connected"));
45
- return;
46
- }
47
- if (pcm16le.length === 0) {
48
- return;
49
- }
50
- try {
51
- const samples = pcm16leToFloat32(pcm16le, 1);
52
- this.inputBuffer.push(samples);
53
- while (this.inputBuffer.size() > this.windowSize) {
54
- const window = this.inputBuffer.get(this.inputBuffer.head(), this.windowSize);
55
- this.inputBuffer.pop(this.windowSize);
56
- this.vad.acceptWaveform(window);
57
- this.syncDetectionState();
58
- }
59
- }
60
- catch (error) {
61
- this.emit("error", error instanceof Error ? error : new Error(String(error)));
62
- }
63
- }
64
- flush() {
65
- if (!this.connected) {
66
- return;
67
- }
68
- try {
69
- this.vad.flush();
70
- this.syncDetectionState();
71
- if (this.inSpeech) {
72
- this.inSpeech = false;
73
- this.emit("speech_stopped");
74
- }
75
- }
76
- catch (error) {
77
- this.emit("error", error instanceof Error ? error : new Error(String(error)));
78
- }
79
- }
80
- close() {
81
- try {
82
- this.vad.reset();
83
- this.inputBuffer.reset();
84
- }
85
- catch {
86
- // ignore native cleanup failures
87
- }
88
- finally {
89
- this.connected = false;
90
- this.inSpeech = false;
91
- }
92
- }
93
- syncDetectionState() {
94
- const detected = this.vad.isDetected();
95
- if (detected && !this.inSpeech) {
96
- this.inSpeech = true;
97
- this.emit("speech_started");
98
- return;
99
- }
100
- if (!detected && this.inSpeech && !this.vad.isEmpty()) {
101
- this.logger.debug("Silero VAD marked end of speech");
102
- this.inSpeech = false;
103
- this.emit("speech_stopped");
104
- }
105
- }
106
- }
107
- //# sourceMappingURL=silero-vad-session.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"silero-vad-session.js","sourceRoot":"","sources":["../../../../../../../src/server/speech/providers/local/sherpa/silero-vad-session.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAC3C,OAAO,EAAE,aAAa,EAAE,MAAM,UAAU,CAAC;AAEzC,OAAO,EAAE,gBAAgB,EAAE,MAAM,mBAAmB,CAAC;AAErD,OAAO,EAAE,kBAAkB,EAAE,MAAM,8BAA8B,CAAC;AAElE,MAAM,mBAAmB,GAAG,KAAK,CAAC;AAClC,MAAM,2BAA2B,GAAG,EAAE,CAAC;AACvC,MAAM,wBAAwB,GAAG,GAAG,CAAC;AACrC,MAAM,4BAA4B,GAAG,GAAG,CAAC;AACzC,MAAM,2BAA2B,GAAG,GAAG,CAAC;AACxC,MAAM,mBAAmB,GAAG,GAAG,CAAC;AAwBhC,SAAS,gCAAgC;IACvC,OAAO,aAAa,CAAC,IAAI,GAAG,CAAC,0BAA0B,EAAE,MAAM,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;AAC7E,CAAC;AAYD,MAAM,OAAO,sBAAuB,SAAQ,YAAY;IAUtD,YAAY,MAGX;QACC,KAAK,EAAE,CAAC;QARF,cAAS,GAAG,KAAK,CAAC;QAClB,aAAQ,GAAG,KAAK,CAAC;QAQvB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,MAAM,MAAM,GAAG,MAAM,CAAC,MAAM,IAAI,EAAE,CAAC;QACnC,IAAI,CAAC,kBAAkB,GAAG,MAAM,CAAC,UAAU,IAAI,mBAAmB,CAAC;QACnE,IAAI,CAAC,UAAU,GAAG,MAAM,CAAC,UAAU,IAAI,mBAAmB,CAAC;QAE3D,MAAM,MAAM,GAAG,kBAAkB,EAAgC,CAAC;QAClE,IAAI,CAAC,GAAG,GAAG,IAAI,MAAM,CAAC,GAAG,CACvB;YACE,SAAS,EAAE;gBACT,KAAK,EAAE,MAAM,CAAC,SAAS,IAAI,gCAAgC,EAAE;gBAC7D,SAAS,EAAE,MAAM,CAAC,SAAS,IAAI,wBAAwB;gBACvD,kBAAkB,EAAE,MAAM,CAAC,kBAAkB,IAAI,4BAA4B;gBAC7E,iBAAiB,EAAE,MAAM,CAAC,iBAAiB,IAAI,2BAA2B;gBAC1E,UAAU,EAAE,MAAM,CAAC,UAAU,IAAI,mBAAmB;aACrD;YACD,UAAU,EAAE,IAAI,CAAC,kBAAkB;YACnC,UAAU,EAAE,CAAC;YACb,QAAQ,EAAE,KAAK;YACf,KAAK,EAAE,CAAC;SACT,EACD,MAAM,CAAC,mBAAmB,IAAI,2BAA2B,CAC1D,CAAC;QACF,IAAI,CAAC,WAAW,GAAG,IAAI,MAAM,CAAC,cAAc,CAC1C,CAAC,MAAM,CAAC,mBAAmB,IAAI,2BAA2B,CAAC,GAAG,IAAI,CAAC,kBAAkB,CACtF,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,OAAO;QACX,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC;IACxB,CAAC;IAED,WAAW,CAAC,OAAe;QACzB,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,CAAC;YACpB,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,IAAI,KAAK,CAAC,sCAAsC,CAAC,CAAC,CAAC;YACtE,OAAO;QACT,CAAC;QACD,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACzB,OAAO;QACT,CAAC;QAED,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,gBAAgB,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC;YAC7C,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;YAC/B,OAAO,IAAI,CAAC,WAAW,CAAC,IAAI,EAAE,GAAG,IAAI,CAAC,UAAU,EAAE,CAAC;gBACjD,MAAM,MAAM,GAAG,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,IAAI,CAAC,WAAW,CAAC,IAAI,EAAE,EAAE,IAAI,CAAC,UAAU,CAAC,CAAC;gBAC9E,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;gBACtC,IAAI,CAAC,GAAG,CAAC,cAAc,CAAC,MAAM,CAAC,CAAC;gBAChC,IAAI,CAAC,kBAAkB,EAAE,CAAC;YAC5B,CAAC;QACH,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QAChF,CAAC;IACH,CAAC;IAED,KAAK;QACH,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,CAAC;YACpB,OAAO;QACT,CAAC;QAED,IAAI,CAAC;YACH,IAAI,CAAC,GAAG,CAAC,KAAK,EAAE,CAAC;YACjB,IAAI,CAAC,kBAAkB,EAAE,CAAC;YAC1B,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;gBAClB,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;gBACtB,IAAI,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;YAC9B,CAAC;QACH,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QAChF,CAAC;IACH,CAAC;IAED,KAAK;QACH,IAAI,CAAC;YACH,IAAI,CAAC,GAAG,CAAC,KAAK,EAAE,CAAC;YACjB,IAAI,CAAC,WAAW,CAAC,KAAK,EAAE,CAAC;QAC3B,CAAC;QAAC,MAAM,CAAC;YACP,iCAAiC;QACnC,CAAC;gBAAS,CAAC;YACT,IAAI,CAAC,SAAS,GAAG,KAAK,CAAC;YACvB,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;QACxB,CAAC;IACH,CAAC;IAEO,kBAAkB;QACxB,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,UAAU,EAAE,CAAC;QACvC,IAAI,QAAQ,IAAI,CAAC,IAAI,CAAC,QAAQ,EAAE,CAAC;YAC/B,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC;YACrB,IAAI,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;YAC5B,OAAO;QACT,CAAC;QAED,IAAI,CAAC,QAAQ,IAAI,IAAI,CAAC,QAAQ,IAAI,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,EAAE,CAAC;YACtD,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,iCAAiC,CAAC,CAAC;YACrD,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;YACtB,IAAI,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;QAC9B,CAAC;IACH,CAAC;CACF"}
@@ -1,80 +0,0 @@
1
- import { z } from "zod";
2
- export const DEFAULT_OPENAI_REALTIME_TRANSCRIPTION_MODEL = "gpt-4o-transcribe";
3
- export const DEFAULT_OPENAI_TTS_MODEL = "tts-1";
4
- const OpenAiTtsVoiceSchema = z.enum(["alloy", "echo", "fable", "onyx", "nova", "shimmer"]);
5
- const OpenAiTtsModelSchema = z.enum(["tts-1", "tts-1-hd"]);
6
- const NumberLikeSchema = z.union([z.number(), z.string().trim().min(1)]);
7
- const OptionalFiniteNumberSchema = NumberLikeSchema.pipe(z.coerce.number().finite()).optional();
8
- const OptionalTrimmedStringSchema = z
9
- .string()
10
- .trim()
11
- .optional()
12
- .transform((value) => (value && value.length > 0 ? value : undefined));
13
- const OpenAiSpeechResolutionSchema = z.object({
14
- apiKey: OptionalTrimmedStringSchema,
15
- sttConfidenceThreshold: OptionalFiniteNumberSchema,
16
- sttModel: OptionalTrimmedStringSchema,
17
- ttsVoice: z.string().trim().toLowerCase().pipe(OpenAiTtsVoiceSchema).default("alloy"),
18
- ttsModel: z
19
- .string()
20
- .trim()
21
- .toLowerCase()
22
- .pipe(OpenAiTtsModelSchema)
23
- .default(DEFAULT_OPENAI_TTS_MODEL),
24
- realtimeTranscriptionModel: OptionalTrimmedStringSchema.default(DEFAULT_OPENAI_REALTIME_TRANSCRIPTION_MODEL),
25
- });
26
- export function resolveOpenAiSpeechConfig(params) {
27
- const parsed = OpenAiSpeechResolutionSchema.parse({
28
- apiKey: params.env.OPENAI_API_KEY ?? params.persisted.providers?.openai?.apiKey,
29
- sttConfidenceThreshold: params.env.STT_CONFIDENCE_THRESHOLD ??
30
- params.persisted.features?.dictation?.stt?.confidenceThreshold,
31
- sttModel: params.env.STT_MODEL ??
32
- (params.providers.voiceStt.enabled !== false &&
33
- params.providers.voiceStt.provider === "openai"
34
- ? params.persisted.features?.voiceMode?.stt?.model
35
- : undefined) ??
36
- (params.providers.dictationStt.enabled !== false &&
37
- params.providers.dictationStt.provider === "openai"
38
- ? params.persisted.features?.dictation?.stt?.model
39
- : undefined),
40
- ttsVoice: params.env.TTS_VOICE ??
41
- (params.providers.voiceTts.enabled !== false &&
42
- params.providers.voiceTts.provider === "openai"
43
- ? params.persisted.features?.voiceMode?.tts?.voice
44
- : undefined) ??
45
- "alloy",
46
- ttsModel: params.env.TTS_MODEL ??
47
- (params.providers.voiceTts.enabled !== false &&
48
- params.providers.voiceTts.provider === "openai"
49
- ? params.persisted.features?.voiceMode?.tts?.model
50
- : undefined) ??
51
- DEFAULT_OPENAI_TTS_MODEL,
52
- realtimeTranscriptionModel: params.env.OPENAI_REALTIME_TRANSCRIPTION_MODEL ??
53
- (params.providers.dictationStt.enabled !== false &&
54
- params.providers.dictationStt.provider === "openai"
55
- ? params.persisted.features?.dictation?.stt?.model
56
- : undefined) ??
57
- DEFAULT_OPENAI_REALTIME_TRANSCRIPTION_MODEL,
58
- });
59
- if (!parsed.apiKey) {
60
- return undefined;
61
- }
62
- return {
63
- apiKey: parsed.apiKey,
64
- stt: {
65
- apiKey: parsed.apiKey,
66
- ...(parsed.sttConfidenceThreshold !== undefined
67
- ? { confidenceThreshold: parsed.sttConfidenceThreshold }
68
- : {}),
69
- ...(parsed.sttModel ? { model: parsed.sttModel } : {}),
70
- },
71
- tts: {
72
- apiKey: parsed.apiKey,
73
- voice: parsed.ttsVoice,
74
- model: parsed.ttsModel,
75
- responseFormat: "pcm",
76
- },
77
- realtimeTranscriptionModel: parsed.realtimeTranscriptionModel,
78
- };
79
- }
80
- //# sourceMappingURL=config.js.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"config.js","sourceRoot":"","sources":["../../../../../../src/server/speech/providers/openai/config.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,CAAC,EAAE,MAAM,KAAK,CAAC;AAOxB,MAAM,CAAC,MAAM,2CAA2C,GAAG,mBAAmB,CAAC;AAC/E,MAAM,CAAC,MAAM,wBAAwB,GAAG,OAAO,CAAC;AAShD,MAAM,oBAAoB,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,OAAO,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,MAAM,EAAE,SAAS,CAAC,CAAC,CAAC;AAE3F,MAAM,oBAAoB,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,OAAO,EAAE,UAAU,CAAC,CAAC,CAAC;AAE3D,MAAM,gBAAgB,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;AAEzE,MAAM,0BAA0B,GAAG,gBAAgB,CAAC,IAAI,CAAC,CAAC,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC,MAAM,EAAE,CAAC,CAAC,QAAQ,EAAE,CAAC;AAEhG,MAAM,2BAA2B,GAAG,CAAC;KAClC,MAAM,EAAE;KACR,IAAI,EAAE;KACN,QAAQ,EAAE;KACV,SAAS,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC,KAAK,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC;AAEzE,MAAM,4BAA4B,GAAG,CAAC,CAAC,MAAM,CAAC;IAC5C,MAAM,EAAE,2BAA2B;IACnC,sBAAsB,EAAE,0BAA0B;IAClD,QAAQ,EAAE,2BAA2B;IACrC,QAAQ,EAAE,CAAC,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC,IAAI,CAAC,oBAAoB,CAAC,CAAC,OAAO,CAAC,OAAO,CAAC;IACrF,QAAQ,EAAE,CAAC;SACR,MAAM,EAAE;SACR,IAAI,EAAE;SACN,WAAW,EAAE;SACb,IAAI,CAAC,oBAAoB,CAAC;SAC1B,OAAO,CAAC,wBAAwB,CAAC;IACpC,0BAA0B,EAAE,2BAA2B,CAAC,OAAO,CAC7D,2CAA2C,CAC5C;CACF,CAAC,CAAC;AAEH,MAAM,UAAU,yBAAyB,CAAC,MAIzC;IACC,MAAM,MAAM,GAAG,4BAA4B,CAAC,KAAK,CAAC;QAChD,MAAM,EAAE,MAAM,CAAC,GAAG,CAAC,cAAc,IAAI,MAAM,CAAC,SAAS,CAAC,SAAS,EAAE,MAAM,EAAE,MAAM;QAC/E,sBAAsB,EACpB,MAAM,CAAC,GAAG,CAAC,wBAAwB;YACnC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,mBAAmB;QAChE,QAAQ,EACN,MAAM,CAAC,GAAG,CAAC,SAAS;YACpB,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,OAAO,KAAK,KAAK;gBAC5C,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,QAAQ,KAAK,QAAQ;gBAC7C,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,KAAK;gBAClD,CAAC,CAAC,SAAS,CAAC;YACd,CAAC,MAAM,CAAC,SAAS,CAAC,YAAY,CAAC,OAAO,KAAK,KAAK;gBAChD,MAAM,CAAC,SAAS,CAAC,YAAY,CAAC,QAAQ,KAAK,QAAQ;gBACjD,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,KAAK;gBAClD,CAAC,CAAC,SAAS,CAAC;QAChB,QAAQ,EACN,MAAM,CAAC,GAAG,CAAC,SAAS;YACpB,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,OAAO,KAAK,KAAK;gBAC5C,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,QAAQ,KAAK,QAAQ;gBAC7C,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,KAAK;gBAClD,CAAC,CAAC,SAAS,CAAC;YACd,OAAO;QACT,QAAQ,EACN,MAAM,CAAC,GAAG,CAAC,SAAS;YACpB,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,OAAO,KAAK,KAAK;gBAC5C,MAAM,CAAC,SAAS,CAAC,QAAQ,CAAC,QAAQ,KAAK,QAAQ;gBAC7C,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,KAAK;gBAClD,CAAC,CAAC,SAAS,CAAC;YACd,wBAAwB;QAC1B,0BAA0B,EACxB,MAAM,CAAC,GAAG,CAAC,mCAAmC;YAC9C,CAAC,MAAM,CAAC,SAAS,CAAC,YAAY,CAAC,OAAO,KAAK,KAAK;gBAChD,MAAM,CAAC,SAAS,CAAC,YAAY,CAAC,QAAQ,KAAK,QAAQ;gBACjD,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE,KAAK;gBAClD,CAAC,CAAC,SAAS,CAAC;YACd,2CAA2C;KAC9C,CAAC,CAAC;IAEH,IAAI,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC;QACnB,OAAO,SAAS,CAAC;IACnB,CAAC;IAED,OAAO;QACL,MAAM,EAAE,MAAM,CAAC,MAAM;QACrB,GAAG,EAAE;YACH,MAAM,EAAE,MAAM,CAAC,MAAM;YACrB,GAAG,CAAC,MAAM,CAAC,sBAAsB,KAAK,SAAS;gBAC7C,CAAC,CAAC,EAAE,mBAAmB,EAAE,MAAM,CAAC,sBAAsB,EAAE;gBACxD,CAAC,CAAC,EAAE,CAAC;YACP,GAAG,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC,CAAC,EAAE,KAAK,EAAE,MAAM,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;SACvD;QACD,GAAG,EAAE;YACH,MAAM,EAAE,MAAM,CAAC,MAAM;YACrB,KAAK,EAAE,MAAM,CAAC,QAAQ;YACtB,KAAK,EAAE,MAAM,CAAC,QAAQ;YACtB,cAAc,EAAE,KAAK;SACtB;QACD,0BAA0B,EAAE,MAAM,CAAC,0BAA0B;KAC9D,CAAC;AACJ,CAAC"}