@full-self-developing/fsd 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1191) hide show
  1. package/.engine/engine-config.json +27 -0
  2. package/CODEBASE_CONTEXT.md +152 -0
  3. package/README.md +111 -0
  4. package/README_zh.md +111 -0
  5. package/UI_SPEC.md +57 -0
  6. package/agents/api-proxy.js +542 -0
  7. package/agents/base.js +280 -0
  8. package/agents/branch-manager.js +135 -0
  9. package/agents/cli-models.json +48 -0
  10. package/agents/coder.js +128 -0
  11. package/agents/core-request.js +174 -0
  12. package/agents/dispatcher.js +491 -0
  13. package/agents/drivers/.atomcode/graph.bin +0 -0
  14. package/agents/drivers/atomcode.js +143 -0
  15. package/agents/drivers/gemini-cli.js +195 -0
  16. package/agents/drivers/index.js +65 -0
  17. package/agents/drivers/openrouter.js +390 -0
  18. package/agents/engine-config.js +444 -0
  19. package/agents/log-fixer.js +72 -0
  20. package/agents/mcp-client-manager.js +159 -0
  21. package/agents/optimizer.js +54 -0
  22. package/agents/path-validator.js +43 -0
  23. package/agents/planner.js +81 -0
  24. package/agents/prompt-manager.js +170 -0
  25. package/agents/skeptic.js +79 -0
  26. package/agents/skills-manager.js +130 -0
  27. package/agents/summarizer.js +34 -0
  28. package/agents/test-runner.js +85 -0
  29. package/bin/cli.js +166 -0
  30. package/client/eslint.config.js +21 -0
  31. package/client/index.html +12 -0
  32. package/client/package-lock.json +3339 -0
  33. package/client/package.json +35 -0
  34. package/client/src/App.jsx +745 -0
  35. package/client/src/api.js +78 -0
  36. package/client/src/components/ChatPanel.jsx +277 -0
  37. package/client/src/components/ConfirmationModal.jsx +61 -0
  38. package/client/src/components/ErrorBoundary.jsx +66 -0
  39. package/client/src/components/FolderPicker.jsx +200 -0
  40. package/client/src/components/LoopPanel.jsx +863 -0
  41. package/client/src/components/NotFound.jsx +52 -0
  42. package/client/src/components/SettingsPanel.jsx +966 -0
  43. package/client/src/components/Sidebar.jsx +318 -0
  44. package/client/src/context/SettingsContext.jsx +353 -0
  45. package/client/src/i18n.js +462 -0
  46. package/client/src/index.css +31 -0
  47. package/client/src/main.jsx +17 -0
  48. package/client/vite.config.js +19 -0
  49. package/design.md +875 -0
  50. package/extensions/alibaba/index.ts +11 -0
  51. package/extensions/alibaba/openclaw.plugin.json +34 -0
  52. package/extensions/alibaba/package.json +15 -0
  53. package/extensions/alibaba/plugin-registration.contract.test.ts +7 -0
  54. package/extensions/alibaba/tsconfig.json +16 -0
  55. package/extensions/alibaba/video-generation-provider.test.ts +92 -0
  56. package/extensions/alibaba/video-generation-provider.ts +83 -0
  57. package/extensions/amazon-bedrock/api.ts +6 -0
  58. package/extensions/amazon-bedrock/aws-credential-refresh.ts +42 -0
  59. package/extensions/amazon-bedrock/config-api.ts +4 -0
  60. package/extensions/amazon-bedrock/config-compat.test.ts +81 -0
  61. package/extensions/amazon-bedrock/config-compat.ts +107 -0
  62. package/extensions/amazon-bedrock/discovery-shared.ts +28 -0
  63. package/extensions/amazon-bedrock/discovery.test.ts +608 -0
  64. package/extensions/amazon-bedrock/discovery.ts +616 -0
  65. package/extensions/amazon-bedrock/embedding-provider.test.ts +109 -0
  66. package/extensions/amazon-bedrock/embedding-provider.ts +470 -0
  67. package/extensions/amazon-bedrock/index.test.ts +1249 -0
  68. package/extensions/amazon-bedrock/index.ts +11 -0
  69. package/extensions/amazon-bedrock/lazy-import.test.ts +56 -0
  70. package/extensions/amazon-bedrock/memory-embedding-adapter.test.ts +105 -0
  71. package/extensions/amazon-bedrock/memory-embedding-adapter.ts +47 -0
  72. package/extensions/amazon-bedrock/npm-shrinkwrap.json +1241 -0
  73. package/extensions/amazon-bedrock/openclaw.plugin.json +80 -0
  74. package/extensions/amazon-bedrock/package.json +41 -0
  75. package/extensions/amazon-bedrock/provider-policy-api.test.ts +46 -0
  76. package/extensions/amazon-bedrock/provider-policy-api.ts +9 -0
  77. package/extensions/amazon-bedrock/register.sync.runtime.ts +659 -0
  78. package/extensions/amazon-bedrock/setup-api.ts +18 -0
  79. package/extensions/amazon-bedrock/thinking-policy.ts +32 -0
  80. package/extensions/amazon-bedrock/tsconfig.json +16 -0
  81. package/extensions/anthropic/api.ts +11 -0
  82. package/extensions/anthropic/claude-model-refs.ts +104 -0
  83. package/extensions/anthropic/cli-auth-seam.ts +13 -0
  84. package/extensions/anthropic/cli-backend-api.ts +6 -0
  85. package/extensions/anthropic/cli-backend.ts +83 -0
  86. package/extensions/anthropic/cli-catalog.ts +42 -0
  87. package/extensions/anthropic/cli-constants.ts +41 -0
  88. package/extensions/anthropic/cli-migration.test.ts +487 -0
  89. package/extensions/anthropic/cli-migration.ts +266 -0
  90. package/extensions/anthropic/cli-shared.test.ts +300 -0
  91. package/extensions/anthropic/cli-shared.ts +248 -0
  92. package/extensions/anthropic/config-defaults.ts +428 -0
  93. package/extensions/anthropic/contract-api.ts +9 -0
  94. package/extensions/anthropic/doctor-contract-api.ts +14 -0
  95. package/extensions/anthropic/index.test.ts +663 -0
  96. package/extensions/anthropic/index.ts +11 -0
  97. package/extensions/anthropic/media-understanding-provider.ts +15 -0
  98. package/extensions/anthropic/openclaw.plugin.json +112 -0
  99. package/extensions/anthropic/package.json +18 -0
  100. package/extensions/anthropic/provider-contract-api.ts +59 -0
  101. package/extensions/anthropic/provider-discovery.ts +35 -0
  102. package/extensions/anthropic/provider-policy-api.test.ts +135 -0
  103. package/extensions/anthropic/provider-policy-api.ts +24 -0
  104. package/extensions/anthropic/provider-runtime.contract.test.ts +3 -0
  105. package/extensions/anthropic/register.runtime.ts +668 -0
  106. package/extensions/anthropic/replay-policy.ts +9 -0
  107. package/extensions/anthropic/setup-api.ts +11 -0
  108. package/extensions/anthropic/stream-wrappers.test.ts +233 -0
  109. package/extensions/anthropic/stream-wrappers.ts +228 -0
  110. package/extensions/anthropic/test-api.ts +3 -0
  111. package/extensions/anthropic/tsconfig.json +16 -0
  112. package/extensions/arcee/api.ts +8 -0
  113. package/extensions/arcee/index.test.ts +195 -0
  114. package/extensions/arcee/index.ts +142 -0
  115. package/extensions/arcee/models.ts +68 -0
  116. package/extensions/arcee/onboard.ts +43 -0
  117. package/extensions/arcee/openclaw.plugin.json +46 -0
  118. package/extensions/arcee/package.json +15 -0
  119. package/extensions/arcee/provider-catalog.ts +54 -0
  120. package/extensions/arcee/tsconfig.json +16 -0
  121. package/extensions/azure-speech/azure-speech.live.test.ts +92 -0
  122. package/extensions/azure-speech/index.ts +11 -0
  123. package/extensions/azure-speech/openclaw.plugin.json +66 -0
  124. package/extensions/azure-speech/package.json +15 -0
  125. package/extensions/azure-speech/speech-provider.test.ts +242 -0
  126. package/extensions/azure-speech/speech-provider.ts +306 -0
  127. package/extensions/azure-speech/tsconfig.json +16 -0
  128. package/extensions/azure-speech/tts.test.ts +127 -0
  129. package/extensions/azure-speech/tts.ts +209 -0
  130. package/extensions/byteplus/api.ts +8 -0
  131. package/extensions/byteplus/index.test.ts +60 -0
  132. package/extensions/byteplus/index.ts +84 -0
  133. package/extensions/byteplus/live.test.ts +60 -0
  134. package/extensions/byteplus/models.ts +35 -0
  135. package/extensions/byteplus/openclaw.plugin.json +165 -0
  136. package/extensions/byteplus/package.json +15 -0
  137. package/extensions/byteplus/plugin-registration.contract.test.ts +8 -0
  138. package/extensions/byteplus/provider-catalog.ts +17 -0
  139. package/extensions/byteplus/provider-discovery.ts +31 -0
  140. package/extensions/byteplus/tsconfig.json +16 -0
  141. package/extensions/byteplus/video-generation-provider.test.ts +223 -0
  142. package/extensions/byteplus/video-generation-provider.ts +389 -0
  143. package/extensions/cerebras/api.ts +7 -0
  144. package/extensions/cerebras/index.ts +41 -0
  145. package/extensions/cerebras/models.ts +25 -0
  146. package/extensions/cerebras/onboard.ts +26 -0
  147. package/extensions/cerebras/openclaw.plugin.json +111 -0
  148. package/extensions/cerebras/package.json +15 -0
  149. package/extensions/cerebras/provider-catalog.ts +10 -0
  150. package/extensions/cerebras/tsconfig.json +16 -0
  151. package/extensions/chutes/api.ts +14 -0
  152. package/extensions/chutes/implicit-provider.test.ts +107 -0
  153. package/extensions/chutes/index.ts +194 -0
  154. package/extensions/chutes/model-discovery-env.ts +5 -0
  155. package/extensions/chutes/models.test.ts +289 -0
  156. package/extensions/chutes/models.ts +632 -0
  157. package/extensions/chutes/oauth.ts +235 -0
  158. package/extensions/chutes/onboard.ts +63 -0
  159. package/extensions/chutes/openclaw.plugin.json +726 -0
  160. package/extensions/chutes/package.json +15 -0
  161. package/extensions/chutes/provider-catalog.ts +29 -0
  162. package/extensions/chutes/tsconfig.json +16 -0
  163. package/extensions/cloudflare-ai-gateway/api.ts +14 -0
  164. package/extensions/cloudflare-ai-gateway/catalog-provider.ts +73 -0
  165. package/extensions/cloudflare-ai-gateway/index.test.ts +60 -0
  166. package/extensions/cloudflare-ai-gateway/index.ts +233 -0
  167. package/extensions/cloudflare-ai-gateway/models.ts +44 -0
  168. package/extensions/cloudflare-ai-gateway/onboard.ts +91 -0
  169. package/extensions/cloudflare-ai-gateway/openclaw.plugin.json +44 -0
  170. package/extensions/cloudflare-ai-gateway/package.json +15 -0
  171. package/extensions/cloudflare-ai-gateway/provider-discovery.contract.test.ts +3 -0
  172. package/extensions/cloudflare-ai-gateway/stream-wrappers.test.ts +160 -0
  173. package/extensions/cloudflare-ai-gateway/stream-wrappers.ts +32 -0
  174. package/extensions/cloudflare-ai-gateway/tsconfig.json +16 -0
  175. package/extensions/codex/doctor-contract-api.test.ts +44 -0
  176. package/extensions/codex/doctor-contract-api.ts +68 -0
  177. package/extensions/codex/harness.ts +85 -0
  178. package/extensions/codex/index.test.ts +230 -0
  179. package/extensions/codex/index.ts +125 -0
  180. package/extensions/codex/media-understanding-provider.test.ts +496 -0
  181. package/extensions/codex/media-understanding-provider.ts +524 -0
  182. package/extensions/codex/npm-shrinkwrap.json +1949 -0
  183. package/extensions/codex/openclaw.plugin.json +403 -0
  184. package/extensions/codex/package.json +41 -0
  185. package/extensions/codex/prompt-overlay-runtime-contract.test.ts +48 -0
  186. package/extensions/codex/prompt-overlay.ts +21 -0
  187. package/extensions/codex/provider-catalog.ts +83 -0
  188. package/extensions/codex/provider-discovery.ts +45 -0
  189. package/extensions/codex/provider.test.ts +384 -0
  190. package/extensions/codex/provider.ts +243 -0
  191. package/extensions/codex/src/app-server/app-inventory-cache.test.ts +176 -0
  192. package/extensions/codex/src/app-server/app-inventory-cache.ts +324 -0
  193. package/extensions/codex/src/app-server/approval-bridge.test.ts +1472 -0
  194. package/extensions/codex/src/app-server/approval-bridge.ts +1211 -0
  195. package/extensions/codex/src/app-server/auth-bridge.test.ts +1449 -0
  196. package/extensions/codex/src/app-server/auth-bridge.ts +614 -0
  197. package/extensions/codex/src/app-server/auth-profile-runtime-contract.test.ts +242 -0
  198. package/extensions/codex/src/app-server/capabilities.ts +27 -0
  199. package/extensions/codex/src/app-server/client-factory.ts +24 -0
  200. package/extensions/codex/src/app-server/client.test.ts +563 -0
  201. package/extensions/codex/src/app-server/client.ts +721 -0
  202. package/extensions/codex/src/app-server/compact.test.ts +1029 -0
  203. package/extensions/codex/src/app-server/compact.ts +662 -0
  204. package/extensions/codex/src/app-server/computer-use.test.ts +788 -0
  205. package/extensions/codex/src/app-server/computer-use.ts +683 -0
  206. package/extensions/codex/src/app-server/config.test.ts +948 -0
  207. package/extensions/codex/src/app-server/config.ts +1093 -0
  208. package/extensions/codex/src/app-server/context-engine-projection.test.ts +252 -0
  209. package/extensions/codex/src/app-server/context-engine-projection.ts +403 -0
  210. package/extensions/codex/src/app-server/delivery-no-reply-runtime-contract.test.ts +80 -0
  211. package/extensions/codex/src/app-server/dynamic-tool-diagnostics.ts +73 -0
  212. package/extensions/codex/src/app-server/dynamic-tool-profile.ts +70 -0
  213. package/extensions/codex/src/app-server/dynamic-tools.test.ts +1357 -0
  214. package/extensions/codex/src/app-server/dynamic-tools.ts +646 -0
  215. package/extensions/codex/src/app-server/elicitation-bridge.test.ts +1281 -0
  216. package/extensions/codex/src/app-server/elicitation-bridge.ts +828 -0
  217. package/extensions/codex/src/app-server/event-projector.test.ts +2885 -0
  218. package/extensions/codex/src/app-server/event-projector.ts +2047 -0
  219. package/extensions/codex/src/app-server/image-payload-sanitizer.test.ts +49 -0
  220. package/extensions/codex/src/app-server/image-payload-sanitizer.ts +195 -0
  221. package/extensions/codex/src/app-server/local-runtime-attribution.ts +39 -0
  222. package/extensions/codex/src/app-server/managed-binary.test.ts +141 -0
  223. package/extensions/codex/src/app-server/managed-binary.ts +193 -0
  224. package/extensions/codex/src/app-server/models.test.ts +246 -0
  225. package/extensions/codex/src/app-server/models.ts +172 -0
  226. package/extensions/codex/src/app-server/native-hook-relay.test.ts +274 -0
  227. package/extensions/codex/src/app-server/native-hook-relay.ts +150 -0
  228. package/extensions/codex/src/app-server/native-subagent-monitor.test.ts +1125 -0
  229. package/extensions/codex/src/app-server/native-subagent-monitor.ts +1061 -0
  230. package/extensions/codex/src/app-server/native-subagent-notification.test.ts +176 -0
  231. package/extensions/codex/src/app-server/native-subagent-notification.ts +222 -0
  232. package/extensions/codex/src/app-server/native-subagent-task-ids.ts +3 -0
  233. package/extensions/codex/src/app-server/native-subagent-task-mirror.test.ts +625 -0
  234. package/extensions/codex/src/app-server/native-subagent-task-mirror.ts +460 -0
  235. package/extensions/codex/src/app-server/notification-correlation.ts +91 -0
  236. package/extensions/codex/src/app-server/openclaw-owned-tool-runtime-contract.test.ts +456 -0
  237. package/extensions/codex/src/app-server/outcome-fallback-runtime-contract.test.ts +404 -0
  238. package/extensions/codex/src/app-server/plugin-activation.test.ts +336 -0
  239. package/extensions/codex/src/app-server/plugin-activation.ts +283 -0
  240. package/extensions/codex/src/app-server/plugin-app-cache-key.ts +74 -0
  241. package/extensions/codex/src/app-server/plugin-approval-roundtrip.ts +122 -0
  242. package/extensions/codex/src/app-server/plugin-inventory.test.ts +355 -0
  243. package/extensions/codex/src/app-server/plugin-inventory.ts +357 -0
  244. package/extensions/codex/src/app-server/plugin-thread-config.test.ts +865 -0
  245. package/extensions/codex/src/app-server/plugin-thread-config.ts +455 -0
  246. package/extensions/codex/src/app-server/protocol-generated/json/DynamicToolCallParams.json +33 -0
  247. package/extensions/codex/src/app-server/protocol-generated/json/v2/ErrorNotification.json +199 -0
  248. package/extensions/codex/src/app-server/protocol-generated/json/v2/GetAccountResponse.json +102 -0
  249. package/extensions/codex/src/app-server/protocol-generated/json/v2/ModelListResponse.json +227 -0
  250. package/extensions/codex/src/app-server/protocol-generated/json/v2/ThreadResumeResponse.json +2630 -0
  251. package/extensions/codex/src/app-server/protocol-generated/json/v2/ThreadStartResponse.json +2630 -0
  252. package/extensions/codex/src/app-server/protocol-generated/json/v2/TurnCompletedNotification.json +1659 -0
  253. package/extensions/codex/src/app-server/protocol-generated/json/v2/TurnStartResponse.json +1655 -0
  254. package/extensions/codex/src/app-server/protocol-validators.test.ts +75 -0
  255. package/extensions/codex/src/app-server/protocol-validators.ts +203 -0
  256. package/extensions/codex/src/app-server/protocol.ts +537 -0
  257. package/extensions/codex/src/app-server/rate-limit-cache.ts +48 -0
  258. package/extensions/codex/src/app-server/rate-limits.test.ts +202 -0
  259. package/extensions/codex/src/app-server/rate-limits.ts +583 -0
  260. package/extensions/codex/src/app-server/request.test.ts +68 -0
  261. package/extensions/codex/src/app-server/request.ts +90 -0
  262. package/extensions/codex/src/app-server/run-attempt-thread-cleanup.test.ts +197 -0
  263. package/extensions/codex/src/app-server/run-attempt.context-engine.test.ts +1246 -0
  264. package/extensions/codex/src/app-server/run-attempt.test.ts +10799 -0
  265. package/extensions/codex/src/app-server/run-attempt.ts +5264 -0
  266. package/extensions/codex/src/app-server/run-attempt.vision-tools.test.ts +35 -0
  267. package/extensions/codex/src/app-server/sandbox-exec-server/filesystem.ts +261 -0
  268. package/extensions/codex/src/app-server/sandbox-exec-server/fs-policy.ts +346 -0
  269. package/extensions/codex/src/app-server/sandbox-exec-server/http.ts +312 -0
  270. package/extensions/codex/src/app-server/sandbox-exec-server/json-rpc.ts +93 -0
  271. package/extensions/codex/src/app-server/sandbox-exec-server/processes.ts +411 -0
  272. package/extensions/codex/src/app-server/sandbox-exec-server/runtime.ts +22 -0
  273. package/extensions/codex/src/app-server/sandbox-exec-server/types.ts +80 -0
  274. package/extensions/codex/src/app-server/sandbox-exec-server.fs.test.ts +527 -0
  275. package/extensions/codex/src/app-server/sandbox-exec-server.http.test.ts +210 -0
  276. package/extensions/codex/src/app-server/sandbox-exec-server.test-helpers.ts +236 -0
  277. package/extensions/codex/src/app-server/sandbox-exec-server.test.ts +460 -0
  278. package/extensions/codex/src/app-server/sandbox-exec-server.ts +355 -0
  279. package/extensions/codex/src/app-server/sandbox-guard.ts +153 -0
  280. package/extensions/codex/src/app-server/schema-normalization-runtime-contract.test.ts +206 -0
  281. package/extensions/codex/src/app-server/session-binding.test.ts +303 -0
  282. package/extensions/codex/src/app-server/session-binding.ts +407 -0
  283. package/extensions/codex/src/app-server/session-history.ts +44 -0
  284. package/extensions/codex/src/app-server/shared-client.test.ts +591 -0
  285. package/extensions/codex/src/app-server/shared-client.ts +289 -0
  286. package/extensions/codex/src/app-server/side-question.test.ts +1243 -0
  287. package/extensions/codex/src/app-server/side-question.ts +1019 -0
  288. package/extensions/codex/src/app-server/test-support.ts +48 -0
  289. package/extensions/codex/src/app-server/thread-lifecycle.test.ts +447 -0
  290. package/extensions/codex/src/app-server/thread-lifecycle.ts +1004 -0
  291. package/extensions/codex/src/app-server/thread-lifecycle.user-mcp-servers.test.ts +442 -0
  292. package/extensions/codex/src/app-server/timeout.ts +9 -0
  293. package/extensions/codex/src/app-server/tool-progress-normalization.ts +77 -0
  294. package/extensions/codex/src/app-server/trajectory.test.ts +205 -0
  295. package/extensions/codex/src/app-server/trajectory.ts +368 -0
  296. package/extensions/codex/src/app-server/transcript-mirror.test.ts +527 -0
  297. package/extensions/codex/src/app-server/transcript-mirror.ts +208 -0
  298. package/extensions/codex/src/app-server/transcript-repair-runtime-contract.test.ts +44 -0
  299. package/extensions/codex/src/app-server/transport-stdio.test.ts +184 -0
  300. package/extensions/codex/src/app-server/transport-stdio.ts +107 -0
  301. package/extensions/codex/src/app-server/transport-websocket.test.ts +71 -0
  302. package/extensions/codex/src/app-server/transport-websocket.ts +90 -0
  303. package/extensions/codex/src/app-server/transport.ts +117 -0
  304. package/extensions/codex/src/app-server/user-input-bridge.test.ts +249 -0
  305. package/extensions/codex/src/app-server/user-input-bridge.ts +316 -0
  306. package/extensions/codex/src/app-server/version.ts +5 -0
  307. package/extensions/codex/src/app-server/vision-tools.ts +12 -0
  308. package/extensions/codex/src/command-account.ts +589 -0
  309. package/extensions/codex/src/command-formatters.ts +426 -0
  310. package/extensions/codex/src/command-handlers.ts +2092 -0
  311. package/extensions/codex/src/command-plugins-management.test.ts +172 -0
  312. package/extensions/codex/src/command-plugins-management.ts +137 -0
  313. package/extensions/codex/src/command-rpc.test.ts +16 -0
  314. package/extensions/codex/src/command-rpc.ts +146 -0
  315. package/extensions/codex/src/commands.test.ts +3737 -0
  316. package/extensions/codex/src/commands.ts +65 -0
  317. package/extensions/codex/src/conversation-binding-data.ts +124 -0
  318. package/extensions/codex/src/conversation-binding.test.ts +697 -0
  319. package/extensions/codex/src/conversation-binding.ts +575 -0
  320. package/extensions/codex/src/conversation-control.test.ts +126 -0
  321. package/extensions/codex/src/conversation-control.ts +303 -0
  322. package/extensions/codex/src/conversation-turn-collector.test.ts +191 -0
  323. package/extensions/codex/src/conversation-turn-collector.ts +190 -0
  324. package/extensions/codex/src/conversation-turn-input.test.ts +141 -0
  325. package/extensions/codex/src/conversation-turn-input.ts +106 -0
  326. package/extensions/codex/src/manifest.test.ts +20 -0
  327. package/extensions/codex/src/migration/apply.ts +501 -0
  328. package/extensions/codex/src/migration/helpers.ts +55 -0
  329. package/extensions/codex/src/migration/plan.ts +461 -0
  330. package/extensions/codex/src/migration/provider.test.ts +1741 -0
  331. package/extensions/codex/src/migration/provider.ts +41 -0
  332. package/extensions/codex/src/migration/source.ts +643 -0
  333. package/extensions/codex/src/migration/targets.ts +25 -0
  334. package/extensions/codex/src/node-cli-sessions.test.ts +180 -0
  335. package/extensions/codex/src/node-cli-sessions.ts +711 -0
  336. package/extensions/codex/test-api.ts +95 -0
  337. package/extensions/codex/tsconfig.json +16 -0
  338. package/extensions/comfy/comfy.live.test.ts +128 -0
  339. package/extensions/comfy/image-generation-provider.test.ts +457 -0
  340. package/extensions/comfy/image-generation-provider.ts +79 -0
  341. package/extensions/comfy/index.test.ts +51 -0
  342. package/extensions/comfy/index.ts +45 -0
  343. package/extensions/comfy/music-generation-provider.test.ts +101 -0
  344. package/extensions/comfy/music-generation-provider.ts +88 -0
  345. package/extensions/comfy/openclaw.plugin.json +268 -0
  346. package/extensions/comfy/package.json +15 -0
  347. package/extensions/comfy/plugin-registration.contract.test.ts +11 -0
  348. package/extensions/comfy/test-helpers.ts +113 -0
  349. package/extensions/comfy/tsconfig.json +16 -0
  350. package/extensions/comfy/video-generation-provider.test.ts +184 -0
  351. package/extensions/comfy/video-generation-provider.ts +104 -0
  352. package/extensions/comfy/workflow-runtime.ts +827 -0
  353. package/extensions/deepgram/audio.live.test.ts +75 -0
  354. package/extensions/deepgram/audio.test.ts +146 -0
  355. package/extensions/deepgram/audio.ts +109 -0
  356. package/extensions/deepgram/index.ts +13 -0
  357. package/extensions/deepgram/media-understanding-provider.ts +10 -0
  358. package/extensions/deepgram/openclaw.plugin.json +30 -0
  359. package/extensions/deepgram/package.json +15 -0
  360. package/extensions/deepgram/realtime-transcription-provider.test.ts +69 -0
  361. package/extensions/deepgram/realtime-transcription-provider.ts +283 -0
  362. package/extensions/deepgram/test-api.ts +2 -0
  363. package/extensions/deepgram/tsconfig.json +16 -0
  364. package/extensions/deepinfra/api.ts +8 -0
  365. package/extensions/deepinfra/embedding-provider.ts +33 -0
  366. package/extensions/deepinfra/image-generation-provider.test.ts +224 -0
  367. package/extensions/deepinfra/image-generation-provider.ts +89 -0
  368. package/extensions/deepinfra/index.test.ts +113 -0
  369. package/extensions/deepinfra/index.ts +84 -0
  370. package/extensions/deepinfra/media-models.ts +50 -0
  371. package/extensions/deepinfra/media-understanding-provider.test.ts +73 -0
  372. package/extensions/deepinfra/media-understanding-provider.ts +37 -0
  373. package/extensions/deepinfra/memory-embedding-adapter.test.ts +31 -0
  374. package/extensions/deepinfra/memory-embedding-adapter.ts +35 -0
  375. package/extensions/deepinfra/onboard.test.ts +172 -0
  376. package/extensions/deepinfra/onboard.ts +36 -0
  377. package/extensions/deepinfra/openclaw.plugin.json +203 -0
  378. package/extensions/deepinfra/package.json +15 -0
  379. package/extensions/deepinfra/provider-catalog.ts +24 -0
  380. package/extensions/deepinfra/provider-models.test.ts +217 -0
  381. package/extensions/deepinfra/provider-models.ts +167 -0
  382. package/extensions/deepinfra/provider-policy-api.test.ts +41 -0
  383. package/extensions/deepinfra/provider-policy-api.ts +21 -0
  384. package/extensions/deepinfra/provider.contract.test.ts +3 -0
  385. package/extensions/deepinfra/speech-provider.test.ts +169 -0
  386. package/extensions/deepinfra/speech-provider.ts +41 -0
  387. package/extensions/deepinfra/tsconfig.json +16 -0
  388. package/extensions/deepinfra/video-generation-provider.test.ts +194 -0
  389. package/extensions/deepinfra/video-generation-provider.ts +262 -0
  390. package/extensions/deepseek/api.ts +7 -0
  391. package/extensions/deepseek/deepseek.live.test.ts +232 -0
  392. package/extensions/deepseek/index.test.ts +488 -0
  393. package/extensions/deepseek/index.ts +58 -0
  394. package/extensions/deepseek/models.ts +33 -0
  395. package/extensions/deepseek/onboard.ts +31 -0
  396. package/extensions/deepseek/openclaw.plugin.json +132 -0
  397. package/extensions/deepseek/package.json +15 -0
  398. package/extensions/deepseek/provider-catalog.ts +14 -0
  399. package/extensions/deepseek/provider-discovery.ts +17 -0
  400. package/extensions/deepseek/provider-policy-api.test.ts +264 -0
  401. package/extensions/deepseek/provider-policy-api.ts +104 -0
  402. package/extensions/deepseek/stream.ts +14 -0
  403. package/extensions/deepseek/thinking.ts +19 -0
  404. package/extensions/deepseek/tsconfig.json +16 -0
  405. package/extensions/elevenlabs/config-api.ts +8 -0
  406. package/extensions/elevenlabs/config-compat.test.ts +75 -0
  407. package/extensions/elevenlabs/config-compat.ts +181 -0
  408. package/extensions/elevenlabs/contract-api.ts +8 -0
  409. package/extensions/elevenlabs/doctor-contract.ts +34 -0
  410. package/extensions/elevenlabs/elevenlabs.live.test.ts +91 -0
  411. package/extensions/elevenlabs/index.ts +15 -0
  412. package/extensions/elevenlabs/media-understanding-provider.test.ts +95 -0
  413. package/extensions/elevenlabs/media-understanding-provider.ts +85 -0
  414. package/extensions/elevenlabs/openclaw.plugin.json +40 -0
  415. package/extensions/elevenlabs/package.json +15 -0
  416. package/extensions/elevenlabs/realtime-transcription-provider.test.ts +60 -0
  417. package/extensions/elevenlabs/realtime-transcription-provider.ts +284 -0
  418. package/extensions/elevenlabs/setup-api.ts +11 -0
  419. package/extensions/elevenlabs/shared.ts +10 -0
  420. package/extensions/elevenlabs/speech-provider.test.ts +124 -0
  421. package/extensions/elevenlabs/speech-provider.ts +594 -0
  422. package/extensions/elevenlabs/test-api.ts +6 -0
  423. package/extensions/elevenlabs/tsconfig.json +16 -0
  424. package/extensions/elevenlabs/tts.test.ts +212 -0
  425. package/extensions/elevenlabs/tts.ts +198 -0
  426. package/extensions/fal/image-generation-provider.test.ts +710 -0
  427. package/extensions/fal/image-generation-provider.ts +463 -0
  428. package/extensions/fal/index.ts +19 -0
  429. package/extensions/fal/music-generation-provider.test.ts +200 -0
  430. package/extensions/fal/music-generation-provider.ts +219 -0
  431. package/extensions/fal/onboard.ts +21 -0
  432. package/extensions/fal/openclaw.plugin.json +42 -0
  433. package/extensions/fal/package.json +15 -0
  434. package/extensions/fal/plugin-registration.contract.test.ts +11 -0
  435. package/extensions/fal/provider-contract-api.ts +31 -0
  436. package/extensions/fal/provider-registration.ts +38 -0
  437. package/extensions/fal/test-api.ts +3 -0
  438. package/extensions/fal/tsconfig.json +16 -0
  439. package/extensions/fal/video-generation-provider.test.ts +566 -0
  440. package/extensions/fal/video-generation-provider.ts +648 -0
  441. package/extensions/fireworks/index.test.ts +181 -0
  442. package/extensions/fireworks/index.ts +85 -0
  443. package/extensions/fireworks/model-id.ts +5 -0
  444. package/extensions/fireworks/onboard.ts +30 -0
  445. package/extensions/fireworks/openclaw.plugin.json +73 -0
  446. package/extensions/fireworks/package.json +18 -0
  447. package/extensions/fireworks/provider-catalog.ts +50 -0
  448. package/extensions/fireworks/provider-policy-api.ts +8 -0
  449. package/extensions/fireworks/stream.test.ts +184 -0
  450. package/extensions/fireworks/stream.ts +39 -0
  451. package/extensions/fireworks/thinking-policy.ts +17 -0
  452. package/extensions/fireworks/tsconfig.json +16 -0
  453. package/extensions/github-copilot/api.ts +1 -0
  454. package/extensions/github-copilot/auth.test.ts +109 -0
  455. package/extensions/github-copilot/auth.ts +65 -0
  456. package/extensions/github-copilot/connection-bound-ids.live.test.ts +231 -0
  457. package/extensions/github-copilot/connection-bound-ids.test.ts +96 -0
  458. package/extensions/github-copilot/connection-bound-ids.ts +81 -0
  459. package/extensions/github-copilot/embeddings.test.ts +287 -0
  460. package/extensions/github-copilot/embeddings.ts +342 -0
  461. package/extensions/github-copilot/index.test.ts +660 -0
  462. package/extensions/github-copilot/index.ts +492 -0
  463. package/extensions/github-copilot/login.ts +323 -0
  464. package/extensions/github-copilot/model-metadata.ts +51 -0
  465. package/extensions/github-copilot/models-defaults.ts +61 -0
  466. package/extensions/github-copilot/models.test.ts +695 -0
  467. package/extensions/github-copilot/models.ts +274 -0
  468. package/extensions/github-copilot/openclaw.plugin.json +270 -0
  469. package/extensions/github-copilot/package.json +19 -0
  470. package/extensions/github-copilot/provider-auth.contract.test.ts +3 -0
  471. package/extensions/github-copilot/provider-discovery.contract.test.ts +7 -0
  472. package/extensions/github-copilot/provider-runtime.contract.test.ts +3 -0
  473. package/extensions/github-copilot/register.runtime.ts +24 -0
  474. package/extensions/github-copilot/replay-policy.ts +9 -0
  475. package/extensions/github-copilot/stream.test.ts +282 -0
  476. package/extensions/github-copilot/stream.ts +157 -0
  477. package/extensions/github-copilot/token.ts +6 -0
  478. package/extensions/github-copilot/tsconfig.json +16 -0
  479. package/extensions/github-copilot/usage.ts +68 -0
  480. package/extensions/google/api.test.ts +249 -0
  481. package/extensions/google/api.ts +91 -0
  482. package/extensions/google/cli-backend.ts +58 -0
  483. package/extensions/google/default-model.test.ts +115 -0
  484. package/extensions/google/doctor-contract-api.ts +18 -0
  485. package/extensions/google/embedding-batch.ts +379 -0
  486. package/extensions/google/embedding-provider.test.ts +264 -0
  487. package/extensions/google/embedding-provider.ts +441 -0
  488. package/extensions/google/gemini-auth.ts +20 -0
  489. package/extensions/google/gemini-cli-provider.ts +145 -0
  490. package/extensions/google/generation-provider-metadata.ts +121 -0
  491. package/extensions/google/google-genai-runtime.ts +8 -0
  492. package/extensions/google/google-shared.test-helpers.ts +99 -0
  493. package/extensions/google/google-shared.test.ts +380 -0
  494. package/extensions/google/google.live.test.ts +179 -0
  495. package/extensions/google/image-generation-provider.test.ts +503 -0
  496. package/extensions/google/image-generation-provider.ts +272 -0
  497. package/extensions/google/index.test.ts +310 -0
  498. package/extensions/google/index.ts +354 -0
  499. package/extensions/google/manifest.test.ts +104 -0
  500. package/extensions/google/media-understanding-provider.ts +164 -0
  501. package/extensions/google/media-understanding-provider.video.test.ts +158 -0
  502. package/extensions/google/memory-embedding-adapter.ts +79 -0
  503. package/extensions/google/model-id.test.ts +42 -0
  504. package/extensions/google/model-id.ts +35 -0
  505. package/extensions/google/music-generation-provider.test.ts +278 -0
  506. package/extensions/google/music-generation-provider.ts +176 -0
  507. package/extensions/google/oauth-token-shared.test.ts +39 -0
  508. package/extensions/google/oauth-token-shared.ts +42 -0
  509. package/extensions/google/oauth.credentials.ts +273 -0
  510. package/extensions/google/oauth.flow.ts +61 -0
  511. package/extensions/google/oauth.http.ts +24 -0
  512. package/extensions/google/oauth.project.ts +232 -0
  513. package/extensions/google/oauth.runtime.ts +1 -0
  514. package/extensions/google/oauth.settings.ts +72 -0
  515. package/extensions/google/oauth.shared.ts +44 -0
  516. package/extensions/google/oauth.test.ts +922 -0
  517. package/extensions/google/oauth.token.ts +138 -0
  518. package/extensions/google/oauth.ts +104 -0
  519. package/extensions/google/onboard.ts +78 -0
  520. package/extensions/google/openclaw.plugin.json +706 -0
  521. package/extensions/google/package.json +19 -0
  522. package/extensions/google/plugin-registration.contract.test.ts +12 -0
  523. package/extensions/google/provider-contract-api.ts +77 -0
  524. package/extensions/google/provider-hooks.ts +18 -0
  525. package/extensions/google/provider-models.test.ts +513 -0
  526. package/extensions/google/provider-models.ts +237 -0
  527. package/extensions/google/provider-policy-api.test.ts +201 -0
  528. package/extensions/google/provider-policy-api.ts +11 -0
  529. package/extensions/google/provider-policy.ts +208 -0
  530. package/extensions/google/provider-registration.ts +72 -0
  531. package/extensions/google/provider-runtime.contract.test.ts +3 -0
  532. package/extensions/google/realtime-voice-provider.test.ts +857 -0
  533. package/extensions/google/realtime-voice-provider.ts +952 -0
  534. package/extensions/google/runtime-api.ts +19 -0
  535. package/extensions/google/setup-api.test.ts +23 -0
  536. package/extensions/google/setup-api.ts +13 -0
  537. package/extensions/google/speech-provider.test.ts +682 -0
  538. package/extensions/google/speech-provider.ts +683 -0
  539. package/extensions/google/src/gemini-web-search-provider.runtime.ts +367 -0
  540. package/extensions/google/src/gemini-web-search-provider.shared.ts +45 -0
  541. package/extensions/google/src/gemini-web-search-provider.ts +151 -0
  542. package/extensions/google/test-api.ts +6 -0
  543. package/extensions/google/thinking-api.ts +14 -0
  544. package/extensions/google/thinking.test.ts +153 -0
  545. package/extensions/google/thinking.ts +14 -0
  546. package/extensions/google/transport-stream.test.ts +1726 -0
  547. package/extensions/google/transport-stream.ts +1396 -0
  548. package/extensions/google/tsconfig.json +16 -0
  549. package/extensions/google/vertex-adc.ts +188 -0
  550. package/extensions/google/video-generation-provider.test.ts +573 -0
  551. package/extensions/google/video-generation-provider.ts +591 -0
  552. package/extensions/google/web-search-contract-api.ts +1 -0
  553. package/extensions/google/web-search-provider.test.ts +548 -0
  554. package/extensions/google/web-search-provider.ts +1 -0
  555. package/extensions/groq/api.ts +60 -0
  556. package/extensions/groq/index.test.ts +90 -0
  557. package/extensions/groq/index.ts +21 -0
  558. package/extensions/groq/media-understanding-provider.ts +21 -0
  559. package/extensions/groq/openclaw.plugin.json +314 -0
  560. package/extensions/groq/package.json +15 -0
  561. package/extensions/groq/test-api.ts +1 -0
  562. package/extensions/groq/tsconfig.json +16 -0
  563. package/extensions/huggingface/api.ts +10 -0
  564. package/extensions/huggingface/index.test.ts +81 -0
  565. package/extensions/huggingface/index.ts +60 -0
  566. package/extensions/huggingface/model-discovery-env.ts +5 -0
  567. package/extensions/huggingface/models.test.ts +98 -0
  568. package/extensions/huggingface/models.ts +218 -0
  569. package/extensions/huggingface/onboard.ts +26 -0
  570. package/extensions/huggingface/openclaw.plugin.json +57 -0
  571. package/extensions/huggingface/package.json +15 -0
  572. package/extensions/huggingface/provider-catalog.ts +22 -0
  573. package/extensions/huggingface/tsconfig.json +16 -0
  574. package/extensions/image-generation-core/api.ts +30 -0
  575. package/extensions/image-generation-core/package.json +10 -0
  576. package/extensions/image-generation-core/runtime-api.ts +6 -0
  577. package/extensions/image-generation-core/src/runtime.test.ts +29 -0
  578. package/extensions/image-generation-core/src/runtime.ts +6 -0
  579. package/extensions/image-generation-core/tsconfig.json +16 -0
  580. package/extensions/kimi-coding/api.ts +8 -0
  581. package/extensions/kimi-coding/implicit-provider.test.ts +116 -0
  582. package/extensions/kimi-coding/index.test.ts +45 -0
  583. package/extensions/kimi-coding/index.ts +113 -0
  584. package/extensions/kimi-coding/onboard.test.ts +44 -0
  585. package/extensions/kimi-coding/onboard.ts +42 -0
  586. package/extensions/kimi-coding/openclaw.plugin.json +64 -0
  587. package/extensions/kimi-coding/package.json +18 -0
  588. package/extensions/kimi-coding/provider-catalog.test.ts +23 -0
  589. package/extensions/kimi-coding/provider-catalog.ts +58 -0
  590. package/extensions/kimi-coding/replay-policy.test.ts +10 -0
  591. package/extensions/kimi-coding/replay-policy.ts +3 -0
  592. package/extensions/kimi-coding/stream.test.ts +603 -0
  593. package/extensions/kimi-coding/stream.ts +399 -0
  594. package/extensions/kimi-coding/tsconfig.json +16 -0
  595. package/extensions/litellm/api.ts +8 -0
  596. package/extensions/litellm/image-generation-provider.test.ts +348 -0
  597. package/extensions/litellm/image-generation-provider.ts +142 -0
  598. package/extensions/litellm/index.test.ts +107 -0
  599. package/extensions/litellm/index.ts +108 -0
  600. package/extensions/litellm/onboard.test.ts +21 -0
  601. package/extensions/litellm/onboard.ts +55 -0
  602. package/extensions/litellm/openclaw.plugin.json +35 -0
  603. package/extensions/litellm/package.json +15 -0
  604. package/extensions/litellm/provider-catalog.ts +10 -0
  605. package/extensions/litellm/tsconfig.json +16 -0
  606. package/extensions/lmstudio/README.md +3 -0
  607. package/extensions/lmstudio/api.ts +36 -0
  608. package/extensions/lmstudio/index.test.ts +207 -0
  609. package/extensions/lmstudio/index.ts +137 -0
  610. package/extensions/lmstudio/memory-embedding-adapter.ts +36 -0
  611. package/extensions/lmstudio/openclaw.plugin.json +53 -0
  612. package/extensions/lmstudio/package.json +15 -0
  613. package/extensions/lmstudio/plugin-registration.contract.test.ts +6 -0
  614. package/extensions/lmstudio/runtime-api.ts +35 -0
  615. package/extensions/lmstudio/src/api.ts +42 -0
  616. package/extensions/lmstudio/src/defaults.ts +14 -0
  617. package/extensions/lmstudio/src/embedding-provider.ts +147 -0
  618. package/extensions/lmstudio/src/models.fetch.ts +277 -0
  619. package/extensions/lmstudio/src/models.test.ts +491 -0
  620. package/extensions/lmstudio/src/models.ts +536 -0
  621. package/extensions/lmstudio/src/plain-text-tool-calls.ts +24 -0
  622. package/extensions/lmstudio/src/provider-auth.ts +59 -0
  623. package/extensions/lmstudio/src/runtime.test.ts +357 -0
  624. package/extensions/lmstudio/src/runtime.ts +276 -0
  625. package/extensions/lmstudio/src/setup.test.ts +1543 -0
  626. package/extensions/lmstudio/src/setup.ts +878 -0
  627. package/extensions/lmstudio/src/stream.test.ts +658 -0
  628. package/extensions/lmstudio/src/stream.ts +493 -0
  629. package/extensions/media-understanding-core/image-ops.ts +137 -0
  630. package/extensions/media-understanding-core/package.json +14 -0
  631. package/extensions/media-understanding-core/runtime-api.ts +9 -0
  632. package/extensions/media-understanding-core/src/runtime.ts +9 -0
  633. package/extensions/media-understanding-core/tsconfig.json +16 -0
  634. package/extensions/microsoft/index.ts +11 -0
  635. package/extensions/microsoft/microsoft.live.test.ts +14 -0
  636. package/extensions/microsoft/openclaw.plugin.json +15 -0
  637. package/extensions/microsoft/package.json +18 -0
  638. package/extensions/microsoft/speech-provider.test.ts +298 -0
  639. package/extensions/microsoft/speech-provider.ts +295 -0
  640. package/extensions/microsoft/test-api.ts +1 -0
  641. package/extensions/microsoft/tsconfig.json +16 -0
  642. package/extensions/microsoft/tts.test.ts +193 -0
  643. package/extensions/microsoft/tts.ts +137 -0
  644. package/extensions/minimax/README.md +37 -0
  645. package/extensions/minimax/api.ts +27 -0
  646. package/extensions/minimax/image-generation-provider.test.ts +313 -0
  647. package/extensions/minimax/image-generation-provider.ts +216 -0
  648. package/extensions/minimax/index.test.ts +408 -0
  649. package/extensions/minimax/index.ts +39 -0
  650. package/extensions/minimax/media-understanding-provider.ts +23 -0
  651. package/extensions/minimax/minimax.live.test.ts +115 -0
  652. package/extensions/minimax/model-definitions.test.ts +101 -0
  653. package/extensions/minimax/model-definitions.ts +91 -0
  654. package/extensions/minimax/music-generation-provider.test.ts +198 -0
  655. package/extensions/minimax/music-generation-provider.ts +259 -0
  656. package/extensions/minimax/oauth.runtime.ts +1 -0
  657. package/extensions/minimax/oauth.ts +233 -0
  658. package/extensions/minimax/onboard.test.ts +126 -0
  659. package/extensions/minimax/onboard.ts +104 -0
  660. package/extensions/minimax/openclaw.plugin.json +133 -0
  661. package/extensions/minimax/package.json +15 -0
  662. package/extensions/minimax/plugin-registration.contract.test.ts +15 -0
  663. package/extensions/minimax/provider-catalog.ts +86 -0
  664. package/extensions/minimax/provider-contract-api.ts +84 -0
  665. package/extensions/minimax/provider-discovery.contract.test.ts +3 -0
  666. package/extensions/minimax/provider-http.test-helpers.ts +142 -0
  667. package/extensions/minimax/provider-models.ts +21 -0
  668. package/extensions/minimax/provider-registration.ts +285 -0
  669. package/extensions/minimax/speech-provider.test.ts +576 -0
  670. package/extensions/minimax/speech-provider.ts +312 -0
  671. package/extensions/minimax/src/minimax-web-search-provider.runtime.ts +270 -0
  672. package/extensions/minimax/src/minimax-web-search-provider.test.ts +177 -0
  673. package/extensions/minimax/src/minimax-web-search-provider.ts +64 -0
  674. package/extensions/minimax/test-api.ts +11 -0
  675. package/extensions/minimax/tsconfig.json +16 -0
  676. package/extensions/minimax/tts.ts +116 -0
  677. package/extensions/minimax/video-generation-provider.test.ts +214 -0
  678. package/extensions/minimax/video-generation-provider.ts +456 -0
  679. package/extensions/minimax/web-search-contract-api.ts +35 -0
  680. package/extensions/minimax/web-search-provider.ts +1 -0
  681. package/extensions/mistral/api.test.ts +195 -0
  682. package/extensions/mistral/api.ts +81 -0
  683. package/extensions/mistral/embedding-provider.ts +52 -0
  684. package/extensions/mistral/index.ts +61 -0
  685. package/extensions/mistral/media-understanding-provider.test.ts +46 -0
  686. package/extensions/mistral/media-understanding-provider.ts +21 -0
  687. package/extensions/mistral/memory-embedding-adapter.ts +35 -0
  688. package/extensions/mistral/mistral.live.test.ts +62 -0
  689. package/extensions/mistral/model-definitions.test.ts +65 -0
  690. package/extensions/mistral/model-definitions.ts +37 -0
  691. package/extensions/mistral/onboard.test.ts +54 -0
  692. package/extensions/mistral/onboard.ts +31 -0
  693. package/extensions/mistral/openclaw.plugin.json +180 -0
  694. package/extensions/mistral/package.json +15 -0
  695. package/extensions/mistral/provider-catalog.ts +10 -0
  696. package/extensions/mistral/provider-compat.ts +62 -0
  697. package/extensions/mistral/realtime-transcription-provider.test.ts +61 -0
  698. package/extensions/mistral/realtime-transcription-provider.ts +280 -0
  699. package/extensions/mistral/test-api.ts +2 -0
  700. package/extensions/mistral/tsconfig.json +16 -0
  701. package/extensions/moonshot/api.ts +9 -0
  702. package/extensions/moonshot/index.test.ts +73 -0
  703. package/extensions/moonshot/index.ts +81 -0
  704. package/extensions/moonshot/media-understanding-provider.test.ts +92 -0
  705. package/extensions/moonshot/media-understanding-provider.ts +85 -0
  706. package/extensions/moonshot/moonshot.live.test.ts +56 -0
  707. package/extensions/moonshot/onboard.ts +38 -0
  708. package/extensions/moonshot/openclaw.plugin.json +209 -0
  709. package/extensions/moonshot/package.json +15 -0
  710. package/extensions/moonshot/provider-catalog.test.ts +84 -0
  711. package/extensions/moonshot/provider-catalog.ts +34 -0
  712. package/extensions/moonshot/provider-contract-api.ts +33 -0
  713. package/extensions/moonshot/provider-discovery.ts +17 -0
  714. package/extensions/moonshot/src/kimi-web-search-provider.runtime.ts +513 -0
  715. package/extensions/moonshot/src/kimi-web-search-provider.test.ts +297 -0
  716. package/extensions/moonshot/src/kimi-web-search-provider.ts +71 -0
  717. package/extensions/moonshot/test-api.ts +2 -0
  718. package/extensions/moonshot/tsconfig.json +16 -0
  719. package/extensions/moonshot/web-search-contract-api.ts +28 -0
  720. package/extensions/moonshot/web-search-provider.ts +1 -0
  721. package/extensions/nvidia/api.ts +6 -0
  722. package/extensions/nvidia/index.test.ts +180 -0
  723. package/extensions/nvidia/index.ts +64 -0
  724. package/extensions/nvidia/onboard.test.ts +49 -0
  725. package/extensions/nvidia/onboard.ts +30 -0
  726. package/extensions/nvidia/openclaw.plugin.json +122 -0
  727. package/extensions/nvidia/package.json +15 -0
  728. package/extensions/nvidia/plugin-registration.contract.test.ts +14 -0
  729. package/extensions/nvidia/provider-catalog.test.ts +21 -0
  730. package/extensions/nvidia/provider-catalog.ts +15 -0
  731. package/extensions/nvidia/tsconfig.json +16 -0
  732. package/extensions/ollama/README.md +3 -0
  733. package/extensions/ollama/api.ts +34 -0
  734. package/extensions/ollama/index.test.ts +979 -0
  735. package/extensions/ollama/index.ts +336 -0
  736. package/extensions/ollama/ollama.live.test.ts +287 -0
  737. package/extensions/ollama/openclaw.plugin.json +67 -0
  738. package/extensions/ollama/package.json +19 -0
  739. package/extensions/ollama/plugin-registration.contract.test.ts +7 -0
  740. package/extensions/ollama/provider-discovery.import-guard.test.ts +29 -0
  741. package/extensions/ollama/provider-discovery.test.ts +657 -0
  742. package/extensions/ollama/provider-discovery.ts +69 -0
  743. package/extensions/ollama/provider-policy-api.test.ts +72 -0
  744. package/extensions/ollama/provider-policy-api.ts +59 -0
  745. package/extensions/ollama/runtime-api.ts +22 -0
  746. package/extensions/ollama/src/defaults.ts +14 -0
  747. package/extensions/ollama/src/discovery-shared.test.ts +41 -0
  748. package/extensions/ollama/src/discovery-shared.ts +322 -0
  749. package/extensions/ollama/src/embedding-provider.test.ts +557 -0
  750. package/extensions/ollama/src/embedding-provider.ts +393 -0
  751. package/extensions/ollama/src/media-understanding-provider.ts +18 -0
  752. package/extensions/ollama/src/memory-embedding-adapter.ts +30 -0
  753. package/extensions/ollama/src/model-id.ts +24 -0
  754. package/extensions/ollama/src/ollama-json.ts +143 -0
  755. package/extensions/ollama/src/provider-base-url.test.ts +44 -0
  756. package/extensions/ollama/src/provider-base-url.ts +23 -0
  757. package/extensions/ollama/src/provider-models.ssrf.test.ts +41 -0
  758. package/extensions/ollama/src/provider-models.test.ts +312 -0
  759. package/extensions/ollama/src/provider-models.ts +327 -0
  760. package/extensions/ollama/src/setup.test.ts +771 -0
  761. package/extensions/ollama/src/setup.ts +743 -0
  762. package/extensions/ollama/src/stream-runtime.test.ts +2218 -0
  763. package/extensions/ollama/src/stream.test.ts +252 -0
  764. package/extensions/ollama/src/stream.ts +1347 -0
  765. package/extensions/ollama/src/web-search-provider.test.ts +488 -0
  766. package/extensions/ollama/src/web-search-provider.ts +350 -0
  767. package/extensions/ollama/src/wsl2-crash-loop-check.test.ts +157 -0
  768. package/extensions/ollama/src/wsl2-crash-loop-check.ts +84 -0
  769. package/extensions/ollama/tsconfig.json +16 -0
  770. package/extensions/ollama/web-search-contract-api.ts +26 -0
  771. package/extensions/ollama/web-search-provider.ts +1 -0
  772. package/extensions/openai/api.ts +16 -0
  773. package/extensions/openai/auth-choice-copy.ts +33 -0
  774. package/extensions/openai/base-url.test.ts +60 -0
  775. package/extensions/openai/base-url.ts +23 -0
  776. package/extensions/openai/default-models.test.ts +36 -0
  777. package/extensions/openai/default-models.ts +40 -0
  778. package/extensions/openai/embedding-batch.test.ts +10 -0
  779. package/extensions/openai/embedding-batch.ts +274 -0
  780. package/extensions/openai/embedding-provider.test.ts +102 -0
  781. package/extensions/openai/embedding-provider.ts +110 -0
  782. package/extensions/openai/image-generation-provider.test.ts +1624 -0
  783. package/extensions/openai/image-generation-provider.ts +903 -0
  784. package/extensions/openai/index.test.ts +630 -0
  785. package/extensions/openai/index.ts +58 -0
  786. package/extensions/openai/media-understanding-provider.test.ts +119 -0
  787. package/extensions/openai/media-understanding-provider.ts +51 -0
  788. package/extensions/openai/memory-embedding-adapter.test.ts +82 -0
  789. package/extensions/openai/memory-embedding-adapter.ts +68 -0
  790. package/extensions/openai/native-web-search.ts +103 -0
  791. package/extensions/openai/openai-codex-auth-identity.test.ts +77 -0
  792. package/extensions/openai/openai-codex-auth-identity.ts +100 -0
  793. package/extensions/openai/openai-codex-catalog.ts +12 -0
  794. package/extensions/openai/openai-codex-device-code.test.ts +248 -0
  795. package/extensions/openai/openai-codex-device-code.ts +309 -0
  796. package/extensions/openai/openai-codex-oauth.runtime.ts +348 -0
  797. package/extensions/openai/openai-codex-provider.runtime.ts +45 -0
  798. package/extensions/openai/openai-codex-provider.test.ts +883 -0
  799. package/extensions/openai/openai-codex-provider.ts +636 -0
  800. package/extensions/openai/openai-codex-shared.ts +3 -0
  801. package/extensions/openai/openai-provider.live.test.ts +196 -0
  802. package/extensions/openai/openai-provider.test.ts +929 -0
  803. package/extensions/openai/openai-provider.ts +325 -0
  804. package/extensions/openai/openai-tts.live.test.ts +44 -0
  805. package/extensions/openai/openai.live.test.ts +493 -0
  806. package/extensions/openai/openclaw.plugin.json +897 -0
  807. package/extensions/openai/openclaw.plugin.test.ts +181 -0
  808. package/extensions/openai/package.json +19 -0
  809. package/extensions/openai/plugin-registration.contract.test.ts +9 -0
  810. package/extensions/openai/prompt-overlay.ts +51 -0
  811. package/extensions/openai/provider-auth.contract.test.ts +12 -0
  812. package/extensions/openai/provider-catalog.contract.test.ts +3 -0
  813. package/extensions/openai/provider-contract-api.ts +83 -0
  814. package/extensions/openai/provider-policy-api.ts +20 -0
  815. package/extensions/openai/provider-runtime.contract.test.ts +3 -0
  816. package/extensions/openai/realtime-provider-shared.ts +168 -0
  817. package/extensions/openai/realtime-transcription-provider.test.ts +356 -0
  818. package/extensions/openai/realtime-transcription-provider.ts +307 -0
  819. package/extensions/openai/realtime-voice-provider.test.ts +1924 -0
  820. package/extensions/openai/realtime-voice-provider.ts +1315 -0
  821. package/extensions/openai/register.runtime.ts +15 -0
  822. package/extensions/openai/replay-policy.ts +32 -0
  823. package/extensions/openai/setup-api.test.ts +29 -0
  824. package/extensions/openai/setup-api.ts +166 -0
  825. package/extensions/openai/shared.ts +131 -0
  826. package/extensions/openai/speech-provider.test.ts +324 -0
  827. package/extensions/openai/speech-provider.ts +347 -0
  828. package/extensions/openai/test-api.ts +9 -0
  829. package/extensions/openai/test-support/provider-catalog.contract-test-support.ts +134 -0
  830. package/extensions/openai/thinking-policy.ts +55 -0
  831. package/extensions/openai/transport-policy.test.ts +128 -0
  832. package/extensions/openai/transport-policy.ts +111 -0
  833. package/extensions/openai/tsconfig.json +16 -0
  834. package/extensions/openai/tts.test.ts +444 -0
  835. package/extensions/openai/tts.ts +184 -0
  836. package/extensions/openai/video-generation-provider.test.ts +254 -0
  837. package/extensions/openai/video-generation-provider.ts +382 -0
  838. package/extensions/opencode/api.ts +9 -0
  839. package/extensions/opencode/index.test.ts +84 -0
  840. package/extensions/opencode/index.ts +74 -0
  841. package/extensions/opencode/media-understanding-provider.test.ts +44 -0
  842. package/extensions/opencode/media-understanding-provider.ts +42 -0
  843. package/extensions/opencode/onboard.test.ts +25 -0
  844. package/extensions/opencode/onboard.ts +29 -0
  845. package/extensions/opencode/openclaw.plugin.json +55 -0
  846. package/extensions/opencode/package.json +15 -0
  847. package/extensions/opencode/plugin-registration.contract.test.ts +8 -0
  848. package/extensions/opencode/provider-policy-api.test.ts +44 -0
  849. package/extensions/opencode/provider-policy-api.ts +5 -0
  850. package/extensions/opencode/tsconfig.json +16 -0
  851. package/extensions/opencode-go/api.ts +27 -0
  852. package/extensions/opencode-go/index.test.ts +305 -0
  853. package/extensions/opencode-go/index.ts +101 -0
  854. package/extensions/opencode-go/media-understanding-provider.test.ts +12 -0
  855. package/extensions/opencode-go/media-understanding-provider.ts +15 -0
  856. package/extensions/opencode-go/onboard.test.ts +28 -0
  857. package/extensions/opencode-go/onboard.ts +17 -0
  858. package/extensions/opencode-go/openclaw.plugin.json +106 -0
  859. package/extensions/opencode-go/package.json +15 -0
  860. package/extensions/opencode-go/plugin-registration.contract.test.ts +8 -0
  861. package/extensions/opencode-go/provider-catalog.ts +135 -0
  862. package/extensions/opencode-go/stream.ts +51 -0
  863. package/extensions/opencode-go/tsconfig.json +16 -0
  864. package/extensions/openrouter/api.ts +12 -0
  865. package/extensions/openrouter/image-generation-provider.test.ts +361 -0
  866. package/extensions/openrouter/image-generation-provider.ts +345 -0
  867. package/extensions/openrouter/index.test.ts +650 -0
  868. package/extensions/openrouter/index.ts +184 -0
  869. package/extensions/openrouter/media-understanding-provider.test.ts +260 -0
  870. package/extensions/openrouter/media-understanding-provider.ts +176 -0
  871. package/extensions/openrouter/models.ts +18 -0
  872. package/extensions/openrouter/music-generation-provider.test.ts +226 -0
  873. package/extensions/openrouter/music-generation-provider.ts +344 -0
  874. package/extensions/openrouter/onboard.test.ts +27 -0
  875. package/extensions/openrouter/onboard.ts +32 -0
  876. package/extensions/openrouter/openclaw.plugin.json +81 -0
  877. package/extensions/openrouter/openrouter.live.test.ts +118 -0
  878. package/extensions/openrouter/package.json +15 -0
  879. package/extensions/openrouter/provider-catalog.ts +88 -0
  880. package/extensions/openrouter/provider-contract-api.ts +27 -0
  881. package/extensions/openrouter/provider-policy-api.ts +5 -0
  882. package/extensions/openrouter/provider-routing.ts +87 -0
  883. package/extensions/openrouter/provider-runtime.contract.test.ts +3 -0
  884. package/extensions/openrouter/speech-provider.test.ts +218 -0
  885. package/extensions/openrouter/speech-provider.ts +46 -0
  886. package/extensions/openrouter/stream.ts +247 -0
  887. package/extensions/openrouter/test-api.ts +4 -0
  888. package/extensions/openrouter/thinking-policy.ts +34 -0
  889. package/extensions/openrouter/tsconfig.json +16 -0
  890. package/extensions/openrouter/video-generation-provider.test.ts +722 -0
  891. package/extensions/openrouter/video-generation-provider.ts +530 -0
  892. package/extensions/openrouter/video-http.ts +48 -0
  893. package/extensions/openrouter/video-model-catalog.ts +299 -0
  894. package/extensions/openshell/index.ts +28 -0
  895. package/extensions/openshell/npm-shrinkwrap.json +24 -0
  896. package/extensions/openshell/openclaw.plugin.json +118 -0
  897. package/extensions/openshell/package.json +37 -0
  898. package/extensions/openshell/src/backend.e2e.test.ts +595 -0
  899. package/extensions/openshell/src/backend.test.ts +40 -0
  900. package/extensions/openshell/src/backend.ts +512 -0
  901. package/extensions/openshell/src/backend.types.ts +11 -0
  902. package/extensions/openshell/src/cli.ts +85 -0
  903. package/extensions/openshell/src/config.test.ts +80 -0
  904. package/extensions/openshell/src/config.ts +194 -0
  905. package/extensions/openshell/src/fs-bridge.ts +370 -0
  906. package/extensions/openshell/src/mirror.test.ts +194 -0
  907. package/extensions/openshell/src/mirror.ts +141 -0
  908. package/extensions/openshell/src/openshell-core.test.ts +529 -0
  909. package/extensions/openshell/tsconfig.json +16 -0
  910. package/extensions/perplexity/index.ts +11 -0
  911. package/extensions/perplexity/openclaw.plugin.json +52 -0
  912. package/extensions/perplexity/package.json +15 -0
  913. package/extensions/perplexity/src/perplexity-web-search-provider.runtime.ts +551 -0
  914. package/extensions/perplexity/src/perplexity-web-search-provider.shared.ts +124 -0
  915. package/extensions/perplexity/src/perplexity-web-search-provider.test.ts +151 -0
  916. package/extensions/perplexity/src/perplexity-web-search-provider.ts +127 -0
  917. package/extensions/perplexity/test-api.ts +1 -0
  918. package/extensions/perplexity/tsconfig.json +16 -0
  919. package/extensions/perplexity/web-search-contract-api.ts +13 -0
  920. package/extensions/perplexity/web-search-provider.ts +1 -0
  921. package/extensions/qianfan/api.ts +6 -0
  922. package/extensions/qianfan/index.test.ts +133 -0
  923. package/extensions/qianfan/index.ts +31 -0
  924. package/extensions/qianfan/onboard.ts +61 -0
  925. package/extensions/qianfan/openclaw.plugin.json +78 -0
  926. package/extensions/qianfan/package.json +15 -0
  927. package/extensions/qianfan/provider-catalog.ts +13 -0
  928. package/extensions/qianfan/tsconfig.json +16 -0
  929. package/extensions/qwen/api.ts +34 -0
  930. package/extensions/qwen/index.test.ts +31 -0
  931. package/extensions/qwen/index.ts +181 -0
  932. package/extensions/qwen/media-understanding-provider.test.ts +76 -0
  933. package/extensions/qwen/media-understanding-provider.ts +88 -0
  934. package/extensions/qwen/model-definitions.ts +20 -0
  935. package/extensions/qwen/models.ts +202 -0
  936. package/extensions/qwen/onboard.ts +73 -0
  937. package/extensions/qwen/openclaw.plugin.json +143 -0
  938. package/extensions/qwen/package.json +15 -0
  939. package/extensions/qwen/plugin-registration.contract.test.ts +10 -0
  940. package/extensions/qwen/provider-catalog.test.ts +62 -0
  941. package/extensions/qwen/provider-catalog.ts +13 -0
  942. package/extensions/qwen/provider-discovery.contract.test.ts +3 -0
  943. package/extensions/qwen/stream.test.ts +171 -0
  944. package/extensions/qwen/stream.ts +87 -0
  945. package/extensions/qwen/test-api.ts +2 -0
  946. package/extensions/qwen/tsconfig.json +16 -0
  947. package/extensions/qwen/video-generation-provider.test.ts +155 -0
  948. package/extensions/qwen/video-generation-provider.ts +111 -0
  949. package/extensions/runway/index.ts +11 -0
  950. package/extensions/runway/openclaw.plugin.json +34 -0
  951. package/extensions/runway/package.json +15 -0
  952. package/extensions/runway/plugin-registration.contract.test.ts +7 -0
  953. package/extensions/runway/tsconfig.json +16 -0
  954. package/extensions/runway/video-generation-provider.test.ts +248 -0
  955. package/extensions/runway/video-generation-provider.ts +462 -0
  956. package/extensions/senseaudio/index.ts +11 -0
  957. package/extensions/senseaudio/media-understanding-provider.test.ts +136 -0
  958. package/extensions/senseaudio/media-understanding-provider.ts +25 -0
  959. package/extensions/senseaudio/openclaw.plugin.json +18 -0
  960. package/extensions/senseaudio/package.json +15 -0
  961. package/extensions/senseaudio/test-api.ts +1 -0
  962. package/extensions/sglang/README.md +3 -0
  963. package/extensions/sglang/api.ts +7 -0
  964. package/extensions/sglang/defaults.ts +4 -0
  965. package/extensions/sglang/index.test.ts +34 -0
  966. package/extensions/sglang/index.ts +95 -0
  967. package/extensions/sglang/models.ts +23 -0
  968. package/extensions/sglang/openclaw.plugin.json +45 -0
  969. package/extensions/sglang/package.json +15 -0
  970. package/extensions/sglang/provider-discovery.contract.test.ts +7 -0
  971. package/extensions/sglang/tsconfig.json +16 -0
  972. package/extensions/skill-workshop/api.ts +3 -0
  973. package/extensions/skill-workshop/index.test.ts +990 -0
  974. package/extensions/skill-workshop/index.ts +170 -0
  975. package/extensions/skill-workshop/openclaw.plugin.json +83 -0
  976. package/extensions/skill-workshop/package.json +18 -0
  977. package/extensions/skill-workshop/src/config.ts +50 -0
  978. package/extensions/skill-workshop/src/prompt.ts +18 -0
  979. package/extensions/skill-workshop/src/reviewer.ts +290 -0
  980. package/extensions/skill-workshop/src/scanner.ts +69 -0
  981. package/extensions/skill-workshop/src/signals.ts +95 -0
  982. package/extensions/skill-workshop/src/skills.ts +186 -0
  983. package/extensions/skill-workshop/src/store.ts +184 -0
  984. package/extensions/skill-workshop/src/text.ts +59 -0
  985. package/extensions/skill-workshop/src/tool.ts +200 -0
  986. package/extensions/skill-workshop/src/types.ts +42 -0
  987. package/extensions/skill-workshop/src/workshop.ts +85 -0
  988. package/extensions/speech-core/api.ts +54 -0
  989. package/extensions/speech-core/package.json +10 -0
  990. package/extensions/speech-core/runtime-api.ts +42 -0
  991. package/extensions/speech-core/src/tts.test.ts +1025 -0
  992. package/extensions/speech-core/src/tts.ts +1929 -0
  993. package/extensions/speech-core/tsconfig.json +16 -0
  994. package/extensions/stepfun/index.ts +252 -0
  995. package/extensions/stepfun/onboard.ts +73 -0
  996. package/extensions/stepfun/openclaw.plugin.json +148 -0
  997. package/extensions/stepfun/package.json +15 -0
  998. package/extensions/stepfun/provider-catalog.ts +40 -0
  999. package/extensions/stepfun/tsconfig.json +16 -0
  1000. package/extensions/tencent/api.ts +7 -0
  1001. package/extensions/tencent/index.ts +64 -0
  1002. package/extensions/tencent/models.ts +25 -0
  1003. package/extensions/tencent/onboard.ts +38 -0
  1004. package/extensions/tencent/openclaw.plugin.json +86 -0
  1005. package/extensions/tencent/package.json +15 -0
  1006. package/extensions/tencent/provider-catalog.ts +14 -0
  1007. package/extensions/tencent/provider-discovery.ts +17 -0
  1008. package/extensions/tencent/tsconfig.json +16 -0
  1009. package/extensions/together/api.ts +7 -0
  1010. package/extensions/together/index.ts +42 -0
  1011. package/extensions/together/models.ts +23 -0
  1012. package/extensions/together/onboard.ts +26 -0
  1013. package/extensions/together/openclaw.plugin.json +160 -0
  1014. package/extensions/together/package.json +15 -0
  1015. package/extensions/together/plugin-registration.contract.test.ts +8 -0
  1016. package/extensions/together/provider-catalog.ts +10 -0
  1017. package/extensions/together/tsconfig.json +16 -0
  1018. package/extensions/together/video-generation-provider.test.ts +130 -0
  1019. package/extensions/together/video-generation-provider.ts +281 -0
  1020. package/extensions/tts-local-cli/index.ts +11 -0
  1021. package/extensions/tts-local-cli/openclaw.plugin.json +15 -0
  1022. package/extensions/tts-local-cli/package.json +15 -0
  1023. package/extensions/tts-local-cli/speech-provider.test.ts +307 -0
  1024. package/extensions/tts-local-cli/speech-provider.ts +455 -0
  1025. package/extensions/venice/api.ts +8 -0
  1026. package/extensions/venice/index.test.ts +109 -0
  1027. package/extensions/venice/index.ts +70 -0
  1028. package/extensions/venice/models.test.ts +291 -0
  1029. package/extensions/venice/models.ts +302 -0
  1030. package/extensions/venice/onboard.ts +27 -0
  1031. package/extensions/venice/openclaw.plugin.json +504 -0
  1032. package/extensions/venice/package.json +15 -0
  1033. package/extensions/venice/provider-catalog.ts +11 -0
  1034. package/extensions/venice/provider-runtime.contract.test.ts +3 -0
  1035. package/extensions/venice/stream.ts +37 -0
  1036. package/extensions/venice/tsconfig.json +16 -0
  1037. package/extensions/vercel-ai-gateway/api.ts +12 -0
  1038. package/extensions/vercel-ai-gateway/index.ts +41 -0
  1039. package/extensions/vercel-ai-gateway/models.ts +226 -0
  1040. package/extensions/vercel-ai-gateway/onboard.ts +32 -0
  1041. package/extensions/vercel-ai-gateway/openclaw.plugin.json +61 -0
  1042. package/extensions/vercel-ai-gateway/package.json +15 -0
  1043. package/extensions/vercel-ai-gateway/provider-catalog.test.ts +96 -0
  1044. package/extensions/vercel-ai-gateway/provider-catalog.ts +22 -0
  1045. package/extensions/vercel-ai-gateway/thinking.test.ts +100 -0
  1046. package/extensions/vercel-ai-gateway/thinking.ts +77 -0
  1047. package/extensions/vercel-ai-gateway/tsconfig.json +16 -0
  1048. package/extensions/vllm/README.md +3 -0
  1049. package/extensions/vllm/api.ts +8 -0
  1050. package/extensions/vllm/defaults.ts +4 -0
  1051. package/extensions/vllm/index.ts +96 -0
  1052. package/extensions/vllm/models.ts +23 -0
  1053. package/extensions/vllm/openclaw.plugin.json +45 -0
  1054. package/extensions/vllm/package.json +15 -0
  1055. package/extensions/vllm/provider-discovery.contract.test.ts +7 -0
  1056. package/extensions/vllm/register.runtime.ts +7 -0
  1057. package/extensions/vllm/stream.test.ts +282 -0
  1058. package/extensions/vllm/stream.ts +164 -0
  1059. package/extensions/vllm/tsconfig.json +16 -0
  1060. package/extensions/volcengine/api.ts +56 -0
  1061. package/extensions/volcengine/index.test.ts +92 -0
  1062. package/extensions/volcengine/index.ts +87 -0
  1063. package/extensions/volcengine/models.ts +28 -0
  1064. package/extensions/volcengine/openclaw.plugin.json +221 -0
  1065. package/extensions/volcengine/package.json +15 -0
  1066. package/extensions/volcengine/provider-catalog.ts +17 -0
  1067. package/extensions/volcengine/provider-discovery.ts +31 -0
  1068. package/extensions/volcengine/speech-provider.ts +229 -0
  1069. package/extensions/volcengine/tsconfig.json +16 -0
  1070. package/extensions/volcengine/tts.live.test.ts +30 -0
  1071. package/extensions/volcengine/tts.test.ts +279 -0
  1072. package/extensions/volcengine/tts.ts +266 -0
  1073. package/extensions/voyage/embedding-batch.ts +315 -0
  1074. package/extensions/voyage/embedding-provider.ts +90 -0
  1075. package/extensions/voyage/index.ts +11 -0
  1076. package/extensions/voyage/memory-embedding-adapter.ts +56 -0
  1077. package/extensions/voyage/openclaw.plugin.json +18 -0
  1078. package/extensions/voyage/package.json +15 -0
  1079. package/extensions/xai/.boundary-stubs/anthropic-vertex-api.d.ts +2 -0
  1080. package/extensions/xai/.boundary-stubs/ollama-api.d.ts +1 -0
  1081. package/extensions/xai/.boundary-stubs/ollama-runtime-api.d.ts +16 -0
  1082. package/extensions/xai/.boundary-stubs/speech-core-runtime-api.d.ts +33 -0
  1083. package/extensions/xai/api.test.ts +51 -0
  1084. package/extensions/xai/api.ts +119 -0
  1085. package/extensions/xai/code-execution.test.ts +262 -0
  1086. package/extensions/xai/code-execution.ts +146 -0
  1087. package/extensions/xai/image-generation-provider.test.ts +293 -0
  1088. package/extensions/xai/image-generation-provider.ts +124 -0
  1089. package/extensions/xai/index.test.ts +263 -0
  1090. package/extensions/xai/index.ts +233 -0
  1091. package/extensions/xai/model-compat.ts +34 -0
  1092. package/extensions/xai/model-definitions.ts +346 -0
  1093. package/extensions/xai/model-id.test.ts +32 -0
  1094. package/extensions/xai/model-id.ts +24 -0
  1095. package/extensions/xai/onboard.test.ts +91 -0
  1096. package/extensions/xai/onboard.ts +56 -0
  1097. package/extensions/xai/openclaw.plugin.json +274 -0
  1098. package/extensions/xai/package.json +20 -0
  1099. package/extensions/xai/plugin-registration.contract.test.ts +11 -0
  1100. package/extensions/xai/provider-catalog.ts +12 -0
  1101. package/extensions/xai/provider-contract-api.ts +22 -0
  1102. package/extensions/xai/provider-discovery.ts +27 -0
  1103. package/extensions/xai/provider-models.ts +45 -0
  1104. package/extensions/xai/provider-policy-api.test.ts +37 -0
  1105. package/extensions/xai/provider-policy-api.ts +18 -0
  1106. package/extensions/xai/realtime-transcription-provider.test.ts +273 -0
  1107. package/extensions/xai/realtime-transcription-provider.ts +306 -0
  1108. package/extensions/xai/runtime-model-compat.test.ts +60 -0
  1109. package/extensions/xai/runtime-model-compat.ts +72 -0
  1110. package/extensions/xai/setup-api.ts +22 -0
  1111. package/extensions/xai/speech-provider.test.ts +184 -0
  1112. package/extensions/xai/speech-provider.ts +275 -0
  1113. package/extensions/xai/src/code-execution-shared.ts +110 -0
  1114. package/extensions/xai/src/responses-tool-shared.test.ts +107 -0
  1115. package/extensions/xai/src/responses-tool-shared.ts +163 -0
  1116. package/extensions/xai/src/tool-auth-shared.test.ts +326 -0
  1117. package/extensions/xai/src/tool-auth-shared.ts +219 -0
  1118. package/extensions/xai/src/tool-config-shared.test.ts +36 -0
  1119. package/extensions/xai/src/tool-config-shared.ts +32 -0
  1120. package/extensions/xai/src/web-search-provider.runtime.ts +429 -0
  1121. package/extensions/xai/src/web-search-response.types.ts +25 -0
  1122. package/extensions/xai/src/web-search-shared.ts +124 -0
  1123. package/extensions/xai/src/x-search-config.ts +78 -0
  1124. package/extensions/xai/src/x-search-shared.ts +146 -0
  1125. package/extensions/xai/src/xai-user-agent.test.ts +59 -0
  1126. package/extensions/xai/src/xai-user-agent.ts +52 -0
  1127. package/extensions/xai/stream.test.ts +410 -0
  1128. package/extensions/xai/stream.ts +359 -0
  1129. package/extensions/xai/stt.test.ts +106 -0
  1130. package/extensions/xai/stt.ts +91 -0
  1131. package/extensions/xai/test-api.ts +1 -0
  1132. package/extensions/xai/test-helpers.ts +73 -0
  1133. package/extensions/xai/tsconfig.json +64 -0
  1134. package/extensions/xai/tts.test.ts +125 -0
  1135. package/extensions/xai/tts.ts +97 -0
  1136. package/extensions/xai/video-generation-provider.test.ts +443 -0
  1137. package/extensions/xai/video-generation-provider.ts +499 -0
  1138. package/extensions/xai/web-search-contract-api.ts +29 -0
  1139. package/extensions/xai/web-search.test.ts +1242 -0
  1140. package/extensions/xai/web-search.ts +68 -0
  1141. package/extensions/xai/x-search-tool-shared.ts +48 -0
  1142. package/extensions/xai/x-search.live.test.ts +76 -0
  1143. package/extensions/xai/x-search.test.ts +484 -0
  1144. package/extensions/xai/x-search.ts +230 -0
  1145. package/extensions/xai/xai-oauth.test.ts +387 -0
  1146. package/extensions/xai/xai-oauth.ts +752 -0
  1147. package/extensions/xai/xai.live.test.ts +323 -0
  1148. package/launcher.js +97 -0
  1149. package/logger.js +87 -0
  1150. package/package.json +21 -0
  1151. package/server.js +1800 -0
  1152. package/skills/ai-error-prevention/SKILL.md +105 -0
  1153. package/skills/api-design/SKILL.md +523 -0
  1154. package/skills/architecture-decision-records/SKILL.md +179 -0
  1155. package/skills/autonomous-loops/SKILL.md +610 -0
  1156. package/skills/backend-patterns/SKILL.md +598 -0
  1157. package/skills/codebase-onboarding/SKILL.md +233 -0
  1158. package/skills/coding-standards/SKILL.md +530 -0
  1159. package/skills/database-migrations/SKILL.md +429 -0
  1160. package/skills/deep-research/SKILL.md +155 -0
  1161. package/skills/error-prevention/SKILL.md +61 -0
  1162. package/skills/exa-search/SKILL.md +103 -0
  1163. package/skills/frontend-slides/SKILL.md +184 -0
  1164. package/skills/frontend-slides/STYLE_PRESETS.md +330 -0
  1165. package/skills/git-workflow/SKILL.md +715 -0
  1166. package/skills/iterative-retrieval/SKILL.md +211 -0
  1167. package/skills/php-security/SKILL.md +70 -0
  1168. package/skills/php-security/rules/thinkphp-security.rules +23 -0
  1169. package/skills/requirement-ears/SKILL.md +31 -0
  1170. package/skills/rules-distill/SKILL.md +264 -0
  1171. package/skills/rules-distill/scripts/scan-rules.sh +58 -0
  1172. package/skills/rules-distill/scripts/scan-skills.sh +129 -0
  1173. package/skills/search-first/SKILL.md +161 -0
  1174. package/skills/security-review/SKILL.md +495 -0
  1175. package/skills/security-review/cloud-infrastructure-security.md +361 -0
  1176. package/skills/security-scan/SKILL.md +68 -0
  1177. package/skills/security-scan/scripts/scan-config.ps1 +31 -0
  1178. package/skills/security-scan/scripts/scan-sqli.ps1 +21 -0
  1179. package/skills/skill-stocktake/SKILL.md +193 -0
  1180. package/skills/skill-stocktake/scripts/quick-diff.sh +87 -0
  1181. package/skills/skill-stocktake/scripts/save-results.sh +56 -0
  1182. package/skills/skill-stocktake/scripts/scan.sh +170 -0
  1183. package/skills/strategic-compact/SKILL.md +131 -0
  1184. package/skills/strategic-compact/suggest-compact.sh +54 -0
  1185. package/skills/tdd-workflow/SKILL.md +90 -0
  1186. package/skills/tdd-workflow/examples/IntegrationTestExample.php +35 -0
  1187. package/skills/tdd-workflow/examples/UnitTestExample.php +39 -0
  1188. package/skills/ui-spec-guider/ui-spec-guider/SKILL.md +37 -0
  1189. package/skills/ui-spec-guider/ui-spec-guider.skill +0 -0
  1190. package/skills/verification-loop/SKILL.md +126 -0
  1191. package/start.bat +29 -0
@@ -0,0 +1,1924 @@
1
+ import { REALTIME_VOICE_AUDIO_FORMAT_PCM16_24KHZ } from "openclaw/plugin-sdk/realtime-voice";
2
+ import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
3
+ import { buildOpenAIRealtimeVoiceProvider } from "./realtime-voice-provider.js";
4
+
5
+ const {
6
+ FakeWebSocket,
7
+ execFileSyncMock,
8
+ fetchWithSsrFGuardMock,
9
+ isProviderAuthProfileConfiguredMock,
10
+ resolveProviderAuthProfileApiKeyMock,
11
+ } = vi.hoisted(() => {
12
+ type Listener = (...args: unknown[]) => void;
13
+
14
+ class MockWebSocket {
15
+ static readonly OPEN = 1;
16
+ static readonly CLOSED = 3;
17
+ static instances: MockWebSocket[] = [];
18
+
19
+ readonly listeners = new Map<string, Listener[]>();
20
+ readyState = 0;
21
+ sent: string[] = [];
22
+ closed = false;
23
+ terminated = false;
24
+ args: unknown[];
25
+
26
+ constructor(...args: unknown[]) {
27
+ this.args = args;
28
+ MockWebSocket.instances.push(this);
29
+ }
30
+
31
+ on(event: string, listener: Listener): this {
32
+ const listeners = this.listeners.get(event) ?? [];
33
+ listeners.push(listener);
34
+ this.listeners.set(event, listeners);
35
+ return this;
36
+ }
37
+
38
+ emit(event: string, ...args: unknown[]): void {
39
+ for (const listener of this.listeners.get(event) ?? []) {
40
+ listener(...args);
41
+ }
42
+ }
43
+
44
+ send(payload: string): void {
45
+ this.sent.push(payload);
46
+ }
47
+
48
+ close(code?: number, reason?: string): void {
49
+ this.closed = true;
50
+ this.readyState = MockWebSocket.CLOSED;
51
+ this.emit("close", code ?? 1000, Buffer.from(reason ?? ""));
52
+ }
53
+
54
+ terminate(): void {
55
+ this.terminated = true;
56
+ this.close(1006, "terminated");
57
+ }
58
+ }
59
+
60
+ return {
61
+ FakeWebSocket: MockWebSocket,
62
+ execFileSyncMock: vi.fn(),
63
+ fetchWithSsrFGuardMock: vi.fn(),
64
+ isProviderAuthProfileConfiguredMock: vi.fn(),
65
+ resolveProviderAuthProfileApiKeyMock: vi.fn(),
66
+ };
67
+ });
68
+
69
+ vi.mock("node:child_process", async (importOriginal) => {
70
+ const actual = await importOriginal<typeof import("node:child_process")>();
71
+ return {
72
+ ...actual,
73
+ execFileSync: execFileSyncMock,
74
+ };
75
+ });
76
+
77
+ vi.mock("ws", () => ({
78
+ default: FakeWebSocket,
79
+ }));
80
+
81
+ vi.mock("openclaw/plugin-sdk/ssrf-runtime", () => ({
82
+ fetchWithSsrFGuard: fetchWithSsrFGuardMock,
83
+ }));
84
+
85
+ vi.mock("openclaw/plugin-sdk/provider-auth", () => ({
86
+ isProviderAuthProfileConfigured: isProviderAuthProfileConfiguredMock,
87
+ resolveProviderAuthProfileApiKey: resolveProviderAuthProfileApiKeyMock,
88
+ }));
89
+
90
+ type FakeWebSocketInstance = InstanceType<typeof FakeWebSocket>;
91
+ type SentRealtimeEvent = {
92
+ type: string;
93
+ audio?: string;
94
+ item_id?: string;
95
+ content_index?: number;
96
+ audio_end_ms?: number;
97
+ session?: {
98
+ type?: string;
99
+ model?: string;
100
+ modalities?: string[];
101
+ instructions?: string;
102
+ voice?: string;
103
+ input_audio_format?: string;
104
+ output_audio_format?: string;
105
+ input_audio_transcription?: Record<string, unknown>;
106
+ turn_detection?: {
107
+ create_response?: boolean;
108
+ };
109
+ output_modalities?: string[];
110
+ audio?: {
111
+ input?: {
112
+ format?: Record<string, unknown>;
113
+ noise_reduction?: Record<string, unknown> | null;
114
+ transcription?: Record<string, unknown>;
115
+ turn_detection?: {
116
+ create_response?: boolean;
117
+ interrupt_response?: boolean;
118
+ };
119
+ };
120
+ output?: {
121
+ format?: Record<string, unknown>;
122
+ voice?: string;
123
+ };
124
+ };
125
+ item?: unknown;
126
+ };
127
+ };
128
+
129
+ function parseSent(socket: FakeWebSocketInstance): SentRealtimeEvent[] {
130
+ return socket.sent.map((payload: string) => JSON.parse(payload) as SentRealtimeEvent);
131
+ }
132
+
133
+ function createJsonResponse(body: unknown, init?: { status?: number }): Response {
134
+ return new Response(JSON.stringify(body), {
135
+ status: init?.status ?? 200,
136
+ headers: {
137
+ "Content-Type": "application/json",
138
+ },
139
+ });
140
+ }
141
+
142
+ function isRecord(value: unknown): value is Record<string, unknown> {
143
+ return typeof value === "object" && value !== null && !Array.isArray(value);
144
+ }
145
+
146
+ function requireRecord(value: unknown, label: string): Record<string, unknown> {
147
+ expect(isRecord(value), `${label} must be an object`).toBe(true);
148
+ return value as Record<string, unknown>;
149
+ }
150
+
151
+ function requireNestedRecord(
152
+ value: unknown,
153
+ path: readonly string[],
154
+ label = path.join("."),
155
+ ): Record<string, unknown> {
156
+ let current = requireRecord(value, label);
157
+ for (const key of path) {
158
+ current = requireRecord(current[key], `${label}.${key}`);
159
+ }
160
+ return current;
161
+ }
162
+
163
+ function expectRecordFields(
164
+ value: unknown,
165
+ label: string,
166
+ expected: Record<string, unknown>,
167
+ ): Record<string, unknown> {
168
+ const record = requireRecord(value, label);
169
+ for (const [key, expectedValue] of Object.entries(expected)) {
170
+ expect(record[key], `${label}.${key}`).toEqual(expectedValue);
171
+ }
172
+ return record;
173
+ }
174
+
175
+ function firstMockCall(
176
+ mock: { mock: { calls: Array<readonly unknown[]> } },
177
+ label: string,
178
+ ): readonly unknown[] {
179
+ const call = mock.mock.calls[0];
180
+ if (!call) {
181
+ throw new Error(`expected ${label} call`);
182
+ }
183
+ return call;
184
+ }
185
+
186
+ function requireFetchRequest(callIndex = 0): Record<string, unknown> {
187
+ return requireRecord(fetchWithSsrFGuardMock.mock.calls[callIndex]?.[0], "fetch request");
188
+ }
189
+
190
+ function requireFetchInit(callIndex = 0): Record<string, unknown> {
191
+ return requireRecord(requireFetchRequest(callIndex).init, "fetch init");
192
+ }
193
+
194
+ function requireFetchHeaders(callIndex = 0): Record<string, unknown> {
195
+ return requireRecord(requireFetchInit(callIndex).headers, "fetch headers");
196
+ }
197
+
198
+ function requireFetchJsonBody(callIndex = 0): Record<string, unknown> {
199
+ const body = requireFetchInit(callIndex).body;
200
+ expect(typeof body, "fetch body must be a JSON string").toBe("string");
201
+ return requireRecord(JSON.parse(body as string), "fetch JSON body");
202
+ }
203
+
204
+ function requireSession(socket: FakeWebSocketInstance, index = 0): Record<string, unknown> {
205
+ return requireRecord(parseSent(socket)[index]?.session, "session");
206
+ }
207
+
208
+ function hasSentEventType(socket: FakeWebSocketInstance, type: string): boolean {
209
+ return parseSent(socket).some((event) => event.type === type);
210
+ }
211
+
212
+ describe("buildOpenAIRealtimeVoiceProvider", () => {
213
+ beforeEach(() => {
214
+ FakeWebSocket.instances = [];
215
+ vi.stubEnv("OPENAI_API_KEY", "");
216
+ execFileSyncMock.mockReset();
217
+ fetchWithSsrFGuardMock.mockReset();
218
+ isProviderAuthProfileConfiguredMock.mockReset();
219
+ isProviderAuthProfileConfiguredMock.mockReturnValue(false);
220
+ resolveProviderAuthProfileApiKeyMock.mockReset();
221
+ resolveProviderAuthProfileApiKeyMock.mockResolvedValue(undefined);
222
+ });
223
+
224
+ afterEach(() => {
225
+ vi.useRealTimers();
226
+ vi.unstubAllEnvs();
227
+ });
228
+
229
+ it("declares realtime Talk capabilities for catalog selection", () => {
230
+ const provider = buildOpenAIRealtimeVoiceProvider();
231
+
232
+ expect(provider.defaultModel).toBe("gpt-realtime-2");
233
+ expect(provider.capabilities).toEqual({
234
+ transports: ["webrtc", "gateway-relay"],
235
+ inputAudioFormats: [
236
+ { encoding: "g711_ulaw", sampleRateHz: 8000, channels: 1 },
237
+ { encoding: "pcm16", sampleRateHz: 24000, channels: 1 },
238
+ ],
239
+ outputAudioFormats: [
240
+ { encoding: "g711_ulaw", sampleRateHz: 8000, channels: 1 },
241
+ { encoding: "pcm16", sampleRateHz: 24000, channels: 1 },
242
+ ],
243
+ supportsBrowserSession: true,
244
+ supportsBargeIn: true,
245
+ supportsToolCalls: true,
246
+ });
247
+ });
248
+
249
+ it("advertises continuing realtime tool results", () => {
250
+ const provider = buildOpenAIRealtimeVoiceProvider();
251
+ const bridge = provider.createBridge({
252
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
253
+ onAudio: vi.fn(),
254
+ onClearAudio: vi.fn(),
255
+ });
256
+
257
+ expect(bridge.supportsToolResultContinuation).toBe(true);
258
+ });
259
+
260
+ it("adds OpenClaw attribution headers to native realtime websocket requests", () => {
261
+ vi.stubEnv("OPENCLAW_VERSION", "2026.3.22");
262
+ const provider = buildOpenAIRealtimeVoiceProvider();
263
+ const bridge = provider.createBridge({
264
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
265
+ onAudio: vi.fn(),
266
+ onClearAudio: vi.fn(),
267
+ });
268
+
269
+ void bridge.connect();
270
+ bridge.close();
271
+
272
+ const socket = FakeWebSocket.instances[0];
273
+ const options = socket?.args[1] as { headers?: Record<string, string> } | undefined;
274
+ expectRecordFields(options?.headers, "websocket headers", {
275
+ originator: "openclaw",
276
+ version: "2026.3.22",
277
+ "User-Agent": "openclaw/2026.3.22",
278
+ });
279
+ expect(options?.headers).not.toHaveProperty("OpenAI-Beta");
280
+ });
281
+
282
+ it("mints an ephemeral Realtime secret for native websocket bridges when using Codex OAuth", async () => {
283
+ resolveProviderAuthProfileApiKeyMock.mockResolvedValueOnce("oauth-token");
284
+ fetchWithSsrFGuardMock.mockResolvedValueOnce({
285
+ response: createJsonResponse({
286
+ client_secret: { value: "ephemeral-realtime-secret" },
287
+ }),
288
+ release: vi.fn(async () => undefined),
289
+ });
290
+ const provider = buildOpenAIRealtimeVoiceProvider();
291
+ const bridge = provider.createBridge({
292
+ cfg: {} as never,
293
+ providerConfig: { model: "gpt-realtime-2" },
294
+ onAudio: vi.fn(),
295
+ onClearAudio: vi.fn(),
296
+ });
297
+
298
+ void bridge.connect();
299
+ await vi.waitFor(() => expect(FakeWebSocket.instances.length).toBe(1));
300
+ bridge.close();
301
+
302
+ expect(resolveProviderAuthProfileApiKeyMock).toHaveBeenCalledWith({
303
+ provider: "openai-codex",
304
+ cfg: {},
305
+ });
306
+ const request = requireFetchRequest();
307
+ expectRecordFields(request, "fetch request", {
308
+ url: "https://api.openai.com/v1/realtime/client_secrets",
309
+ auditContext: "openai-realtime-bridge-session",
310
+ });
311
+ expectRecordFields(requireFetchInit(), "fetch init", { method: "POST" });
312
+ expectRecordFields(requireFetchHeaders(), "fetch headers", {
313
+ Authorization: "Bearer oauth-token", // pragma: allowlist secret
314
+ "Content-Type": "application/json",
315
+ });
316
+ const body = requireFetchJsonBody();
317
+ const bodySession = requireRecord(body.session, "fetch session");
318
+ expectRecordFields(bodySession, "fetch session", {
319
+ type: "realtime",
320
+ model: "gpt-realtime-2",
321
+ });
322
+ expectRecordFields(
323
+ requireNestedRecord(bodySession, ["audio", "output"]),
324
+ "fetch session output",
325
+ {
326
+ voice: "alloy",
327
+ },
328
+ );
329
+ const socket = FakeWebSocket.instances[0];
330
+ const options = socket?.args[1] as { headers?: Record<string, string> } | undefined;
331
+ expect(options?.headers?.Authorization).toBe("Bearer ephemeral-realtime-secret");
332
+ expect(options?.headers).not.toHaveProperty("OpenAI-Beta");
333
+ });
334
+
335
+ it("does not fall back to Codex OAuth for custom realtime endpoints", async () => {
336
+ resolveProviderAuthProfileApiKeyMock.mockResolvedValueOnce("oauth-token");
337
+ const provider = buildOpenAIRealtimeVoiceProvider();
338
+ const bridge = provider.createBridge({
339
+ cfg: {} as never,
340
+ providerConfig: {
341
+ azureEndpoint: "https://example.openai.azure.com",
342
+ model: "gpt-realtime-2",
343
+ },
344
+ onAudio: vi.fn(),
345
+ onClearAudio: vi.fn(),
346
+ });
347
+
348
+ await expect(bridge.connect()).rejects.toThrow("OpenAI API key missing");
349
+
350
+ expect(resolveProviderAuthProfileApiKeyMock).not.toHaveBeenCalled();
351
+ expect(fetchWithSsrFGuardMock).not.toHaveBeenCalled();
352
+ expect(FakeWebSocket.instances).toHaveLength(0);
353
+ });
354
+
355
+ it("does not open a native websocket after slow OAuth resolution times out", async () => {
356
+ vi.useFakeTimers();
357
+ resolveProviderAuthProfileApiKeyMock.mockResolvedValueOnce("oauth-token");
358
+ let resolveClientSecret: (value: {
359
+ response: Response;
360
+ release: () => Promise<void>;
361
+ }) => void = () => {};
362
+ fetchWithSsrFGuardMock.mockReturnValueOnce(
363
+ new Promise((resolve) => {
364
+ resolveClientSecret = resolve;
365
+ }),
366
+ );
367
+ const provider = buildOpenAIRealtimeVoiceProvider();
368
+ const bridge = provider.createBridge({
369
+ cfg: {} as never,
370
+ providerConfig: { model: "gpt-realtime-2" },
371
+ onAudio: vi.fn(),
372
+ onClearAudio: vi.fn(),
373
+ });
374
+
375
+ const connecting = expect(bridge.connect()).rejects.toThrow(
376
+ "OpenAI realtime connection timeout",
377
+ );
378
+ await vi.advanceTimersByTimeAsync(10_000);
379
+ await connecting;
380
+
381
+ resolveClientSecret({
382
+ response: createJsonResponse({
383
+ client_secret: { value: "ephemeral-realtime-secret" },
384
+ }),
385
+ release: vi.fn(async () => undefined),
386
+ });
387
+ await vi.runAllTimersAsync();
388
+
389
+ expect(FakeWebSocket.instances).toHaveLength(0);
390
+ bridge.close();
391
+ });
392
+
393
+ it("returns browser-safe OpenClaw attribution headers for native WebRTC offers", async () => {
394
+ vi.stubEnv("OPENCLAW_VERSION", "2026.3.22");
395
+ fetchWithSsrFGuardMock.mockResolvedValueOnce({
396
+ response: createJsonResponse({
397
+ client_secret: { value: "client-secret-123" },
398
+ expires_at: 1_765_000_000,
399
+ }),
400
+ release: vi.fn(async () => undefined),
401
+ });
402
+ const provider = buildOpenAIRealtimeVoiceProvider();
403
+ if (!provider.createBrowserSession) {
404
+ throw new Error("expected OpenAI realtime provider to support browser sessions");
405
+ }
406
+
407
+ const session = await provider.createBrowserSession({
408
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
409
+ instructions: "Be concise.",
410
+ voice: " Marin ",
411
+ });
412
+
413
+ expectRecordFields(requireFetchRequest(), "fetch request", {
414
+ url: "https://api.openai.com/v1/realtime/client_secrets",
415
+ });
416
+ expectRecordFields(requireFetchInit(), "fetch init", { method: "POST" });
417
+ expectRecordFields(requireFetchHeaders(), "fetch headers", {
418
+ Authorization: "Bearer sk-test", // pragma: allowlist secret
419
+ "Content-Type": "application/json",
420
+ originator: "openclaw",
421
+ version: "2026.3.22",
422
+ "User-Agent": "openclaw/2026.3.22",
423
+ });
424
+ const body = requireFetchJsonBody();
425
+ const bodySession = requireRecord(body.session, "fetch session");
426
+ expect(bodySession.model).toBe("gpt-realtime-2");
427
+ expect(requireNestedRecord(bodySession, ["audio", "input"])).toEqual({
428
+ noise_reduction: { type: "near_field" },
429
+ turn_detection: {
430
+ type: "server_vad",
431
+ create_response: true,
432
+ interrupt_response: true,
433
+ },
434
+ transcription: { model: "gpt-4o-mini-transcribe" },
435
+ });
436
+ expect(requireNestedRecord(bodySession, ["audio", "output"])).toEqual({ voice: "marin" });
437
+ expect(bodySession).not.toHaveProperty("temperature");
438
+ expectRecordFields(session, "browser session", {
439
+ provider: "openai",
440
+ transport: "webrtc",
441
+ clientSecret: "client-secret-123",
442
+ offerUrl: "https://api.openai.com/v1/realtime/calls",
443
+ model: "gpt-realtime-2",
444
+ });
445
+ // originator, version, and User-Agent are server-side attribution headers; they
446
+ // must not be forwarded to the browser so that the browser's direct SDP POST to
447
+ // api.openai.com passes the CORS preflight (only authorization,content-type
448
+ // allowed — #76435). All three are filtered, leaving no browser offer headers.
449
+ expect((session as { offerHeaders?: Record<string, string> }).offerHeaders).toBeUndefined();
450
+ });
451
+
452
+ it("resolves keychain OPENAI_API_KEY refs before creating browser sessions", async () => {
453
+ vi.stubEnv("OPENAI_API_KEY", "keychain:openclaw:OPENAI_REALTIME_BROWSER_TEST");
454
+ execFileSyncMock.mockReturnValueOnce("sk-browser-env\n"); // pragma: allowlist secret
455
+ fetchWithSsrFGuardMock.mockResolvedValueOnce({
456
+ response: createJsonResponse({
457
+ client_secret: { value: "client-secret-123" },
458
+ }),
459
+ release: vi.fn(async () => undefined),
460
+ });
461
+ const provider = buildOpenAIRealtimeVoiceProvider();
462
+ if (!provider.createBrowserSession) {
463
+ throw new Error("expected OpenAI realtime provider to support browser sessions");
464
+ }
465
+
466
+ await provider.createBrowserSession({
467
+ providerConfig: {},
468
+ instructions: "Be concise.",
469
+ });
470
+
471
+ const [securityBinary, securityArgs, securityOptions] = firstMockCall(
472
+ execFileSyncMock,
473
+ "security keychain lookup",
474
+ );
475
+ expect(securityBinary).toBe("/usr/bin/security");
476
+ expect(securityArgs).toEqual([
477
+ "find-generic-password",
478
+ "-s",
479
+ "openclaw",
480
+ "-a",
481
+ "OPENAI_REALTIME_BROWSER_TEST",
482
+ "-w",
483
+ ]);
484
+ expectRecordFields(securityOptions, "security command options", {
485
+ encoding: "utf8",
486
+ timeout: 5000,
487
+ });
488
+ expectRecordFields(requireFetchHeaders(), "fetch headers", {
489
+ Authorization: "Bearer sk-browser-env", // pragma: allowlist secret
490
+ });
491
+ });
492
+
493
+ it("resolves and caches keychain OPENAI_API_KEY refs before creating bridges", () => {
494
+ vi.stubEnv("OPENAI_API_KEY", "keychain:openclaw:OPENAI_REALTIME_BRIDGE_TEST");
495
+ execFileSyncMock.mockReturnValue("sk-bridge-env\n"); // pragma: allowlist secret
496
+ const provider = buildOpenAIRealtimeVoiceProvider();
497
+
498
+ const first = provider.createBridge({
499
+ providerConfig: {},
500
+ onAudio: vi.fn(),
501
+ onClearAudio: vi.fn(),
502
+ });
503
+ const second = provider.createBridge({
504
+ providerConfig: {},
505
+ onAudio: vi.fn(),
506
+ onClearAudio: vi.fn(),
507
+ });
508
+ void first.connect();
509
+ void second.connect();
510
+ first.close();
511
+ second.close();
512
+
513
+ expect(execFileSyncMock).toHaveBeenCalledTimes(1);
514
+ for (const socket of FakeWebSocket.instances) {
515
+ const options = socket.args[1] as { headers?: Record<string, string> } | undefined;
516
+ expectRecordFields(options?.headers, "websocket headers", {
517
+ Authorization: "Bearer sk-bridge-env", // pragma: allowlist secret
518
+ });
519
+ }
520
+ });
521
+
522
+ it("does not resolve keychain refs during configured checks", () => {
523
+ vi.stubEnv("OPENAI_API_KEY", "keychain:openclaw:OPENAI_REALTIME_CONFIGURED_TEST");
524
+ const provider = buildOpenAIRealtimeVoiceProvider();
525
+
526
+ expect(provider.isConfigured({ providerConfig: {} })).toBe(true);
527
+ expect(execFileSyncMock).not.toHaveBeenCalled();
528
+ });
529
+
530
+ it("treats OpenAI Codex OAuth profiles as configured for browser realtime sessions", () => {
531
+ isProviderAuthProfileConfiguredMock.mockReturnValue(true);
532
+ const provider = buildOpenAIRealtimeVoiceProvider();
533
+ const cfg = { agents: { defaults: {} } } as never;
534
+
535
+ expect(provider.isConfigured({ cfg, providerConfig: {} })).toBe(true);
536
+ expect(isProviderAuthProfileConfiguredMock).toHaveBeenCalledWith({
537
+ provider: "openai-codex",
538
+ cfg,
539
+ });
540
+ });
541
+
542
+ it("does not use Codex OAuth to configure Azure realtime sessions", () => {
543
+ isProviderAuthProfileConfiguredMock.mockReturnValue(true);
544
+ const provider = buildOpenAIRealtimeVoiceProvider();
545
+ const cfg = { agents: { defaults: {} } } as never;
546
+
547
+ expect(
548
+ provider.isConfigured({
549
+ cfg,
550
+ providerConfig: {
551
+ azureEndpoint: "https://example.openai.azure.com",
552
+ azureDeployment: "realtime",
553
+ },
554
+ }),
555
+ ).toBe(false);
556
+ expect(isProviderAuthProfileConfiguredMock).not.toHaveBeenCalled();
557
+ });
558
+
559
+ it("uses OpenAI Codex OAuth to mint browser realtime client secrets when no API key is set", async () => {
560
+ resolveProviderAuthProfileApiKeyMock.mockResolvedValueOnce("oauth-realtime-token");
561
+ fetchWithSsrFGuardMock.mockResolvedValueOnce({
562
+ response: createJsonResponse({
563
+ client_secret: { value: "client-secret-123" },
564
+ }),
565
+ release: vi.fn(async () => undefined),
566
+ });
567
+ const provider = buildOpenAIRealtimeVoiceProvider();
568
+ if (!provider.createBrowserSession) {
569
+ throw new Error("expected OpenAI realtime provider to support browser sessions");
570
+ }
571
+ const cfg = { agents: { defaults: {} } } as never;
572
+
573
+ await provider.createBrowserSession({
574
+ cfg,
575
+ providerConfig: {},
576
+ instructions: "Be concise.",
577
+ });
578
+
579
+ expect(resolveProviderAuthProfileApiKeyMock).toHaveBeenCalledWith({
580
+ provider: "openai-codex",
581
+ cfg,
582
+ });
583
+ expectRecordFields(requireFetchHeaders(), "fetch headers", {
584
+ Authorization: "Bearer oauth-realtime-token", // pragma: allowlist secret
585
+ });
586
+ });
587
+
588
+ it("fails closed when keychain refs cannot be resolved", async () => {
589
+ vi.stubEnv("OPENAI_API_KEY", "keychain:openclaw:OPENAI_REALTIME_MISSING_TEST");
590
+ execFileSyncMock.mockImplementationOnce(() => {
591
+ throw new Error("keychain unavailable");
592
+ });
593
+ const provider = buildOpenAIRealtimeVoiceProvider();
594
+
595
+ const bridge = provider.createBridge({
596
+ providerConfig: {},
597
+ onAudio: vi.fn(),
598
+ onClearAudio: vi.fn(),
599
+ });
600
+
601
+ await expect(bridge.connect()).rejects.toThrow("OpenAI API key or Codex OAuth missing");
602
+ });
603
+
604
+ it("normalizes provider-owned voice settings from raw provider config", () => {
605
+ const provider = buildOpenAIRealtimeVoiceProvider();
606
+ const resolved = provider.resolveConfig?.({
607
+ cfg: {} as never,
608
+ rawConfig: {
609
+ providers: {
610
+ openai: {
611
+ model: "gpt-realtime-2",
612
+ voice: " Verse ",
613
+ temperature: 0.6,
614
+ silenceDurationMs: 850,
615
+ vadThreshold: 0.35,
616
+ reasoningEffort: "low",
617
+ },
618
+ },
619
+ },
620
+ });
621
+
622
+ expect(resolved).toEqual({
623
+ model: "gpt-realtime-2",
624
+ voice: "verse",
625
+ temperature: 0.6,
626
+ silenceDurationMs: 850,
627
+ vadThreshold: 0.35,
628
+ reasoningEffort: "low",
629
+ });
630
+ });
631
+
632
+ it("waits for session.updated before draining audio and firing onReady", async () => {
633
+ const provider = buildOpenAIRealtimeVoiceProvider();
634
+ const onReady = vi.fn();
635
+ const bridge = provider.createBridge({
636
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
637
+ instructions: "Be helpful.",
638
+ onAudio: vi.fn(),
639
+ onClearAudio: vi.fn(),
640
+ onReady,
641
+ });
642
+ const connecting = bridge.connect();
643
+ let connectResolved = false;
644
+ void connecting.then(() => {
645
+ connectResolved = true;
646
+ });
647
+ const socket = FakeWebSocket.instances[0];
648
+ if (!socket) {
649
+ throw new Error("expected bridge to create a websocket");
650
+ }
651
+
652
+ socket.readyState = FakeWebSocket.OPEN;
653
+ socket.emit("open");
654
+ await Promise.resolve();
655
+
656
+ bridge.sendAudio(Buffer.from("before-ready"));
657
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.created" })));
658
+
659
+ expect(connectResolved).toBe(false);
660
+ expect(onReady).not.toHaveBeenCalled();
661
+ expect(parseSent(socket).map((event) => event.type)).toEqual(["session.update"]);
662
+ const session = requireSession(socket);
663
+ expectRecordFields(session, "session", {
664
+ type: "realtime",
665
+ model: "gpt-realtime-2",
666
+ output_modalities: ["audio"],
667
+ });
668
+ const inputAudio = requireNestedRecord(session, ["audio", "input"]);
669
+ expectRecordFields(inputAudio, "session audio input", {
670
+ format: { type: "audio/pcmu" },
671
+ noise_reduction: null,
672
+ transcription: { model: "gpt-4o-mini-transcribe" },
673
+ });
674
+ expect(requireNestedRecord(session, ["audio", "output"])).toEqual({
675
+ format: { type: "audio/pcmu" },
676
+ voice: "alloy",
677
+ });
678
+ expect(session).not.toHaveProperty("temperature");
679
+ expect(bridge.isConnected()).toBe(false);
680
+
681
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
682
+ await connecting;
683
+
684
+ expect(connectResolved).toBe(true);
685
+ expect(onReady).toHaveBeenCalledTimes(1);
686
+ expect(parseSent(socket).map((event) => event.type)).toEqual([
687
+ "session.update",
688
+ "input_audio_buffer.append",
689
+ ]);
690
+ expect(bridge.isConnected()).toBe(true);
691
+ });
692
+
693
+ it("keeps Azure deployment bridges on deployment-compatible session payloads", async () => {
694
+ const provider = buildOpenAIRealtimeVoiceProvider();
695
+ const bridge = provider.createBridge({
696
+ providerConfig: {
697
+ apiKey: "sk-test", // pragma: allowlist secret
698
+ azureEndpoint: "https://example.openai.azure.com/",
699
+ azureDeployment: "realtime-prod",
700
+ azureApiVersion: "2024-10-01-preview",
701
+ voice: "verse",
702
+ },
703
+ audioFormat: REALTIME_VOICE_AUDIO_FORMAT_PCM16_24KHZ,
704
+ instructions: "Be helpful.",
705
+ onAudio: vi.fn(),
706
+ onClearAudio: vi.fn(),
707
+ });
708
+ const connecting = bridge.connect();
709
+ const socket = FakeWebSocket.instances[0];
710
+ if (!socket) {
711
+ throw new Error("expected bridge to create a websocket");
712
+ }
713
+
714
+ expect(socket.args[0]).toBe(
715
+ "wss://example.openai.azure.com/openai/realtime?api-version=2024-10-01-preview&deployment=realtime-prod",
716
+ );
717
+
718
+ socket.readyState = FakeWebSocket.OPEN;
719
+ socket.emit("open");
720
+ await Promise.resolve();
721
+
722
+ const session = requireSession(socket);
723
+ expectRecordFields(session, "session", {
724
+ modalities: ["text", "audio"],
725
+ instructions: "Be helpful.",
726
+ voice: "verse",
727
+ input_audio_format: "pcm16",
728
+ output_audio_format: "pcm16",
729
+ input_audio_transcription: { model: "whisper-1" },
730
+ temperature: 0.8,
731
+ });
732
+ expectRecordFields(
733
+ requireRecord(session.turn_detection, "session turn detection"),
734
+ "turn detection",
735
+ {
736
+ create_response: true,
737
+ },
738
+ );
739
+ expect(session).not.toHaveProperty("type");
740
+ expect(session).not.toHaveProperty("audio");
741
+
742
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
743
+ await connecting;
744
+ });
745
+
746
+ it("rejects connection when session configuration fails before readiness", async () => {
747
+ const provider = buildOpenAIRealtimeVoiceProvider();
748
+ const bridge = provider.createBridge({
749
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
750
+ onAudio: vi.fn(),
751
+ onClearAudio: vi.fn(),
752
+ });
753
+ const connecting = bridge.connect();
754
+ const socket = FakeWebSocket.instances[0];
755
+ if (!socket) {
756
+ throw new Error("expected bridge to create a websocket");
757
+ }
758
+
759
+ socket.readyState = FakeWebSocket.OPEN;
760
+ socket.emit("open");
761
+ socket.emit(
762
+ "message",
763
+ Buffer.from(
764
+ JSON.stringify({
765
+ type: "error",
766
+ error: { message: "invalid realtime session" },
767
+ }),
768
+ ),
769
+ );
770
+
771
+ await expect(connecting).rejects.toThrow("invalid realtime session");
772
+ expect(bridge.isConnected()).toBe(false);
773
+ });
774
+
775
+ it("treats pre-ready auth errors as a single startup failure", async () => {
776
+ const provider = buildOpenAIRealtimeVoiceProvider();
777
+ const onError = vi.fn();
778
+ const bridge = provider.createBridge({
779
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
780
+ onAudio: vi.fn(),
781
+ onClearAudio: vi.fn(),
782
+ onError,
783
+ });
784
+ const connecting = bridge.connect();
785
+ const socket = FakeWebSocket.instances[0];
786
+ if (!socket) {
787
+ throw new Error("expected bridge to create a websocket");
788
+ }
789
+
790
+ socket.readyState = FakeWebSocket.OPEN;
791
+ socket.emit("open");
792
+ socket.emit(
793
+ "message",
794
+ Buffer.from(
795
+ JSON.stringify({
796
+ type: "error",
797
+ error: { message: "Incorrect API key provided" },
798
+ }),
799
+ ),
800
+ );
801
+ socket.emit(
802
+ "message",
803
+ Buffer.from(
804
+ JSON.stringify({
805
+ type: "error",
806
+ error: { message: "Incorrect API key provided" },
807
+ }),
808
+ ),
809
+ );
810
+
811
+ await expect(connecting).rejects.toThrow("Incorrect API key provided");
812
+ expect(onError).not.toHaveBeenCalled();
813
+ expect(socket.closed).toBe(true);
814
+ expect(bridge.isConnected()).toBe(false);
815
+ });
816
+
817
+ it("rejects connection when the socket closes before session readiness", async () => {
818
+ const provider = buildOpenAIRealtimeVoiceProvider();
819
+ const bridge = provider.createBridge({
820
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
821
+ onAudio: vi.fn(),
822
+ onClearAudio: vi.fn(),
823
+ });
824
+ const connecting = bridge.connect();
825
+ const socket = FakeWebSocket.instances[0];
826
+ if (!socket) {
827
+ throw new Error("expected bridge to create a websocket");
828
+ }
829
+
830
+ socket.readyState = FakeWebSocket.OPEN;
831
+ socket.emit("open");
832
+ socket.close(1006, "session closed");
833
+
834
+ await expect(connecting).rejects.toThrow("OpenAI realtime connection closed before ready");
835
+ expect(bridge.isConnected()).toBe(false);
836
+ });
837
+
838
+ it("can disable automatic audio turn responses for agent-routed voice loops", async () => {
839
+ const provider = buildOpenAIRealtimeVoiceProvider();
840
+ const bridge = provider.createBridge({
841
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
842
+ autoRespondToAudio: false,
843
+ onAudio: vi.fn(),
844
+ onClearAudio: vi.fn(),
845
+ });
846
+ const connecting = bridge.connect();
847
+ const socket = FakeWebSocket.instances[0];
848
+ if (!socket) {
849
+ throw new Error("expected bridge to create a websocket");
850
+ }
851
+
852
+ socket.readyState = FakeWebSocket.OPEN;
853
+ socket.emit("open");
854
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
855
+ await connecting;
856
+
857
+ expectRecordFields(
858
+ requireNestedRecord(requireSession(socket), ["audio", "input", "turn_detection"]),
859
+ "turn detection",
860
+ {
861
+ create_response: false,
862
+ interrupt_response: false,
863
+ },
864
+ );
865
+ });
866
+
867
+ it("can disable realtime response interruption while keeping audio responses enabled", async () => {
868
+ const provider = buildOpenAIRealtimeVoiceProvider();
869
+ const bridge = provider.createBridge({
870
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
871
+ autoRespondToAudio: true,
872
+ interruptResponseOnInputAudio: false,
873
+ onAudio: vi.fn(),
874
+ onClearAudio: vi.fn(),
875
+ });
876
+ const connecting = bridge.connect();
877
+ const socket = FakeWebSocket.instances[0];
878
+ if (!socket) {
879
+ throw new Error("expected bridge to create a websocket");
880
+ }
881
+
882
+ socket.readyState = FakeWebSocket.OPEN;
883
+ socket.emit("open");
884
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
885
+ await connecting;
886
+
887
+ expectRecordFields(
888
+ requireNestedRecord(requireSession(socket), ["audio", "input", "turn_detection"]),
889
+ "turn detection",
890
+ {
891
+ create_response: true,
892
+ interrupt_response: false,
893
+ },
894
+ );
895
+ });
896
+
897
+ it("does not locally clear playback on speech-start events when input interruption is disabled", async () => {
898
+ const provider = buildOpenAIRealtimeVoiceProvider();
899
+ const onAudio = vi.fn();
900
+ const onClearAudio = vi.fn();
901
+ const bridge = provider.createBridge({
902
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
903
+ autoRespondToAudio: true,
904
+ interruptResponseOnInputAudio: false,
905
+ onAudio,
906
+ onClearAudio,
907
+ });
908
+ const connecting = bridge.connect();
909
+ const socket = FakeWebSocket.instances[0];
910
+ if (!socket) {
911
+ throw new Error("expected bridge to create a websocket");
912
+ }
913
+
914
+ socket.readyState = FakeWebSocket.OPEN;
915
+ socket.emit("open");
916
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
917
+ await connecting;
918
+
919
+ socket.emit(
920
+ "message",
921
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
922
+ );
923
+ socket.emit(
924
+ "message",
925
+ Buffer.from(
926
+ JSON.stringify({
927
+ type: "response.audio.delta",
928
+ item_id: "item_1",
929
+ delta: Buffer.from("assistant audio").toString("base64"),
930
+ }),
931
+ ),
932
+ );
933
+ socket.emit(
934
+ "message",
935
+ Buffer.from(JSON.stringify({ type: "input_audio_buffer.speech_started" })),
936
+ );
937
+
938
+ expect(onAudio).toHaveBeenCalledTimes(1);
939
+ expect(onClearAudio).not.toHaveBeenCalled();
940
+ expect(hasSentEventType(socket, "response.cancel")).toBe(false);
941
+ expect(hasSentEventType(socket, "conversation.item.truncate")).toBe(false);
942
+ });
943
+
944
+ it("keeps assistant playback active on server VAD when automatic audio responses are disabled", async () => {
945
+ const provider = buildOpenAIRealtimeVoiceProvider();
946
+ const onAudio = vi.fn();
947
+ const onClearAudio = vi.fn();
948
+ const bridge = provider.createBridge({
949
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
950
+ autoRespondToAudio: false,
951
+ onAudio,
952
+ onClearAudio,
953
+ });
954
+ const connecting = bridge.connect();
955
+ const socket = FakeWebSocket.instances[0];
956
+ if (!socket) {
957
+ throw new Error("expected bridge to create a websocket");
958
+ }
959
+
960
+ socket.readyState = FakeWebSocket.OPEN;
961
+ socket.emit("open");
962
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
963
+ await connecting;
964
+
965
+ socket.emit(
966
+ "message",
967
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
968
+ );
969
+ socket.emit(
970
+ "message",
971
+ Buffer.from(
972
+ JSON.stringify({
973
+ type: "response.audio.delta",
974
+ item_id: "item_1",
975
+ delta: Buffer.from("assistant audio").toString("base64"),
976
+ }),
977
+ ),
978
+ );
979
+ socket.emit(
980
+ "message",
981
+ Buffer.from(JSON.stringify({ type: "input_audio_buffer.speech_started" })),
982
+ );
983
+
984
+ expect(onAudio).toHaveBeenCalledTimes(1);
985
+ expect(onClearAudio).not.toHaveBeenCalled();
986
+ expect(hasSentEventType(socket, "response.cancel")).toBe(false);
987
+ expect(hasSentEventType(socket, "conversation.item.truncate")).toBe(false);
988
+ });
989
+
990
+ it("can request PCM16 24 kHz realtime audio for Chrome command-pair bridges", async () => {
991
+ const provider = buildOpenAIRealtimeVoiceProvider();
992
+ const bridge = provider.createBridge({
993
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
994
+ audioFormat: REALTIME_VOICE_AUDIO_FORMAT_PCM16_24KHZ,
995
+ onAudio: vi.fn(),
996
+ onClearAudio: vi.fn(),
997
+ });
998
+
999
+ const connecting = bridge.connect();
1000
+ const socket = FakeWebSocket.instances[0];
1001
+ if (!socket) {
1002
+ throw new Error("expected bridge to create a websocket");
1003
+ }
1004
+
1005
+ socket.readyState = FakeWebSocket.OPEN;
1006
+ socket.emit("open");
1007
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1008
+ await connecting;
1009
+
1010
+ const session = requireSession(socket);
1011
+ expect(requireNestedRecord(session, ["audio", "input", "format"])).toEqual({
1012
+ type: "audio/pcm",
1013
+ rate: 24000,
1014
+ });
1015
+ expect(requireNestedRecord(session, ["audio", "output", "format"])).toEqual({
1016
+ type: "audio/pcm",
1017
+ rate: 24000,
1018
+ });
1019
+ });
1020
+
1021
+ it("settles cleanly when closed before the websocket opens", async () => {
1022
+ const provider = buildOpenAIRealtimeVoiceProvider();
1023
+ const onClose = vi.fn();
1024
+ const bridge = provider.createBridge({
1025
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1026
+ onAudio: vi.fn(),
1027
+ onClearAudio: vi.fn(),
1028
+ onClose,
1029
+ });
1030
+ const connecting = bridge.connect();
1031
+ const socket = FakeWebSocket.instances[0];
1032
+ if (!socket) {
1033
+ throw new Error("expected bridge to create a websocket");
1034
+ }
1035
+
1036
+ bridge.close();
1037
+
1038
+ await expect(connecting).resolves.toBeUndefined();
1039
+ expect(socket.closed).toBe(true);
1040
+ expect(socket.terminated).toBe(false);
1041
+ expect(onClose).toHaveBeenCalledWith("completed");
1042
+ });
1043
+
1044
+ it("truncates externally interrupted playback after an immediate mark acknowledgement", async () => {
1045
+ const provider = buildOpenAIRealtimeVoiceProvider();
1046
+ const onAudio = vi.fn();
1047
+ const onClearAudio = vi.fn();
1048
+ let bridge: ReturnType<typeof provider.createBridge>;
1049
+ bridge = provider.createBridge({
1050
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1051
+ onAudio,
1052
+ onClearAudio,
1053
+ onMark: () => bridge.acknowledgeMark(),
1054
+ });
1055
+ const connecting = bridge.connect();
1056
+ const socket = FakeWebSocket.instances[0];
1057
+ if (!socket) {
1058
+ throw new Error("expected bridge to create a websocket");
1059
+ }
1060
+
1061
+ socket.readyState = FakeWebSocket.OPEN;
1062
+ socket.emit("open");
1063
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1064
+ await connecting;
1065
+
1066
+ bridge.setMediaTimestamp(1000);
1067
+ socket.emit(
1068
+ "message",
1069
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1070
+ );
1071
+ socket.emit(
1072
+ "message",
1073
+ Buffer.from(
1074
+ JSON.stringify({
1075
+ type: "response.audio.delta",
1076
+ item_id: "item_1",
1077
+ delta: Buffer.from("assistant audio").toString("base64"),
1078
+ }),
1079
+ ),
1080
+ );
1081
+ bridge.setMediaTimestamp(1300);
1082
+
1083
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1084
+
1085
+ expect(onAudio).toHaveBeenCalledTimes(1);
1086
+ expect(onClearAudio).toHaveBeenCalledTimes(1);
1087
+ expect(parseSent(socket).slice(-2)).toEqual([
1088
+ { type: "response.cancel" },
1089
+ {
1090
+ type: "conversation.item.truncate",
1091
+ item_id: "item_1",
1092
+ content_index: 0,
1093
+ audio_end_ms: 300,
1094
+ },
1095
+ ]);
1096
+ });
1097
+
1098
+ it("forwards current realtime output audio events", async () => {
1099
+ const provider = buildOpenAIRealtimeVoiceProvider();
1100
+ const onAudio = vi.fn();
1101
+ const onTranscript = vi.fn();
1102
+ const bridge = provider.createBridge({
1103
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1104
+ onAudio,
1105
+ onClearAudio: vi.fn(),
1106
+ onTranscript,
1107
+ });
1108
+ const connecting = bridge.connect();
1109
+ const socket = FakeWebSocket.instances[0];
1110
+ if (!socket) {
1111
+ throw new Error("expected bridge to create a websocket");
1112
+ }
1113
+
1114
+ socket.readyState = FakeWebSocket.OPEN;
1115
+ socket.emit("open");
1116
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1117
+ await connecting;
1118
+
1119
+ const audio = Buffer.from("assistant audio");
1120
+ socket.emit(
1121
+ "message",
1122
+ Buffer.from(
1123
+ JSON.stringify({
1124
+ type: "response.output_audio.delta",
1125
+ item_id: "item_1",
1126
+ delta: audio.toString("base64"),
1127
+ }),
1128
+ ),
1129
+ );
1130
+ socket.emit(
1131
+ "message",
1132
+ Buffer.from(
1133
+ JSON.stringify({
1134
+ type: "response.output_audio_transcript.done",
1135
+ transcript: "hello from current realtime events",
1136
+ }),
1137
+ ),
1138
+ );
1139
+
1140
+ expect(onAudio).toHaveBeenCalledWith(audio);
1141
+ expect(onTranscript).toHaveBeenCalledWith(
1142
+ "assistant",
1143
+ "hello from current realtime events",
1144
+ true,
1145
+ );
1146
+ });
1147
+
1148
+ it("forwards Codex-compatible legacy realtime audio and transcript events", async () => {
1149
+ const provider = buildOpenAIRealtimeVoiceProvider();
1150
+ const onAudio = vi.fn();
1151
+ const onTranscript = vi.fn();
1152
+ const bridge = provider.createBridge({
1153
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1154
+ onAudio,
1155
+ onClearAudio: vi.fn(),
1156
+ onTranscript,
1157
+ });
1158
+ const connecting = bridge.connect();
1159
+ const socket = FakeWebSocket.instances[0];
1160
+ if (!socket) {
1161
+ throw new Error("expected bridge to create a websocket");
1162
+ }
1163
+
1164
+ socket.readyState = FakeWebSocket.OPEN;
1165
+ socket.emit("open");
1166
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1167
+ await connecting;
1168
+
1169
+ const audio = Buffer.from("legacy assistant audio");
1170
+ socket.emit(
1171
+ "message",
1172
+ Buffer.from(
1173
+ JSON.stringify({
1174
+ type: "conversation.output_audio.delta",
1175
+ data: audio.toString("base64"),
1176
+ sample_rate: 24000,
1177
+ channels: 1,
1178
+ }),
1179
+ ),
1180
+ );
1181
+ socket.emit(
1182
+ "message",
1183
+ Buffer.from(
1184
+ JSON.stringify({
1185
+ type: "conversation.input_transcript.delta",
1186
+ delta: "partial user",
1187
+ }),
1188
+ ),
1189
+ );
1190
+ socket.emit(
1191
+ "message",
1192
+ Buffer.from(
1193
+ JSON.stringify({
1194
+ type: "conversation.output_transcript.delta",
1195
+ delta: "partial assistant",
1196
+ }),
1197
+ ),
1198
+ );
1199
+ socket.emit(
1200
+ "message",
1201
+ Buffer.from(
1202
+ JSON.stringify({
1203
+ type: "response.output_text.done",
1204
+ text: "final assistant text",
1205
+ }),
1206
+ ),
1207
+ );
1208
+
1209
+ expect(onAudio).toHaveBeenCalledWith(audio);
1210
+ expect(onTranscript).toHaveBeenCalledWith("user", "partial user", false);
1211
+ expect(onTranscript).toHaveBeenCalledWith("assistant", "partial assistant", false);
1212
+ expect(onTranscript).toHaveBeenCalledWith("assistant", "final assistant text", true);
1213
+ });
1214
+
1215
+ it("emits tool calls from realtime conversation item done events", async () => {
1216
+ const provider = buildOpenAIRealtimeVoiceProvider();
1217
+ const onToolCall = vi.fn();
1218
+ const onEvent = vi.fn();
1219
+ const bridge = provider.createBridge({
1220
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1221
+ onAudio: vi.fn(),
1222
+ onClearAudio: vi.fn(),
1223
+ onToolCall,
1224
+ onEvent,
1225
+ });
1226
+ const connecting = bridge.connect();
1227
+ const socket = FakeWebSocket.instances[0];
1228
+ if (!socket) {
1229
+ throw new Error("expected bridge to create a websocket");
1230
+ }
1231
+
1232
+ socket.readyState = FakeWebSocket.OPEN;
1233
+ socket.emit("open");
1234
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1235
+ await connecting;
1236
+
1237
+ socket.emit(
1238
+ "message",
1239
+ Buffer.from(
1240
+ JSON.stringify({
1241
+ type: "conversation.item.done",
1242
+ item: {
1243
+ id: "item_tool_1",
1244
+ type: "function_call",
1245
+ name: "openclaw_agent_consult",
1246
+ call_id: "call_1",
1247
+ arguments: JSON.stringify({ question: "delegate this" }),
1248
+ },
1249
+ }),
1250
+ ),
1251
+ );
1252
+
1253
+ expect(onToolCall).toHaveBeenCalledWith({
1254
+ itemId: "item_tool_1",
1255
+ callId: "call_1",
1256
+ name: "openclaw_agent_consult",
1257
+ args: { question: "delegate this" },
1258
+ });
1259
+ expect(onEvent).toHaveBeenCalledWith({
1260
+ direction: "server",
1261
+ type: "conversation.item.done",
1262
+ detail: "function_call name=openclaw_agent_consult",
1263
+ });
1264
+ });
1265
+
1266
+ it("deduplicates tool calls reported by arguments done and item done events", async () => {
1267
+ const provider = buildOpenAIRealtimeVoiceProvider();
1268
+ const onToolCall = vi.fn();
1269
+ const bridge = provider.createBridge({
1270
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1271
+ onAudio: vi.fn(),
1272
+ onClearAudio: vi.fn(),
1273
+ onToolCall,
1274
+ });
1275
+ const connecting = bridge.connect();
1276
+ const socket = FakeWebSocket.instances[0];
1277
+ if (!socket) {
1278
+ throw new Error("expected bridge to create a websocket");
1279
+ }
1280
+
1281
+ socket.readyState = FakeWebSocket.OPEN;
1282
+ socket.emit("open");
1283
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1284
+ await connecting;
1285
+
1286
+ socket.emit(
1287
+ "message",
1288
+ Buffer.from(
1289
+ JSON.stringify({
1290
+ type: "response.function_call_arguments.delta",
1291
+ item_id: "item_tool_1",
1292
+ name: "openclaw_agent_consult",
1293
+ call_id: "call_1",
1294
+ delta: JSON.stringify({ question: "delegate this" }),
1295
+ }),
1296
+ ),
1297
+ );
1298
+ socket.emit(
1299
+ "message",
1300
+ Buffer.from(
1301
+ JSON.stringify({
1302
+ type: "response.function_call_arguments.done",
1303
+ item_id: "item_tool_1",
1304
+ name: "openclaw_agent_consult",
1305
+ call_id: "call_1",
1306
+ }),
1307
+ ),
1308
+ );
1309
+ socket.emit(
1310
+ "message",
1311
+ Buffer.from(
1312
+ JSON.stringify({
1313
+ type: "conversation.item.done",
1314
+ item: {
1315
+ id: "item_tool_1",
1316
+ type: "function_call",
1317
+ name: "openclaw_agent_consult",
1318
+ call_id: "call_1",
1319
+ arguments: JSON.stringify({ question: "delegate this" }),
1320
+ },
1321
+ }),
1322
+ ),
1323
+ );
1324
+
1325
+ expect(onToolCall).toHaveBeenCalledTimes(1);
1326
+ expect(onToolCall).toHaveBeenCalledWith({
1327
+ itemId: "item_tool_1",
1328
+ callId: "call_1",
1329
+ name: "openclaw_agent_consult",
1330
+ args: { question: "delegate this" },
1331
+ });
1332
+ });
1333
+
1334
+ it("creates an explicit user item and response for manual speech", async () => {
1335
+ const provider = buildOpenAIRealtimeVoiceProvider();
1336
+ const onEvent = vi.fn();
1337
+ const bridge = provider.createBridge({
1338
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1339
+ onAudio: vi.fn(),
1340
+ onClearAudio: vi.fn(),
1341
+ onEvent,
1342
+ });
1343
+ const connecting = bridge.connect();
1344
+ const socket = FakeWebSocket.instances[0];
1345
+ if (!socket) {
1346
+ throw new Error("expected bridge to create a websocket");
1347
+ }
1348
+
1349
+ socket.readyState = FakeWebSocket.OPEN;
1350
+ socket.emit("open");
1351
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1352
+ await connecting;
1353
+
1354
+ bridge.triggerGreeting?.("Say exactly: hello from explicit speech.");
1355
+
1356
+ expect(parseSent(socket).slice(-2)).toEqual([
1357
+ {
1358
+ type: "conversation.item.create",
1359
+ item: {
1360
+ type: "message",
1361
+ role: "user",
1362
+ content: [
1363
+ {
1364
+ type: "input_text",
1365
+ text: "Say exactly: hello from explicit speech.",
1366
+ },
1367
+ ],
1368
+ },
1369
+ },
1370
+ {
1371
+ type: "response.create",
1372
+ },
1373
+ ]);
1374
+ expect(JSON.stringify(parseSent(socket).at(-1))).not.toContain("output_modalities");
1375
+ expect(onEvent).toHaveBeenCalledWith({ direction: "client", type: "conversation.item.create" });
1376
+ expect(onEvent).toHaveBeenCalledWith({ direction: "client", type: "response.create" });
1377
+ });
1378
+
1379
+ it("defers manual response.create while a realtime response is active", async () => {
1380
+ const provider = buildOpenAIRealtimeVoiceProvider();
1381
+ const bridge = provider.createBridge({
1382
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1383
+ onAudio: vi.fn(),
1384
+ onClearAudio: vi.fn(),
1385
+ });
1386
+ const connecting = bridge.connect();
1387
+ const socket = FakeWebSocket.instances[0];
1388
+ if (!socket) {
1389
+ throw new Error("expected bridge to create a websocket");
1390
+ }
1391
+
1392
+ socket.readyState = FakeWebSocket.OPEN;
1393
+ socket.emit("open");
1394
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1395
+ await connecting;
1396
+ socket.emit(
1397
+ "message",
1398
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1399
+ );
1400
+
1401
+ bridge.submitToolResult("call_1", { text: "done" });
1402
+
1403
+ expect(parseSent(socket).slice(-1)).toEqual([
1404
+ {
1405
+ type: "conversation.item.create",
1406
+ item: {
1407
+ type: "function_call_output",
1408
+ call_id: "call_1",
1409
+ output: JSON.stringify({ text: "done" }),
1410
+ },
1411
+ },
1412
+ ]);
1413
+
1414
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "response.done" })));
1415
+
1416
+ expect(parseSent(socket).slice(-1)).toEqual([{ type: "response.create" }]);
1417
+ });
1418
+
1419
+ it("does not request a realtime response for continuing tool results", async () => {
1420
+ const provider = buildOpenAIRealtimeVoiceProvider();
1421
+ const bridge = provider.createBridge({
1422
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1423
+ onAudio: vi.fn(),
1424
+ onClearAudio: vi.fn(),
1425
+ });
1426
+ const connecting = bridge.connect();
1427
+ const socket = FakeWebSocket.instances[0];
1428
+ if (!socket) {
1429
+ throw new Error("expected bridge to create a websocket");
1430
+ }
1431
+
1432
+ socket.readyState = FakeWebSocket.OPEN;
1433
+ socket.emit("open");
1434
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1435
+ await connecting;
1436
+
1437
+ bridge.submitToolResult("call_1", { status: "working" }, { willContinue: true });
1438
+
1439
+ expect(parseSent(socket).slice(-1)).toEqual([
1440
+ {
1441
+ type: "conversation.item.create",
1442
+ item: {
1443
+ type: "function_call_output",
1444
+ call_id: "call_1",
1445
+ output: JSON.stringify({ status: "working" }),
1446
+ },
1447
+ },
1448
+ ]);
1449
+ expect(hasSentEventType(socket, "response.create")).toBe(false);
1450
+
1451
+ bridge.submitToolResult("call_1", { text: "done" });
1452
+
1453
+ expect(parseSent(socket).slice(-2)).toEqual([
1454
+ {
1455
+ type: "conversation.item.create",
1456
+ item: {
1457
+ type: "function_call_output",
1458
+ call_id: "call_1",
1459
+ output: JSON.stringify({ text: "done" }),
1460
+ },
1461
+ },
1462
+ { type: "response.create" },
1463
+ ]);
1464
+ socket.emit(
1465
+ "message",
1466
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_2" } })),
1467
+ );
1468
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "response.done" })));
1469
+
1470
+ expect(parseSent(socket).filter((event) => event.type === "response.create")).toHaveLength(1);
1471
+ });
1472
+
1473
+ it("does not request a realtime response for suppressed tool results", async () => {
1474
+ const provider = buildOpenAIRealtimeVoiceProvider();
1475
+ const bridge = provider.createBridge({
1476
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1477
+ onAudio: vi.fn(),
1478
+ onClearAudio: vi.fn(),
1479
+ });
1480
+ const connecting = bridge.connect();
1481
+ const socket = FakeWebSocket.instances[0];
1482
+ if (!socket) {
1483
+ throw new Error("expected bridge to create a websocket");
1484
+ }
1485
+
1486
+ socket.readyState = FakeWebSocket.OPEN;
1487
+ socket.emit("open");
1488
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1489
+ await connecting;
1490
+
1491
+ bridge.submitToolResult("call_1", { status: "already_delivered" }, { suppressResponse: true });
1492
+
1493
+ expect(parseSent(socket).slice(-1)).toEqual([
1494
+ {
1495
+ type: "conversation.item.create",
1496
+ item: {
1497
+ type: "function_call_output",
1498
+ call_id: "call_1",
1499
+ output: JSON.stringify({ status: "already_delivered" }),
1500
+ },
1501
+ },
1502
+ ]);
1503
+ expect(hasSentEventType(socket, "response.create")).toBe(false);
1504
+ });
1505
+
1506
+ it("does not flush deferred response.create while a tool result is still continuing", async () => {
1507
+ const provider = buildOpenAIRealtimeVoiceProvider();
1508
+ const onError = vi.fn();
1509
+ const bridge = provider.createBridge({
1510
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1511
+ onAudio: vi.fn(),
1512
+ onClearAudio: vi.fn(),
1513
+ onError,
1514
+ });
1515
+ const connecting = bridge.connect();
1516
+ const socket = FakeWebSocket.instances[0];
1517
+ if (!socket) {
1518
+ throw new Error("expected bridge to create a websocket");
1519
+ }
1520
+
1521
+ socket.readyState = FakeWebSocket.OPEN;
1522
+ socket.emit("open");
1523
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1524
+ await connecting;
1525
+
1526
+ bridge.submitToolResult("call_1", { status: "working" }, { willContinue: true });
1527
+ socket.emit(
1528
+ "message",
1529
+ Buffer.from(
1530
+ JSON.stringify({
1531
+ type: "error",
1532
+ error: {
1533
+ message: "Conversation already has an active response in progress: resp_1",
1534
+ },
1535
+ }),
1536
+ ),
1537
+ );
1538
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "response.done" })));
1539
+
1540
+ expect(onError).not.toHaveBeenCalled();
1541
+ expect(parseSent(socket).filter((event) => event.type === "response.create")).toEqual([]);
1542
+
1543
+ bridge.submitToolResult("call_1", { text: "done" });
1544
+
1545
+ expect(parseSent(socket).slice(-2)).toEqual([
1546
+ {
1547
+ type: "conversation.item.create",
1548
+ item: {
1549
+ type: "function_call_output",
1550
+ call_id: "call_1",
1551
+ output: JSON.stringify({ text: "done" }),
1552
+ },
1553
+ },
1554
+ { type: "response.create" },
1555
+ ]);
1556
+ });
1557
+
1558
+ it("drains deferred response.create after response.cancelled", async () => {
1559
+ const provider = buildOpenAIRealtimeVoiceProvider();
1560
+ const bridge = provider.createBridge({
1561
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1562
+ onAudio: vi.fn(),
1563
+ onClearAudio: vi.fn(),
1564
+ });
1565
+ const connecting = bridge.connect();
1566
+ const socket = FakeWebSocket.instances[0];
1567
+ if (!socket) {
1568
+ throw new Error("expected bridge to create a websocket");
1569
+ }
1570
+
1571
+ socket.readyState = FakeWebSocket.OPEN;
1572
+ socket.emit("open");
1573
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1574
+ await connecting;
1575
+ socket.emit(
1576
+ "message",
1577
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1578
+ );
1579
+
1580
+ bridge.submitToolResult("call_1", { text: "done" });
1581
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "response.cancelled" })));
1582
+
1583
+ expect(parseSent(socket).slice(-1)).toEqual([{ type: "response.create" }]);
1584
+ });
1585
+
1586
+ it("does not send duplicate response.cancel while cancellation is pending", async () => {
1587
+ const provider = buildOpenAIRealtimeVoiceProvider();
1588
+ const onEvent = vi.fn();
1589
+ const bridge = provider.createBridge({
1590
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1591
+ onAudio: vi.fn(),
1592
+ onClearAudio: vi.fn(),
1593
+ onEvent,
1594
+ });
1595
+ const connecting = bridge.connect();
1596
+ const socket = FakeWebSocket.instances[0];
1597
+ if (!socket) {
1598
+ throw new Error("expected bridge to create a websocket");
1599
+ }
1600
+
1601
+ socket.readyState = FakeWebSocket.OPEN;
1602
+ socket.emit("open");
1603
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1604
+ await connecting;
1605
+ socket.emit(
1606
+ "message",
1607
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1608
+ );
1609
+ bridge.setMediaTimestamp(1000);
1610
+ socket.emit(
1611
+ "message",
1612
+ Buffer.from(
1613
+ JSON.stringify({
1614
+ type: "response.audio.delta",
1615
+ item_id: "item_1",
1616
+ delta: Buffer.from("assistant audio").toString("base64"),
1617
+ }),
1618
+ ),
1619
+ );
1620
+ bridge.setMediaTimestamp(1300);
1621
+
1622
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1623
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1624
+
1625
+ expect(parseSent(socket).filter((event) => event.type === "response.cancel")).toHaveLength(1);
1626
+ expect(onEvent).toHaveBeenCalledWith({
1627
+ direction: "client",
1628
+ type: "response.cancel",
1629
+ detail: "reason=barge-in",
1630
+ });
1631
+ expect(onEvent).toHaveBeenCalledWith({
1632
+ direction: "client",
1633
+ type: "conversation.item.truncate",
1634
+ detail: "reason=barge-in audioEndMs=300",
1635
+ });
1636
+ });
1637
+
1638
+ it("ignores zero-length playback barge-in without clearing audio", async () => {
1639
+ const provider = buildOpenAIRealtimeVoiceProvider();
1640
+ const onClearAudio = vi.fn();
1641
+ const onEvent = vi.fn();
1642
+ const bridge = provider.createBridge({
1643
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1644
+ onAudio: vi.fn(),
1645
+ onClearAudio,
1646
+ onEvent,
1647
+ });
1648
+ const connecting = bridge.connect();
1649
+ const socket = FakeWebSocket.instances[0];
1650
+ if (!socket) {
1651
+ throw new Error("expected bridge to create a websocket");
1652
+ }
1653
+
1654
+ socket.readyState = FakeWebSocket.OPEN;
1655
+ socket.emit("open");
1656
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1657
+ await connecting;
1658
+ bridge.setMediaTimestamp(1000);
1659
+ socket.emit(
1660
+ "message",
1661
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1662
+ );
1663
+ socket.emit(
1664
+ "message",
1665
+ Buffer.from(
1666
+ JSON.stringify({
1667
+ type: "response.audio.delta",
1668
+ item_id: "item_1",
1669
+ delta: Buffer.from("assistant audio").toString("base64"),
1670
+ }),
1671
+ ),
1672
+ );
1673
+
1674
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1675
+
1676
+ expect(onClearAudio).not.toHaveBeenCalled();
1677
+ expect(hasSentEventType(socket, "response.cancel")).toBe(false);
1678
+ expect(parseSent(socket).some((event) => event.type === "conversation.item.truncate")).toBe(
1679
+ false,
1680
+ );
1681
+ expect(onEvent).toHaveBeenCalledWith({
1682
+ direction: "client",
1683
+ type: "conversation.item.truncate.skipped",
1684
+ detail: "reason=barge-in audioEndMs=0 minAudioEndMs=250",
1685
+ });
1686
+ });
1687
+
1688
+ it("force-cancels zero-length playback barge-in for agent handoff fallback", async () => {
1689
+ const provider = buildOpenAIRealtimeVoiceProvider();
1690
+ const onClearAudio = vi.fn();
1691
+ const onEvent = vi.fn();
1692
+ const bridge = provider.createBridge({
1693
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1694
+ onAudio: vi.fn(),
1695
+ onClearAudio,
1696
+ onEvent,
1697
+ });
1698
+ const connecting = bridge.connect();
1699
+ const socket = FakeWebSocket.instances[0];
1700
+ if (!socket) {
1701
+ throw new Error("expected bridge to create a websocket");
1702
+ }
1703
+
1704
+ socket.readyState = FakeWebSocket.OPEN;
1705
+ socket.emit("open");
1706
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1707
+ await connecting;
1708
+ bridge.setMediaTimestamp(1000);
1709
+ socket.emit(
1710
+ "message",
1711
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1712
+ );
1713
+ socket.emit(
1714
+ "message",
1715
+ Buffer.from(
1716
+ JSON.stringify({
1717
+ type: "response.audio.delta",
1718
+ item_id: "item_1",
1719
+ delta: Buffer.from("assistant audio").toString("base64"),
1720
+ }),
1721
+ ),
1722
+ );
1723
+
1724
+ bridge.handleBargeIn?.({ audioPlaybackActive: true, force: true });
1725
+
1726
+ expect(parseSent(socket).slice(-2)).toEqual([
1727
+ { type: "response.cancel" },
1728
+ {
1729
+ type: "conversation.item.truncate",
1730
+ item_id: "item_1",
1731
+ content_index: 0,
1732
+ audio_end_ms: 0,
1733
+ },
1734
+ ]);
1735
+ expect(onClearAudio).toHaveBeenCalled();
1736
+ expect(
1737
+ onEvent.mock.calls.some(
1738
+ ([event]) => isRecord(event) && event.type === "conversation.item.truncate.skipped",
1739
+ ),
1740
+ ).toBe(false);
1741
+ });
1742
+
1743
+ it("allows immediate playback barge-in when the minimum audio window is zero", async () => {
1744
+ const provider = buildOpenAIRealtimeVoiceProvider();
1745
+ const onClearAudio = vi.fn();
1746
+ const bridge = provider.createBridge({
1747
+ providerConfig: {
1748
+ apiKey: "sk-test", // pragma: allowlist secret
1749
+ minBargeInAudioEndMs: 0,
1750
+ },
1751
+ onAudio: vi.fn(),
1752
+ onClearAudio,
1753
+ });
1754
+ const connecting = bridge.connect();
1755
+ const socket = FakeWebSocket.instances[0];
1756
+ if (!socket) {
1757
+ throw new Error("expected bridge to create a websocket");
1758
+ }
1759
+
1760
+ socket.readyState = FakeWebSocket.OPEN;
1761
+ socket.emit("open");
1762
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1763
+ await connecting;
1764
+ bridge.setMediaTimestamp(1000);
1765
+ socket.emit(
1766
+ "message",
1767
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1768
+ );
1769
+ socket.emit(
1770
+ "message",
1771
+ Buffer.from(
1772
+ JSON.stringify({
1773
+ type: "response.audio.delta",
1774
+ item_id: "item_1",
1775
+ delta: Buffer.from("assistant audio").toString("base64"),
1776
+ }),
1777
+ ),
1778
+ );
1779
+
1780
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1781
+
1782
+ expect(onClearAudio).toHaveBeenCalledTimes(1);
1783
+ expect(parseSent(socket).slice(-2)).toEqual([
1784
+ { type: "response.cancel" },
1785
+ {
1786
+ type: "conversation.item.truncate",
1787
+ item_id: "item_1",
1788
+ content_index: 0,
1789
+ audio_end_ms: 0,
1790
+ },
1791
+ ]);
1792
+ });
1793
+
1794
+ it("drains deferred response.create after a no-active-response cancellation error", async () => {
1795
+ const provider = buildOpenAIRealtimeVoiceProvider();
1796
+ const onError = vi.fn();
1797
+ const bridge = provider.createBridge({
1798
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1799
+ onAudio: vi.fn(),
1800
+ onClearAudio: vi.fn(),
1801
+ onError,
1802
+ });
1803
+ const connecting = bridge.connect();
1804
+ const socket = FakeWebSocket.instances[0];
1805
+ if (!socket) {
1806
+ throw new Error("expected bridge to create a websocket");
1807
+ }
1808
+
1809
+ socket.readyState = FakeWebSocket.OPEN;
1810
+ socket.emit("open");
1811
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1812
+ await connecting;
1813
+ socket.emit(
1814
+ "message",
1815
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1816
+ );
1817
+
1818
+ bridge.submitToolResult("call_1", { text: "done" });
1819
+ bridge.handleBargeIn?.({ audioPlaybackActive: true });
1820
+ socket.emit(
1821
+ "message",
1822
+ Buffer.from(
1823
+ JSON.stringify({
1824
+ type: "error",
1825
+ error: {
1826
+ message: "Cancellation failed: no active response found",
1827
+ },
1828
+ }),
1829
+ ),
1830
+ );
1831
+
1832
+ expect(onError).not.toHaveBeenCalled();
1833
+ expect(parseSent(socket).slice(-1)).toEqual([{ type: "response.create" }]);
1834
+ });
1835
+
1836
+ it("resets deferred response guards after websocket reconnect", async () => {
1837
+ vi.useFakeTimers();
1838
+ const provider = buildOpenAIRealtimeVoiceProvider();
1839
+ const bridge = provider.createBridge({
1840
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1841
+ onAudio: vi.fn(),
1842
+ onClearAudio: vi.fn(),
1843
+ });
1844
+ const connecting = bridge.connect();
1845
+ const socket = FakeWebSocket.instances[0];
1846
+ if (!socket) {
1847
+ throw new Error("expected bridge to create a websocket");
1848
+ }
1849
+
1850
+ socket.readyState = FakeWebSocket.OPEN;
1851
+ socket.emit("open");
1852
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1853
+ await connecting;
1854
+ socket.emit(
1855
+ "message",
1856
+ Buffer.from(JSON.stringify({ type: "response.created", response: { id: "resp_1" } })),
1857
+ );
1858
+ bridge.submitToolResult("call_1", { text: "done" });
1859
+
1860
+ expect(parseSent(socket).slice(-1)[0]?.type).toBe("conversation.item.create");
1861
+
1862
+ socket.emit("close", 1006, Buffer.from("transient drop"));
1863
+ await vi.advanceTimersByTimeAsync(1000);
1864
+ const reconnectedSocket = FakeWebSocket.instances[1];
1865
+ if (!reconnectedSocket) {
1866
+ throw new Error("expected bridge to reconnect");
1867
+ }
1868
+
1869
+ reconnectedSocket.readyState = FakeWebSocket.OPEN;
1870
+ reconnectedSocket.emit("open");
1871
+ reconnectedSocket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1872
+ bridge.sendUserMessage?.("Say hello after reconnect.");
1873
+
1874
+ expect(parseSent(reconnectedSocket).slice(-2)).toEqual([
1875
+ {
1876
+ type: "conversation.item.create",
1877
+ item: {
1878
+ type: "message",
1879
+ role: "user",
1880
+ content: [{ type: "input_text", text: "Say hello after reconnect." }],
1881
+ },
1882
+ },
1883
+ { type: "response.create" },
1884
+ ]);
1885
+ });
1886
+
1887
+ it("turns active-response errors into a deferred response.create retry", async () => {
1888
+ const provider = buildOpenAIRealtimeVoiceProvider();
1889
+ const onError = vi.fn();
1890
+ const bridge = provider.createBridge({
1891
+ providerConfig: { apiKey: "sk-test" }, // pragma: allowlist secret
1892
+ onAudio: vi.fn(),
1893
+ onClearAudio: vi.fn(),
1894
+ onError,
1895
+ });
1896
+ const connecting = bridge.connect();
1897
+ const socket = FakeWebSocket.instances[0];
1898
+ if (!socket) {
1899
+ throw new Error("expected bridge to create a websocket");
1900
+ }
1901
+
1902
+ socket.readyState = FakeWebSocket.OPEN;
1903
+ socket.emit("open");
1904
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "session.updated" })));
1905
+ await connecting;
1906
+
1907
+ bridge.submitToolResult("call_1", { text: "done" });
1908
+ socket.emit(
1909
+ "message",
1910
+ Buffer.from(
1911
+ JSON.stringify({
1912
+ type: "error",
1913
+ error: {
1914
+ message: "Conversation already has an active response in progress: resp_1",
1915
+ },
1916
+ }),
1917
+ ),
1918
+ );
1919
+ socket.emit("message", Buffer.from(JSON.stringify({ type: "response.done" })));
1920
+
1921
+ expect(onError).not.toHaveBeenCalled();
1922
+ expect(parseSent(socket).slice(-1)).toEqual([{ type: "response.create" }]);
1923
+ });
1924
+ });