ruflo 3.10.35 → 3.10.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (498) hide show
  1. package/README.md +416 -416
  2. package/bin/ruflo.js +77 -77
  3. package/package.json +113 -113
  4. package/src/chat-ui/Dockerfile +25 -25
  5. package/src/chat-ui/patch-mcp-url-safety.sh +28 -28
  6. package/src/config/config.example.json +76 -76
  7. package/src/mcp-bridge/Dockerfile +45 -45
  8. package/src/mcp-bridge/index.js +1692 -1692
  9. package/src/mcp-bridge/mcp-stdio-kernel.js +159 -159
  10. package/src/mcp-bridge/package.json +17 -17
  11. package/src/mcp-bridge/test-harness.js +470 -470
  12. package/src/nginx/Dockerfile +10 -10
  13. package/src/nginx/nginx.conf +67 -67
  14. package/src/nginx/static/favicon-dark.svg +4 -4
  15. package/src/nginx/static/favicon.svg +4 -4
  16. package/src/nginx/static/icon.svg +5 -5
  17. package/src/nginx/static/logo.svg +9 -9
  18. package/src/nginx/static/manifest.json +22 -22
  19. package/src/nginx/static/welcome.js +184 -184
  20. package/src/ruvocal/.claude/skills/add-model-descriptions/SKILL.md +73 -73
  21. package/src/ruvocal/.devcontainer/Dockerfile +9 -9
  22. package/src/ruvocal/.devcontainer/devcontainer.json +36 -36
  23. package/src/ruvocal/.dockerignore +16 -16
  24. package/src/ruvocal/.eslintignore +13 -13
  25. package/src/ruvocal/.eslintrc.cjs +45 -45
  26. package/src/ruvocal/.gcloudignore +18 -18
  27. package/src/ruvocal/.github/ISSUE_TEMPLATE/bug-report--chat-ui-.md +43 -43
  28. package/src/ruvocal/.github/ISSUE_TEMPLATE/config-support.md +9 -9
  29. package/src/ruvocal/.github/ISSUE_TEMPLATE/feature-request--chat-ui-.md +17 -17
  30. package/src/ruvocal/.github/ISSUE_TEMPLATE/huggingchat.md +11 -11
  31. package/src/ruvocal/.github/release.yml +16 -16
  32. package/src/ruvocal/.github/workflows/build-docs.yml +18 -18
  33. package/src/ruvocal/.github/workflows/build-image.yml +142 -142
  34. package/src/ruvocal/.github/workflows/build-pr-docs.yml +20 -20
  35. package/src/ruvocal/.github/workflows/deploy-dev.yml +63 -63
  36. package/src/ruvocal/.github/workflows/deploy-prod.yml +78 -78
  37. package/src/ruvocal/.github/workflows/lint-and-test.yml +84 -84
  38. package/src/ruvocal/.github/workflows/slugify.yaml +72 -72
  39. package/src/ruvocal/.github/workflows/trufflehog.yml +17 -17
  40. package/src/ruvocal/.github/workflows/upload-pr-documentation.yml +16 -16
  41. package/src/ruvocal/.husky/lint-stage-config.js +4 -4
  42. package/src/ruvocal/.husky/pre-commit +2 -2
  43. package/src/ruvocal/.prettierignore +14 -14
  44. package/src/ruvocal/.prettierrc +7 -7
  45. package/src/ruvocal/CLAUDE.md +126 -126
  46. package/src/ruvocal/Dockerfile +96 -96
  47. package/src/ruvocal/LICENSE +202 -202
  48. package/src/ruvocal/PRIVACY.md +41 -41
  49. package/src/ruvocal/README.md +164 -164
  50. package/src/ruvocal/chart/Chart.yaml +5 -5
  51. package/src/ruvocal/chart/env/dev.yaml +260 -260
  52. package/src/ruvocal/chart/env/prod.yaml +273 -273
  53. package/src/ruvocal/chart/templates/_helpers.tpl +22 -22
  54. package/src/ruvocal/chart/templates/config.yaml +10 -10
  55. package/src/ruvocal/chart/templates/deployment.yaml +81 -81
  56. package/src/ruvocal/chart/templates/hpa.yaml +45 -45
  57. package/src/ruvocal/chart/templates/infisical.yaml +24 -24
  58. package/src/ruvocal/chart/templates/ingress-internal.yaml +32 -32
  59. package/src/ruvocal/chart/templates/ingress.yaml +32 -32
  60. package/src/ruvocal/chart/templates/network-policy.yaml +36 -36
  61. package/src/ruvocal/chart/templates/service-account.yaml +13 -13
  62. package/src/ruvocal/chart/templates/service-monitor.yaml +17 -17
  63. package/src/ruvocal/chart/templates/service.yaml +21 -21
  64. package/src/ruvocal/chart/values.yaml +73 -73
  65. package/src/ruvocal/cloudbuild.yaml +68 -68
  66. package/src/ruvocal/config/branding.env.example +19 -19
  67. package/src/ruvocal/docker-compose.yml +21 -21
  68. package/src/ruvocal/docs/adr/ADR-029-HUGGINGFACE-CHAT-UI-CLOUD-RUN.md +1236 -1236
  69. package/src/ruvocal/docs/adr/ADR-033-RUVECTOR-RUFLO-MCP-INTEGRATION.md +111 -111
  70. package/src/ruvocal/docs/adr/ADR-034-OPTIONAL-MCP-BACKENDS.md +117 -117
  71. package/src/ruvocal/docs/adr/ADR-035-MCP-TOOL-GROUPS.md +186 -186
  72. package/src/ruvocal/docs/adr/ADR-037-AUTOPILOT-CHAT-MODE.md +1500 -1500
  73. package/src/ruvocal/docs/adr/ADR-038-RUVOCAL-FORK.md +286 -286
  74. package/src/ruvocal/docs/source/_toctree.yml +30 -30
  75. package/src/ruvocal/docs/source/configuration/common-issues.md +38 -38
  76. package/src/ruvocal/docs/source/configuration/llm-router.md +105 -105
  77. package/src/ruvocal/docs/source/configuration/mcp-tools.md +84 -84
  78. package/src/ruvocal/docs/source/configuration/metrics.md +9 -9
  79. package/src/ruvocal/docs/source/configuration/open-id.md +57 -57
  80. package/src/ruvocal/docs/source/configuration/overview.md +89 -89
  81. package/src/ruvocal/docs/source/configuration/theming.md +20 -20
  82. package/src/ruvocal/docs/source/developing/architecture.md +48 -48
  83. package/src/ruvocal/docs/source/index.md +53 -53
  84. package/src/ruvocal/docs/source/installation/docker.md +43 -43
  85. package/src/ruvocal/docs/source/installation/helm.md +43 -43
  86. package/src/ruvocal/docs/source/installation/local.md +62 -62
  87. package/src/ruvocal/entrypoint.sh +18 -18
  88. package/src/ruvocal/mcp-bridge/Dockerfile +45 -45
  89. package/src/ruvocal/mcp-bridge/cloudbuild.yaml +49 -49
  90. package/src/ruvocal/mcp-bridge/index.js +1902 -1902
  91. package/src/ruvocal/mcp-bridge/mcp-stdio-kernel.js +159 -159
  92. package/src/ruvocal/mcp-bridge/package-lock.json +762 -762
  93. package/src/ruvocal/mcp-bridge/package.json +17 -17
  94. package/src/ruvocal/mcp-bridge/test-harness.js +470 -470
  95. package/src/ruvocal/package-lock.json +11741 -11741
  96. package/src/ruvocal/package.json +121 -121
  97. package/src/ruvocal/postcss.config.js +6 -6
  98. package/src/ruvocal/rvf.manifest.json +204 -204
  99. package/src/ruvocal/scripts/config.ts +64 -64
  100. package/src/ruvocal/scripts/generate-welcome.mjs +181 -181
  101. package/src/ruvocal/scripts/populate.ts +288 -288
  102. package/src/ruvocal/scripts/samples.txt +194 -194
  103. package/src/ruvocal/scripts/setups/vitest-setup-server.ts +44 -44
  104. package/src/ruvocal/scripts/updateLocalEnv.ts +48 -48
  105. package/src/ruvocal/src/ambient.d.ts +7 -7
  106. package/src/ruvocal/src/app.d.ts +29 -29
  107. package/src/ruvocal/src/app.html +53 -53
  108. package/src/ruvocal/src/hooks.server.ts +32 -32
  109. package/src/ruvocal/src/hooks.ts +6 -6
  110. package/src/ruvocal/src/lib/APIClient.ts +148 -148
  111. package/src/ruvocal/src/lib/actions/clickOutside.ts +18 -18
  112. package/src/ruvocal/src/lib/actions/snapScrollToBottom.ts +346 -346
  113. package/src/ruvocal/src/lib/buildPrompt.ts +33 -33
  114. package/src/ruvocal/src/lib/components/AnnouncementBanner.svelte +20 -20
  115. package/src/ruvocal/src/lib/components/BackgroundGenerationPoller.svelte +168 -168
  116. package/src/ruvocal/src/lib/components/CodeBlock.svelte +73 -73
  117. package/src/ruvocal/src/lib/components/CopyToClipBoardBtn.svelte +92 -92
  118. package/src/ruvocal/src/lib/components/DeleteConversationModal.svelte +75 -75
  119. package/src/ruvocal/src/lib/components/EditConversationModal.svelte +100 -100
  120. package/src/ruvocal/src/lib/components/ExpandNavigation.svelte +22 -22
  121. package/src/ruvocal/src/lib/components/FoundationBackground.svelte +242 -242
  122. package/src/ruvocal/src/lib/components/HoverTooltip.svelte +44 -44
  123. package/src/ruvocal/src/lib/components/HtmlPreviewModal.svelte +143 -143
  124. package/src/ruvocal/src/lib/components/InfiniteScroll.svelte +50 -50
  125. package/src/ruvocal/src/lib/components/MobileNav.svelte +300 -300
  126. package/src/ruvocal/src/lib/components/Modal.svelte +115 -115
  127. package/src/ruvocal/src/lib/components/ModelCardMetadata.svelte +71 -71
  128. package/src/ruvocal/src/lib/components/NavConversationItem.svelte +151 -151
  129. package/src/ruvocal/src/lib/components/NavMenu.svelte +313 -313
  130. package/src/ruvocal/src/lib/components/Pagination.svelte +97 -97
  131. package/src/ruvocal/src/lib/components/PaginationArrow.svelte +27 -27
  132. package/src/ruvocal/src/lib/components/Portal.svelte +24 -24
  133. package/src/ruvocal/src/lib/components/RetryBtn.svelte +18 -18
  134. package/src/ruvocal/src/lib/components/RuFloUniverse.svelte +185 -185
  135. package/src/ruvocal/src/lib/components/RufloHelpModal.svelte +411 -411
  136. package/src/ruvocal/src/lib/components/ScrollToBottomBtn.svelte +47 -47
  137. package/src/ruvocal/src/lib/components/ScrollToPreviousBtn.svelte +77 -77
  138. package/src/ruvocal/src/lib/components/ShareConversationModal.svelte +182 -182
  139. package/src/ruvocal/src/lib/components/StopGeneratingBtn.svelte +69 -69
  140. package/src/ruvocal/src/lib/components/SubscribeModal.svelte +87 -87
  141. package/src/ruvocal/src/lib/components/Switch.svelte +36 -36
  142. package/src/ruvocal/src/lib/components/SystemPromptModal.svelte +44 -44
  143. package/src/ruvocal/src/lib/components/Toast.svelte +27 -27
  144. package/src/ruvocal/src/lib/components/Tooltip.svelte +30 -30
  145. package/src/ruvocal/src/lib/components/WelcomeModal.svelte +46 -46
  146. package/src/ruvocal/src/lib/components/chat/Alternatives.svelte +77 -77
  147. package/src/ruvocal/src/lib/components/chat/BlockWrapper.svelte +72 -72
  148. package/src/ruvocal/src/lib/components/chat/ChatInput.svelte +490 -490
  149. package/src/ruvocal/src/lib/components/chat/ChatIntroduction.svelte +123 -123
  150. package/src/ruvocal/src/lib/components/chat/ChatMessage.svelte +548 -548
  151. package/src/ruvocal/src/lib/components/chat/ChatWindow.svelte +1057 -1057
  152. package/src/ruvocal/src/lib/components/chat/FileDropzone.svelte +92 -92
  153. package/src/ruvocal/src/lib/components/chat/ImageLightbox.svelte +66 -66
  154. package/src/ruvocal/src/lib/components/chat/MarkdownBlock.svelte +23 -23
  155. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte +69 -69
  156. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte.test.ts +58 -58
  157. package/src/ruvocal/src/lib/components/chat/MessageAvatar.svelte +103 -103
  158. package/src/ruvocal/src/lib/components/chat/ModelSwitch.svelte +64 -64
  159. package/src/ruvocal/src/lib/components/chat/OpenReasoningResults.svelte +81 -81
  160. package/src/ruvocal/src/lib/components/chat/TaskGroup.svelte +88 -88
  161. package/src/ruvocal/src/lib/components/chat/ToolUpdate.svelte +273 -273
  162. package/src/ruvocal/src/lib/components/chat/UploadedFile.svelte +253 -253
  163. package/src/ruvocal/src/lib/components/chat/UrlFetchModal.svelte +203 -203
  164. package/src/ruvocal/src/lib/components/chat/VoiceRecorder.svelte +214 -214
  165. package/src/ruvocal/src/lib/components/icons/IconBurger.svelte +20 -20
  166. package/src/ruvocal/src/lib/components/icons/IconCheap.svelte +20 -20
  167. package/src/ruvocal/src/lib/components/icons/IconChevron.svelte +24 -24
  168. package/src/ruvocal/src/lib/components/icons/IconDazzled.svelte +40 -40
  169. package/src/ruvocal/src/lib/components/icons/IconFast.svelte +20 -20
  170. package/src/ruvocal/src/lib/components/icons/IconLoading.svelte +22 -22
  171. package/src/ruvocal/src/lib/components/icons/IconMCP.svelte +28 -28
  172. package/src/ruvocal/src/lib/components/icons/IconMoon.svelte +21 -21
  173. package/src/ruvocal/src/lib/components/icons/IconNew.svelte +20 -20
  174. package/src/ruvocal/src/lib/components/icons/IconOmni.svelte +90 -90
  175. package/src/ruvocal/src/lib/components/icons/IconPaperclip.svelte +24 -24
  176. package/src/ruvocal/src/lib/components/icons/IconPro.svelte +37 -37
  177. package/src/ruvocal/src/lib/components/icons/IconShare.svelte +21 -21
  178. package/src/ruvocal/src/lib/components/icons/IconSun.svelte +93 -93
  179. package/src/ruvocal/src/lib/components/icons/Logo.svelte +68 -68
  180. package/src/ruvocal/src/lib/components/icons/LogoHuggingFaceBorderless.svelte +54 -54
  181. package/src/ruvocal/src/lib/components/mcp/AddServerForm.svelte +250 -250
  182. package/src/ruvocal/src/lib/components/mcp/MCPServerManager.svelte +185 -185
  183. package/src/ruvocal/src/lib/components/mcp/ServerCard.svelte +203 -203
  184. package/src/ruvocal/src/lib/components/players/AudioPlayer.svelte +82 -82
  185. package/src/ruvocal/src/lib/components/voice/AudioWaveform.svelte +96 -96
  186. package/src/ruvocal/src/lib/components/wasm/GalleryPanel.svelte +357 -357
  187. package/src/ruvocal/src/lib/constants/mcpExamples.ts +114 -114
  188. package/src/ruvocal/src/lib/constants/mime.ts +11 -11
  189. package/src/ruvocal/src/lib/constants/pagination.ts +1 -1
  190. package/src/ruvocal/src/lib/constants/publicSepToken.ts +1 -1
  191. package/src/ruvocal/src/lib/constants/routerExamples.ts +133 -133
  192. package/src/ruvocal/src/lib/constants/rvagentPresets.ts +206 -206
  193. package/src/ruvocal/src/lib/createShareLink.ts +27 -27
  194. package/src/ruvocal/src/lib/jobs/refresh-conversation-stats.ts +297 -297
  195. package/src/ruvocal/src/lib/migrations/lock.ts +56 -56
  196. package/src/ruvocal/src/lib/migrations/migrations.spec.ts +74 -74
  197. package/src/ruvocal/src/lib/migrations/migrations.ts +109 -109
  198. package/src/ruvocal/src/lib/migrations/routines/01-update-search-assistants.ts +50 -50
  199. package/src/ruvocal/src/lib/migrations/routines/02-update-assistants-models.ts +48 -48
  200. package/src/ruvocal/src/lib/migrations/routines/04-update-message-updates.ts +151 -151
  201. package/src/ruvocal/src/lib/migrations/routines/05-update-message-files.ts +56 -56
  202. package/src/ruvocal/src/lib/migrations/routines/06-trim-message-updates.ts +56 -56
  203. package/src/ruvocal/src/lib/migrations/routines/08-update-featured-to-review.ts +32 -32
  204. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.spec.ts +214 -214
  205. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.ts +88 -88
  206. package/src/ruvocal/src/lib/migrations/routines/10-update-reports-assistantid.ts +29 -29
  207. package/src/ruvocal/src/lib/migrations/routines/index.ts +15 -15
  208. package/src/ruvocal/src/lib/server/__tests__/conversation-stop-generating.spec.ts +103 -103
  209. package/src/ruvocal/src/lib/server/abortRegistry.ts +57 -57
  210. package/src/ruvocal/src/lib/server/abortedGenerations.ts +43 -43
  211. package/src/ruvocal/src/lib/server/adminToken.ts +62 -62
  212. package/src/ruvocal/src/lib/server/api/__tests__/conversations-id.spec.ts +296 -296
  213. package/src/ruvocal/src/lib/server/api/__tests__/conversations-message.spec.ts +216 -216
  214. package/src/ruvocal/src/lib/server/api/__tests__/conversations.spec.ts +235 -235
  215. package/src/ruvocal/src/lib/server/api/__tests__/misc.spec.ts +72 -72
  216. package/src/ruvocal/src/lib/server/api/__tests__/testHelpers.ts +86 -86
  217. package/src/ruvocal/src/lib/server/api/__tests__/user-reports.spec.ts +78 -78
  218. package/src/ruvocal/src/lib/server/api/__tests__/user.spec.ts +239 -239
  219. package/src/ruvocal/src/lib/server/api/types.ts +37 -37
  220. package/src/ruvocal/src/lib/server/api/utils/requireAuth.ts +22 -22
  221. package/src/ruvocal/src/lib/server/api/utils/resolveConversation.ts +69 -69
  222. package/src/ruvocal/src/lib/server/api/utils/resolveModel.ts +27 -27
  223. package/src/ruvocal/src/lib/server/api/utils/superjsonResponse.ts +15 -15
  224. package/src/ruvocal/src/lib/server/apiToken.ts +11 -11
  225. package/src/ruvocal/src/lib/server/auth.ts +554 -554
  226. package/src/ruvocal/src/lib/server/config.ts +187 -187
  227. package/src/ruvocal/src/lib/server/conversation.ts +83 -83
  228. package/src/ruvocal/src/lib/server/database/__tests__/rvf.spec.ts +709 -709
  229. package/src/ruvocal/src/lib/server/database/postgres.ts +700 -700
  230. package/src/ruvocal/src/lib/server/database/rvf.ts +1078 -1078
  231. package/src/ruvocal/src/lib/server/database.ts +145 -145
  232. package/src/ruvocal/src/lib/server/endpoints/document.ts +68 -68
  233. package/src/ruvocal/src/lib/server/endpoints/endpoints.ts +43 -43
  234. package/src/ruvocal/src/lib/server/endpoints/images.ts +211 -211
  235. package/src/ruvocal/src/lib/server/endpoints/openai/endpointOai.ts +266 -266
  236. package/src/ruvocal/src/lib/server/endpoints/openai/openAIChatToTextGenerationStream.ts +212 -212
  237. package/src/ruvocal/src/lib/server/endpoints/openai/openAICompletionToTextGenerationStream.ts +32 -32
  238. package/src/ruvocal/src/lib/server/endpoints/preprocessMessages.ts +61 -61
  239. package/src/ruvocal/src/lib/server/exitHandler.ts +59 -59
  240. package/src/ruvocal/src/lib/server/files/downloadFile.ts +34 -34
  241. package/src/ruvocal/src/lib/server/files/uploadFile.ts +29 -29
  242. package/src/ruvocal/src/lib/server/findRepoRoot.ts +13 -13
  243. package/src/ruvocal/src/lib/server/generateFromDefaultEndpoint.ts +46 -46
  244. package/src/ruvocal/src/lib/server/hooks/error.ts +37 -37
  245. package/src/ruvocal/src/lib/server/hooks/fetch.ts +22 -22
  246. package/src/ruvocal/src/lib/server/hooks/handle.ts +250 -250
  247. package/src/ruvocal/src/lib/server/hooks/init.ts +51 -51
  248. package/src/ruvocal/src/lib/server/isURLLocal.spec.ts +31 -31
  249. package/src/ruvocal/src/lib/server/isURLLocal.ts +74 -74
  250. package/src/ruvocal/src/lib/server/logger.ts +42 -42
  251. package/src/ruvocal/src/lib/server/mcp/clientPool.spec.ts +175 -175
  252. package/src/ruvocal/src/lib/server/mcp/hf.ts +32 -32
  253. package/src/ruvocal/src/lib/server/mcp/httpClient.ts +122 -122
  254. package/src/ruvocal/src/lib/server/mcp/registry.ts +76 -76
  255. package/src/ruvocal/src/lib/server/mcp/tools.ts +196 -196
  256. package/src/ruvocal/src/lib/server/metrics.ts +255 -255
  257. package/src/ruvocal/src/lib/server/models.ts +518 -518
  258. package/src/ruvocal/src/lib/server/requestContext.ts +55 -55
  259. package/src/ruvocal/src/lib/server/router/arch.ts +230 -230
  260. package/src/ruvocal/src/lib/server/router/endpoint.ts +316 -316
  261. package/src/ruvocal/src/lib/server/router/multimodal.ts +28 -28
  262. package/src/ruvocal/src/lib/server/router/policy.ts +49 -49
  263. package/src/ruvocal/src/lib/server/router/toolsRoute.ts +51 -51
  264. package/src/ruvocal/src/lib/server/router/types.ts +21 -21
  265. package/src/ruvocal/src/lib/server/sendSlack.ts +23 -23
  266. package/src/ruvocal/src/lib/server/textGeneration/generate.ts +258 -258
  267. package/src/ruvocal/src/lib/server/textGeneration/index.ts +96 -96
  268. package/src/ruvocal/src/lib/server/textGeneration/mcp/fileRefs.ts +155 -155
  269. package/src/ruvocal/src/lib/server/textGeneration/mcp/routerResolution.ts +108 -108
  270. package/src/ruvocal/src/lib/server/textGeneration/mcp/runMcpFlow.ts +831 -831
  271. package/src/ruvocal/src/lib/server/textGeneration/mcp/toolInvocation.ts +349 -349
  272. package/src/ruvocal/src/lib/server/textGeneration/mcp/wasmTools.test.ts +633 -633
  273. package/src/ruvocal/src/lib/server/textGeneration/reasoning.ts +23 -23
  274. package/src/ruvocal/src/lib/server/textGeneration/title.ts +83 -83
  275. package/src/ruvocal/src/lib/server/textGeneration/types.ts +28 -28
  276. package/src/ruvocal/src/lib/server/textGeneration/utils/prepareFiles.ts +88 -88
  277. package/src/ruvocal/src/lib/server/textGeneration/utils/routing.ts +21 -21
  278. package/src/ruvocal/src/lib/server/textGeneration/utils/toolPrompt.ts +49 -49
  279. package/src/ruvocal/src/lib/server/urlSafety.ts +77 -77
  280. package/src/ruvocal/src/lib/server/usageLimits.ts +30 -30
  281. package/src/ruvocal/src/lib/stores/autopilotStore.svelte.ts +175 -175
  282. package/src/ruvocal/src/lib/stores/backgroundGenerations.svelte.ts +32 -32
  283. package/src/ruvocal/src/lib/stores/backgroundGenerations.ts +1 -1
  284. package/src/ruvocal/src/lib/stores/errors.ts +9 -9
  285. package/src/ruvocal/src/lib/stores/isAborted.ts +3 -3
  286. package/src/ruvocal/src/lib/stores/isPro.ts +4 -4
  287. package/src/ruvocal/src/lib/stores/loading.ts +3 -3
  288. package/src/ruvocal/src/lib/stores/mcpServers.ts +534 -534
  289. package/src/ruvocal/src/lib/stores/pendingChatInput.ts +3 -3
  290. package/src/ruvocal/src/lib/stores/pendingMessage.ts +9 -9
  291. package/src/ruvocal/src/lib/stores/settings.ts +182 -182
  292. package/src/ruvocal/src/lib/stores/shareModal.ts +13 -13
  293. package/src/ruvocal/src/lib/stores/titleUpdate.ts +8 -8
  294. package/src/ruvocal/src/lib/stores/wasmMcp.ts +472 -472
  295. package/src/ruvocal/src/lib/switchTheme.ts +124 -124
  296. package/src/ruvocal/src/lib/types/AbortedGeneration.ts +8 -8
  297. package/src/ruvocal/src/lib/types/Assistant.ts +31 -31
  298. package/src/ruvocal/src/lib/types/AssistantStats.ts +11 -11
  299. package/src/ruvocal/src/lib/types/ConfigKey.ts +4 -4
  300. package/src/ruvocal/src/lib/types/ConvSidebar.ts +9 -9
  301. package/src/ruvocal/src/lib/types/Conversation.ts +27 -27
  302. package/src/ruvocal/src/lib/types/ConversationStats.ts +13 -13
  303. package/src/ruvocal/src/lib/types/Message.ts +41 -41
  304. package/src/ruvocal/src/lib/types/MessageEvent.ts +10 -10
  305. package/src/ruvocal/src/lib/types/MessageUpdate.ts +139 -139
  306. package/src/ruvocal/src/lib/types/MigrationResult.ts +7 -7
  307. package/src/ruvocal/src/lib/types/Model.ts +23 -23
  308. package/src/ruvocal/src/lib/types/Report.ts +12 -12
  309. package/src/ruvocal/src/lib/types/Review.ts +6 -6
  310. package/src/ruvocal/src/lib/types/Semaphore.ts +19 -19
  311. package/src/ruvocal/src/lib/types/Session.ts +22 -22
  312. package/src/ruvocal/src/lib/types/Settings.ts +93 -93
  313. package/src/ruvocal/src/lib/types/SharedConversation.ts +9 -9
  314. package/src/ruvocal/src/lib/types/Template.ts +6 -6
  315. package/src/ruvocal/src/lib/types/Timestamps.ts +4 -4
  316. package/src/ruvocal/src/lib/types/TokenCache.ts +6 -6
  317. package/src/ruvocal/src/lib/types/Tool.ts +77 -77
  318. package/src/ruvocal/src/lib/types/UrlDependency.ts +5 -5
  319. package/src/ruvocal/src/lib/types/User.ts +14 -14
  320. package/src/ruvocal/src/lib/utils/PublicConfig.svelte.ts +75 -75
  321. package/src/ruvocal/src/lib/utils/auth.ts +17 -17
  322. package/src/ruvocal/src/lib/utils/chunk.ts +33 -33
  323. package/src/ruvocal/src/lib/utils/cookiesAreEnabled.ts +13 -13
  324. package/src/ruvocal/src/lib/utils/debounce.ts +17 -17
  325. package/src/ruvocal/src/lib/utils/deepestChild.ts +6 -6
  326. package/src/ruvocal/src/lib/utils/favicon.ts +21 -21
  327. package/src/ruvocal/src/lib/utils/fetchJSON.ts +23 -23
  328. package/src/ruvocal/src/lib/utils/file2base64.ts +14 -14
  329. package/src/ruvocal/src/lib/utils/formatUserCount.ts +37 -37
  330. package/src/ruvocal/src/lib/utils/generationState.spec.ts +75 -75
  331. package/src/ruvocal/src/lib/utils/generationState.ts +26 -26
  332. package/src/ruvocal/src/lib/utils/getHref.ts +41 -41
  333. package/src/ruvocal/src/lib/utils/getReturnFromGenerator.ts +7 -7
  334. package/src/ruvocal/src/lib/utils/haptics.ts +64 -64
  335. package/src/ruvocal/src/lib/utils/hashConv.ts +12 -12
  336. package/src/ruvocal/src/lib/utils/hf.ts +17 -17
  337. package/src/ruvocal/src/lib/utils/isDesktop.ts +7 -7
  338. package/src/ruvocal/src/lib/utils/isUrl.ts +8 -8
  339. package/src/ruvocal/src/lib/utils/isVirtualKeyboard.ts +16 -16
  340. package/src/ruvocal/src/lib/utils/loadAttachmentsFromUrls.ts +115 -115
  341. package/src/ruvocal/src/lib/utils/marked.spec.ts +96 -96
  342. package/src/ruvocal/src/lib/utils/marked.ts +531 -531
  343. package/src/ruvocal/src/lib/utils/mcpValidation.ts +147 -147
  344. package/src/ruvocal/src/lib/utils/mergeAsyncGenerators.ts +38 -38
  345. package/src/ruvocal/src/lib/utils/messageUpdates.spec.ts +262 -262
  346. package/src/ruvocal/src/lib/utils/messageUpdates.ts +324 -324
  347. package/src/ruvocal/src/lib/utils/mime.ts +56 -56
  348. package/src/ruvocal/src/lib/utils/models.ts +14 -14
  349. package/src/ruvocal/src/lib/utils/parseBlocks.ts +120 -120
  350. package/src/ruvocal/src/lib/utils/parseIncompleteMarkdown.ts +644 -644
  351. package/src/ruvocal/src/lib/utils/parseStringToList.ts +10 -10
  352. package/src/ruvocal/src/lib/utils/randomUuid.ts +14 -14
  353. package/src/ruvocal/src/lib/utils/searchTokens.ts +33 -33
  354. package/src/ruvocal/src/lib/utils/sha256.ts +7 -7
  355. package/src/ruvocal/src/lib/utils/stringifyError.ts +12 -12
  356. package/src/ruvocal/src/lib/utils/sum.ts +3 -3
  357. package/src/ruvocal/src/lib/utils/template.spec.ts +59 -59
  358. package/src/ruvocal/src/lib/utils/template.ts +53 -53
  359. package/src/ruvocal/src/lib/utils/timeout.ts +9 -9
  360. package/src/ruvocal/src/lib/utils/toolProgress.spec.ts +46 -46
  361. package/src/ruvocal/src/lib/utils/toolProgress.ts +11 -11
  362. package/src/ruvocal/src/lib/utils/tree/addChildren.spec.ts +102 -102
  363. package/src/ruvocal/src/lib/utils/tree/addChildren.ts +48 -48
  364. package/src/ruvocal/src/lib/utils/tree/addSibling.spec.ts +81 -81
  365. package/src/ruvocal/src/lib/utils/tree/addSibling.ts +41 -41
  366. package/src/ruvocal/src/lib/utils/tree/buildSubtree.spec.ts +110 -110
  367. package/src/ruvocal/src/lib/utils/tree/buildSubtree.ts +24 -24
  368. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.spec.ts +31 -31
  369. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.ts +36 -36
  370. package/src/ruvocal/src/lib/utils/tree/isMessageId.spec.ts +15 -15
  371. package/src/ruvocal/src/lib/utils/tree/isMessageId.ts +5 -5
  372. package/src/ruvocal/src/lib/utils/tree/tree.d.ts +14 -14
  373. package/src/ruvocal/src/lib/utils/tree/treeHelpers.spec.ts +167 -167
  374. package/src/ruvocal/src/lib/utils/updates.ts +39 -39
  375. package/src/ruvocal/src/lib/utils/urlParams.ts +13 -13
  376. package/src/ruvocal/src/lib/wasm/idb.ts +438 -438
  377. package/src/ruvocal/src/lib/wasm/index.ts +1213 -1213
  378. package/src/ruvocal/src/lib/wasm/tests/wasm-capabilities.test.ts +565 -565
  379. package/src/ruvocal/src/lib/wasm/wasm.worker.ts +332 -332
  380. package/src/ruvocal/src/lib/wasm/workerClient.ts +166 -166
  381. package/src/ruvocal/src/lib/workers/autopilotWorker.ts +221 -221
  382. package/src/ruvocal/src/lib/workers/detailFetchWorker.ts +100 -100
  383. package/src/ruvocal/src/lib/workers/markdownWorker.ts +61 -61
  384. package/src/ruvocal/src/routes/+error.svelte +20 -20
  385. package/src/ruvocal/src/routes/+layout.svelte +324 -324
  386. package/src/ruvocal/src/routes/+layout.ts +91 -91
  387. package/src/ruvocal/src/routes/+page.svelte +168 -168
  388. package/src/ruvocal/src/routes/.well-known/oauth-cimd/+server.ts +37 -37
  389. package/src/ruvocal/src/routes/__debug/openai/+server.ts +21 -21
  390. package/src/ruvocal/src/routes/admin/export/+server.ts +159 -159
  391. package/src/ruvocal/src/routes/admin/stats/compute/+server.ts +16 -16
  392. package/src/ruvocal/src/routes/api/conversation/[id]/+server.ts +40 -40
  393. package/src/ruvocal/src/routes/api/conversation/[id]/message/[messageId]/+server.ts +42 -42
  394. package/src/ruvocal/src/routes/api/conversations/+server.ts +48 -48
  395. package/src/ruvocal/src/routes/api/fetch-url/+server.ts +147 -147
  396. package/src/ruvocal/src/routes/api/mcp/health/+server.ts +292 -292
  397. package/src/ruvocal/src/routes/api/mcp/servers/+server.ts +32 -32
  398. package/src/ruvocal/src/routes/api/models/+server.ts +25 -25
  399. package/src/ruvocal/src/routes/api/transcribe/+server.ts +104 -104
  400. package/src/ruvocal/src/routes/api/user/+server.ts +15 -15
  401. package/src/ruvocal/src/routes/api/user/validate-token/+server.ts +20 -20
  402. package/src/ruvocal/src/routes/api/v2/conversations/+server.ts +48 -48
  403. package/src/ruvocal/src/routes/api/v2/conversations/[id]/+server.ts +94 -94
  404. package/src/ruvocal/src/routes/api/v2/conversations/[id]/message/[messageId]/+server.ts +43 -43
  405. package/src/ruvocal/src/routes/api/v2/conversations/import-share/+server.ts +23 -23
  406. package/src/ruvocal/src/routes/api/v2/debug/config/+server.ts +16 -16
  407. package/src/ruvocal/src/routes/api/v2/debug/refresh/+server.ts +30 -30
  408. package/src/ruvocal/src/routes/api/v2/export/+server.ts +196 -196
  409. package/src/ruvocal/src/routes/api/v2/feature-flags/+server.ts +14 -14
  410. package/src/ruvocal/src/routes/api/v2/models/+server.ts +38 -38
  411. package/src/ruvocal/src/routes/api/v2/models/[namespace]/+server.ts +8 -8
  412. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/+server.ts +8 -8
  413. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/subscribe/+server.ts +28 -28
  414. package/src/ruvocal/src/routes/api/v2/models/[namespace]/subscribe/+server.ts +28 -28
  415. package/src/ruvocal/src/routes/api/v2/models/old/+server.ts +7 -7
  416. package/src/ruvocal/src/routes/api/v2/models/refresh/+server.ts +33 -33
  417. package/src/ruvocal/src/routes/api/v2/public-config/+server.ts +7 -7
  418. package/src/ruvocal/src/routes/api/v2/user/+server.ts +17 -17
  419. package/src/ruvocal/src/routes/api/v2/user/billing-orgs/+server.ts +73 -73
  420. package/src/ruvocal/src/routes/api/v2/user/reports/+server.ts +17 -17
  421. package/src/ruvocal/src/routes/api/v2/user/settings/+server.ts +110 -110
  422. package/src/ruvocal/src/routes/conversation/+server.ts +115 -115
  423. package/src/ruvocal/src/routes/conversation/[id]/+page.svelte +586 -586
  424. package/src/ruvocal/src/routes/conversation/[id]/+page.ts +60 -60
  425. package/src/ruvocal/src/routes/conversation/[id]/+server.ts +740 -740
  426. package/src/ruvocal/src/routes/conversation/[id]/message/[messageId]/prompt/+server.ts +66 -66
  427. package/src/ruvocal/src/routes/conversation/[id]/share/+server.ts +69 -69
  428. package/src/ruvocal/src/routes/conversation/[id]/stop-generating/+server.ts +35 -35
  429. package/src/ruvocal/src/routes/healthcheck/+server.ts +3 -3
  430. package/src/ruvocal/src/routes/login/+server.ts +5 -5
  431. package/src/ruvocal/src/routes/login/callback/+server.ts +103 -103
  432. package/src/ruvocal/src/routes/login/callback/updateUser.spec.ts +157 -157
  433. package/src/ruvocal/src/routes/login/callback/updateUser.ts +215 -215
  434. package/src/ruvocal/src/routes/logout/+server.ts +18 -18
  435. package/src/ruvocal/src/routes/metrics/+server.ts +18 -18
  436. package/src/ruvocal/src/routes/models/+page.svelte +233 -233
  437. package/src/ruvocal/src/routes/models/[...model]/+page.svelte +161 -161
  438. package/src/ruvocal/src/routes/models/[...model]/+page.ts +14 -14
  439. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/+server.ts +64 -64
  440. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/ModelThumbnail.svelte +28 -28
  441. package/src/ruvocal/src/routes/privacy/+page.svelte +11 -11
  442. package/src/ruvocal/src/routes/r/[id]/+page.ts +34 -34
  443. package/src/ruvocal/src/routes/settings/(nav)/+layout.svelte +282 -282
  444. package/src/ruvocal/src/routes/settings/(nav)/+layout.ts +1 -1
  445. package/src/ruvocal/src/routes/settings/(nav)/+server.ts +59 -59
  446. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.svelte +464 -464
  447. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.ts +14 -14
  448. package/src/ruvocal/src/routes/settings/(nav)/application/+page.svelte +362 -362
  449. package/src/ruvocal/src/routes/settings/+layout.svelte +40 -40
  450. package/src/ruvocal/src/styles/highlight-js.css +195 -195
  451. package/src/ruvocal/src/styles/main.css +144 -144
  452. package/src/ruvocal/static/chatui/favicon-dark.svg +3 -3
  453. package/src/ruvocal/static/chatui/favicon-dev.svg +3 -3
  454. package/src/ruvocal/static/chatui/favicon.svg +3 -3
  455. package/src/ruvocal/static/chatui/icon.svg +3 -3
  456. package/src/ruvocal/static/chatui/logo.svg +7 -7
  457. package/src/ruvocal/static/chatui/manifest.json +54 -54
  458. package/src/ruvocal/static/chatui/welcome.js +184 -184
  459. package/src/ruvocal/static/huggingchat/favicon-dark.svg +4 -4
  460. package/src/ruvocal/static/huggingchat/favicon-dev.svg +4 -4
  461. package/src/ruvocal/static/huggingchat/favicon.svg +4 -4
  462. package/src/ruvocal/static/huggingchat/fulltext-logo.svg +1 -1
  463. package/src/ruvocal/static/huggingchat/icon.svg +4 -4
  464. package/src/ruvocal/static/huggingchat/logo.svg +4 -4
  465. package/src/ruvocal/static/huggingchat/manifest.json +54 -54
  466. package/src/ruvocal/static/huggingchat/routes.chat.json +226 -226
  467. package/src/ruvocal/static/robots.txt +10 -10
  468. package/src/ruvocal/static/wasm/rvagent_wasm.js +1539 -1539
  469. package/src/ruvocal/stub/@reflink/reflink/package.json +5 -5
  470. package/src/ruvocal/svelte.config.js +53 -53
  471. package/src/ruvocal/tailwind.config.cjs +30 -30
  472. package/src/ruvocal/tsconfig.json +19 -19
  473. package/src/ruvocal/vite.config.ts +87 -87
  474. package/src/scripts/deploy.sh +116 -116
  475. package/src/scripts/generate-config.js +245 -245
  476. package/src/scripts/generate-welcome.js +187 -187
  477. package/src/scripts/package-rvf.sh +116 -116
  478. package/src/ruvocal/.claude-flow/daemon-state.json +0 -135
  479. package/src/ruvocal/.claude-flow/data/pending-insights.jsonl +0 -0
  480. package/src/ruvocal/.claude-flow/data/ranked-context.json +0 -5
  481. package/src/ruvocal/.claude-flow/logs/daemon.log +0 -31
  482. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_prompt.log +0 -989
  483. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_result.log +0 -67
  484. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_prompt.log +0 -989
  485. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_result.log +0 -93
  486. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_prompt.log +0 -1498
  487. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_result.log +0 -93
  488. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_prompt.log +0 -1498
  489. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_result.log +0 -100
  490. package/src/ruvocal/.claude-flow/metrics/codebase-map.json +0 -11
  491. package/src/ruvocal/.claude-flow/metrics/consolidation.json +0 -6
  492. package/src/ruvocal/.claude-flow/neural/stats.json +0 -6
  493. package/src/ruvocal/.claude-flow/sessions/current.json +0 -13
  494. package/src/ruvocal/.swarm/attestation.db +0 -0
  495. package/src/ruvocal/.swarm/hnsw.index +0 -0
  496. package/src/ruvocal/.swarm/hnsw.metadata.json +0 -1
  497. package/src/ruvocal/.swarm/memory.db +0 -0
  498. package/src/ruvocal/.swarm/schema.sql +0 -305
@@ -1,740 +1,740 @@
1
- import { authCondition } from "$lib/server/auth";
2
- import { collections } from "$lib/server/database";
3
- import { config } from "$lib/server/config";
4
- import { models, validModelIdSchema } from "$lib/server/models";
5
- import { ERROR_MESSAGES } from "$lib/stores/errors";
6
- import type { Message } from "$lib/types/Message";
7
- import { error } from "@sveltejs/kit";
8
- import { ObjectId } from "mongodb";
9
- import { z } from "zod";
10
- import {
11
- MessageUpdateStatus,
12
- MessageUpdateType,
13
- MessageReasoningUpdateType,
14
- type MessageUpdate,
15
- type MessageStreamUpdate,
16
- } from "$lib/types/MessageUpdate";
17
- import { uploadFile } from "$lib/server/files/uploadFile";
18
- import { convertLegacyConversation } from "$lib/utils/tree/convertLegacyConversation";
19
- import { isMessageId } from "$lib/utils/tree/isMessageId";
20
- import { buildSubtree } from "$lib/utils/tree/buildSubtree.js";
21
- import { addChildren } from "$lib/utils/tree/addChildren.js";
22
- import { addSibling } from "$lib/utils/tree/addSibling.js";
23
- import { usageLimits } from "$lib/server/usageLimits";
24
- import { textGeneration } from "$lib/server/textGeneration";
25
- import type { TextGenerationContext } from "$lib/server/textGeneration/types";
26
- import { logger } from "$lib/server/logger.js";
27
- import { AbortRegistry } from "$lib/server/abortRegistry";
28
- import { MetricsServer } from "$lib/server/metrics";
29
-
30
- export async function POST({ request, locals, params, getClientAddress }) {
31
- const id = z.string().parse(params.id);
32
- const convId = new ObjectId(id);
33
- const promptedAt = new Date();
34
-
35
- const userId = locals.user?._id ?? locals.sessionId;
36
-
37
- // check user
38
- if (!userId) {
39
- error(401, "Unauthorized");
40
- }
41
-
42
- // check if the user has access to the conversation
43
- const convBeforeCheck = await collections.conversations.findOne({
44
- _id: convId,
45
- ...authCondition(locals),
46
- });
47
-
48
- if (convBeforeCheck && !convBeforeCheck.rootMessageId) {
49
- const res = await collections.conversations.updateOne(
50
- {
51
- _id: convId,
52
- },
53
- {
54
- $set: {
55
- ...convBeforeCheck,
56
- ...convertLegacyConversation(convBeforeCheck),
57
- },
58
- }
59
- );
60
-
61
- if (!res.acknowledged) {
62
- error(500, "Failed to convert conversation");
63
- }
64
- }
65
-
66
- const conv = await collections.conversations.findOne({
67
- _id: convId,
68
- ...authCondition(locals),
69
- });
70
-
71
- if (!conv) {
72
- error(404, "Conversation not found");
73
- }
74
-
75
- // register the event for ratelimiting
76
- await collections.messageEvents.insertOne({
77
- type: "message",
78
- userId,
79
- createdAt: new Date(),
80
- expiresAt: new Date(Date.now() + 60_000),
81
- ip: getClientAddress(),
82
- });
83
-
84
- if (usageLimits?.messagesPerMinute) {
85
- // check if the user is rate limited
86
- const nEvents = Math.max(
87
- await collections.messageEvents.countDocuments({
88
- userId,
89
- type: "message",
90
- expiresAt: { $gt: new Date() },
91
- }),
92
- await collections.messageEvents.countDocuments({
93
- ip: getClientAddress(),
94
- type: "message",
95
- expiresAt: { $gt: new Date() },
96
- })
97
- );
98
- if (nEvents > usageLimits.messagesPerMinute) {
99
- error(429, ERROR_MESSAGES.rateLimited);
100
- }
101
- }
102
-
103
- if (usageLimits?.messages && conv.messages.length > usageLimits.messages) {
104
- error(
105
- 429,
106
- `This conversation has more than ${usageLimits.messages} messages. Start a new one to continue`
107
- );
108
- }
109
-
110
- // fetch the model
111
- const model = models.find((m) => m.id === conv.model);
112
-
113
- if (!model) {
114
- error(410, "Model not available anymore");
115
- }
116
-
117
- // finally parse the content of the request
118
- const form = await request.formData();
119
-
120
- const json = form.get("data");
121
-
122
- if (!json || typeof json !== "string") {
123
- error(400, "Invalid request");
124
- }
125
-
126
- const {
127
- inputs: newPrompt,
128
- id: messageId,
129
- is_retry: isRetry,
130
- selectedMcpServerNames,
131
- selectedMcpServers,
132
- autopilot,
133
- autopilotMaxSteps,
134
- } = z
135
- .object({
136
- id: z.string().uuid().refine(isMessageId).optional(), // parent message id to append to for a normal message, or the message id for a retry/continue
137
- inputs: z.optional(
138
- z
139
- .string()
140
- .min(1)
141
- .transform((s) => s.replace(/\r\n/g, "\n"))
142
- ),
143
- is_retry: z.optional(z.boolean()),
144
- autopilot: z.optional(z.boolean()),
145
- // User-configurable cap on autopilot tool-call loops. Server clamps to [1, 100].
146
- autopilotMaxSteps: z.optional(z.number().int().min(1).max(100)),
147
- selectedMcpServerNames: z.optional(z.array(z.string())),
148
- selectedMcpServers: z
149
- .optional(
150
- z.array(
151
- z.object({
152
- name: z.string(),
153
- url: z.string(),
154
- headers: z
155
- .optional(z.array(z.object({ key: z.string(), value: z.string() })))
156
- .default([]),
157
- })
158
- )
159
- )
160
- .default([]),
161
- files: z.optional(
162
- z.array(
163
- z.object({
164
- type: z.literal("base64").or(z.literal("hash")),
165
- name: z.string(),
166
- value: z.string(),
167
- mime: z.string(),
168
- })
169
- )
170
- ),
171
- })
172
- .parse(JSON.parse(json));
173
-
174
- // Attach MCP selection to locals so the text generation pipeline can consume it
175
- try {
176
- (locals as unknown as Record<string, unknown>).mcp = {
177
- selectedServerNames: selectedMcpServerNames,
178
- selectedServers: (selectedMcpServers ?? []).map((s) => ({
179
- name: s.name,
180
- url: s.url,
181
- headers:
182
- s.headers && s.headers.length > 0
183
- ? Object.fromEntries(s.headers.map((h) => [h.key, h.value]))
184
- : undefined,
185
- })),
186
- };
187
- } catch {
188
- // ignore attachment errors, pipeline will just use env servers
189
- }
190
-
191
- const inputFiles = await Promise.all(
192
- form
193
- .getAll("files")
194
- .filter((entry): entry is File => entry instanceof File && entry.size > 0)
195
- .map(async (file) => {
196
- const [type, ...name] = file.name.split(";");
197
-
198
- return {
199
- type: z.literal("base64").or(z.literal("hash")).parse(type),
200
- value: await file.text(),
201
- mime: file.type,
202
- name: name.join(";"),
203
- };
204
- })
205
- );
206
-
207
- if (usageLimits?.messageLength && (newPrompt?.length ?? 0) > usageLimits.messageLength) {
208
- error(400, "Message too long.");
209
- }
210
-
211
- // each file is either:
212
- // base64 string requiring upload to the server
213
- // hash pointing to an existing file
214
- const hashFiles = inputFiles?.filter((file) => file.type === "hash") ?? [];
215
- const b64Files =
216
- inputFiles
217
- ?.filter((file) => file.type !== "hash")
218
- .map((file) => {
219
- const blob = Buffer.from(file.value, "base64");
220
- return new File([blob], file.name, { type: file.mime });
221
- }) ?? [];
222
-
223
- // check sizes
224
- // todo: make configurable
225
- if (b64Files.some((file) => file.size > 10 * 1024 * 1024)) {
226
- error(413, "File too large, should be <10MB");
227
- }
228
-
229
- const uploadedFiles = await Promise.all(b64Files.map((file) => uploadFile(file, conv))).then(
230
- (files) => [...files, ...hashFiles]
231
- );
232
-
233
- // we will append tokens to the content of this message
234
- let messageToWriteToId: Message["id"] | undefined = undefined;
235
- // used for building the prompt, subtree of the conversation that goes from the latest message to the root
236
- let messagesForPrompt: Message[] = [];
237
-
238
- if (isRetry && messageId) {
239
- // two cases, if we're retrying a user message with a newPrompt set,
240
- // it means we're editing a user message
241
- // if we're retrying on an assistant message, newPrompt cannot be set
242
- // it means we're retrying the last assistant message for a new answer
243
-
244
- const messageToRetry = conv.messages.find((message) => message.id === messageId);
245
-
246
- if (!messageToRetry) {
247
- error(404, "Message not found");
248
- }
249
-
250
- if (messageToRetry.from === "user" && newPrompt) {
251
- // add a sibling to this message from the user, with the alternative prompt
252
- // add a children to that sibling, where we can write to
253
- const newUserMessageId = addSibling(
254
- conv,
255
- {
256
- from: "user",
257
- content: newPrompt,
258
- files: uploadedFiles,
259
- createdAt: new Date(),
260
- updatedAt: new Date(),
261
- },
262
- messageId
263
- );
264
- messageToWriteToId = addChildren(
265
- conv,
266
- {
267
- from: "assistant",
268
- content: "",
269
- createdAt: new Date(),
270
- updatedAt: new Date(),
271
- },
272
- newUserMessageId
273
- );
274
- messagesForPrompt = buildSubtree(conv, newUserMessageId);
275
- } else if (messageToRetry.from === "assistant") {
276
- // we're retrying an assistant message, to generate a new answer
277
- // just add a sibling to the assistant answer where we can write to
278
- messageToWriteToId = addSibling(
279
- conv,
280
- { from: "assistant", content: "", createdAt: new Date(), updatedAt: new Date() },
281
- messageId
282
- );
283
- messagesForPrompt = buildSubtree(conv, messageId);
284
- messagesForPrompt.pop(); // don't need the latest assistant message in the prompt since we're retrying it
285
- }
286
- } else {
287
- // just a normal linear conversation, so we add the user message
288
- // and the blank assistant message back to back
289
- const newUserMessageId = addChildren(
290
- conv,
291
- {
292
- from: "user",
293
- content: newPrompt ?? "",
294
- files: uploadedFiles,
295
- createdAt: new Date(),
296
- updatedAt: new Date(),
297
- },
298
- messageId
299
- );
300
-
301
- messageToWriteToId = addChildren(
302
- conv,
303
- {
304
- from: "assistant",
305
- content: "",
306
- createdAt: new Date(),
307
- updatedAt: new Date(),
308
- },
309
- newUserMessageId
310
- );
311
- // build the prompt from the user message
312
- messagesForPrompt = buildSubtree(conv, newUserMessageId);
313
- }
314
-
315
- const messageToWriteTo = conv.messages.find((message) => message.id === messageToWriteToId);
316
- if (!messageToWriteTo) {
317
- error(500, "Failed to create message");
318
- }
319
- if (messagesForPrompt.length === 0) {
320
- error(500, "Failed to create prompt");
321
- }
322
-
323
- // update the conversation with the new messages
324
- await collections.conversations.updateOne(
325
- { _id: convId },
326
- { $set: { messages: conv.messages, title: conv.title, updatedAt: new Date() } }
327
- );
328
-
329
- let doneStreaming = false;
330
- let clientDetached = false;
331
-
332
- let lastTokenTimestamp: undefined | Date = undefined;
333
- let firstTokenObserved = false;
334
- const metricsEnabled = MetricsServer.isEnabled();
335
- const metrics = metricsEnabled ? MetricsServer.getMetrics() : undefined;
336
- const metricsModelId = model.id ?? model.name ?? conv.model;
337
- const metricsLabels = { model: metricsModelId };
338
-
339
- const persistConversation = async () => {
340
- const messagesForSave = conv.messages.map((msg) => {
341
- const filteredUpdates =
342
- msg.updates
343
- ?.filter(
344
- (u) =>
345
- !(u.type === MessageUpdateType.Status && u.status === MessageUpdateStatus.KeepAlive)
346
- )
347
- .map((u) => {
348
- if (u.type !== MessageUpdateType.Stream) return u;
349
- // Preserve existing len if already compressed, otherwise compute from token
350
- const len = u.len ?? (u.token ?? "").length;
351
- // store a lightweight marker to preserve ordering without duplicating content
352
- return { type: MessageUpdateType.Stream, token: "", len } satisfies MessageStreamUpdate;
353
- }) ?? [];
354
-
355
- return { ...msg, updates: filteredUpdates };
356
- });
357
-
358
- await collections.conversations.updateOne(
359
- { _id: convId },
360
- { $set: { messages: messagesForSave, title: conv.title, updatedAt: new Date() } }
361
- );
362
- };
363
-
364
- const abortRegistry = AbortRegistry.getInstance();
365
-
366
- // we now build the stream
367
- const stream = new ReadableStream({
368
- async start(controller) {
369
- const conversationKey = convId.toString();
370
- const ctrl = new AbortController();
371
- abortRegistry.register(conversationKey, ctrl);
372
-
373
- let finalAnswerReceived = false;
374
- let abortedByUser = false;
375
- let finishedStatusSent = false;
376
-
377
- messageToWriteTo.updates ??= [];
378
- async function update(event: MessageUpdate) {
379
- if (!messageToWriteTo || !conv) {
380
- throw Error("No message or conversation to write events to");
381
- }
382
-
383
- if (
384
- event.type === MessageUpdateType.Status &&
385
- event.status === MessageUpdateStatus.Finished
386
- ) {
387
- finishedStatusSent = true;
388
- }
389
-
390
- // Add token to content or skip if empty
391
- if (event.type === MessageUpdateType.Stream) {
392
- if (event.token === "") return;
393
- messageToWriteTo.content += event.token;
394
-
395
- if (metricsEnabled && metrics) {
396
- const now = Date.now();
397
- metrics.model.tokenCountTotal.inc(metricsLabels);
398
-
399
- if (!firstTokenObserved) {
400
- metrics.model.timeToFirstToken.observe(metricsLabels, now - promptedAt.getTime());
401
- firstTokenObserved = true;
402
- }
403
-
404
- const previousTimestamp = lastTokenTimestamp
405
- ? lastTokenTimestamp.getTime()
406
- : promptedAt.getTime();
407
- metrics.model.timePerOutputToken.observe(metricsLabels, now - previousTimestamp);
408
- }
409
-
410
- lastTokenTimestamp = new Date();
411
- }
412
-
413
- // Append reasoning stream tokens to message.reasoning (server-side)
414
- else if (
415
- event.type === MessageUpdateType.Reasoning &&
416
- event.subtype === MessageReasoningUpdateType.Stream &&
417
- "token" in event
418
- ) {
419
- messageToWriteTo.reasoning ??= "";
420
- messageToWriteTo.reasoning += event.token;
421
- }
422
-
423
- // Set the title
424
- else if (event.type === MessageUpdateType.Title) {
425
- // Always strip <think> markers from titles when saving
426
- const sanitizedTitle = event.title.replace(/<\/?think>/gi, "").trim();
427
- conv.title = sanitizedTitle;
428
- await collections.conversations.updateOne(
429
- { _id: convId },
430
- { $set: { title: conv?.title, updatedAt: new Date() } }
431
- );
432
- }
433
-
434
- // Set the final text and the interrupted flag
435
- else if (event.type === MessageUpdateType.FinalAnswer) {
436
- messageToWriteTo.interrupted = event.interrupted;
437
- // Default behavior: replace the streamed text with the provider's final text.
438
- // However, when tools (MCP/function calls) were used, providers often stream
439
- // some content (e.g., a story) before triggering tools, then return a
440
- // different follow‑up message afterwards (e.g., an image caption). Our
441
- // previous logic overwrote the pre‑tool content. Preserve it by merging in
442
- // the pre‑tool stream when tool updates occurred and the final text does
443
- // not already include the streamed prefix.
444
- const hadTools = (messageToWriteTo.updates ?? []).some(
445
- (u) => u.type === MessageUpdateType.Tool
446
- );
447
-
448
- if (hadTools) {
449
- const existing = messageToWriteTo.content.slice(initialMessageContent.length);
450
- if (existing && existing.length > 0) {
451
- // A. If we already streamed the same final text, keep as-is.
452
- if (event.text && existing.endsWith(event.text)) {
453
- messageToWriteTo.content = initialMessageContent + existing;
454
- }
455
- // B. If the final text already includes the streamed prefix, use it verbatim.
456
- else if (event.text && event.text.startsWith(existing)) {
457
- messageToWriteTo.content = initialMessageContent + event.text;
458
- }
459
- // C. Otherwise, merge with a paragraph break for readability.
460
- else {
461
- const needsGap = !/\n\n$/.test(existing) && !/^\n/.test(event.text ?? "");
462
- messageToWriteTo.content =
463
- initialMessageContent + existing + (needsGap ? "\n\n" : "") + (event.text ?? "");
464
- }
465
- } else {
466
- messageToWriteTo.content = initialMessageContent + (event.text ?? "");
467
- }
468
- } else {
469
- messageToWriteTo.content = initialMessageContent + event.text;
470
- }
471
- finalAnswerReceived = true;
472
-
473
- if (metricsEnabled && metrics) {
474
- metrics.model.latency.observe(metricsLabels, Date.now() - promptedAt.getTime());
475
- }
476
- }
477
-
478
- // Add file
479
- else if (event.type === MessageUpdateType.File) {
480
- messageToWriteTo.files = [
481
- ...(messageToWriteTo.files ?? []),
482
- { type: "hash", name: event.name, value: event.sha, mime: event.mime },
483
- ];
484
- }
485
-
486
- // Store router metadata (for router models) or provider info (for all models)
487
- else if (event.type === MessageUpdateType.RouterMetadata) {
488
- // Merge metadata updates to preserve existing fields (router may send route/model first, then provider comes later)
489
- if (model?.isRouter) {
490
- messageToWriteTo.routerMetadata = {
491
- route: event.route || messageToWriteTo.routerMetadata?.route || "",
492
- model: event.model || messageToWriteTo.routerMetadata?.model || "",
493
- provider: event.provider || messageToWriteTo.routerMetadata?.provider,
494
- };
495
- }
496
- // Store provider-only metadata for non-router models if available
497
- else if (event.provider) {
498
- messageToWriteTo.routerMetadata = {
499
- route: messageToWriteTo.routerMetadata?.route || "",
500
- model: messageToWriteTo.routerMetadata?.model || "",
501
- provider: event.provider,
502
- };
503
- }
504
- }
505
-
506
- // Append updates for audit/replay (streams too, to preserve ordering)
507
- if (
508
- !(
509
- event.type === MessageUpdateType.Status &&
510
- event.status === MessageUpdateStatus.KeepAlive
511
- )
512
- ) {
513
- messageToWriteTo?.updates?.push(
514
- event.type === MessageUpdateType.Stream ? { ...event } : event
515
- );
516
- }
517
-
518
- // Avoid remote keylogging attack executed by watching packet lengths
519
- // by padding the text with null chars to a fixed length
520
- // https://cdn.arstechnica.net/wp-content/uploads/2024/03/LLM-Side-Channel.pdf
521
- if (event.type === MessageUpdateType.Stream) {
522
- event = { ...event, token: event.token.padEnd(16, "\0") };
523
- }
524
-
525
- messageToWriteTo.updatedAt = new Date();
526
-
527
- const enqueueUpdate = async () => {
528
- if (clientDetached) return;
529
- try {
530
- controller.enqueue(JSON.stringify(event) + "\n");
531
- if (event.type === MessageUpdateType.FinalAnswer) {
532
- controller.enqueue(" ".repeat(4096));
533
- }
534
- } catch (err) {
535
- clientDetached = true;
536
- logger.info(
537
- { conversationId: convId.toString() },
538
- "Client detached during message streaming"
539
- );
540
- }
541
- };
542
-
543
- await enqueueUpdate();
544
-
545
- if (clientDetached) {
546
- await persistConversation();
547
- }
548
- }
549
-
550
- let hasError = false;
551
- const initialMessageContent = messageToWriteTo.content;
552
-
553
- try {
554
- // Fetch user settings once for all overrides and billing org
555
- const userSettings = await collections.settings.findOne(authCondition(locals));
556
-
557
- // Add billing organization to locals for the endpoint to use
558
- locals.billingOrganization = userSettings?.billingOrganization;
559
-
560
- const ctx: TextGenerationContext = {
561
- model,
562
- endpoint: await model.getEndpoint(),
563
- conv,
564
- messages: messagesForPrompt,
565
- assistant: undefined,
566
- promptedAt,
567
- ip: getClientAddress(),
568
- username: locals.user?.username,
569
- // Force-enable multimodal if user settings say so for this model
570
- forceMultimodal: Boolean(userSettings?.multimodalOverrides?.[model.id]),
571
- // Force-enable tools if user settings say so for this model
572
- forceTools: Boolean(userSettings?.toolsOverrides?.[model.id]),
573
- // Inference provider preference (HuggingChat only, skip for router models)
574
- provider:
575
- config.isHuggingChat && !model.isRouter
576
- ? userSettings?.providerOverrides?.[model.id]
577
- : undefined,
578
- locals,
579
- abortController: ctrl,
580
- autopilot: autopilot === true,
581
- autopilotMaxSteps,
582
- };
583
- // run the text generation and send updates to the client
584
- for await (const event of textGeneration(ctx)) await update(event);
585
- if (ctrl.signal.aborted) {
586
- abortedByUser = true;
587
- }
588
- if (abortedByUser && !finalAnswerReceived) {
589
- const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
590
- await update({
591
- type: MessageUpdateType.FinalAnswer,
592
- text: partialText,
593
- interrupted: true,
594
- });
595
- }
596
- } catch (e) {
597
- const err = e as Error;
598
- const isAbortError =
599
- err?.name === "AbortError" ||
600
- err?.name === "APIUserAbortError" ||
601
- err?.message === "Request was aborted.";
602
- if (isAbortError || ctrl.signal.aborted) {
603
- abortedByUser = true;
604
- logger.info({ conversationId: conversationKey }, "Generation aborted by user");
605
- if (!finalAnswerReceived) {
606
- const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
607
- await update({
608
- type: MessageUpdateType.FinalAnswer,
609
- text: partialText,
610
- interrupted: true,
611
- });
612
- }
613
- } else {
614
- hasError = true;
615
- // Extract status code if available from HTTPError or APIError
616
- const errObj = err as unknown as Record<string, unknown>;
617
- const statusCode =
618
- (typeof errObj.statusCode === "number" ? errObj.statusCode : undefined) ||
619
- (typeof errObj.status === "number" ? errObj.status : undefined);
620
- await update({
621
- type: MessageUpdateType.Status,
622
- status: MessageUpdateStatus.Error,
623
- message: err.message,
624
- ...(statusCode && { statusCode }),
625
- });
626
- logger.error(err, "Error in conversation stream");
627
- }
628
- } finally {
629
- // check if no output was generated
630
- if (!hasError && !abortedByUser && messageToWriteTo.content === initialMessageContent) {
631
- hasError = true;
632
- logger.warn(
633
- {
634
- conversationId: conversationKey,
635
- updatesCount: messageToWriteTo.updates?.length ?? 0,
636
- filesCount: messageToWriteTo.files?.length ?? 0,
637
- reasoningLen: messageToWriteTo.reasoning?.length ?? 0,
638
- initialLen: initialMessageContent.length,
639
- finalLen: messageToWriteTo.content.length,
640
- },
641
- "No output generated after streaming; emitting error status"
642
- );
643
- await update({
644
- type: MessageUpdateType.Status,
645
- status: MessageUpdateStatus.Error,
646
- message: "No output was generated. Something went wrong.",
647
- });
648
- }
649
- }
650
-
651
- if (!hasError && !finishedStatusSent) {
652
- await update({
653
- type: MessageUpdateType.Status,
654
- status: MessageUpdateStatus.Finished,
655
- });
656
- }
657
-
658
- await persistConversation();
659
- abortRegistry.unregister(conversationKey, ctrl);
660
-
661
- // used to detect if cancel() is called bc of interrupt or just because the connection closes
662
- doneStreaming = true;
663
- if (!clientDetached) {
664
- controller.close();
665
- }
666
- },
667
- async cancel() {
668
- if (doneStreaming) return;
669
- clientDetached = true;
670
- await persistConversation();
671
- },
672
- });
673
-
674
- if (metricsEnabled && metrics) {
675
- metrics.model.messagesTotal.inc(metricsLabels);
676
- }
677
-
678
- // Todo: maybe we should wait for the message to be saved before ending the response - in case of errors
679
- return new Response(stream, {
680
- headers: {
681
- "Content-Type": "application/jsonl",
682
- },
683
- });
684
- }
685
-
686
- export async function DELETE({ locals, params }) {
687
- const convId = new ObjectId(params.id);
688
-
689
- const conv = await collections.conversations.findOne({
690
- _id: convId,
691
- ...authCondition(locals),
692
- });
693
-
694
- if (!conv) {
695
- error(404, "Conversation not found");
696
- }
697
-
698
- await collections.conversations.deleteOne({ _id: conv._id });
699
-
700
- return new Response();
701
- }
702
-
703
- export async function PATCH({ request, locals, params }) {
704
- const values = z
705
- .object({
706
- title: z.string().trim().min(1).max(100).optional(),
707
- model: validModelIdSchema.optional(),
708
- })
709
- .parse(await request.json());
710
-
711
- const convId = new ObjectId(params.id);
712
-
713
- const conv = await collections.conversations.findOne({
714
- _id: convId,
715
- ...authCondition(locals),
716
- });
717
-
718
- if (!conv) {
719
- error(404, "Conversation not found");
720
- }
721
-
722
- // Only include defined values in the update, with title sanitized
723
- const updateValues = {
724
- ...(values.title !== undefined && {
725
- title: values.title.replace(/<\/?think>/gi, "").trim(),
726
- }),
727
- ...(values.model !== undefined && { model: values.model }),
728
- };
729
-
730
- await collections.conversations.updateOne(
731
- {
732
- _id: convId,
733
- },
734
- {
735
- $set: updateValues,
736
- }
737
- );
738
-
739
- return new Response();
740
- }
1
+ import { authCondition } from "$lib/server/auth";
2
+ import { collections } from "$lib/server/database";
3
+ import { config } from "$lib/server/config";
4
+ import { models, validModelIdSchema } from "$lib/server/models";
5
+ import { ERROR_MESSAGES } from "$lib/stores/errors";
6
+ import type { Message } from "$lib/types/Message";
7
+ import { error } from "@sveltejs/kit";
8
+ import { ObjectId } from "mongodb";
9
+ import { z } from "zod";
10
+ import {
11
+ MessageUpdateStatus,
12
+ MessageUpdateType,
13
+ MessageReasoningUpdateType,
14
+ type MessageUpdate,
15
+ type MessageStreamUpdate,
16
+ } from "$lib/types/MessageUpdate";
17
+ import { uploadFile } from "$lib/server/files/uploadFile";
18
+ import { convertLegacyConversation } from "$lib/utils/tree/convertLegacyConversation";
19
+ import { isMessageId } from "$lib/utils/tree/isMessageId";
20
+ import { buildSubtree } from "$lib/utils/tree/buildSubtree.js";
21
+ import { addChildren } from "$lib/utils/tree/addChildren.js";
22
+ import { addSibling } from "$lib/utils/tree/addSibling.js";
23
+ import { usageLimits } from "$lib/server/usageLimits";
24
+ import { textGeneration } from "$lib/server/textGeneration";
25
+ import type { TextGenerationContext } from "$lib/server/textGeneration/types";
26
+ import { logger } from "$lib/server/logger.js";
27
+ import { AbortRegistry } from "$lib/server/abortRegistry";
28
+ import { MetricsServer } from "$lib/server/metrics";
29
+
30
+ export async function POST({ request, locals, params, getClientAddress }) {
31
+ const id = z.string().parse(params.id);
32
+ const convId = new ObjectId(id);
33
+ const promptedAt = new Date();
34
+
35
+ const userId = locals.user?._id ?? locals.sessionId;
36
+
37
+ // check user
38
+ if (!userId) {
39
+ error(401, "Unauthorized");
40
+ }
41
+
42
+ // check if the user has access to the conversation
43
+ const convBeforeCheck = await collections.conversations.findOne({
44
+ _id: convId,
45
+ ...authCondition(locals),
46
+ });
47
+
48
+ if (convBeforeCheck && !convBeforeCheck.rootMessageId) {
49
+ const res = await collections.conversations.updateOne(
50
+ {
51
+ _id: convId,
52
+ },
53
+ {
54
+ $set: {
55
+ ...convBeforeCheck,
56
+ ...convertLegacyConversation(convBeforeCheck),
57
+ },
58
+ }
59
+ );
60
+
61
+ if (!res.acknowledged) {
62
+ error(500, "Failed to convert conversation");
63
+ }
64
+ }
65
+
66
+ const conv = await collections.conversations.findOne({
67
+ _id: convId,
68
+ ...authCondition(locals),
69
+ });
70
+
71
+ if (!conv) {
72
+ error(404, "Conversation not found");
73
+ }
74
+
75
+ // register the event for ratelimiting
76
+ await collections.messageEvents.insertOne({
77
+ type: "message",
78
+ userId,
79
+ createdAt: new Date(),
80
+ expiresAt: new Date(Date.now() + 60_000),
81
+ ip: getClientAddress(),
82
+ });
83
+
84
+ if (usageLimits?.messagesPerMinute) {
85
+ // check if the user is rate limited
86
+ const nEvents = Math.max(
87
+ await collections.messageEvents.countDocuments({
88
+ userId,
89
+ type: "message",
90
+ expiresAt: { $gt: new Date() },
91
+ }),
92
+ await collections.messageEvents.countDocuments({
93
+ ip: getClientAddress(),
94
+ type: "message",
95
+ expiresAt: { $gt: new Date() },
96
+ })
97
+ );
98
+ if (nEvents > usageLimits.messagesPerMinute) {
99
+ error(429, ERROR_MESSAGES.rateLimited);
100
+ }
101
+ }
102
+
103
+ if (usageLimits?.messages && conv.messages.length > usageLimits.messages) {
104
+ error(
105
+ 429,
106
+ `This conversation has more than ${usageLimits.messages} messages. Start a new one to continue`
107
+ );
108
+ }
109
+
110
+ // fetch the model
111
+ const model = models.find((m) => m.id === conv.model);
112
+
113
+ if (!model) {
114
+ error(410, "Model not available anymore");
115
+ }
116
+
117
+ // finally parse the content of the request
118
+ const form = await request.formData();
119
+
120
+ const json = form.get("data");
121
+
122
+ if (!json || typeof json !== "string") {
123
+ error(400, "Invalid request");
124
+ }
125
+
126
+ const {
127
+ inputs: newPrompt,
128
+ id: messageId,
129
+ is_retry: isRetry,
130
+ selectedMcpServerNames,
131
+ selectedMcpServers,
132
+ autopilot,
133
+ autopilotMaxSteps,
134
+ } = z
135
+ .object({
136
+ id: z.string().uuid().refine(isMessageId).optional(), // parent message id to append to for a normal message, or the message id for a retry/continue
137
+ inputs: z.optional(
138
+ z
139
+ .string()
140
+ .min(1)
141
+ .transform((s) => s.replace(/\r\n/g, "\n"))
142
+ ),
143
+ is_retry: z.optional(z.boolean()),
144
+ autopilot: z.optional(z.boolean()),
145
+ // User-configurable cap on autopilot tool-call loops. Server clamps to [1, 100].
146
+ autopilotMaxSteps: z.optional(z.number().int().min(1).max(100)),
147
+ selectedMcpServerNames: z.optional(z.array(z.string())),
148
+ selectedMcpServers: z
149
+ .optional(
150
+ z.array(
151
+ z.object({
152
+ name: z.string(),
153
+ url: z.string(),
154
+ headers: z
155
+ .optional(z.array(z.object({ key: z.string(), value: z.string() })))
156
+ .default([]),
157
+ })
158
+ )
159
+ )
160
+ .default([]),
161
+ files: z.optional(
162
+ z.array(
163
+ z.object({
164
+ type: z.literal("base64").or(z.literal("hash")),
165
+ name: z.string(),
166
+ value: z.string(),
167
+ mime: z.string(),
168
+ })
169
+ )
170
+ ),
171
+ })
172
+ .parse(JSON.parse(json));
173
+
174
+ // Attach MCP selection to locals so the text generation pipeline can consume it
175
+ try {
176
+ (locals as unknown as Record<string, unknown>).mcp = {
177
+ selectedServerNames: selectedMcpServerNames,
178
+ selectedServers: (selectedMcpServers ?? []).map((s) => ({
179
+ name: s.name,
180
+ url: s.url,
181
+ headers:
182
+ s.headers && s.headers.length > 0
183
+ ? Object.fromEntries(s.headers.map((h) => [h.key, h.value]))
184
+ : undefined,
185
+ })),
186
+ };
187
+ } catch {
188
+ // ignore attachment errors, pipeline will just use env servers
189
+ }
190
+
191
+ const inputFiles = await Promise.all(
192
+ form
193
+ .getAll("files")
194
+ .filter((entry): entry is File => entry instanceof File && entry.size > 0)
195
+ .map(async (file) => {
196
+ const [type, ...name] = file.name.split(";");
197
+
198
+ return {
199
+ type: z.literal("base64").or(z.literal("hash")).parse(type),
200
+ value: await file.text(),
201
+ mime: file.type,
202
+ name: name.join(";"),
203
+ };
204
+ })
205
+ );
206
+
207
+ if (usageLimits?.messageLength && (newPrompt?.length ?? 0) > usageLimits.messageLength) {
208
+ error(400, "Message too long.");
209
+ }
210
+
211
+ // each file is either:
212
+ // base64 string requiring upload to the server
213
+ // hash pointing to an existing file
214
+ const hashFiles = inputFiles?.filter((file) => file.type === "hash") ?? [];
215
+ const b64Files =
216
+ inputFiles
217
+ ?.filter((file) => file.type !== "hash")
218
+ .map((file) => {
219
+ const blob = Buffer.from(file.value, "base64");
220
+ return new File([blob], file.name, { type: file.mime });
221
+ }) ?? [];
222
+
223
+ // check sizes
224
+ // todo: make configurable
225
+ if (b64Files.some((file) => file.size > 10 * 1024 * 1024)) {
226
+ error(413, "File too large, should be <10MB");
227
+ }
228
+
229
+ const uploadedFiles = await Promise.all(b64Files.map((file) => uploadFile(file, conv))).then(
230
+ (files) => [...files, ...hashFiles]
231
+ );
232
+
233
+ // we will append tokens to the content of this message
234
+ let messageToWriteToId: Message["id"] | undefined = undefined;
235
+ // used for building the prompt, subtree of the conversation that goes from the latest message to the root
236
+ let messagesForPrompt: Message[] = [];
237
+
238
+ if (isRetry && messageId) {
239
+ // two cases, if we're retrying a user message with a newPrompt set,
240
+ // it means we're editing a user message
241
+ // if we're retrying on an assistant message, newPrompt cannot be set
242
+ // it means we're retrying the last assistant message for a new answer
243
+
244
+ const messageToRetry = conv.messages.find((message) => message.id === messageId);
245
+
246
+ if (!messageToRetry) {
247
+ error(404, "Message not found");
248
+ }
249
+
250
+ if (messageToRetry.from === "user" && newPrompt) {
251
+ // add a sibling to this message from the user, with the alternative prompt
252
+ // add a children to that sibling, where we can write to
253
+ const newUserMessageId = addSibling(
254
+ conv,
255
+ {
256
+ from: "user",
257
+ content: newPrompt,
258
+ files: uploadedFiles,
259
+ createdAt: new Date(),
260
+ updatedAt: new Date(),
261
+ },
262
+ messageId
263
+ );
264
+ messageToWriteToId = addChildren(
265
+ conv,
266
+ {
267
+ from: "assistant",
268
+ content: "",
269
+ createdAt: new Date(),
270
+ updatedAt: new Date(),
271
+ },
272
+ newUserMessageId
273
+ );
274
+ messagesForPrompt = buildSubtree(conv, newUserMessageId);
275
+ } else if (messageToRetry.from === "assistant") {
276
+ // we're retrying an assistant message, to generate a new answer
277
+ // just add a sibling to the assistant answer where we can write to
278
+ messageToWriteToId = addSibling(
279
+ conv,
280
+ { from: "assistant", content: "", createdAt: new Date(), updatedAt: new Date() },
281
+ messageId
282
+ );
283
+ messagesForPrompt = buildSubtree(conv, messageId);
284
+ messagesForPrompt.pop(); // don't need the latest assistant message in the prompt since we're retrying it
285
+ }
286
+ } else {
287
+ // just a normal linear conversation, so we add the user message
288
+ // and the blank assistant message back to back
289
+ const newUserMessageId = addChildren(
290
+ conv,
291
+ {
292
+ from: "user",
293
+ content: newPrompt ?? "",
294
+ files: uploadedFiles,
295
+ createdAt: new Date(),
296
+ updatedAt: new Date(),
297
+ },
298
+ messageId
299
+ );
300
+
301
+ messageToWriteToId = addChildren(
302
+ conv,
303
+ {
304
+ from: "assistant",
305
+ content: "",
306
+ createdAt: new Date(),
307
+ updatedAt: new Date(),
308
+ },
309
+ newUserMessageId
310
+ );
311
+ // build the prompt from the user message
312
+ messagesForPrompt = buildSubtree(conv, newUserMessageId);
313
+ }
314
+
315
+ const messageToWriteTo = conv.messages.find((message) => message.id === messageToWriteToId);
316
+ if (!messageToWriteTo) {
317
+ error(500, "Failed to create message");
318
+ }
319
+ if (messagesForPrompt.length === 0) {
320
+ error(500, "Failed to create prompt");
321
+ }
322
+
323
+ // update the conversation with the new messages
324
+ await collections.conversations.updateOne(
325
+ { _id: convId },
326
+ { $set: { messages: conv.messages, title: conv.title, updatedAt: new Date() } }
327
+ );
328
+
329
+ let doneStreaming = false;
330
+ let clientDetached = false;
331
+
332
+ let lastTokenTimestamp: undefined | Date = undefined;
333
+ let firstTokenObserved = false;
334
+ const metricsEnabled = MetricsServer.isEnabled();
335
+ const metrics = metricsEnabled ? MetricsServer.getMetrics() : undefined;
336
+ const metricsModelId = model.id ?? model.name ?? conv.model;
337
+ const metricsLabels = { model: metricsModelId };
338
+
339
+ const persistConversation = async () => {
340
+ const messagesForSave = conv.messages.map((msg) => {
341
+ const filteredUpdates =
342
+ msg.updates
343
+ ?.filter(
344
+ (u) =>
345
+ !(u.type === MessageUpdateType.Status && u.status === MessageUpdateStatus.KeepAlive)
346
+ )
347
+ .map((u) => {
348
+ if (u.type !== MessageUpdateType.Stream) return u;
349
+ // Preserve existing len if already compressed, otherwise compute from token
350
+ const len = u.len ?? (u.token ?? "").length;
351
+ // store a lightweight marker to preserve ordering without duplicating content
352
+ return { type: MessageUpdateType.Stream, token: "", len } satisfies MessageStreamUpdate;
353
+ }) ?? [];
354
+
355
+ return { ...msg, updates: filteredUpdates };
356
+ });
357
+
358
+ await collections.conversations.updateOne(
359
+ { _id: convId },
360
+ { $set: { messages: messagesForSave, title: conv.title, updatedAt: new Date() } }
361
+ );
362
+ };
363
+
364
+ const abortRegistry = AbortRegistry.getInstance();
365
+
366
+ // we now build the stream
367
+ const stream = new ReadableStream({
368
+ async start(controller) {
369
+ const conversationKey = convId.toString();
370
+ const ctrl = new AbortController();
371
+ abortRegistry.register(conversationKey, ctrl);
372
+
373
+ let finalAnswerReceived = false;
374
+ let abortedByUser = false;
375
+ let finishedStatusSent = false;
376
+
377
+ messageToWriteTo.updates ??= [];
378
+ async function update(event: MessageUpdate) {
379
+ if (!messageToWriteTo || !conv) {
380
+ throw Error("No message or conversation to write events to");
381
+ }
382
+
383
+ if (
384
+ event.type === MessageUpdateType.Status &&
385
+ event.status === MessageUpdateStatus.Finished
386
+ ) {
387
+ finishedStatusSent = true;
388
+ }
389
+
390
+ // Add token to content or skip if empty
391
+ if (event.type === MessageUpdateType.Stream) {
392
+ if (event.token === "") return;
393
+ messageToWriteTo.content += event.token;
394
+
395
+ if (metricsEnabled && metrics) {
396
+ const now = Date.now();
397
+ metrics.model.tokenCountTotal.inc(metricsLabels);
398
+
399
+ if (!firstTokenObserved) {
400
+ metrics.model.timeToFirstToken.observe(metricsLabels, now - promptedAt.getTime());
401
+ firstTokenObserved = true;
402
+ }
403
+
404
+ const previousTimestamp = lastTokenTimestamp
405
+ ? lastTokenTimestamp.getTime()
406
+ : promptedAt.getTime();
407
+ metrics.model.timePerOutputToken.observe(metricsLabels, now - previousTimestamp);
408
+ }
409
+
410
+ lastTokenTimestamp = new Date();
411
+ }
412
+
413
+ // Append reasoning stream tokens to message.reasoning (server-side)
414
+ else if (
415
+ event.type === MessageUpdateType.Reasoning &&
416
+ event.subtype === MessageReasoningUpdateType.Stream &&
417
+ "token" in event
418
+ ) {
419
+ messageToWriteTo.reasoning ??= "";
420
+ messageToWriteTo.reasoning += event.token;
421
+ }
422
+
423
+ // Set the title
424
+ else if (event.type === MessageUpdateType.Title) {
425
+ // Always strip <think> markers from titles when saving
426
+ const sanitizedTitle = event.title.replace(/<\/?think>/gi, "").trim();
427
+ conv.title = sanitizedTitle;
428
+ await collections.conversations.updateOne(
429
+ { _id: convId },
430
+ { $set: { title: conv?.title, updatedAt: new Date() } }
431
+ );
432
+ }
433
+
434
+ // Set the final text and the interrupted flag
435
+ else if (event.type === MessageUpdateType.FinalAnswer) {
436
+ messageToWriteTo.interrupted = event.interrupted;
437
+ // Default behavior: replace the streamed text with the provider's final text.
438
+ // However, when tools (MCP/function calls) were used, providers often stream
439
+ // some content (e.g., a story) before triggering tools, then return a
440
+ // different follow‑up message afterwards (e.g., an image caption). Our
441
+ // previous logic overwrote the pre‑tool content. Preserve it by merging in
442
+ // the pre‑tool stream when tool updates occurred and the final text does
443
+ // not already include the streamed prefix.
444
+ const hadTools = (messageToWriteTo.updates ?? []).some(
445
+ (u) => u.type === MessageUpdateType.Tool
446
+ );
447
+
448
+ if (hadTools) {
449
+ const existing = messageToWriteTo.content.slice(initialMessageContent.length);
450
+ if (existing && existing.length > 0) {
451
+ // A. If we already streamed the same final text, keep as-is.
452
+ if (event.text && existing.endsWith(event.text)) {
453
+ messageToWriteTo.content = initialMessageContent + existing;
454
+ }
455
+ // B. If the final text already includes the streamed prefix, use it verbatim.
456
+ else if (event.text && event.text.startsWith(existing)) {
457
+ messageToWriteTo.content = initialMessageContent + event.text;
458
+ }
459
+ // C. Otherwise, merge with a paragraph break for readability.
460
+ else {
461
+ const needsGap = !/\n\n$/.test(existing) && !/^\n/.test(event.text ?? "");
462
+ messageToWriteTo.content =
463
+ initialMessageContent + existing + (needsGap ? "\n\n" : "") + (event.text ?? "");
464
+ }
465
+ } else {
466
+ messageToWriteTo.content = initialMessageContent + (event.text ?? "");
467
+ }
468
+ } else {
469
+ messageToWriteTo.content = initialMessageContent + event.text;
470
+ }
471
+ finalAnswerReceived = true;
472
+
473
+ if (metricsEnabled && metrics) {
474
+ metrics.model.latency.observe(metricsLabels, Date.now() - promptedAt.getTime());
475
+ }
476
+ }
477
+
478
+ // Add file
479
+ else if (event.type === MessageUpdateType.File) {
480
+ messageToWriteTo.files = [
481
+ ...(messageToWriteTo.files ?? []),
482
+ { type: "hash", name: event.name, value: event.sha, mime: event.mime },
483
+ ];
484
+ }
485
+
486
+ // Store router metadata (for router models) or provider info (for all models)
487
+ else if (event.type === MessageUpdateType.RouterMetadata) {
488
+ // Merge metadata updates to preserve existing fields (router may send route/model first, then provider comes later)
489
+ if (model?.isRouter) {
490
+ messageToWriteTo.routerMetadata = {
491
+ route: event.route || messageToWriteTo.routerMetadata?.route || "",
492
+ model: event.model || messageToWriteTo.routerMetadata?.model || "",
493
+ provider: event.provider || messageToWriteTo.routerMetadata?.provider,
494
+ };
495
+ }
496
+ // Store provider-only metadata for non-router models if available
497
+ else if (event.provider) {
498
+ messageToWriteTo.routerMetadata = {
499
+ route: messageToWriteTo.routerMetadata?.route || "",
500
+ model: messageToWriteTo.routerMetadata?.model || "",
501
+ provider: event.provider,
502
+ };
503
+ }
504
+ }
505
+
506
+ // Append updates for audit/replay (streams too, to preserve ordering)
507
+ if (
508
+ !(
509
+ event.type === MessageUpdateType.Status &&
510
+ event.status === MessageUpdateStatus.KeepAlive
511
+ )
512
+ ) {
513
+ messageToWriteTo?.updates?.push(
514
+ event.type === MessageUpdateType.Stream ? { ...event } : event
515
+ );
516
+ }
517
+
518
+ // Avoid remote keylogging attack executed by watching packet lengths
519
+ // by padding the text with null chars to a fixed length
520
+ // https://cdn.arstechnica.net/wp-content/uploads/2024/03/LLM-Side-Channel.pdf
521
+ if (event.type === MessageUpdateType.Stream) {
522
+ event = { ...event, token: event.token.padEnd(16, "\0") };
523
+ }
524
+
525
+ messageToWriteTo.updatedAt = new Date();
526
+
527
+ const enqueueUpdate = async () => {
528
+ if (clientDetached) return;
529
+ try {
530
+ controller.enqueue(JSON.stringify(event) + "\n");
531
+ if (event.type === MessageUpdateType.FinalAnswer) {
532
+ controller.enqueue(" ".repeat(4096));
533
+ }
534
+ } catch (err) {
535
+ clientDetached = true;
536
+ logger.info(
537
+ { conversationId: convId.toString() },
538
+ "Client detached during message streaming"
539
+ );
540
+ }
541
+ };
542
+
543
+ await enqueueUpdate();
544
+
545
+ if (clientDetached) {
546
+ await persistConversation();
547
+ }
548
+ }
549
+
550
+ let hasError = false;
551
+ const initialMessageContent = messageToWriteTo.content;
552
+
553
+ try {
554
+ // Fetch user settings once for all overrides and billing org
555
+ const userSettings = await collections.settings.findOne(authCondition(locals));
556
+
557
+ // Add billing organization to locals for the endpoint to use
558
+ locals.billingOrganization = userSettings?.billingOrganization;
559
+
560
+ const ctx: TextGenerationContext = {
561
+ model,
562
+ endpoint: await model.getEndpoint(),
563
+ conv,
564
+ messages: messagesForPrompt,
565
+ assistant: undefined,
566
+ promptedAt,
567
+ ip: getClientAddress(),
568
+ username: locals.user?.username,
569
+ // Force-enable multimodal if user settings say so for this model
570
+ forceMultimodal: Boolean(userSettings?.multimodalOverrides?.[model.id]),
571
+ // Force-enable tools if user settings say so for this model
572
+ forceTools: Boolean(userSettings?.toolsOverrides?.[model.id]),
573
+ // Inference provider preference (HuggingChat only, skip for router models)
574
+ provider:
575
+ config.isHuggingChat && !model.isRouter
576
+ ? userSettings?.providerOverrides?.[model.id]
577
+ : undefined,
578
+ locals,
579
+ abortController: ctrl,
580
+ autopilot: autopilot === true,
581
+ autopilotMaxSteps,
582
+ };
583
+ // run the text generation and send updates to the client
584
+ for await (const event of textGeneration(ctx)) await update(event);
585
+ if (ctrl.signal.aborted) {
586
+ abortedByUser = true;
587
+ }
588
+ if (abortedByUser && !finalAnswerReceived) {
589
+ const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
590
+ await update({
591
+ type: MessageUpdateType.FinalAnswer,
592
+ text: partialText,
593
+ interrupted: true,
594
+ });
595
+ }
596
+ } catch (e) {
597
+ const err = e as Error;
598
+ const isAbortError =
599
+ err?.name === "AbortError" ||
600
+ err?.name === "APIUserAbortError" ||
601
+ err?.message === "Request was aborted.";
602
+ if (isAbortError || ctrl.signal.aborted) {
603
+ abortedByUser = true;
604
+ logger.info({ conversationId: conversationKey }, "Generation aborted by user");
605
+ if (!finalAnswerReceived) {
606
+ const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
607
+ await update({
608
+ type: MessageUpdateType.FinalAnswer,
609
+ text: partialText,
610
+ interrupted: true,
611
+ });
612
+ }
613
+ } else {
614
+ hasError = true;
615
+ // Extract status code if available from HTTPError or APIError
616
+ const errObj = err as unknown as Record<string, unknown>;
617
+ const statusCode =
618
+ (typeof errObj.statusCode === "number" ? errObj.statusCode : undefined) ||
619
+ (typeof errObj.status === "number" ? errObj.status : undefined);
620
+ await update({
621
+ type: MessageUpdateType.Status,
622
+ status: MessageUpdateStatus.Error,
623
+ message: err.message,
624
+ ...(statusCode && { statusCode }),
625
+ });
626
+ logger.error(err, "Error in conversation stream");
627
+ }
628
+ } finally {
629
+ // check if no output was generated
630
+ if (!hasError && !abortedByUser && messageToWriteTo.content === initialMessageContent) {
631
+ hasError = true;
632
+ logger.warn(
633
+ {
634
+ conversationId: conversationKey,
635
+ updatesCount: messageToWriteTo.updates?.length ?? 0,
636
+ filesCount: messageToWriteTo.files?.length ?? 0,
637
+ reasoningLen: messageToWriteTo.reasoning?.length ?? 0,
638
+ initialLen: initialMessageContent.length,
639
+ finalLen: messageToWriteTo.content.length,
640
+ },
641
+ "No output generated after streaming; emitting error status"
642
+ );
643
+ await update({
644
+ type: MessageUpdateType.Status,
645
+ status: MessageUpdateStatus.Error,
646
+ message: "No output was generated. Something went wrong.",
647
+ });
648
+ }
649
+ }
650
+
651
+ if (!hasError && !finishedStatusSent) {
652
+ await update({
653
+ type: MessageUpdateType.Status,
654
+ status: MessageUpdateStatus.Finished,
655
+ });
656
+ }
657
+
658
+ await persistConversation();
659
+ abortRegistry.unregister(conversationKey, ctrl);
660
+
661
+ // used to detect if cancel() is called bc of interrupt or just because the connection closes
662
+ doneStreaming = true;
663
+ if (!clientDetached) {
664
+ controller.close();
665
+ }
666
+ },
667
+ async cancel() {
668
+ if (doneStreaming) return;
669
+ clientDetached = true;
670
+ await persistConversation();
671
+ },
672
+ });
673
+
674
+ if (metricsEnabled && metrics) {
675
+ metrics.model.messagesTotal.inc(metricsLabels);
676
+ }
677
+
678
+ // Todo: maybe we should wait for the message to be saved before ending the response - in case of errors
679
+ return new Response(stream, {
680
+ headers: {
681
+ "Content-Type": "application/jsonl",
682
+ },
683
+ });
684
+ }
685
+
686
+ export async function DELETE({ locals, params }) {
687
+ const convId = new ObjectId(params.id);
688
+
689
+ const conv = await collections.conversations.findOne({
690
+ _id: convId,
691
+ ...authCondition(locals),
692
+ });
693
+
694
+ if (!conv) {
695
+ error(404, "Conversation not found");
696
+ }
697
+
698
+ await collections.conversations.deleteOne({ _id: conv._id });
699
+
700
+ return new Response();
701
+ }
702
+
703
+ export async function PATCH({ request, locals, params }) {
704
+ const values = z
705
+ .object({
706
+ title: z.string().trim().min(1).max(100).optional(),
707
+ model: validModelIdSchema.optional(),
708
+ })
709
+ .parse(await request.json());
710
+
711
+ const convId = new ObjectId(params.id);
712
+
713
+ const conv = await collections.conversations.findOne({
714
+ _id: convId,
715
+ ...authCondition(locals),
716
+ });
717
+
718
+ if (!conv) {
719
+ error(404, "Conversation not found");
720
+ }
721
+
722
+ // Only include defined values in the update, with title sanitized
723
+ const updateValues = {
724
+ ...(values.title !== undefined && {
725
+ title: values.title.replace(/<\/?think>/gi, "").trim(),
726
+ }),
727
+ ...(values.model !== undefined && { model: values.model }),
728
+ };
729
+
730
+ await collections.conversations.updateOne(
731
+ {
732
+ _id: convId,
733
+ },
734
+ {
735
+ $set: updateValues,
736
+ }
737
+ );
738
+
739
+ return new Response();
740
+ }