ruflo 3.10.46 → 3.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (498) hide show
  1. package/README.md +412 -412
  2. package/bin/ruflo.js +77 -77
  3. package/package.json +113 -113
  4. package/src/chat-ui/Dockerfile +25 -25
  5. package/src/chat-ui/patch-mcp-url-safety.sh +28 -28
  6. package/src/config/config.example.json +76 -76
  7. package/src/mcp-bridge/Dockerfile +45 -45
  8. package/src/mcp-bridge/index.js +1692 -1692
  9. package/src/mcp-bridge/mcp-stdio-kernel.js +159 -159
  10. package/src/mcp-bridge/package.json +17 -17
  11. package/src/mcp-bridge/test-harness.js +470 -470
  12. package/src/nginx/Dockerfile +10 -10
  13. package/src/nginx/nginx.conf +67 -67
  14. package/src/nginx/static/favicon-dark.svg +4 -4
  15. package/src/nginx/static/favicon.svg +4 -4
  16. package/src/nginx/static/icon.svg +5 -5
  17. package/src/nginx/static/logo.svg +9 -9
  18. package/src/nginx/static/manifest.json +22 -22
  19. package/src/nginx/static/welcome.js +184 -184
  20. package/src/ruvocal/.claude/skills/add-model-descriptions/SKILL.md +73 -73
  21. package/src/ruvocal/.claude-flow/daemon-state.json +135 -0
  22. package/src/ruvocal/.claude-flow/data/pending-insights.jsonl +0 -0
  23. package/src/ruvocal/.claude-flow/data/ranked-context.json +5 -0
  24. package/src/ruvocal/.claude-flow/logs/daemon.log +31 -0
  25. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_prompt.log +989 -0
  26. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_result.log +67 -0
  27. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_prompt.log +989 -0
  28. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_result.log +93 -0
  29. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_prompt.log +1498 -0
  30. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_result.log +93 -0
  31. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_prompt.log +1498 -0
  32. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_result.log +100 -0
  33. package/src/ruvocal/.claude-flow/metrics/codebase-map.json +11 -0
  34. package/src/ruvocal/.claude-flow/metrics/consolidation.json +6 -0
  35. package/src/ruvocal/.claude-flow/neural/stats.json +6 -0
  36. package/src/ruvocal/.claude-flow/sessions/current.json +13 -0
  37. package/src/ruvocal/.devcontainer/Dockerfile +9 -9
  38. package/src/ruvocal/.devcontainer/devcontainer.json +36 -36
  39. package/src/ruvocal/.dockerignore +16 -16
  40. package/src/ruvocal/.eslintignore +13 -13
  41. package/src/ruvocal/.eslintrc.cjs +45 -45
  42. package/src/ruvocal/.gcloudignore +18 -18
  43. package/src/ruvocal/.github/ISSUE_TEMPLATE/bug-report--chat-ui-.md +43 -43
  44. package/src/ruvocal/.github/ISSUE_TEMPLATE/config-support.md +9 -9
  45. package/src/ruvocal/.github/ISSUE_TEMPLATE/feature-request--chat-ui-.md +17 -17
  46. package/src/ruvocal/.github/ISSUE_TEMPLATE/huggingchat.md +11 -11
  47. package/src/ruvocal/.github/release.yml +16 -16
  48. package/src/ruvocal/.github/workflows/build-docs.yml +18 -18
  49. package/src/ruvocal/.github/workflows/build-image.yml +142 -142
  50. package/src/ruvocal/.github/workflows/build-pr-docs.yml +20 -20
  51. package/src/ruvocal/.github/workflows/deploy-dev.yml +63 -63
  52. package/src/ruvocal/.github/workflows/deploy-prod.yml +78 -78
  53. package/src/ruvocal/.github/workflows/lint-and-test.yml +84 -84
  54. package/src/ruvocal/.github/workflows/slugify.yaml +72 -72
  55. package/src/ruvocal/.github/workflows/trufflehog.yml +17 -17
  56. package/src/ruvocal/.github/workflows/upload-pr-documentation.yml +16 -16
  57. package/src/ruvocal/.husky/lint-stage-config.js +4 -4
  58. package/src/ruvocal/.husky/pre-commit +2 -2
  59. package/src/ruvocal/.prettierignore +14 -14
  60. package/src/ruvocal/.prettierrc +7 -7
  61. package/src/ruvocal/.swarm/attestation.db +0 -0
  62. package/src/ruvocal/.swarm/hnsw.index +0 -0
  63. package/src/ruvocal/.swarm/hnsw.metadata.json +1 -0
  64. package/src/ruvocal/.swarm/memory.db +0 -0
  65. package/src/ruvocal/.swarm/schema.sql +305 -0
  66. package/src/ruvocal/CLAUDE.md +126 -126
  67. package/src/ruvocal/Dockerfile +96 -96
  68. package/src/ruvocal/LICENSE +202 -202
  69. package/src/ruvocal/PRIVACY.md +41 -41
  70. package/src/ruvocal/README.md +164 -164
  71. package/src/ruvocal/chart/Chart.yaml +5 -5
  72. package/src/ruvocal/chart/env/dev.yaml +260 -260
  73. package/src/ruvocal/chart/env/prod.yaml +273 -273
  74. package/src/ruvocal/chart/templates/_helpers.tpl +22 -22
  75. package/src/ruvocal/chart/templates/config.yaml +10 -10
  76. package/src/ruvocal/chart/templates/deployment.yaml +81 -81
  77. package/src/ruvocal/chart/templates/hpa.yaml +45 -45
  78. package/src/ruvocal/chart/templates/infisical.yaml +24 -24
  79. package/src/ruvocal/chart/templates/ingress-internal.yaml +32 -32
  80. package/src/ruvocal/chart/templates/ingress.yaml +32 -32
  81. package/src/ruvocal/chart/templates/network-policy.yaml +36 -36
  82. package/src/ruvocal/chart/templates/service-account.yaml +13 -13
  83. package/src/ruvocal/chart/templates/service-monitor.yaml +17 -17
  84. package/src/ruvocal/chart/templates/service.yaml +21 -21
  85. package/src/ruvocal/chart/values.yaml +73 -73
  86. package/src/ruvocal/cloudbuild.yaml +68 -68
  87. package/src/ruvocal/config/branding.env.example +19 -19
  88. package/src/ruvocal/docker-compose.yml +21 -21
  89. package/src/ruvocal/docs/adr/ADR-029-HUGGINGFACE-CHAT-UI-CLOUD-RUN.md +1236 -1236
  90. package/src/ruvocal/docs/adr/ADR-033-RUVECTOR-RUFLO-MCP-INTEGRATION.md +111 -111
  91. package/src/ruvocal/docs/adr/ADR-034-OPTIONAL-MCP-BACKENDS.md +117 -117
  92. package/src/ruvocal/docs/adr/ADR-035-MCP-TOOL-GROUPS.md +186 -186
  93. package/src/ruvocal/docs/adr/ADR-037-AUTOPILOT-CHAT-MODE.md +1500 -1500
  94. package/src/ruvocal/docs/adr/ADR-038-RUVOCAL-FORK.md +286 -286
  95. package/src/ruvocal/docs/source/_toctree.yml +30 -30
  96. package/src/ruvocal/docs/source/configuration/common-issues.md +38 -38
  97. package/src/ruvocal/docs/source/configuration/llm-router.md +105 -105
  98. package/src/ruvocal/docs/source/configuration/mcp-tools.md +84 -84
  99. package/src/ruvocal/docs/source/configuration/metrics.md +9 -9
  100. package/src/ruvocal/docs/source/configuration/open-id.md +57 -57
  101. package/src/ruvocal/docs/source/configuration/overview.md +89 -89
  102. package/src/ruvocal/docs/source/configuration/theming.md +20 -20
  103. package/src/ruvocal/docs/source/developing/architecture.md +48 -48
  104. package/src/ruvocal/docs/source/index.md +53 -53
  105. package/src/ruvocal/docs/source/installation/docker.md +43 -43
  106. package/src/ruvocal/docs/source/installation/helm.md +43 -43
  107. package/src/ruvocal/docs/source/installation/local.md +62 -62
  108. package/src/ruvocal/entrypoint.sh +18 -18
  109. package/src/ruvocal/mcp-bridge/Dockerfile +45 -45
  110. package/src/ruvocal/mcp-bridge/cloudbuild.yaml +49 -49
  111. package/src/ruvocal/mcp-bridge/index.js +1902 -1902
  112. package/src/ruvocal/mcp-bridge/mcp-stdio-kernel.js +159 -159
  113. package/src/ruvocal/mcp-bridge/package-lock.json +762 -762
  114. package/src/ruvocal/mcp-bridge/package.json +17 -17
  115. package/src/ruvocal/mcp-bridge/test-harness.js +470 -470
  116. package/src/ruvocal/package-lock.json +11741 -11741
  117. package/src/ruvocal/package.json +121 -121
  118. package/src/ruvocal/postcss.config.js +6 -6
  119. package/src/ruvocal/rvf.manifest.json +204 -204
  120. package/src/ruvocal/scripts/config.ts +64 -64
  121. package/src/ruvocal/scripts/generate-welcome.mjs +181 -181
  122. package/src/ruvocal/scripts/populate.ts +288 -288
  123. package/src/ruvocal/scripts/samples.txt +194 -194
  124. package/src/ruvocal/scripts/setups/vitest-setup-server.ts +44 -44
  125. package/src/ruvocal/scripts/updateLocalEnv.ts +48 -48
  126. package/src/ruvocal/src/ambient.d.ts +7 -7
  127. package/src/ruvocal/src/app.d.ts +29 -29
  128. package/src/ruvocal/src/app.html +53 -53
  129. package/src/ruvocal/src/hooks.server.ts +32 -32
  130. package/src/ruvocal/src/hooks.ts +6 -6
  131. package/src/ruvocal/src/lib/APIClient.ts +148 -148
  132. package/src/ruvocal/src/lib/actions/clickOutside.ts +18 -18
  133. package/src/ruvocal/src/lib/actions/snapScrollToBottom.ts +346 -346
  134. package/src/ruvocal/src/lib/buildPrompt.ts +33 -33
  135. package/src/ruvocal/src/lib/components/AnnouncementBanner.svelte +20 -20
  136. package/src/ruvocal/src/lib/components/BackgroundGenerationPoller.svelte +168 -168
  137. package/src/ruvocal/src/lib/components/CodeBlock.svelte +73 -73
  138. package/src/ruvocal/src/lib/components/CopyToClipBoardBtn.svelte +92 -92
  139. package/src/ruvocal/src/lib/components/DeleteConversationModal.svelte +75 -75
  140. package/src/ruvocal/src/lib/components/EditConversationModal.svelte +100 -100
  141. package/src/ruvocal/src/lib/components/ExpandNavigation.svelte +22 -22
  142. package/src/ruvocal/src/lib/components/FoundationBackground.svelte +242 -242
  143. package/src/ruvocal/src/lib/components/HoverTooltip.svelte +44 -44
  144. package/src/ruvocal/src/lib/components/HtmlPreviewModal.svelte +143 -143
  145. package/src/ruvocal/src/lib/components/InfiniteScroll.svelte +50 -50
  146. package/src/ruvocal/src/lib/components/MobileNav.svelte +300 -300
  147. package/src/ruvocal/src/lib/components/Modal.svelte +115 -115
  148. package/src/ruvocal/src/lib/components/ModelCardMetadata.svelte +71 -71
  149. package/src/ruvocal/src/lib/components/NavConversationItem.svelte +151 -151
  150. package/src/ruvocal/src/lib/components/NavMenu.svelte +313 -313
  151. package/src/ruvocal/src/lib/components/Pagination.svelte +97 -97
  152. package/src/ruvocal/src/lib/components/PaginationArrow.svelte +27 -27
  153. package/src/ruvocal/src/lib/components/Portal.svelte +24 -24
  154. package/src/ruvocal/src/lib/components/RetryBtn.svelte +18 -18
  155. package/src/ruvocal/src/lib/components/RuFloUniverse.svelte +185 -185
  156. package/src/ruvocal/src/lib/components/RufloHelpModal.svelte +411 -411
  157. package/src/ruvocal/src/lib/components/ScrollToBottomBtn.svelte +47 -47
  158. package/src/ruvocal/src/lib/components/ScrollToPreviousBtn.svelte +77 -77
  159. package/src/ruvocal/src/lib/components/ShareConversationModal.svelte +182 -182
  160. package/src/ruvocal/src/lib/components/StopGeneratingBtn.svelte +69 -69
  161. package/src/ruvocal/src/lib/components/SubscribeModal.svelte +87 -87
  162. package/src/ruvocal/src/lib/components/Switch.svelte +36 -36
  163. package/src/ruvocal/src/lib/components/SystemPromptModal.svelte +44 -44
  164. package/src/ruvocal/src/lib/components/Toast.svelte +27 -27
  165. package/src/ruvocal/src/lib/components/Tooltip.svelte +30 -30
  166. package/src/ruvocal/src/lib/components/WelcomeModal.svelte +46 -46
  167. package/src/ruvocal/src/lib/components/chat/Alternatives.svelte +77 -77
  168. package/src/ruvocal/src/lib/components/chat/BlockWrapper.svelte +72 -72
  169. package/src/ruvocal/src/lib/components/chat/ChatInput.svelte +490 -490
  170. package/src/ruvocal/src/lib/components/chat/ChatIntroduction.svelte +123 -123
  171. package/src/ruvocal/src/lib/components/chat/ChatMessage.svelte +548 -548
  172. package/src/ruvocal/src/lib/components/chat/ChatWindow.svelte +1057 -1057
  173. package/src/ruvocal/src/lib/components/chat/FileDropzone.svelte +92 -92
  174. package/src/ruvocal/src/lib/components/chat/ImageLightbox.svelte +66 -66
  175. package/src/ruvocal/src/lib/components/chat/MarkdownBlock.svelte +23 -23
  176. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte +69 -69
  177. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte.test.ts +58 -58
  178. package/src/ruvocal/src/lib/components/chat/MessageAvatar.svelte +103 -103
  179. package/src/ruvocal/src/lib/components/chat/ModelSwitch.svelte +64 -64
  180. package/src/ruvocal/src/lib/components/chat/OpenReasoningResults.svelte +81 -81
  181. package/src/ruvocal/src/lib/components/chat/TaskGroup.svelte +88 -88
  182. package/src/ruvocal/src/lib/components/chat/ToolUpdate.svelte +273 -273
  183. package/src/ruvocal/src/lib/components/chat/UploadedFile.svelte +253 -253
  184. package/src/ruvocal/src/lib/components/chat/UrlFetchModal.svelte +203 -203
  185. package/src/ruvocal/src/lib/components/chat/VoiceRecorder.svelte +214 -214
  186. package/src/ruvocal/src/lib/components/icons/IconBurger.svelte +20 -20
  187. package/src/ruvocal/src/lib/components/icons/IconCheap.svelte +20 -20
  188. package/src/ruvocal/src/lib/components/icons/IconChevron.svelte +24 -24
  189. package/src/ruvocal/src/lib/components/icons/IconDazzled.svelte +40 -40
  190. package/src/ruvocal/src/lib/components/icons/IconFast.svelte +20 -20
  191. package/src/ruvocal/src/lib/components/icons/IconLoading.svelte +22 -22
  192. package/src/ruvocal/src/lib/components/icons/IconMCP.svelte +28 -28
  193. package/src/ruvocal/src/lib/components/icons/IconMoon.svelte +21 -21
  194. package/src/ruvocal/src/lib/components/icons/IconNew.svelte +20 -20
  195. package/src/ruvocal/src/lib/components/icons/IconOmni.svelte +90 -90
  196. package/src/ruvocal/src/lib/components/icons/IconPaperclip.svelte +24 -24
  197. package/src/ruvocal/src/lib/components/icons/IconPro.svelte +37 -37
  198. package/src/ruvocal/src/lib/components/icons/IconShare.svelte +21 -21
  199. package/src/ruvocal/src/lib/components/icons/IconSun.svelte +93 -93
  200. package/src/ruvocal/src/lib/components/icons/Logo.svelte +68 -68
  201. package/src/ruvocal/src/lib/components/icons/LogoHuggingFaceBorderless.svelte +54 -54
  202. package/src/ruvocal/src/lib/components/mcp/AddServerForm.svelte +250 -250
  203. package/src/ruvocal/src/lib/components/mcp/MCPServerManager.svelte +185 -185
  204. package/src/ruvocal/src/lib/components/mcp/ServerCard.svelte +203 -203
  205. package/src/ruvocal/src/lib/components/players/AudioPlayer.svelte +82 -82
  206. package/src/ruvocal/src/lib/components/voice/AudioWaveform.svelte +96 -96
  207. package/src/ruvocal/src/lib/components/wasm/GalleryPanel.svelte +357 -357
  208. package/src/ruvocal/src/lib/constants/mcpExamples.ts +114 -114
  209. package/src/ruvocal/src/lib/constants/mime.ts +11 -11
  210. package/src/ruvocal/src/lib/constants/pagination.ts +1 -1
  211. package/src/ruvocal/src/lib/constants/publicSepToken.ts +1 -1
  212. package/src/ruvocal/src/lib/constants/routerExamples.ts +133 -133
  213. package/src/ruvocal/src/lib/constants/rvagentPresets.ts +206 -206
  214. package/src/ruvocal/src/lib/createShareLink.ts +27 -27
  215. package/src/ruvocal/src/lib/jobs/refresh-conversation-stats.ts +297 -297
  216. package/src/ruvocal/src/lib/migrations/lock.ts +56 -56
  217. package/src/ruvocal/src/lib/migrations/migrations.spec.ts +74 -74
  218. package/src/ruvocal/src/lib/migrations/migrations.ts +109 -109
  219. package/src/ruvocal/src/lib/migrations/routines/01-update-search-assistants.ts +50 -50
  220. package/src/ruvocal/src/lib/migrations/routines/02-update-assistants-models.ts +48 -48
  221. package/src/ruvocal/src/lib/migrations/routines/04-update-message-updates.ts +151 -151
  222. package/src/ruvocal/src/lib/migrations/routines/05-update-message-files.ts +56 -56
  223. package/src/ruvocal/src/lib/migrations/routines/06-trim-message-updates.ts +56 -56
  224. package/src/ruvocal/src/lib/migrations/routines/08-update-featured-to-review.ts +32 -32
  225. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.spec.ts +214 -214
  226. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.ts +88 -88
  227. package/src/ruvocal/src/lib/migrations/routines/10-update-reports-assistantid.ts +29 -29
  228. package/src/ruvocal/src/lib/migrations/routines/index.ts +15 -15
  229. package/src/ruvocal/src/lib/server/__tests__/conversation-stop-generating.spec.ts +103 -103
  230. package/src/ruvocal/src/lib/server/abortRegistry.ts +57 -57
  231. package/src/ruvocal/src/lib/server/abortedGenerations.ts +43 -43
  232. package/src/ruvocal/src/lib/server/adminToken.ts +62 -62
  233. package/src/ruvocal/src/lib/server/api/__tests__/conversations-id.spec.ts +296 -296
  234. package/src/ruvocal/src/lib/server/api/__tests__/conversations-message.spec.ts +216 -216
  235. package/src/ruvocal/src/lib/server/api/__tests__/conversations.spec.ts +235 -235
  236. package/src/ruvocal/src/lib/server/api/__tests__/misc.spec.ts +72 -72
  237. package/src/ruvocal/src/lib/server/api/__tests__/testHelpers.ts +86 -86
  238. package/src/ruvocal/src/lib/server/api/__tests__/user-reports.spec.ts +78 -78
  239. package/src/ruvocal/src/lib/server/api/__tests__/user.spec.ts +239 -239
  240. package/src/ruvocal/src/lib/server/api/types.ts +37 -37
  241. package/src/ruvocal/src/lib/server/api/utils/requireAuth.ts +22 -22
  242. package/src/ruvocal/src/lib/server/api/utils/resolveConversation.ts +69 -69
  243. package/src/ruvocal/src/lib/server/api/utils/resolveModel.ts +27 -27
  244. package/src/ruvocal/src/lib/server/api/utils/superjsonResponse.ts +15 -15
  245. package/src/ruvocal/src/lib/server/apiToken.ts +11 -11
  246. package/src/ruvocal/src/lib/server/auth.ts +554 -554
  247. package/src/ruvocal/src/lib/server/config.ts +187 -187
  248. package/src/ruvocal/src/lib/server/conversation.ts +83 -83
  249. package/src/ruvocal/src/lib/server/database/__tests__/rvf.spec.ts +709 -709
  250. package/src/ruvocal/src/lib/server/database/postgres.ts +700 -700
  251. package/src/ruvocal/src/lib/server/database/rvf.ts +1078 -1078
  252. package/src/ruvocal/src/lib/server/database.ts +145 -145
  253. package/src/ruvocal/src/lib/server/endpoints/document.ts +68 -68
  254. package/src/ruvocal/src/lib/server/endpoints/endpoints.ts +43 -43
  255. package/src/ruvocal/src/lib/server/endpoints/images.ts +211 -211
  256. package/src/ruvocal/src/lib/server/endpoints/openai/endpointOai.ts +266 -266
  257. package/src/ruvocal/src/lib/server/endpoints/openai/openAIChatToTextGenerationStream.ts +212 -212
  258. package/src/ruvocal/src/lib/server/endpoints/openai/openAICompletionToTextGenerationStream.ts +32 -32
  259. package/src/ruvocal/src/lib/server/endpoints/preprocessMessages.ts +61 -61
  260. package/src/ruvocal/src/lib/server/exitHandler.ts +59 -59
  261. package/src/ruvocal/src/lib/server/files/downloadFile.ts +34 -34
  262. package/src/ruvocal/src/lib/server/files/uploadFile.ts +29 -29
  263. package/src/ruvocal/src/lib/server/findRepoRoot.ts +13 -13
  264. package/src/ruvocal/src/lib/server/generateFromDefaultEndpoint.ts +46 -46
  265. package/src/ruvocal/src/lib/server/hooks/error.ts +37 -37
  266. package/src/ruvocal/src/lib/server/hooks/fetch.ts +22 -22
  267. package/src/ruvocal/src/lib/server/hooks/handle.ts +250 -250
  268. package/src/ruvocal/src/lib/server/hooks/init.ts +51 -51
  269. package/src/ruvocal/src/lib/server/isURLLocal.spec.ts +31 -31
  270. package/src/ruvocal/src/lib/server/isURLLocal.ts +74 -74
  271. package/src/ruvocal/src/lib/server/logger.ts +42 -42
  272. package/src/ruvocal/src/lib/server/mcp/clientPool.spec.ts +175 -175
  273. package/src/ruvocal/src/lib/server/mcp/hf.ts +32 -32
  274. package/src/ruvocal/src/lib/server/mcp/httpClient.ts +122 -122
  275. package/src/ruvocal/src/lib/server/mcp/registry.ts +76 -76
  276. package/src/ruvocal/src/lib/server/mcp/tools.ts +196 -196
  277. package/src/ruvocal/src/lib/server/metrics.ts +255 -255
  278. package/src/ruvocal/src/lib/server/models.ts +518 -518
  279. package/src/ruvocal/src/lib/server/requestContext.ts +55 -55
  280. package/src/ruvocal/src/lib/server/router/arch.ts +230 -230
  281. package/src/ruvocal/src/lib/server/router/endpoint.ts +316 -316
  282. package/src/ruvocal/src/lib/server/router/multimodal.ts +28 -28
  283. package/src/ruvocal/src/lib/server/router/policy.ts +49 -49
  284. package/src/ruvocal/src/lib/server/router/toolsRoute.ts +51 -51
  285. package/src/ruvocal/src/lib/server/router/types.ts +21 -21
  286. package/src/ruvocal/src/lib/server/sendSlack.ts +23 -23
  287. package/src/ruvocal/src/lib/server/textGeneration/generate.ts +258 -258
  288. package/src/ruvocal/src/lib/server/textGeneration/index.ts +96 -96
  289. package/src/ruvocal/src/lib/server/textGeneration/mcp/fileRefs.ts +155 -155
  290. package/src/ruvocal/src/lib/server/textGeneration/mcp/routerResolution.ts +108 -108
  291. package/src/ruvocal/src/lib/server/textGeneration/mcp/runMcpFlow.ts +831 -831
  292. package/src/ruvocal/src/lib/server/textGeneration/mcp/toolInvocation.ts +349 -349
  293. package/src/ruvocal/src/lib/server/textGeneration/mcp/wasmTools.test.ts +633 -633
  294. package/src/ruvocal/src/lib/server/textGeneration/reasoning.ts +23 -23
  295. package/src/ruvocal/src/lib/server/textGeneration/title.ts +83 -83
  296. package/src/ruvocal/src/lib/server/textGeneration/types.ts +28 -28
  297. package/src/ruvocal/src/lib/server/textGeneration/utils/prepareFiles.ts +88 -88
  298. package/src/ruvocal/src/lib/server/textGeneration/utils/routing.ts +21 -21
  299. package/src/ruvocal/src/lib/server/textGeneration/utils/toolPrompt.ts +49 -49
  300. package/src/ruvocal/src/lib/server/urlSafety.ts +77 -77
  301. package/src/ruvocal/src/lib/server/usageLimits.ts +30 -30
  302. package/src/ruvocal/src/lib/stores/autopilotStore.svelte.ts +175 -175
  303. package/src/ruvocal/src/lib/stores/backgroundGenerations.svelte.ts +32 -32
  304. package/src/ruvocal/src/lib/stores/backgroundGenerations.ts +1 -1
  305. package/src/ruvocal/src/lib/stores/errors.ts +9 -9
  306. package/src/ruvocal/src/lib/stores/isAborted.ts +3 -3
  307. package/src/ruvocal/src/lib/stores/isPro.ts +4 -4
  308. package/src/ruvocal/src/lib/stores/loading.ts +3 -3
  309. package/src/ruvocal/src/lib/stores/mcpServers.ts +534 -534
  310. package/src/ruvocal/src/lib/stores/pendingChatInput.ts +3 -3
  311. package/src/ruvocal/src/lib/stores/pendingMessage.ts +9 -9
  312. package/src/ruvocal/src/lib/stores/settings.ts +182 -182
  313. package/src/ruvocal/src/lib/stores/shareModal.ts +13 -13
  314. package/src/ruvocal/src/lib/stores/titleUpdate.ts +8 -8
  315. package/src/ruvocal/src/lib/stores/wasmMcp.ts +472 -472
  316. package/src/ruvocal/src/lib/switchTheme.ts +124 -124
  317. package/src/ruvocal/src/lib/types/AbortedGeneration.ts +8 -8
  318. package/src/ruvocal/src/lib/types/Assistant.ts +31 -31
  319. package/src/ruvocal/src/lib/types/AssistantStats.ts +11 -11
  320. package/src/ruvocal/src/lib/types/ConfigKey.ts +4 -4
  321. package/src/ruvocal/src/lib/types/ConvSidebar.ts +9 -9
  322. package/src/ruvocal/src/lib/types/Conversation.ts +27 -27
  323. package/src/ruvocal/src/lib/types/ConversationStats.ts +13 -13
  324. package/src/ruvocal/src/lib/types/Message.ts +41 -41
  325. package/src/ruvocal/src/lib/types/MessageEvent.ts +10 -10
  326. package/src/ruvocal/src/lib/types/MessageUpdate.ts +139 -139
  327. package/src/ruvocal/src/lib/types/MigrationResult.ts +7 -7
  328. package/src/ruvocal/src/lib/types/Model.ts +23 -23
  329. package/src/ruvocal/src/lib/types/Report.ts +12 -12
  330. package/src/ruvocal/src/lib/types/Review.ts +6 -6
  331. package/src/ruvocal/src/lib/types/Semaphore.ts +19 -19
  332. package/src/ruvocal/src/lib/types/Session.ts +22 -22
  333. package/src/ruvocal/src/lib/types/Settings.ts +93 -93
  334. package/src/ruvocal/src/lib/types/SharedConversation.ts +9 -9
  335. package/src/ruvocal/src/lib/types/Template.ts +6 -6
  336. package/src/ruvocal/src/lib/types/Timestamps.ts +4 -4
  337. package/src/ruvocal/src/lib/types/TokenCache.ts +6 -6
  338. package/src/ruvocal/src/lib/types/Tool.ts +77 -77
  339. package/src/ruvocal/src/lib/types/UrlDependency.ts +5 -5
  340. package/src/ruvocal/src/lib/types/User.ts +14 -14
  341. package/src/ruvocal/src/lib/utils/PublicConfig.svelte.ts +75 -75
  342. package/src/ruvocal/src/lib/utils/auth.ts +17 -17
  343. package/src/ruvocal/src/lib/utils/chunk.ts +33 -33
  344. package/src/ruvocal/src/lib/utils/cookiesAreEnabled.ts +13 -13
  345. package/src/ruvocal/src/lib/utils/debounce.ts +17 -17
  346. package/src/ruvocal/src/lib/utils/deepestChild.ts +6 -6
  347. package/src/ruvocal/src/lib/utils/favicon.ts +21 -21
  348. package/src/ruvocal/src/lib/utils/fetchJSON.ts +23 -23
  349. package/src/ruvocal/src/lib/utils/file2base64.ts +14 -14
  350. package/src/ruvocal/src/lib/utils/formatUserCount.ts +37 -37
  351. package/src/ruvocal/src/lib/utils/generationState.spec.ts +75 -75
  352. package/src/ruvocal/src/lib/utils/generationState.ts +26 -26
  353. package/src/ruvocal/src/lib/utils/getHref.ts +41 -41
  354. package/src/ruvocal/src/lib/utils/getReturnFromGenerator.ts +7 -7
  355. package/src/ruvocal/src/lib/utils/haptics.ts +64 -64
  356. package/src/ruvocal/src/lib/utils/hashConv.ts +12 -12
  357. package/src/ruvocal/src/lib/utils/hf.ts +17 -17
  358. package/src/ruvocal/src/lib/utils/isDesktop.ts +7 -7
  359. package/src/ruvocal/src/lib/utils/isUrl.ts +8 -8
  360. package/src/ruvocal/src/lib/utils/isVirtualKeyboard.ts +16 -16
  361. package/src/ruvocal/src/lib/utils/loadAttachmentsFromUrls.ts +115 -115
  362. package/src/ruvocal/src/lib/utils/marked.spec.ts +96 -96
  363. package/src/ruvocal/src/lib/utils/marked.ts +531 -531
  364. package/src/ruvocal/src/lib/utils/mcpValidation.ts +147 -147
  365. package/src/ruvocal/src/lib/utils/mergeAsyncGenerators.ts +38 -38
  366. package/src/ruvocal/src/lib/utils/messageUpdates.spec.ts +262 -262
  367. package/src/ruvocal/src/lib/utils/messageUpdates.ts +324 -324
  368. package/src/ruvocal/src/lib/utils/mime.ts +56 -56
  369. package/src/ruvocal/src/lib/utils/models.ts +14 -14
  370. package/src/ruvocal/src/lib/utils/parseBlocks.ts +120 -120
  371. package/src/ruvocal/src/lib/utils/parseIncompleteMarkdown.ts +644 -644
  372. package/src/ruvocal/src/lib/utils/parseStringToList.ts +10 -10
  373. package/src/ruvocal/src/lib/utils/randomUuid.ts +14 -14
  374. package/src/ruvocal/src/lib/utils/searchTokens.ts +33 -33
  375. package/src/ruvocal/src/lib/utils/sha256.ts +7 -7
  376. package/src/ruvocal/src/lib/utils/stringifyError.ts +12 -12
  377. package/src/ruvocal/src/lib/utils/sum.ts +3 -3
  378. package/src/ruvocal/src/lib/utils/template.spec.ts +59 -59
  379. package/src/ruvocal/src/lib/utils/template.ts +53 -53
  380. package/src/ruvocal/src/lib/utils/timeout.ts +9 -9
  381. package/src/ruvocal/src/lib/utils/toolProgress.spec.ts +46 -46
  382. package/src/ruvocal/src/lib/utils/toolProgress.ts +11 -11
  383. package/src/ruvocal/src/lib/utils/tree/addChildren.spec.ts +102 -102
  384. package/src/ruvocal/src/lib/utils/tree/addChildren.ts +48 -48
  385. package/src/ruvocal/src/lib/utils/tree/addSibling.spec.ts +81 -81
  386. package/src/ruvocal/src/lib/utils/tree/addSibling.ts +41 -41
  387. package/src/ruvocal/src/lib/utils/tree/buildSubtree.spec.ts +110 -110
  388. package/src/ruvocal/src/lib/utils/tree/buildSubtree.ts +24 -24
  389. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.spec.ts +31 -31
  390. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.ts +36 -36
  391. package/src/ruvocal/src/lib/utils/tree/isMessageId.spec.ts +15 -15
  392. package/src/ruvocal/src/lib/utils/tree/isMessageId.ts +5 -5
  393. package/src/ruvocal/src/lib/utils/tree/tree.d.ts +14 -14
  394. package/src/ruvocal/src/lib/utils/tree/treeHelpers.spec.ts +167 -167
  395. package/src/ruvocal/src/lib/utils/updates.ts +39 -39
  396. package/src/ruvocal/src/lib/utils/urlParams.ts +13 -13
  397. package/src/ruvocal/src/lib/wasm/idb.ts +438 -438
  398. package/src/ruvocal/src/lib/wasm/index.ts +1213 -1213
  399. package/src/ruvocal/src/lib/wasm/tests/wasm-capabilities.test.ts +565 -565
  400. package/src/ruvocal/src/lib/wasm/wasm.worker.ts +332 -332
  401. package/src/ruvocal/src/lib/wasm/workerClient.ts +166 -166
  402. package/src/ruvocal/src/lib/workers/autopilotWorker.ts +221 -221
  403. package/src/ruvocal/src/lib/workers/detailFetchWorker.ts +100 -100
  404. package/src/ruvocal/src/lib/workers/markdownWorker.ts +61 -61
  405. package/src/ruvocal/src/routes/+error.svelte +20 -20
  406. package/src/ruvocal/src/routes/+layout.svelte +324 -324
  407. package/src/ruvocal/src/routes/+layout.ts +91 -91
  408. package/src/ruvocal/src/routes/+page.svelte +168 -168
  409. package/src/ruvocal/src/routes/.well-known/oauth-cimd/+server.ts +37 -37
  410. package/src/ruvocal/src/routes/__debug/openai/+server.ts +21 -21
  411. package/src/ruvocal/src/routes/admin/export/+server.ts +159 -159
  412. package/src/ruvocal/src/routes/admin/stats/compute/+server.ts +16 -16
  413. package/src/ruvocal/src/routes/api/conversation/[id]/+server.ts +40 -40
  414. package/src/ruvocal/src/routes/api/conversation/[id]/message/[messageId]/+server.ts +42 -42
  415. package/src/ruvocal/src/routes/api/conversations/+server.ts +48 -48
  416. package/src/ruvocal/src/routes/api/fetch-url/+server.ts +147 -147
  417. package/src/ruvocal/src/routes/api/mcp/health/+server.ts +292 -292
  418. package/src/ruvocal/src/routes/api/mcp/servers/+server.ts +32 -32
  419. package/src/ruvocal/src/routes/api/models/+server.ts +25 -25
  420. package/src/ruvocal/src/routes/api/transcribe/+server.ts +104 -104
  421. package/src/ruvocal/src/routes/api/user/+server.ts +15 -15
  422. package/src/ruvocal/src/routes/api/user/validate-token/+server.ts +20 -20
  423. package/src/ruvocal/src/routes/api/v2/conversations/+server.ts +48 -48
  424. package/src/ruvocal/src/routes/api/v2/conversations/[id]/+server.ts +94 -94
  425. package/src/ruvocal/src/routes/api/v2/conversations/[id]/message/[messageId]/+server.ts +43 -43
  426. package/src/ruvocal/src/routes/api/v2/conversations/import-share/+server.ts +23 -23
  427. package/src/ruvocal/src/routes/api/v2/debug/config/+server.ts +16 -16
  428. package/src/ruvocal/src/routes/api/v2/debug/refresh/+server.ts +30 -30
  429. package/src/ruvocal/src/routes/api/v2/export/+server.ts +196 -196
  430. package/src/ruvocal/src/routes/api/v2/feature-flags/+server.ts +14 -14
  431. package/src/ruvocal/src/routes/api/v2/models/+server.ts +38 -38
  432. package/src/ruvocal/src/routes/api/v2/models/[namespace]/+server.ts +8 -8
  433. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/+server.ts +8 -8
  434. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/subscribe/+server.ts +28 -28
  435. package/src/ruvocal/src/routes/api/v2/models/[namespace]/subscribe/+server.ts +28 -28
  436. package/src/ruvocal/src/routes/api/v2/models/old/+server.ts +7 -7
  437. package/src/ruvocal/src/routes/api/v2/models/refresh/+server.ts +33 -33
  438. package/src/ruvocal/src/routes/api/v2/public-config/+server.ts +7 -7
  439. package/src/ruvocal/src/routes/api/v2/user/+server.ts +17 -17
  440. package/src/ruvocal/src/routes/api/v2/user/billing-orgs/+server.ts +73 -73
  441. package/src/ruvocal/src/routes/api/v2/user/reports/+server.ts +17 -17
  442. package/src/ruvocal/src/routes/api/v2/user/settings/+server.ts +110 -110
  443. package/src/ruvocal/src/routes/conversation/+server.ts +115 -115
  444. package/src/ruvocal/src/routes/conversation/[id]/+page.svelte +586 -586
  445. package/src/ruvocal/src/routes/conversation/[id]/+page.ts +60 -60
  446. package/src/ruvocal/src/routes/conversation/[id]/+server.ts +740 -740
  447. package/src/ruvocal/src/routes/conversation/[id]/message/[messageId]/prompt/+server.ts +66 -66
  448. package/src/ruvocal/src/routes/conversation/[id]/share/+server.ts +69 -69
  449. package/src/ruvocal/src/routes/conversation/[id]/stop-generating/+server.ts +35 -35
  450. package/src/ruvocal/src/routes/healthcheck/+server.ts +3 -3
  451. package/src/ruvocal/src/routes/login/+server.ts +5 -5
  452. package/src/ruvocal/src/routes/login/callback/+server.ts +103 -103
  453. package/src/ruvocal/src/routes/login/callback/updateUser.spec.ts +157 -157
  454. package/src/ruvocal/src/routes/login/callback/updateUser.ts +215 -215
  455. package/src/ruvocal/src/routes/logout/+server.ts +18 -18
  456. package/src/ruvocal/src/routes/metrics/+server.ts +18 -18
  457. package/src/ruvocal/src/routes/models/+page.svelte +233 -233
  458. package/src/ruvocal/src/routes/models/[...model]/+page.svelte +161 -161
  459. package/src/ruvocal/src/routes/models/[...model]/+page.ts +14 -14
  460. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/+server.ts +64 -64
  461. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/ModelThumbnail.svelte +28 -28
  462. package/src/ruvocal/src/routes/privacy/+page.svelte +11 -11
  463. package/src/ruvocal/src/routes/r/[id]/+page.ts +34 -34
  464. package/src/ruvocal/src/routes/settings/(nav)/+layout.svelte +282 -282
  465. package/src/ruvocal/src/routes/settings/(nav)/+layout.ts +1 -1
  466. package/src/ruvocal/src/routes/settings/(nav)/+server.ts +59 -59
  467. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.svelte +464 -464
  468. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.ts +14 -14
  469. package/src/ruvocal/src/routes/settings/(nav)/application/+page.svelte +362 -362
  470. package/src/ruvocal/src/routes/settings/+layout.svelte +40 -40
  471. package/src/ruvocal/src/styles/highlight-js.css +195 -195
  472. package/src/ruvocal/src/styles/main.css +144 -144
  473. package/src/ruvocal/static/chatui/favicon-dark.svg +3 -3
  474. package/src/ruvocal/static/chatui/favicon-dev.svg +3 -3
  475. package/src/ruvocal/static/chatui/favicon.svg +3 -3
  476. package/src/ruvocal/static/chatui/icon.svg +3 -3
  477. package/src/ruvocal/static/chatui/logo.svg +7 -7
  478. package/src/ruvocal/static/chatui/manifest.json +54 -54
  479. package/src/ruvocal/static/chatui/welcome.js +184 -184
  480. package/src/ruvocal/static/huggingchat/favicon-dark.svg +4 -4
  481. package/src/ruvocal/static/huggingchat/favicon-dev.svg +4 -4
  482. package/src/ruvocal/static/huggingchat/favicon.svg +4 -4
  483. package/src/ruvocal/static/huggingchat/fulltext-logo.svg +1 -1
  484. package/src/ruvocal/static/huggingchat/icon.svg +4 -4
  485. package/src/ruvocal/static/huggingchat/logo.svg +4 -4
  486. package/src/ruvocal/static/huggingchat/manifest.json +54 -54
  487. package/src/ruvocal/static/huggingchat/routes.chat.json +226 -226
  488. package/src/ruvocal/static/robots.txt +10 -10
  489. package/src/ruvocal/static/wasm/rvagent_wasm.js +1539 -1539
  490. package/src/ruvocal/stub/@reflink/reflink/package.json +5 -5
  491. package/src/ruvocal/svelte.config.js +53 -53
  492. package/src/ruvocal/tailwind.config.cjs +30 -30
  493. package/src/ruvocal/tsconfig.json +19 -19
  494. package/src/ruvocal/vite.config.ts +87 -87
  495. package/src/scripts/deploy.sh +116 -116
  496. package/src/scripts/generate-config.js +245 -245
  497. package/src/scripts/generate-welcome.js +187 -187
  498. package/src/scripts/package-rvf.sh +116 -116
@@ -1,740 +1,740 @@
1
- import { authCondition } from "$lib/server/auth";
2
- import { collections } from "$lib/server/database";
3
- import { config } from "$lib/server/config";
4
- import { models, validModelIdSchema } from "$lib/server/models";
5
- import { ERROR_MESSAGES } from "$lib/stores/errors";
6
- import type { Message } from "$lib/types/Message";
7
- import { error } from "@sveltejs/kit";
8
- import { ObjectId } from "mongodb";
9
- import { z } from "zod";
10
- import {
11
- MessageUpdateStatus,
12
- MessageUpdateType,
13
- MessageReasoningUpdateType,
14
- type MessageUpdate,
15
- type MessageStreamUpdate,
16
- } from "$lib/types/MessageUpdate";
17
- import { uploadFile } from "$lib/server/files/uploadFile";
18
- import { convertLegacyConversation } from "$lib/utils/tree/convertLegacyConversation";
19
- import { isMessageId } from "$lib/utils/tree/isMessageId";
20
- import { buildSubtree } from "$lib/utils/tree/buildSubtree.js";
21
- import { addChildren } from "$lib/utils/tree/addChildren.js";
22
- import { addSibling } from "$lib/utils/tree/addSibling.js";
23
- import { usageLimits } from "$lib/server/usageLimits";
24
- import { textGeneration } from "$lib/server/textGeneration";
25
- import type { TextGenerationContext } from "$lib/server/textGeneration/types";
26
- import { logger } from "$lib/server/logger.js";
27
- import { AbortRegistry } from "$lib/server/abortRegistry";
28
- import { MetricsServer } from "$lib/server/metrics";
29
-
30
- export async function POST({ request, locals, params, getClientAddress }) {
31
- const id = z.string().parse(params.id);
32
- const convId = new ObjectId(id);
33
- const promptedAt = new Date();
34
-
35
- const userId = locals.user?._id ?? locals.sessionId;
36
-
37
- // check user
38
- if (!userId) {
39
- error(401, "Unauthorized");
40
- }
41
-
42
- // check if the user has access to the conversation
43
- const convBeforeCheck = await collections.conversations.findOne({
44
- _id: convId,
45
- ...authCondition(locals),
46
- });
47
-
48
- if (convBeforeCheck && !convBeforeCheck.rootMessageId) {
49
- const res = await collections.conversations.updateOne(
50
- {
51
- _id: convId,
52
- },
53
- {
54
- $set: {
55
- ...convBeforeCheck,
56
- ...convertLegacyConversation(convBeforeCheck),
57
- },
58
- }
59
- );
60
-
61
- if (!res.acknowledged) {
62
- error(500, "Failed to convert conversation");
63
- }
64
- }
65
-
66
- const conv = await collections.conversations.findOne({
67
- _id: convId,
68
- ...authCondition(locals),
69
- });
70
-
71
- if (!conv) {
72
- error(404, "Conversation not found");
73
- }
74
-
75
- // register the event for ratelimiting
76
- await collections.messageEvents.insertOne({
77
- type: "message",
78
- userId,
79
- createdAt: new Date(),
80
- expiresAt: new Date(Date.now() + 60_000),
81
- ip: getClientAddress(),
82
- });
83
-
84
- if (usageLimits?.messagesPerMinute) {
85
- // check if the user is rate limited
86
- const nEvents = Math.max(
87
- await collections.messageEvents.countDocuments({
88
- userId,
89
- type: "message",
90
- expiresAt: { $gt: new Date() },
91
- }),
92
- await collections.messageEvents.countDocuments({
93
- ip: getClientAddress(),
94
- type: "message",
95
- expiresAt: { $gt: new Date() },
96
- })
97
- );
98
- if (nEvents > usageLimits.messagesPerMinute) {
99
- error(429, ERROR_MESSAGES.rateLimited);
100
- }
101
- }
102
-
103
- if (usageLimits?.messages && conv.messages.length > usageLimits.messages) {
104
- error(
105
- 429,
106
- `This conversation has more than ${usageLimits.messages} messages. Start a new one to continue`
107
- );
108
- }
109
-
110
- // fetch the model
111
- const model = models.find((m) => m.id === conv.model);
112
-
113
- if (!model) {
114
- error(410, "Model not available anymore");
115
- }
116
-
117
- // finally parse the content of the request
118
- const form = await request.formData();
119
-
120
- const json = form.get("data");
121
-
122
- if (!json || typeof json !== "string") {
123
- error(400, "Invalid request");
124
- }
125
-
126
- const {
127
- inputs: newPrompt,
128
- id: messageId,
129
- is_retry: isRetry,
130
- selectedMcpServerNames,
131
- selectedMcpServers,
132
- autopilot,
133
- autopilotMaxSteps,
134
- } = z
135
- .object({
136
- id: z.string().uuid().refine(isMessageId).optional(), // parent message id to append to for a normal message, or the message id for a retry/continue
137
- inputs: z.optional(
138
- z
139
- .string()
140
- .min(1)
141
- .transform((s) => s.replace(/\r\n/g, "\n"))
142
- ),
143
- is_retry: z.optional(z.boolean()),
144
- autopilot: z.optional(z.boolean()),
145
- // User-configurable cap on autopilot tool-call loops. Server clamps to [1, 100].
146
- autopilotMaxSteps: z.optional(z.number().int().min(1).max(100)),
147
- selectedMcpServerNames: z.optional(z.array(z.string())),
148
- selectedMcpServers: z
149
- .optional(
150
- z.array(
151
- z.object({
152
- name: z.string(),
153
- url: z.string(),
154
- headers: z
155
- .optional(z.array(z.object({ key: z.string(), value: z.string() })))
156
- .default([]),
157
- })
158
- )
159
- )
160
- .default([]),
161
- files: z.optional(
162
- z.array(
163
- z.object({
164
- type: z.literal("base64").or(z.literal("hash")),
165
- name: z.string(),
166
- value: z.string(),
167
- mime: z.string(),
168
- })
169
- )
170
- ),
171
- })
172
- .parse(JSON.parse(json));
173
-
174
- // Attach MCP selection to locals so the text generation pipeline can consume it
175
- try {
176
- (locals as unknown as Record<string, unknown>).mcp = {
177
- selectedServerNames: selectedMcpServerNames,
178
- selectedServers: (selectedMcpServers ?? []).map((s) => ({
179
- name: s.name,
180
- url: s.url,
181
- headers:
182
- s.headers && s.headers.length > 0
183
- ? Object.fromEntries(s.headers.map((h) => [h.key, h.value]))
184
- : undefined,
185
- })),
186
- };
187
- } catch {
188
- // ignore attachment errors, pipeline will just use env servers
189
- }
190
-
191
- const inputFiles = await Promise.all(
192
- form
193
- .getAll("files")
194
- .filter((entry): entry is File => entry instanceof File && entry.size > 0)
195
- .map(async (file) => {
196
- const [type, ...name] = file.name.split(";");
197
-
198
- return {
199
- type: z.literal("base64").or(z.literal("hash")).parse(type),
200
- value: await file.text(),
201
- mime: file.type,
202
- name: name.join(";"),
203
- };
204
- })
205
- );
206
-
207
- if (usageLimits?.messageLength && (newPrompt?.length ?? 0) > usageLimits.messageLength) {
208
- error(400, "Message too long.");
209
- }
210
-
211
- // each file is either:
212
- // base64 string requiring upload to the server
213
- // hash pointing to an existing file
214
- const hashFiles = inputFiles?.filter((file) => file.type === "hash") ?? [];
215
- const b64Files =
216
- inputFiles
217
- ?.filter((file) => file.type !== "hash")
218
- .map((file) => {
219
- const blob = Buffer.from(file.value, "base64");
220
- return new File([blob], file.name, { type: file.mime });
221
- }) ?? [];
222
-
223
- // check sizes
224
- // todo: make configurable
225
- if (b64Files.some((file) => file.size > 10 * 1024 * 1024)) {
226
- error(413, "File too large, should be <10MB");
227
- }
228
-
229
- const uploadedFiles = await Promise.all(b64Files.map((file) => uploadFile(file, conv))).then(
230
- (files) => [...files, ...hashFiles]
231
- );
232
-
233
- // we will append tokens to the content of this message
234
- let messageToWriteToId: Message["id"] | undefined = undefined;
235
- // used for building the prompt, subtree of the conversation that goes from the latest message to the root
236
- let messagesForPrompt: Message[] = [];
237
-
238
- if (isRetry && messageId) {
239
- // two cases, if we're retrying a user message with a newPrompt set,
240
- // it means we're editing a user message
241
- // if we're retrying on an assistant message, newPrompt cannot be set
242
- // it means we're retrying the last assistant message for a new answer
243
-
244
- const messageToRetry = conv.messages.find((message) => message.id === messageId);
245
-
246
- if (!messageToRetry) {
247
- error(404, "Message not found");
248
- }
249
-
250
- if (messageToRetry.from === "user" && newPrompt) {
251
- // add a sibling to this message from the user, with the alternative prompt
252
- // add a children to that sibling, where we can write to
253
- const newUserMessageId = addSibling(
254
- conv,
255
- {
256
- from: "user",
257
- content: newPrompt,
258
- files: uploadedFiles,
259
- createdAt: new Date(),
260
- updatedAt: new Date(),
261
- },
262
- messageId
263
- );
264
- messageToWriteToId = addChildren(
265
- conv,
266
- {
267
- from: "assistant",
268
- content: "",
269
- createdAt: new Date(),
270
- updatedAt: new Date(),
271
- },
272
- newUserMessageId
273
- );
274
- messagesForPrompt = buildSubtree(conv, newUserMessageId);
275
- } else if (messageToRetry.from === "assistant") {
276
- // we're retrying an assistant message, to generate a new answer
277
- // just add a sibling to the assistant answer where we can write to
278
- messageToWriteToId = addSibling(
279
- conv,
280
- { from: "assistant", content: "", createdAt: new Date(), updatedAt: new Date() },
281
- messageId
282
- );
283
- messagesForPrompt = buildSubtree(conv, messageId);
284
- messagesForPrompt.pop(); // don't need the latest assistant message in the prompt since we're retrying it
285
- }
286
- } else {
287
- // just a normal linear conversation, so we add the user message
288
- // and the blank assistant message back to back
289
- const newUserMessageId = addChildren(
290
- conv,
291
- {
292
- from: "user",
293
- content: newPrompt ?? "",
294
- files: uploadedFiles,
295
- createdAt: new Date(),
296
- updatedAt: new Date(),
297
- },
298
- messageId
299
- );
300
-
301
- messageToWriteToId = addChildren(
302
- conv,
303
- {
304
- from: "assistant",
305
- content: "",
306
- createdAt: new Date(),
307
- updatedAt: new Date(),
308
- },
309
- newUserMessageId
310
- );
311
- // build the prompt from the user message
312
- messagesForPrompt = buildSubtree(conv, newUserMessageId);
313
- }
314
-
315
- const messageToWriteTo = conv.messages.find((message) => message.id === messageToWriteToId);
316
- if (!messageToWriteTo) {
317
- error(500, "Failed to create message");
318
- }
319
- if (messagesForPrompt.length === 0) {
320
- error(500, "Failed to create prompt");
321
- }
322
-
323
- // update the conversation with the new messages
324
- await collections.conversations.updateOne(
325
- { _id: convId },
326
- { $set: { messages: conv.messages, title: conv.title, updatedAt: new Date() } }
327
- );
328
-
329
- let doneStreaming = false;
330
- let clientDetached = false;
331
-
332
- let lastTokenTimestamp: undefined | Date = undefined;
333
- let firstTokenObserved = false;
334
- const metricsEnabled = MetricsServer.isEnabled();
335
- const metrics = metricsEnabled ? MetricsServer.getMetrics() : undefined;
336
- const metricsModelId = model.id ?? model.name ?? conv.model;
337
- const metricsLabels = { model: metricsModelId };
338
-
339
- const persistConversation = async () => {
340
- const messagesForSave = conv.messages.map((msg) => {
341
- const filteredUpdates =
342
- msg.updates
343
- ?.filter(
344
- (u) =>
345
- !(u.type === MessageUpdateType.Status && u.status === MessageUpdateStatus.KeepAlive)
346
- )
347
- .map((u) => {
348
- if (u.type !== MessageUpdateType.Stream) return u;
349
- // Preserve existing len if already compressed, otherwise compute from token
350
- const len = u.len ?? (u.token ?? "").length;
351
- // store a lightweight marker to preserve ordering without duplicating content
352
- return { type: MessageUpdateType.Stream, token: "", len } satisfies MessageStreamUpdate;
353
- }) ?? [];
354
-
355
- return { ...msg, updates: filteredUpdates };
356
- });
357
-
358
- await collections.conversations.updateOne(
359
- { _id: convId },
360
- { $set: { messages: messagesForSave, title: conv.title, updatedAt: new Date() } }
361
- );
362
- };
363
-
364
- const abortRegistry = AbortRegistry.getInstance();
365
-
366
- // we now build the stream
367
- const stream = new ReadableStream({
368
- async start(controller) {
369
- const conversationKey = convId.toString();
370
- const ctrl = new AbortController();
371
- abortRegistry.register(conversationKey, ctrl);
372
-
373
- let finalAnswerReceived = false;
374
- let abortedByUser = false;
375
- let finishedStatusSent = false;
376
-
377
- messageToWriteTo.updates ??= [];
378
- async function update(event: MessageUpdate) {
379
- if (!messageToWriteTo || !conv) {
380
- throw Error("No message or conversation to write events to");
381
- }
382
-
383
- if (
384
- event.type === MessageUpdateType.Status &&
385
- event.status === MessageUpdateStatus.Finished
386
- ) {
387
- finishedStatusSent = true;
388
- }
389
-
390
- // Add token to content or skip if empty
391
- if (event.type === MessageUpdateType.Stream) {
392
- if (event.token === "") return;
393
- messageToWriteTo.content += event.token;
394
-
395
- if (metricsEnabled && metrics) {
396
- const now = Date.now();
397
- metrics.model.tokenCountTotal.inc(metricsLabels);
398
-
399
- if (!firstTokenObserved) {
400
- metrics.model.timeToFirstToken.observe(metricsLabels, now - promptedAt.getTime());
401
- firstTokenObserved = true;
402
- }
403
-
404
- const previousTimestamp = lastTokenTimestamp
405
- ? lastTokenTimestamp.getTime()
406
- : promptedAt.getTime();
407
- metrics.model.timePerOutputToken.observe(metricsLabels, now - previousTimestamp);
408
- }
409
-
410
- lastTokenTimestamp = new Date();
411
- }
412
-
413
- // Append reasoning stream tokens to message.reasoning (server-side)
414
- else if (
415
- event.type === MessageUpdateType.Reasoning &&
416
- event.subtype === MessageReasoningUpdateType.Stream &&
417
- "token" in event
418
- ) {
419
- messageToWriteTo.reasoning ??= "";
420
- messageToWriteTo.reasoning += event.token;
421
- }
422
-
423
- // Set the title
424
- else if (event.type === MessageUpdateType.Title) {
425
- // Always strip <think> markers from titles when saving
426
- const sanitizedTitle = event.title.replace(/<\/?think>/gi, "").trim();
427
- conv.title = sanitizedTitle;
428
- await collections.conversations.updateOne(
429
- { _id: convId },
430
- { $set: { title: conv?.title, updatedAt: new Date() } }
431
- );
432
- }
433
-
434
- // Set the final text and the interrupted flag
435
- else if (event.type === MessageUpdateType.FinalAnswer) {
436
- messageToWriteTo.interrupted = event.interrupted;
437
- // Default behavior: replace the streamed text with the provider's final text.
438
- // However, when tools (MCP/function calls) were used, providers often stream
439
- // some content (e.g., a story) before triggering tools, then return a
440
- // different follow‑up message afterwards (e.g., an image caption). Our
441
- // previous logic overwrote the pre‑tool content. Preserve it by merging in
442
- // the pre‑tool stream when tool updates occurred and the final text does
443
- // not already include the streamed prefix.
444
- const hadTools = (messageToWriteTo.updates ?? []).some(
445
- (u) => u.type === MessageUpdateType.Tool
446
- );
447
-
448
- if (hadTools) {
449
- const existing = messageToWriteTo.content.slice(initialMessageContent.length);
450
- if (existing && existing.length > 0) {
451
- // A. If we already streamed the same final text, keep as-is.
452
- if (event.text && existing.endsWith(event.text)) {
453
- messageToWriteTo.content = initialMessageContent + existing;
454
- }
455
- // B. If the final text already includes the streamed prefix, use it verbatim.
456
- else if (event.text && event.text.startsWith(existing)) {
457
- messageToWriteTo.content = initialMessageContent + event.text;
458
- }
459
- // C. Otherwise, merge with a paragraph break for readability.
460
- else {
461
- const needsGap = !/\n\n$/.test(existing) && !/^\n/.test(event.text ?? "");
462
- messageToWriteTo.content =
463
- initialMessageContent + existing + (needsGap ? "\n\n" : "") + (event.text ?? "");
464
- }
465
- } else {
466
- messageToWriteTo.content = initialMessageContent + (event.text ?? "");
467
- }
468
- } else {
469
- messageToWriteTo.content = initialMessageContent + event.text;
470
- }
471
- finalAnswerReceived = true;
472
-
473
- if (metricsEnabled && metrics) {
474
- metrics.model.latency.observe(metricsLabels, Date.now() - promptedAt.getTime());
475
- }
476
- }
477
-
478
- // Add file
479
- else if (event.type === MessageUpdateType.File) {
480
- messageToWriteTo.files = [
481
- ...(messageToWriteTo.files ?? []),
482
- { type: "hash", name: event.name, value: event.sha, mime: event.mime },
483
- ];
484
- }
485
-
486
- // Store router metadata (for router models) or provider info (for all models)
487
- else if (event.type === MessageUpdateType.RouterMetadata) {
488
- // Merge metadata updates to preserve existing fields (router may send route/model first, then provider comes later)
489
- if (model?.isRouter) {
490
- messageToWriteTo.routerMetadata = {
491
- route: event.route || messageToWriteTo.routerMetadata?.route || "",
492
- model: event.model || messageToWriteTo.routerMetadata?.model || "",
493
- provider: event.provider || messageToWriteTo.routerMetadata?.provider,
494
- };
495
- }
496
- // Store provider-only metadata for non-router models if available
497
- else if (event.provider) {
498
- messageToWriteTo.routerMetadata = {
499
- route: messageToWriteTo.routerMetadata?.route || "",
500
- model: messageToWriteTo.routerMetadata?.model || "",
501
- provider: event.provider,
502
- };
503
- }
504
- }
505
-
506
- // Append updates for audit/replay (streams too, to preserve ordering)
507
- if (
508
- !(
509
- event.type === MessageUpdateType.Status &&
510
- event.status === MessageUpdateStatus.KeepAlive
511
- )
512
- ) {
513
- messageToWriteTo?.updates?.push(
514
- event.type === MessageUpdateType.Stream ? { ...event } : event
515
- );
516
- }
517
-
518
- // Avoid remote keylogging attack executed by watching packet lengths
519
- // by padding the text with null chars to a fixed length
520
- // https://cdn.arstechnica.net/wp-content/uploads/2024/03/LLM-Side-Channel.pdf
521
- if (event.type === MessageUpdateType.Stream) {
522
- event = { ...event, token: event.token.padEnd(16, "\0") };
523
- }
524
-
525
- messageToWriteTo.updatedAt = new Date();
526
-
527
- const enqueueUpdate = async () => {
528
- if (clientDetached) return;
529
- try {
530
- controller.enqueue(JSON.stringify(event) + "\n");
531
- if (event.type === MessageUpdateType.FinalAnswer) {
532
- controller.enqueue(" ".repeat(4096));
533
- }
534
- } catch (err) {
535
- clientDetached = true;
536
- logger.info(
537
- { conversationId: convId.toString() },
538
- "Client detached during message streaming"
539
- );
540
- }
541
- };
542
-
543
- await enqueueUpdate();
544
-
545
- if (clientDetached) {
546
- await persistConversation();
547
- }
548
- }
549
-
550
- let hasError = false;
551
- const initialMessageContent = messageToWriteTo.content;
552
-
553
- try {
554
- // Fetch user settings once for all overrides and billing org
555
- const userSettings = await collections.settings.findOne(authCondition(locals));
556
-
557
- // Add billing organization to locals for the endpoint to use
558
- locals.billingOrganization = userSettings?.billingOrganization;
559
-
560
- const ctx: TextGenerationContext = {
561
- model,
562
- endpoint: await model.getEndpoint(),
563
- conv,
564
- messages: messagesForPrompt,
565
- assistant: undefined,
566
- promptedAt,
567
- ip: getClientAddress(),
568
- username: locals.user?.username,
569
- // Force-enable multimodal if user settings say so for this model
570
- forceMultimodal: Boolean(userSettings?.multimodalOverrides?.[model.id]),
571
- // Force-enable tools if user settings say so for this model
572
- forceTools: Boolean(userSettings?.toolsOverrides?.[model.id]),
573
- // Inference provider preference (HuggingChat only, skip for router models)
574
- provider:
575
- config.isHuggingChat && !model.isRouter
576
- ? userSettings?.providerOverrides?.[model.id]
577
- : undefined,
578
- locals,
579
- abortController: ctrl,
580
- autopilot: autopilot === true,
581
- autopilotMaxSteps,
582
- };
583
- // run the text generation and send updates to the client
584
- for await (const event of textGeneration(ctx)) await update(event);
585
- if (ctrl.signal.aborted) {
586
- abortedByUser = true;
587
- }
588
- if (abortedByUser && !finalAnswerReceived) {
589
- const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
590
- await update({
591
- type: MessageUpdateType.FinalAnswer,
592
- text: partialText,
593
- interrupted: true,
594
- });
595
- }
596
- } catch (e) {
597
- const err = e as Error;
598
- const isAbortError =
599
- err?.name === "AbortError" ||
600
- err?.name === "APIUserAbortError" ||
601
- err?.message === "Request was aborted.";
602
- if (isAbortError || ctrl.signal.aborted) {
603
- abortedByUser = true;
604
- logger.info({ conversationId: conversationKey }, "Generation aborted by user");
605
- if (!finalAnswerReceived) {
606
- const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
607
- await update({
608
- type: MessageUpdateType.FinalAnswer,
609
- text: partialText,
610
- interrupted: true,
611
- });
612
- }
613
- } else {
614
- hasError = true;
615
- // Extract status code if available from HTTPError or APIError
616
- const errObj = err as unknown as Record<string, unknown>;
617
- const statusCode =
618
- (typeof errObj.statusCode === "number" ? errObj.statusCode : undefined) ||
619
- (typeof errObj.status === "number" ? errObj.status : undefined);
620
- await update({
621
- type: MessageUpdateType.Status,
622
- status: MessageUpdateStatus.Error,
623
- message: err.message,
624
- ...(statusCode && { statusCode }),
625
- });
626
- logger.error(err, "Error in conversation stream");
627
- }
628
- } finally {
629
- // check if no output was generated
630
- if (!hasError && !abortedByUser && messageToWriteTo.content === initialMessageContent) {
631
- hasError = true;
632
- logger.warn(
633
- {
634
- conversationId: conversationKey,
635
- updatesCount: messageToWriteTo.updates?.length ?? 0,
636
- filesCount: messageToWriteTo.files?.length ?? 0,
637
- reasoningLen: messageToWriteTo.reasoning?.length ?? 0,
638
- initialLen: initialMessageContent.length,
639
- finalLen: messageToWriteTo.content.length,
640
- },
641
- "No output generated after streaming; emitting error status"
642
- );
643
- await update({
644
- type: MessageUpdateType.Status,
645
- status: MessageUpdateStatus.Error,
646
- message: "No output was generated. Something went wrong.",
647
- });
648
- }
649
- }
650
-
651
- if (!hasError && !finishedStatusSent) {
652
- await update({
653
- type: MessageUpdateType.Status,
654
- status: MessageUpdateStatus.Finished,
655
- });
656
- }
657
-
658
- await persistConversation();
659
- abortRegistry.unregister(conversationKey, ctrl);
660
-
661
- // used to detect if cancel() is called bc of interrupt or just because the connection closes
662
- doneStreaming = true;
663
- if (!clientDetached) {
664
- controller.close();
665
- }
666
- },
667
- async cancel() {
668
- if (doneStreaming) return;
669
- clientDetached = true;
670
- await persistConversation();
671
- },
672
- });
673
-
674
- if (metricsEnabled && metrics) {
675
- metrics.model.messagesTotal.inc(metricsLabels);
676
- }
677
-
678
- // Todo: maybe we should wait for the message to be saved before ending the response - in case of errors
679
- return new Response(stream, {
680
- headers: {
681
- "Content-Type": "application/jsonl",
682
- },
683
- });
684
- }
685
-
686
- export async function DELETE({ locals, params }) {
687
- const convId = new ObjectId(params.id);
688
-
689
- const conv = await collections.conversations.findOne({
690
- _id: convId,
691
- ...authCondition(locals),
692
- });
693
-
694
- if (!conv) {
695
- error(404, "Conversation not found");
696
- }
697
-
698
- await collections.conversations.deleteOne({ _id: conv._id });
699
-
700
- return new Response();
701
- }
702
-
703
- export async function PATCH({ request, locals, params }) {
704
- const values = z
705
- .object({
706
- title: z.string().trim().min(1).max(100).optional(),
707
- model: validModelIdSchema.optional(),
708
- })
709
- .parse(await request.json());
710
-
711
- const convId = new ObjectId(params.id);
712
-
713
- const conv = await collections.conversations.findOne({
714
- _id: convId,
715
- ...authCondition(locals),
716
- });
717
-
718
- if (!conv) {
719
- error(404, "Conversation not found");
720
- }
721
-
722
- // Only include defined values in the update, with title sanitized
723
- const updateValues = {
724
- ...(values.title !== undefined && {
725
- title: values.title.replace(/<\/?think>/gi, "").trim(),
726
- }),
727
- ...(values.model !== undefined && { model: values.model }),
728
- };
729
-
730
- await collections.conversations.updateOne(
731
- {
732
- _id: convId,
733
- },
734
- {
735
- $set: updateValues,
736
- }
737
- );
738
-
739
- return new Response();
740
- }
1
+ import { authCondition } from "$lib/server/auth";
2
+ import { collections } from "$lib/server/database";
3
+ import { config } from "$lib/server/config";
4
+ import { models, validModelIdSchema } from "$lib/server/models";
5
+ import { ERROR_MESSAGES } from "$lib/stores/errors";
6
+ import type { Message } from "$lib/types/Message";
7
+ import { error } from "@sveltejs/kit";
8
+ import { ObjectId } from "mongodb";
9
+ import { z } from "zod";
10
+ import {
11
+ MessageUpdateStatus,
12
+ MessageUpdateType,
13
+ MessageReasoningUpdateType,
14
+ type MessageUpdate,
15
+ type MessageStreamUpdate,
16
+ } from "$lib/types/MessageUpdate";
17
+ import { uploadFile } from "$lib/server/files/uploadFile";
18
+ import { convertLegacyConversation } from "$lib/utils/tree/convertLegacyConversation";
19
+ import { isMessageId } from "$lib/utils/tree/isMessageId";
20
+ import { buildSubtree } from "$lib/utils/tree/buildSubtree.js";
21
+ import { addChildren } from "$lib/utils/tree/addChildren.js";
22
+ import { addSibling } from "$lib/utils/tree/addSibling.js";
23
+ import { usageLimits } from "$lib/server/usageLimits";
24
+ import { textGeneration } from "$lib/server/textGeneration";
25
+ import type { TextGenerationContext } from "$lib/server/textGeneration/types";
26
+ import { logger } from "$lib/server/logger.js";
27
+ import { AbortRegistry } from "$lib/server/abortRegistry";
28
+ import { MetricsServer } from "$lib/server/metrics";
29
+
30
+ export async function POST({ request, locals, params, getClientAddress }) {
31
+ const id = z.string().parse(params.id);
32
+ const convId = new ObjectId(id);
33
+ const promptedAt = new Date();
34
+
35
+ const userId = locals.user?._id ?? locals.sessionId;
36
+
37
+ // check user
38
+ if (!userId) {
39
+ error(401, "Unauthorized");
40
+ }
41
+
42
+ // check if the user has access to the conversation
43
+ const convBeforeCheck = await collections.conversations.findOne({
44
+ _id: convId,
45
+ ...authCondition(locals),
46
+ });
47
+
48
+ if (convBeforeCheck && !convBeforeCheck.rootMessageId) {
49
+ const res = await collections.conversations.updateOne(
50
+ {
51
+ _id: convId,
52
+ },
53
+ {
54
+ $set: {
55
+ ...convBeforeCheck,
56
+ ...convertLegacyConversation(convBeforeCheck),
57
+ },
58
+ }
59
+ );
60
+
61
+ if (!res.acknowledged) {
62
+ error(500, "Failed to convert conversation");
63
+ }
64
+ }
65
+
66
+ const conv = await collections.conversations.findOne({
67
+ _id: convId,
68
+ ...authCondition(locals),
69
+ });
70
+
71
+ if (!conv) {
72
+ error(404, "Conversation not found");
73
+ }
74
+
75
+ // register the event for ratelimiting
76
+ await collections.messageEvents.insertOne({
77
+ type: "message",
78
+ userId,
79
+ createdAt: new Date(),
80
+ expiresAt: new Date(Date.now() + 60_000),
81
+ ip: getClientAddress(),
82
+ });
83
+
84
+ if (usageLimits?.messagesPerMinute) {
85
+ // check if the user is rate limited
86
+ const nEvents = Math.max(
87
+ await collections.messageEvents.countDocuments({
88
+ userId,
89
+ type: "message",
90
+ expiresAt: { $gt: new Date() },
91
+ }),
92
+ await collections.messageEvents.countDocuments({
93
+ ip: getClientAddress(),
94
+ type: "message",
95
+ expiresAt: { $gt: new Date() },
96
+ })
97
+ );
98
+ if (nEvents > usageLimits.messagesPerMinute) {
99
+ error(429, ERROR_MESSAGES.rateLimited);
100
+ }
101
+ }
102
+
103
+ if (usageLimits?.messages && conv.messages.length > usageLimits.messages) {
104
+ error(
105
+ 429,
106
+ `This conversation has more than ${usageLimits.messages} messages. Start a new one to continue`
107
+ );
108
+ }
109
+
110
+ // fetch the model
111
+ const model = models.find((m) => m.id === conv.model);
112
+
113
+ if (!model) {
114
+ error(410, "Model not available anymore");
115
+ }
116
+
117
+ // finally parse the content of the request
118
+ const form = await request.formData();
119
+
120
+ const json = form.get("data");
121
+
122
+ if (!json || typeof json !== "string") {
123
+ error(400, "Invalid request");
124
+ }
125
+
126
+ const {
127
+ inputs: newPrompt,
128
+ id: messageId,
129
+ is_retry: isRetry,
130
+ selectedMcpServerNames,
131
+ selectedMcpServers,
132
+ autopilot,
133
+ autopilotMaxSteps,
134
+ } = z
135
+ .object({
136
+ id: z.string().uuid().refine(isMessageId).optional(), // parent message id to append to for a normal message, or the message id for a retry/continue
137
+ inputs: z.optional(
138
+ z
139
+ .string()
140
+ .min(1)
141
+ .transform((s) => s.replace(/\r\n/g, "\n"))
142
+ ),
143
+ is_retry: z.optional(z.boolean()),
144
+ autopilot: z.optional(z.boolean()),
145
+ // User-configurable cap on autopilot tool-call loops. Server clamps to [1, 100].
146
+ autopilotMaxSteps: z.optional(z.number().int().min(1).max(100)),
147
+ selectedMcpServerNames: z.optional(z.array(z.string())),
148
+ selectedMcpServers: z
149
+ .optional(
150
+ z.array(
151
+ z.object({
152
+ name: z.string(),
153
+ url: z.string(),
154
+ headers: z
155
+ .optional(z.array(z.object({ key: z.string(), value: z.string() })))
156
+ .default([]),
157
+ })
158
+ )
159
+ )
160
+ .default([]),
161
+ files: z.optional(
162
+ z.array(
163
+ z.object({
164
+ type: z.literal("base64").or(z.literal("hash")),
165
+ name: z.string(),
166
+ value: z.string(),
167
+ mime: z.string(),
168
+ })
169
+ )
170
+ ),
171
+ })
172
+ .parse(JSON.parse(json));
173
+
174
+ // Attach MCP selection to locals so the text generation pipeline can consume it
175
+ try {
176
+ (locals as unknown as Record<string, unknown>).mcp = {
177
+ selectedServerNames: selectedMcpServerNames,
178
+ selectedServers: (selectedMcpServers ?? []).map((s) => ({
179
+ name: s.name,
180
+ url: s.url,
181
+ headers:
182
+ s.headers && s.headers.length > 0
183
+ ? Object.fromEntries(s.headers.map((h) => [h.key, h.value]))
184
+ : undefined,
185
+ })),
186
+ };
187
+ } catch {
188
+ // ignore attachment errors, pipeline will just use env servers
189
+ }
190
+
191
+ const inputFiles = await Promise.all(
192
+ form
193
+ .getAll("files")
194
+ .filter((entry): entry is File => entry instanceof File && entry.size > 0)
195
+ .map(async (file) => {
196
+ const [type, ...name] = file.name.split(";");
197
+
198
+ return {
199
+ type: z.literal("base64").or(z.literal("hash")).parse(type),
200
+ value: await file.text(),
201
+ mime: file.type,
202
+ name: name.join(";"),
203
+ };
204
+ })
205
+ );
206
+
207
+ if (usageLimits?.messageLength && (newPrompt?.length ?? 0) > usageLimits.messageLength) {
208
+ error(400, "Message too long.");
209
+ }
210
+
211
+ // each file is either:
212
+ // base64 string requiring upload to the server
213
+ // hash pointing to an existing file
214
+ const hashFiles = inputFiles?.filter((file) => file.type === "hash") ?? [];
215
+ const b64Files =
216
+ inputFiles
217
+ ?.filter((file) => file.type !== "hash")
218
+ .map((file) => {
219
+ const blob = Buffer.from(file.value, "base64");
220
+ return new File([blob], file.name, { type: file.mime });
221
+ }) ?? [];
222
+
223
+ // check sizes
224
+ // todo: make configurable
225
+ if (b64Files.some((file) => file.size > 10 * 1024 * 1024)) {
226
+ error(413, "File too large, should be <10MB");
227
+ }
228
+
229
+ const uploadedFiles = await Promise.all(b64Files.map((file) => uploadFile(file, conv))).then(
230
+ (files) => [...files, ...hashFiles]
231
+ );
232
+
233
+ // we will append tokens to the content of this message
234
+ let messageToWriteToId: Message["id"] | undefined = undefined;
235
+ // used for building the prompt, subtree of the conversation that goes from the latest message to the root
236
+ let messagesForPrompt: Message[] = [];
237
+
238
+ if (isRetry && messageId) {
239
+ // two cases, if we're retrying a user message with a newPrompt set,
240
+ // it means we're editing a user message
241
+ // if we're retrying on an assistant message, newPrompt cannot be set
242
+ // it means we're retrying the last assistant message for a new answer
243
+
244
+ const messageToRetry = conv.messages.find((message) => message.id === messageId);
245
+
246
+ if (!messageToRetry) {
247
+ error(404, "Message not found");
248
+ }
249
+
250
+ if (messageToRetry.from === "user" && newPrompt) {
251
+ // add a sibling to this message from the user, with the alternative prompt
252
+ // add a children to that sibling, where we can write to
253
+ const newUserMessageId = addSibling(
254
+ conv,
255
+ {
256
+ from: "user",
257
+ content: newPrompt,
258
+ files: uploadedFiles,
259
+ createdAt: new Date(),
260
+ updatedAt: new Date(),
261
+ },
262
+ messageId
263
+ );
264
+ messageToWriteToId = addChildren(
265
+ conv,
266
+ {
267
+ from: "assistant",
268
+ content: "",
269
+ createdAt: new Date(),
270
+ updatedAt: new Date(),
271
+ },
272
+ newUserMessageId
273
+ );
274
+ messagesForPrompt = buildSubtree(conv, newUserMessageId);
275
+ } else if (messageToRetry.from === "assistant") {
276
+ // we're retrying an assistant message, to generate a new answer
277
+ // just add a sibling to the assistant answer where we can write to
278
+ messageToWriteToId = addSibling(
279
+ conv,
280
+ { from: "assistant", content: "", createdAt: new Date(), updatedAt: new Date() },
281
+ messageId
282
+ );
283
+ messagesForPrompt = buildSubtree(conv, messageId);
284
+ messagesForPrompt.pop(); // don't need the latest assistant message in the prompt since we're retrying it
285
+ }
286
+ } else {
287
+ // just a normal linear conversation, so we add the user message
288
+ // and the blank assistant message back to back
289
+ const newUserMessageId = addChildren(
290
+ conv,
291
+ {
292
+ from: "user",
293
+ content: newPrompt ?? "",
294
+ files: uploadedFiles,
295
+ createdAt: new Date(),
296
+ updatedAt: new Date(),
297
+ },
298
+ messageId
299
+ );
300
+
301
+ messageToWriteToId = addChildren(
302
+ conv,
303
+ {
304
+ from: "assistant",
305
+ content: "",
306
+ createdAt: new Date(),
307
+ updatedAt: new Date(),
308
+ },
309
+ newUserMessageId
310
+ );
311
+ // build the prompt from the user message
312
+ messagesForPrompt = buildSubtree(conv, newUserMessageId);
313
+ }
314
+
315
+ const messageToWriteTo = conv.messages.find((message) => message.id === messageToWriteToId);
316
+ if (!messageToWriteTo) {
317
+ error(500, "Failed to create message");
318
+ }
319
+ if (messagesForPrompt.length === 0) {
320
+ error(500, "Failed to create prompt");
321
+ }
322
+
323
+ // update the conversation with the new messages
324
+ await collections.conversations.updateOne(
325
+ { _id: convId },
326
+ { $set: { messages: conv.messages, title: conv.title, updatedAt: new Date() } }
327
+ );
328
+
329
+ let doneStreaming = false;
330
+ let clientDetached = false;
331
+
332
+ let lastTokenTimestamp: undefined | Date = undefined;
333
+ let firstTokenObserved = false;
334
+ const metricsEnabled = MetricsServer.isEnabled();
335
+ const metrics = metricsEnabled ? MetricsServer.getMetrics() : undefined;
336
+ const metricsModelId = model.id ?? model.name ?? conv.model;
337
+ const metricsLabels = { model: metricsModelId };
338
+
339
+ const persistConversation = async () => {
340
+ const messagesForSave = conv.messages.map((msg) => {
341
+ const filteredUpdates =
342
+ msg.updates
343
+ ?.filter(
344
+ (u) =>
345
+ !(u.type === MessageUpdateType.Status && u.status === MessageUpdateStatus.KeepAlive)
346
+ )
347
+ .map((u) => {
348
+ if (u.type !== MessageUpdateType.Stream) return u;
349
+ // Preserve existing len if already compressed, otherwise compute from token
350
+ const len = u.len ?? (u.token ?? "").length;
351
+ // store a lightweight marker to preserve ordering without duplicating content
352
+ return { type: MessageUpdateType.Stream, token: "", len } satisfies MessageStreamUpdate;
353
+ }) ?? [];
354
+
355
+ return { ...msg, updates: filteredUpdates };
356
+ });
357
+
358
+ await collections.conversations.updateOne(
359
+ { _id: convId },
360
+ { $set: { messages: messagesForSave, title: conv.title, updatedAt: new Date() } }
361
+ );
362
+ };
363
+
364
+ const abortRegistry = AbortRegistry.getInstance();
365
+
366
+ // we now build the stream
367
+ const stream = new ReadableStream({
368
+ async start(controller) {
369
+ const conversationKey = convId.toString();
370
+ const ctrl = new AbortController();
371
+ abortRegistry.register(conversationKey, ctrl);
372
+
373
+ let finalAnswerReceived = false;
374
+ let abortedByUser = false;
375
+ let finishedStatusSent = false;
376
+
377
+ messageToWriteTo.updates ??= [];
378
+ async function update(event: MessageUpdate) {
379
+ if (!messageToWriteTo || !conv) {
380
+ throw Error("No message or conversation to write events to");
381
+ }
382
+
383
+ if (
384
+ event.type === MessageUpdateType.Status &&
385
+ event.status === MessageUpdateStatus.Finished
386
+ ) {
387
+ finishedStatusSent = true;
388
+ }
389
+
390
+ // Add token to content or skip if empty
391
+ if (event.type === MessageUpdateType.Stream) {
392
+ if (event.token === "") return;
393
+ messageToWriteTo.content += event.token;
394
+
395
+ if (metricsEnabled && metrics) {
396
+ const now = Date.now();
397
+ metrics.model.tokenCountTotal.inc(metricsLabels);
398
+
399
+ if (!firstTokenObserved) {
400
+ metrics.model.timeToFirstToken.observe(metricsLabels, now - promptedAt.getTime());
401
+ firstTokenObserved = true;
402
+ }
403
+
404
+ const previousTimestamp = lastTokenTimestamp
405
+ ? lastTokenTimestamp.getTime()
406
+ : promptedAt.getTime();
407
+ metrics.model.timePerOutputToken.observe(metricsLabels, now - previousTimestamp);
408
+ }
409
+
410
+ lastTokenTimestamp = new Date();
411
+ }
412
+
413
+ // Append reasoning stream tokens to message.reasoning (server-side)
414
+ else if (
415
+ event.type === MessageUpdateType.Reasoning &&
416
+ event.subtype === MessageReasoningUpdateType.Stream &&
417
+ "token" in event
418
+ ) {
419
+ messageToWriteTo.reasoning ??= "";
420
+ messageToWriteTo.reasoning += event.token;
421
+ }
422
+
423
+ // Set the title
424
+ else if (event.type === MessageUpdateType.Title) {
425
+ // Always strip <think> markers from titles when saving
426
+ const sanitizedTitle = event.title.replace(/<\/?think>/gi, "").trim();
427
+ conv.title = sanitizedTitle;
428
+ await collections.conversations.updateOne(
429
+ { _id: convId },
430
+ { $set: { title: conv?.title, updatedAt: new Date() } }
431
+ );
432
+ }
433
+
434
+ // Set the final text and the interrupted flag
435
+ else if (event.type === MessageUpdateType.FinalAnswer) {
436
+ messageToWriteTo.interrupted = event.interrupted;
437
+ // Default behavior: replace the streamed text with the provider's final text.
438
+ // However, when tools (MCP/function calls) were used, providers often stream
439
+ // some content (e.g., a story) before triggering tools, then return a
440
+ // different follow‑up message afterwards (e.g., an image caption). Our
441
+ // previous logic overwrote the pre‑tool content. Preserve it by merging in
442
+ // the pre‑tool stream when tool updates occurred and the final text does
443
+ // not already include the streamed prefix.
444
+ const hadTools = (messageToWriteTo.updates ?? []).some(
445
+ (u) => u.type === MessageUpdateType.Tool
446
+ );
447
+
448
+ if (hadTools) {
449
+ const existing = messageToWriteTo.content.slice(initialMessageContent.length);
450
+ if (existing && existing.length > 0) {
451
+ // A. If we already streamed the same final text, keep as-is.
452
+ if (event.text && existing.endsWith(event.text)) {
453
+ messageToWriteTo.content = initialMessageContent + existing;
454
+ }
455
+ // B. If the final text already includes the streamed prefix, use it verbatim.
456
+ else if (event.text && event.text.startsWith(existing)) {
457
+ messageToWriteTo.content = initialMessageContent + event.text;
458
+ }
459
+ // C. Otherwise, merge with a paragraph break for readability.
460
+ else {
461
+ const needsGap = !/\n\n$/.test(existing) && !/^\n/.test(event.text ?? "");
462
+ messageToWriteTo.content =
463
+ initialMessageContent + existing + (needsGap ? "\n\n" : "") + (event.text ?? "");
464
+ }
465
+ } else {
466
+ messageToWriteTo.content = initialMessageContent + (event.text ?? "");
467
+ }
468
+ } else {
469
+ messageToWriteTo.content = initialMessageContent + event.text;
470
+ }
471
+ finalAnswerReceived = true;
472
+
473
+ if (metricsEnabled && metrics) {
474
+ metrics.model.latency.observe(metricsLabels, Date.now() - promptedAt.getTime());
475
+ }
476
+ }
477
+
478
+ // Add file
479
+ else if (event.type === MessageUpdateType.File) {
480
+ messageToWriteTo.files = [
481
+ ...(messageToWriteTo.files ?? []),
482
+ { type: "hash", name: event.name, value: event.sha, mime: event.mime },
483
+ ];
484
+ }
485
+
486
+ // Store router metadata (for router models) or provider info (for all models)
487
+ else if (event.type === MessageUpdateType.RouterMetadata) {
488
+ // Merge metadata updates to preserve existing fields (router may send route/model first, then provider comes later)
489
+ if (model?.isRouter) {
490
+ messageToWriteTo.routerMetadata = {
491
+ route: event.route || messageToWriteTo.routerMetadata?.route || "",
492
+ model: event.model || messageToWriteTo.routerMetadata?.model || "",
493
+ provider: event.provider || messageToWriteTo.routerMetadata?.provider,
494
+ };
495
+ }
496
+ // Store provider-only metadata for non-router models if available
497
+ else if (event.provider) {
498
+ messageToWriteTo.routerMetadata = {
499
+ route: messageToWriteTo.routerMetadata?.route || "",
500
+ model: messageToWriteTo.routerMetadata?.model || "",
501
+ provider: event.provider,
502
+ };
503
+ }
504
+ }
505
+
506
+ // Append updates for audit/replay (streams too, to preserve ordering)
507
+ if (
508
+ !(
509
+ event.type === MessageUpdateType.Status &&
510
+ event.status === MessageUpdateStatus.KeepAlive
511
+ )
512
+ ) {
513
+ messageToWriteTo?.updates?.push(
514
+ event.type === MessageUpdateType.Stream ? { ...event } : event
515
+ );
516
+ }
517
+
518
+ // Avoid remote keylogging attack executed by watching packet lengths
519
+ // by padding the text with null chars to a fixed length
520
+ // https://cdn.arstechnica.net/wp-content/uploads/2024/03/LLM-Side-Channel.pdf
521
+ if (event.type === MessageUpdateType.Stream) {
522
+ event = { ...event, token: event.token.padEnd(16, "\0") };
523
+ }
524
+
525
+ messageToWriteTo.updatedAt = new Date();
526
+
527
+ const enqueueUpdate = async () => {
528
+ if (clientDetached) return;
529
+ try {
530
+ controller.enqueue(JSON.stringify(event) + "\n");
531
+ if (event.type === MessageUpdateType.FinalAnswer) {
532
+ controller.enqueue(" ".repeat(4096));
533
+ }
534
+ } catch (err) {
535
+ clientDetached = true;
536
+ logger.info(
537
+ { conversationId: convId.toString() },
538
+ "Client detached during message streaming"
539
+ );
540
+ }
541
+ };
542
+
543
+ await enqueueUpdate();
544
+
545
+ if (clientDetached) {
546
+ await persistConversation();
547
+ }
548
+ }
549
+
550
+ let hasError = false;
551
+ const initialMessageContent = messageToWriteTo.content;
552
+
553
+ try {
554
+ // Fetch user settings once for all overrides and billing org
555
+ const userSettings = await collections.settings.findOne(authCondition(locals));
556
+
557
+ // Add billing organization to locals for the endpoint to use
558
+ locals.billingOrganization = userSettings?.billingOrganization;
559
+
560
+ const ctx: TextGenerationContext = {
561
+ model,
562
+ endpoint: await model.getEndpoint(),
563
+ conv,
564
+ messages: messagesForPrompt,
565
+ assistant: undefined,
566
+ promptedAt,
567
+ ip: getClientAddress(),
568
+ username: locals.user?.username,
569
+ // Force-enable multimodal if user settings say so for this model
570
+ forceMultimodal: Boolean(userSettings?.multimodalOverrides?.[model.id]),
571
+ // Force-enable tools if user settings say so for this model
572
+ forceTools: Boolean(userSettings?.toolsOverrides?.[model.id]),
573
+ // Inference provider preference (HuggingChat only, skip for router models)
574
+ provider:
575
+ config.isHuggingChat && !model.isRouter
576
+ ? userSettings?.providerOverrides?.[model.id]
577
+ : undefined,
578
+ locals,
579
+ abortController: ctrl,
580
+ autopilot: autopilot === true,
581
+ autopilotMaxSteps,
582
+ };
583
+ // run the text generation and send updates to the client
584
+ for await (const event of textGeneration(ctx)) await update(event);
585
+ if (ctrl.signal.aborted) {
586
+ abortedByUser = true;
587
+ }
588
+ if (abortedByUser && !finalAnswerReceived) {
589
+ const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
590
+ await update({
591
+ type: MessageUpdateType.FinalAnswer,
592
+ text: partialText,
593
+ interrupted: true,
594
+ });
595
+ }
596
+ } catch (e) {
597
+ const err = e as Error;
598
+ const isAbortError =
599
+ err?.name === "AbortError" ||
600
+ err?.name === "APIUserAbortError" ||
601
+ err?.message === "Request was aborted.";
602
+ if (isAbortError || ctrl.signal.aborted) {
603
+ abortedByUser = true;
604
+ logger.info({ conversationId: conversationKey }, "Generation aborted by user");
605
+ if (!finalAnswerReceived) {
606
+ const partialText = messageToWriteTo.content.slice(initialMessageContent.length);
607
+ await update({
608
+ type: MessageUpdateType.FinalAnswer,
609
+ text: partialText,
610
+ interrupted: true,
611
+ });
612
+ }
613
+ } else {
614
+ hasError = true;
615
+ // Extract status code if available from HTTPError or APIError
616
+ const errObj = err as unknown as Record<string, unknown>;
617
+ const statusCode =
618
+ (typeof errObj.statusCode === "number" ? errObj.statusCode : undefined) ||
619
+ (typeof errObj.status === "number" ? errObj.status : undefined);
620
+ await update({
621
+ type: MessageUpdateType.Status,
622
+ status: MessageUpdateStatus.Error,
623
+ message: err.message,
624
+ ...(statusCode && { statusCode }),
625
+ });
626
+ logger.error(err, "Error in conversation stream");
627
+ }
628
+ } finally {
629
+ // check if no output was generated
630
+ if (!hasError && !abortedByUser && messageToWriteTo.content === initialMessageContent) {
631
+ hasError = true;
632
+ logger.warn(
633
+ {
634
+ conversationId: conversationKey,
635
+ updatesCount: messageToWriteTo.updates?.length ?? 0,
636
+ filesCount: messageToWriteTo.files?.length ?? 0,
637
+ reasoningLen: messageToWriteTo.reasoning?.length ?? 0,
638
+ initialLen: initialMessageContent.length,
639
+ finalLen: messageToWriteTo.content.length,
640
+ },
641
+ "No output generated after streaming; emitting error status"
642
+ );
643
+ await update({
644
+ type: MessageUpdateType.Status,
645
+ status: MessageUpdateStatus.Error,
646
+ message: "No output was generated. Something went wrong.",
647
+ });
648
+ }
649
+ }
650
+
651
+ if (!hasError && !finishedStatusSent) {
652
+ await update({
653
+ type: MessageUpdateType.Status,
654
+ status: MessageUpdateStatus.Finished,
655
+ });
656
+ }
657
+
658
+ await persistConversation();
659
+ abortRegistry.unregister(conversationKey, ctrl);
660
+
661
+ // used to detect if cancel() is called bc of interrupt or just because the connection closes
662
+ doneStreaming = true;
663
+ if (!clientDetached) {
664
+ controller.close();
665
+ }
666
+ },
667
+ async cancel() {
668
+ if (doneStreaming) return;
669
+ clientDetached = true;
670
+ await persistConversation();
671
+ },
672
+ });
673
+
674
+ if (metricsEnabled && metrics) {
675
+ metrics.model.messagesTotal.inc(metricsLabels);
676
+ }
677
+
678
+ // Todo: maybe we should wait for the message to be saved before ending the response - in case of errors
679
+ return new Response(stream, {
680
+ headers: {
681
+ "Content-Type": "application/jsonl",
682
+ },
683
+ });
684
+ }
685
+
686
+ export async function DELETE({ locals, params }) {
687
+ const convId = new ObjectId(params.id);
688
+
689
+ const conv = await collections.conversations.findOne({
690
+ _id: convId,
691
+ ...authCondition(locals),
692
+ });
693
+
694
+ if (!conv) {
695
+ error(404, "Conversation not found");
696
+ }
697
+
698
+ await collections.conversations.deleteOne({ _id: conv._id });
699
+
700
+ return new Response();
701
+ }
702
+
703
+ export async function PATCH({ request, locals, params }) {
704
+ const values = z
705
+ .object({
706
+ title: z.string().trim().min(1).max(100).optional(),
707
+ model: validModelIdSchema.optional(),
708
+ })
709
+ .parse(await request.json());
710
+
711
+ const convId = new ObjectId(params.id);
712
+
713
+ const conv = await collections.conversations.findOne({
714
+ _id: convId,
715
+ ...authCondition(locals),
716
+ });
717
+
718
+ if (!conv) {
719
+ error(404, "Conversation not found");
720
+ }
721
+
722
+ // Only include defined values in the update, with title sanitized
723
+ const updateValues = {
724
+ ...(values.title !== undefined && {
725
+ title: values.title.replace(/<\/?think>/gi, "").trim(),
726
+ }),
727
+ ...(values.model !== undefined && { model: values.model }),
728
+ };
729
+
730
+ await collections.conversations.updateOne(
731
+ {
732
+ _id: convId,
733
+ },
734
+ {
735
+ $set: updateValues,
736
+ }
737
+ );
738
+
739
+ return new Response();
740
+ }