ruflo 3.10.45 → 3.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (498) hide show
  1. package/README.md +412 -412
  2. package/bin/ruflo.js +77 -77
  3. package/package.json +113 -113
  4. package/src/chat-ui/Dockerfile +25 -25
  5. package/src/chat-ui/patch-mcp-url-safety.sh +28 -28
  6. package/src/config/config.example.json +76 -76
  7. package/src/mcp-bridge/Dockerfile +45 -45
  8. package/src/mcp-bridge/index.js +1692 -1692
  9. package/src/mcp-bridge/mcp-stdio-kernel.js +159 -159
  10. package/src/mcp-bridge/package.json +17 -17
  11. package/src/mcp-bridge/test-harness.js +470 -470
  12. package/src/nginx/Dockerfile +10 -10
  13. package/src/nginx/nginx.conf +67 -67
  14. package/src/nginx/static/favicon-dark.svg +4 -4
  15. package/src/nginx/static/favicon.svg +4 -4
  16. package/src/nginx/static/icon.svg +5 -5
  17. package/src/nginx/static/logo.svg +9 -9
  18. package/src/nginx/static/manifest.json +22 -22
  19. package/src/nginx/static/welcome.js +184 -184
  20. package/src/ruvocal/.claude/skills/add-model-descriptions/SKILL.md +73 -73
  21. package/src/ruvocal/.claude-flow/daemon-state.json +135 -0
  22. package/src/ruvocal/.claude-flow/data/pending-insights.jsonl +0 -0
  23. package/src/ruvocal/.claude-flow/data/ranked-context.json +5 -0
  24. package/src/ruvocal/.claude-flow/logs/daemon.log +31 -0
  25. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_prompt.log +989 -0
  26. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_result.log +67 -0
  27. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_prompt.log +989 -0
  28. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_result.log +93 -0
  29. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_prompt.log +1498 -0
  30. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_result.log +93 -0
  31. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_prompt.log +1498 -0
  32. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_result.log +100 -0
  33. package/src/ruvocal/.claude-flow/metrics/codebase-map.json +11 -0
  34. package/src/ruvocal/.claude-flow/metrics/consolidation.json +6 -0
  35. package/src/ruvocal/.claude-flow/neural/stats.json +6 -0
  36. package/src/ruvocal/.claude-flow/sessions/current.json +13 -0
  37. package/src/ruvocal/.devcontainer/Dockerfile +9 -9
  38. package/src/ruvocal/.devcontainer/devcontainer.json +36 -36
  39. package/src/ruvocal/.dockerignore +16 -16
  40. package/src/ruvocal/.eslintignore +13 -13
  41. package/src/ruvocal/.eslintrc.cjs +45 -45
  42. package/src/ruvocal/.gcloudignore +18 -18
  43. package/src/ruvocal/.github/ISSUE_TEMPLATE/bug-report--chat-ui-.md +43 -43
  44. package/src/ruvocal/.github/ISSUE_TEMPLATE/config-support.md +9 -9
  45. package/src/ruvocal/.github/ISSUE_TEMPLATE/feature-request--chat-ui-.md +17 -17
  46. package/src/ruvocal/.github/ISSUE_TEMPLATE/huggingchat.md +11 -11
  47. package/src/ruvocal/.github/release.yml +16 -16
  48. package/src/ruvocal/.github/workflows/build-docs.yml +18 -18
  49. package/src/ruvocal/.github/workflows/build-image.yml +142 -142
  50. package/src/ruvocal/.github/workflows/build-pr-docs.yml +20 -20
  51. package/src/ruvocal/.github/workflows/deploy-dev.yml +63 -63
  52. package/src/ruvocal/.github/workflows/deploy-prod.yml +78 -78
  53. package/src/ruvocal/.github/workflows/lint-and-test.yml +84 -84
  54. package/src/ruvocal/.github/workflows/slugify.yaml +72 -72
  55. package/src/ruvocal/.github/workflows/trufflehog.yml +17 -17
  56. package/src/ruvocal/.github/workflows/upload-pr-documentation.yml +16 -16
  57. package/src/ruvocal/.husky/lint-stage-config.js +4 -4
  58. package/src/ruvocal/.husky/pre-commit +2 -2
  59. package/src/ruvocal/.prettierignore +14 -14
  60. package/src/ruvocal/.prettierrc +7 -7
  61. package/src/ruvocal/.swarm/attestation.db +0 -0
  62. package/src/ruvocal/.swarm/hnsw.index +0 -0
  63. package/src/ruvocal/.swarm/hnsw.metadata.json +1 -0
  64. package/src/ruvocal/.swarm/memory.db +0 -0
  65. package/src/ruvocal/.swarm/schema.sql +305 -0
  66. package/src/ruvocal/CLAUDE.md +126 -126
  67. package/src/ruvocal/Dockerfile +96 -96
  68. package/src/ruvocal/LICENSE +202 -202
  69. package/src/ruvocal/PRIVACY.md +41 -41
  70. package/src/ruvocal/README.md +164 -164
  71. package/src/ruvocal/chart/Chart.yaml +5 -5
  72. package/src/ruvocal/chart/env/dev.yaml +260 -260
  73. package/src/ruvocal/chart/env/prod.yaml +273 -273
  74. package/src/ruvocal/chart/templates/_helpers.tpl +22 -22
  75. package/src/ruvocal/chart/templates/config.yaml +10 -10
  76. package/src/ruvocal/chart/templates/deployment.yaml +81 -81
  77. package/src/ruvocal/chart/templates/hpa.yaml +45 -45
  78. package/src/ruvocal/chart/templates/infisical.yaml +24 -24
  79. package/src/ruvocal/chart/templates/ingress-internal.yaml +32 -32
  80. package/src/ruvocal/chart/templates/ingress.yaml +32 -32
  81. package/src/ruvocal/chart/templates/network-policy.yaml +36 -36
  82. package/src/ruvocal/chart/templates/service-account.yaml +13 -13
  83. package/src/ruvocal/chart/templates/service-monitor.yaml +17 -17
  84. package/src/ruvocal/chart/templates/service.yaml +21 -21
  85. package/src/ruvocal/chart/values.yaml +73 -73
  86. package/src/ruvocal/cloudbuild.yaml +68 -68
  87. package/src/ruvocal/config/branding.env.example +19 -19
  88. package/src/ruvocal/docker-compose.yml +21 -21
  89. package/src/ruvocal/docs/adr/ADR-029-HUGGINGFACE-CHAT-UI-CLOUD-RUN.md +1236 -1236
  90. package/src/ruvocal/docs/adr/ADR-033-RUVECTOR-RUFLO-MCP-INTEGRATION.md +111 -111
  91. package/src/ruvocal/docs/adr/ADR-034-OPTIONAL-MCP-BACKENDS.md +117 -117
  92. package/src/ruvocal/docs/adr/ADR-035-MCP-TOOL-GROUPS.md +186 -186
  93. package/src/ruvocal/docs/adr/ADR-037-AUTOPILOT-CHAT-MODE.md +1500 -1500
  94. package/src/ruvocal/docs/adr/ADR-038-RUVOCAL-FORK.md +286 -286
  95. package/src/ruvocal/docs/source/_toctree.yml +30 -30
  96. package/src/ruvocal/docs/source/configuration/common-issues.md +38 -38
  97. package/src/ruvocal/docs/source/configuration/llm-router.md +105 -105
  98. package/src/ruvocal/docs/source/configuration/mcp-tools.md +84 -84
  99. package/src/ruvocal/docs/source/configuration/metrics.md +9 -9
  100. package/src/ruvocal/docs/source/configuration/open-id.md +57 -57
  101. package/src/ruvocal/docs/source/configuration/overview.md +89 -89
  102. package/src/ruvocal/docs/source/configuration/theming.md +20 -20
  103. package/src/ruvocal/docs/source/developing/architecture.md +48 -48
  104. package/src/ruvocal/docs/source/index.md +53 -53
  105. package/src/ruvocal/docs/source/installation/docker.md +43 -43
  106. package/src/ruvocal/docs/source/installation/helm.md +43 -43
  107. package/src/ruvocal/docs/source/installation/local.md +62 -62
  108. package/src/ruvocal/entrypoint.sh +18 -18
  109. package/src/ruvocal/mcp-bridge/Dockerfile +45 -45
  110. package/src/ruvocal/mcp-bridge/cloudbuild.yaml +49 -49
  111. package/src/ruvocal/mcp-bridge/index.js +1902 -1902
  112. package/src/ruvocal/mcp-bridge/mcp-stdio-kernel.js +159 -159
  113. package/src/ruvocal/mcp-bridge/package-lock.json +762 -762
  114. package/src/ruvocal/mcp-bridge/package.json +17 -17
  115. package/src/ruvocal/mcp-bridge/test-harness.js +470 -470
  116. package/src/ruvocal/package-lock.json +11741 -11741
  117. package/src/ruvocal/package.json +121 -121
  118. package/src/ruvocal/postcss.config.js +6 -6
  119. package/src/ruvocal/rvf.manifest.json +204 -204
  120. package/src/ruvocal/scripts/config.ts +64 -64
  121. package/src/ruvocal/scripts/generate-welcome.mjs +181 -181
  122. package/src/ruvocal/scripts/populate.ts +288 -288
  123. package/src/ruvocal/scripts/samples.txt +194 -194
  124. package/src/ruvocal/scripts/setups/vitest-setup-server.ts +44 -44
  125. package/src/ruvocal/scripts/updateLocalEnv.ts +48 -48
  126. package/src/ruvocal/src/ambient.d.ts +7 -7
  127. package/src/ruvocal/src/app.d.ts +29 -29
  128. package/src/ruvocal/src/app.html +53 -53
  129. package/src/ruvocal/src/hooks.server.ts +32 -32
  130. package/src/ruvocal/src/hooks.ts +6 -6
  131. package/src/ruvocal/src/lib/APIClient.ts +148 -148
  132. package/src/ruvocal/src/lib/actions/clickOutside.ts +18 -18
  133. package/src/ruvocal/src/lib/actions/snapScrollToBottom.ts +346 -346
  134. package/src/ruvocal/src/lib/buildPrompt.ts +33 -33
  135. package/src/ruvocal/src/lib/components/AnnouncementBanner.svelte +20 -20
  136. package/src/ruvocal/src/lib/components/BackgroundGenerationPoller.svelte +168 -168
  137. package/src/ruvocal/src/lib/components/CodeBlock.svelte +73 -73
  138. package/src/ruvocal/src/lib/components/CopyToClipBoardBtn.svelte +92 -92
  139. package/src/ruvocal/src/lib/components/DeleteConversationModal.svelte +75 -75
  140. package/src/ruvocal/src/lib/components/EditConversationModal.svelte +100 -100
  141. package/src/ruvocal/src/lib/components/ExpandNavigation.svelte +22 -22
  142. package/src/ruvocal/src/lib/components/FoundationBackground.svelte +242 -242
  143. package/src/ruvocal/src/lib/components/HoverTooltip.svelte +44 -44
  144. package/src/ruvocal/src/lib/components/HtmlPreviewModal.svelte +143 -143
  145. package/src/ruvocal/src/lib/components/InfiniteScroll.svelte +50 -50
  146. package/src/ruvocal/src/lib/components/MobileNav.svelte +300 -300
  147. package/src/ruvocal/src/lib/components/Modal.svelte +115 -115
  148. package/src/ruvocal/src/lib/components/ModelCardMetadata.svelte +71 -71
  149. package/src/ruvocal/src/lib/components/NavConversationItem.svelte +151 -151
  150. package/src/ruvocal/src/lib/components/NavMenu.svelte +313 -313
  151. package/src/ruvocal/src/lib/components/Pagination.svelte +97 -97
  152. package/src/ruvocal/src/lib/components/PaginationArrow.svelte +27 -27
  153. package/src/ruvocal/src/lib/components/Portal.svelte +24 -24
  154. package/src/ruvocal/src/lib/components/RetryBtn.svelte +18 -18
  155. package/src/ruvocal/src/lib/components/RuFloUniverse.svelte +185 -185
  156. package/src/ruvocal/src/lib/components/RufloHelpModal.svelte +411 -411
  157. package/src/ruvocal/src/lib/components/ScrollToBottomBtn.svelte +47 -47
  158. package/src/ruvocal/src/lib/components/ScrollToPreviousBtn.svelte +77 -77
  159. package/src/ruvocal/src/lib/components/ShareConversationModal.svelte +182 -182
  160. package/src/ruvocal/src/lib/components/StopGeneratingBtn.svelte +69 -69
  161. package/src/ruvocal/src/lib/components/SubscribeModal.svelte +87 -87
  162. package/src/ruvocal/src/lib/components/Switch.svelte +36 -36
  163. package/src/ruvocal/src/lib/components/SystemPromptModal.svelte +44 -44
  164. package/src/ruvocal/src/lib/components/Toast.svelte +27 -27
  165. package/src/ruvocal/src/lib/components/Tooltip.svelte +30 -30
  166. package/src/ruvocal/src/lib/components/WelcomeModal.svelte +46 -46
  167. package/src/ruvocal/src/lib/components/chat/Alternatives.svelte +77 -77
  168. package/src/ruvocal/src/lib/components/chat/BlockWrapper.svelte +72 -72
  169. package/src/ruvocal/src/lib/components/chat/ChatInput.svelte +490 -490
  170. package/src/ruvocal/src/lib/components/chat/ChatIntroduction.svelte +123 -123
  171. package/src/ruvocal/src/lib/components/chat/ChatMessage.svelte +548 -548
  172. package/src/ruvocal/src/lib/components/chat/ChatWindow.svelte +1057 -1057
  173. package/src/ruvocal/src/lib/components/chat/FileDropzone.svelte +92 -92
  174. package/src/ruvocal/src/lib/components/chat/ImageLightbox.svelte +66 -66
  175. package/src/ruvocal/src/lib/components/chat/MarkdownBlock.svelte +23 -23
  176. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte +69 -69
  177. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte.test.ts +58 -58
  178. package/src/ruvocal/src/lib/components/chat/MessageAvatar.svelte +103 -103
  179. package/src/ruvocal/src/lib/components/chat/ModelSwitch.svelte +64 -64
  180. package/src/ruvocal/src/lib/components/chat/OpenReasoningResults.svelte +81 -81
  181. package/src/ruvocal/src/lib/components/chat/TaskGroup.svelte +88 -88
  182. package/src/ruvocal/src/lib/components/chat/ToolUpdate.svelte +273 -273
  183. package/src/ruvocal/src/lib/components/chat/UploadedFile.svelte +253 -253
  184. package/src/ruvocal/src/lib/components/chat/UrlFetchModal.svelte +203 -203
  185. package/src/ruvocal/src/lib/components/chat/VoiceRecorder.svelte +214 -214
  186. package/src/ruvocal/src/lib/components/icons/IconBurger.svelte +20 -20
  187. package/src/ruvocal/src/lib/components/icons/IconCheap.svelte +20 -20
  188. package/src/ruvocal/src/lib/components/icons/IconChevron.svelte +24 -24
  189. package/src/ruvocal/src/lib/components/icons/IconDazzled.svelte +40 -40
  190. package/src/ruvocal/src/lib/components/icons/IconFast.svelte +20 -20
  191. package/src/ruvocal/src/lib/components/icons/IconLoading.svelte +22 -22
  192. package/src/ruvocal/src/lib/components/icons/IconMCP.svelte +28 -28
  193. package/src/ruvocal/src/lib/components/icons/IconMoon.svelte +21 -21
  194. package/src/ruvocal/src/lib/components/icons/IconNew.svelte +20 -20
  195. package/src/ruvocal/src/lib/components/icons/IconOmni.svelte +90 -90
  196. package/src/ruvocal/src/lib/components/icons/IconPaperclip.svelte +24 -24
  197. package/src/ruvocal/src/lib/components/icons/IconPro.svelte +37 -37
  198. package/src/ruvocal/src/lib/components/icons/IconShare.svelte +21 -21
  199. package/src/ruvocal/src/lib/components/icons/IconSun.svelte +93 -93
  200. package/src/ruvocal/src/lib/components/icons/Logo.svelte +68 -68
  201. package/src/ruvocal/src/lib/components/icons/LogoHuggingFaceBorderless.svelte +54 -54
  202. package/src/ruvocal/src/lib/components/mcp/AddServerForm.svelte +250 -250
  203. package/src/ruvocal/src/lib/components/mcp/MCPServerManager.svelte +185 -185
  204. package/src/ruvocal/src/lib/components/mcp/ServerCard.svelte +203 -203
  205. package/src/ruvocal/src/lib/components/players/AudioPlayer.svelte +82 -82
  206. package/src/ruvocal/src/lib/components/voice/AudioWaveform.svelte +96 -96
  207. package/src/ruvocal/src/lib/components/wasm/GalleryPanel.svelte +357 -357
  208. package/src/ruvocal/src/lib/constants/mcpExamples.ts +114 -114
  209. package/src/ruvocal/src/lib/constants/mime.ts +11 -11
  210. package/src/ruvocal/src/lib/constants/pagination.ts +1 -1
  211. package/src/ruvocal/src/lib/constants/publicSepToken.ts +1 -1
  212. package/src/ruvocal/src/lib/constants/routerExamples.ts +133 -133
  213. package/src/ruvocal/src/lib/constants/rvagentPresets.ts +206 -206
  214. package/src/ruvocal/src/lib/createShareLink.ts +27 -27
  215. package/src/ruvocal/src/lib/jobs/refresh-conversation-stats.ts +297 -297
  216. package/src/ruvocal/src/lib/migrations/lock.ts +56 -56
  217. package/src/ruvocal/src/lib/migrations/migrations.spec.ts +74 -74
  218. package/src/ruvocal/src/lib/migrations/migrations.ts +109 -109
  219. package/src/ruvocal/src/lib/migrations/routines/01-update-search-assistants.ts +50 -50
  220. package/src/ruvocal/src/lib/migrations/routines/02-update-assistants-models.ts +48 -48
  221. package/src/ruvocal/src/lib/migrations/routines/04-update-message-updates.ts +151 -151
  222. package/src/ruvocal/src/lib/migrations/routines/05-update-message-files.ts +56 -56
  223. package/src/ruvocal/src/lib/migrations/routines/06-trim-message-updates.ts +56 -56
  224. package/src/ruvocal/src/lib/migrations/routines/08-update-featured-to-review.ts +32 -32
  225. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.spec.ts +214 -214
  226. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.ts +88 -88
  227. package/src/ruvocal/src/lib/migrations/routines/10-update-reports-assistantid.ts +29 -29
  228. package/src/ruvocal/src/lib/migrations/routines/index.ts +15 -15
  229. package/src/ruvocal/src/lib/server/__tests__/conversation-stop-generating.spec.ts +103 -103
  230. package/src/ruvocal/src/lib/server/abortRegistry.ts +57 -57
  231. package/src/ruvocal/src/lib/server/abortedGenerations.ts +43 -43
  232. package/src/ruvocal/src/lib/server/adminToken.ts +62 -62
  233. package/src/ruvocal/src/lib/server/api/__tests__/conversations-id.spec.ts +296 -296
  234. package/src/ruvocal/src/lib/server/api/__tests__/conversations-message.spec.ts +216 -216
  235. package/src/ruvocal/src/lib/server/api/__tests__/conversations.spec.ts +235 -235
  236. package/src/ruvocal/src/lib/server/api/__tests__/misc.spec.ts +72 -72
  237. package/src/ruvocal/src/lib/server/api/__tests__/testHelpers.ts +86 -86
  238. package/src/ruvocal/src/lib/server/api/__tests__/user-reports.spec.ts +78 -78
  239. package/src/ruvocal/src/lib/server/api/__tests__/user.spec.ts +239 -239
  240. package/src/ruvocal/src/lib/server/api/types.ts +37 -37
  241. package/src/ruvocal/src/lib/server/api/utils/requireAuth.ts +22 -22
  242. package/src/ruvocal/src/lib/server/api/utils/resolveConversation.ts +69 -69
  243. package/src/ruvocal/src/lib/server/api/utils/resolveModel.ts +27 -27
  244. package/src/ruvocal/src/lib/server/api/utils/superjsonResponse.ts +15 -15
  245. package/src/ruvocal/src/lib/server/apiToken.ts +11 -11
  246. package/src/ruvocal/src/lib/server/auth.ts +554 -554
  247. package/src/ruvocal/src/lib/server/config.ts +187 -187
  248. package/src/ruvocal/src/lib/server/conversation.ts +83 -83
  249. package/src/ruvocal/src/lib/server/database/__tests__/rvf.spec.ts +709 -709
  250. package/src/ruvocal/src/lib/server/database/postgres.ts +700 -700
  251. package/src/ruvocal/src/lib/server/database/rvf.ts +1078 -1078
  252. package/src/ruvocal/src/lib/server/database.ts +145 -145
  253. package/src/ruvocal/src/lib/server/endpoints/document.ts +68 -68
  254. package/src/ruvocal/src/lib/server/endpoints/endpoints.ts +43 -43
  255. package/src/ruvocal/src/lib/server/endpoints/images.ts +211 -211
  256. package/src/ruvocal/src/lib/server/endpoints/openai/endpointOai.ts +266 -266
  257. package/src/ruvocal/src/lib/server/endpoints/openai/openAIChatToTextGenerationStream.ts +212 -212
  258. package/src/ruvocal/src/lib/server/endpoints/openai/openAICompletionToTextGenerationStream.ts +32 -32
  259. package/src/ruvocal/src/lib/server/endpoints/preprocessMessages.ts +61 -61
  260. package/src/ruvocal/src/lib/server/exitHandler.ts +59 -59
  261. package/src/ruvocal/src/lib/server/files/downloadFile.ts +34 -34
  262. package/src/ruvocal/src/lib/server/files/uploadFile.ts +29 -29
  263. package/src/ruvocal/src/lib/server/findRepoRoot.ts +13 -13
  264. package/src/ruvocal/src/lib/server/generateFromDefaultEndpoint.ts +46 -46
  265. package/src/ruvocal/src/lib/server/hooks/error.ts +37 -37
  266. package/src/ruvocal/src/lib/server/hooks/fetch.ts +22 -22
  267. package/src/ruvocal/src/lib/server/hooks/handle.ts +250 -250
  268. package/src/ruvocal/src/lib/server/hooks/init.ts +51 -51
  269. package/src/ruvocal/src/lib/server/isURLLocal.spec.ts +31 -31
  270. package/src/ruvocal/src/lib/server/isURLLocal.ts +74 -74
  271. package/src/ruvocal/src/lib/server/logger.ts +42 -42
  272. package/src/ruvocal/src/lib/server/mcp/clientPool.spec.ts +175 -175
  273. package/src/ruvocal/src/lib/server/mcp/hf.ts +32 -32
  274. package/src/ruvocal/src/lib/server/mcp/httpClient.ts +122 -122
  275. package/src/ruvocal/src/lib/server/mcp/registry.ts +76 -76
  276. package/src/ruvocal/src/lib/server/mcp/tools.ts +196 -196
  277. package/src/ruvocal/src/lib/server/metrics.ts +255 -255
  278. package/src/ruvocal/src/lib/server/models.ts +518 -518
  279. package/src/ruvocal/src/lib/server/requestContext.ts +55 -55
  280. package/src/ruvocal/src/lib/server/router/arch.ts +230 -230
  281. package/src/ruvocal/src/lib/server/router/endpoint.ts +316 -316
  282. package/src/ruvocal/src/lib/server/router/multimodal.ts +28 -28
  283. package/src/ruvocal/src/lib/server/router/policy.ts +49 -49
  284. package/src/ruvocal/src/lib/server/router/toolsRoute.ts +51 -51
  285. package/src/ruvocal/src/lib/server/router/types.ts +21 -21
  286. package/src/ruvocal/src/lib/server/sendSlack.ts +23 -23
  287. package/src/ruvocal/src/lib/server/textGeneration/generate.ts +258 -258
  288. package/src/ruvocal/src/lib/server/textGeneration/index.ts +96 -96
  289. package/src/ruvocal/src/lib/server/textGeneration/mcp/fileRefs.ts +155 -155
  290. package/src/ruvocal/src/lib/server/textGeneration/mcp/routerResolution.ts +108 -108
  291. package/src/ruvocal/src/lib/server/textGeneration/mcp/runMcpFlow.ts +831 -831
  292. package/src/ruvocal/src/lib/server/textGeneration/mcp/toolInvocation.ts +349 -349
  293. package/src/ruvocal/src/lib/server/textGeneration/mcp/wasmTools.test.ts +633 -633
  294. package/src/ruvocal/src/lib/server/textGeneration/reasoning.ts +23 -23
  295. package/src/ruvocal/src/lib/server/textGeneration/title.ts +83 -83
  296. package/src/ruvocal/src/lib/server/textGeneration/types.ts +28 -28
  297. package/src/ruvocal/src/lib/server/textGeneration/utils/prepareFiles.ts +88 -88
  298. package/src/ruvocal/src/lib/server/textGeneration/utils/routing.ts +21 -21
  299. package/src/ruvocal/src/lib/server/textGeneration/utils/toolPrompt.ts +49 -49
  300. package/src/ruvocal/src/lib/server/urlSafety.ts +77 -77
  301. package/src/ruvocal/src/lib/server/usageLimits.ts +30 -30
  302. package/src/ruvocal/src/lib/stores/autopilotStore.svelte.ts +175 -175
  303. package/src/ruvocal/src/lib/stores/backgroundGenerations.svelte.ts +32 -32
  304. package/src/ruvocal/src/lib/stores/backgroundGenerations.ts +1 -1
  305. package/src/ruvocal/src/lib/stores/errors.ts +9 -9
  306. package/src/ruvocal/src/lib/stores/isAborted.ts +3 -3
  307. package/src/ruvocal/src/lib/stores/isPro.ts +4 -4
  308. package/src/ruvocal/src/lib/stores/loading.ts +3 -3
  309. package/src/ruvocal/src/lib/stores/mcpServers.ts +534 -534
  310. package/src/ruvocal/src/lib/stores/pendingChatInput.ts +3 -3
  311. package/src/ruvocal/src/lib/stores/pendingMessage.ts +9 -9
  312. package/src/ruvocal/src/lib/stores/settings.ts +182 -182
  313. package/src/ruvocal/src/lib/stores/shareModal.ts +13 -13
  314. package/src/ruvocal/src/lib/stores/titleUpdate.ts +8 -8
  315. package/src/ruvocal/src/lib/stores/wasmMcp.ts +472 -472
  316. package/src/ruvocal/src/lib/switchTheme.ts +124 -124
  317. package/src/ruvocal/src/lib/types/AbortedGeneration.ts +8 -8
  318. package/src/ruvocal/src/lib/types/Assistant.ts +31 -31
  319. package/src/ruvocal/src/lib/types/AssistantStats.ts +11 -11
  320. package/src/ruvocal/src/lib/types/ConfigKey.ts +4 -4
  321. package/src/ruvocal/src/lib/types/ConvSidebar.ts +9 -9
  322. package/src/ruvocal/src/lib/types/Conversation.ts +27 -27
  323. package/src/ruvocal/src/lib/types/ConversationStats.ts +13 -13
  324. package/src/ruvocal/src/lib/types/Message.ts +41 -41
  325. package/src/ruvocal/src/lib/types/MessageEvent.ts +10 -10
  326. package/src/ruvocal/src/lib/types/MessageUpdate.ts +139 -139
  327. package/src/ruvocal/src/lib/types/MigrationResult.ts +7 -7
  328. package/src/ruvocal/src/lib/types/Model.ts +23 -23
  329. package/src/ruvocal/src/lib/types/Report.ts +12 -12
  330. package/src/ruvocal/src/lib/types/Review.ts +6 -6
  331. package/src/ruvocal/src/lib/types/Semaphore.ts +19 -19
  332. package/src/ruvocal/src/lib/types/Session.ts +22 -22
  333. package/src/ruvocal/src/lib/types/Settings.ts +93 -93
  334. package/src/ruvocal/src/lib/types/SharedConversation.ts +9 -9
  335. package/src/ruvocal/src/lib/types/Template.ts +6 -6
  336. package/src/ruvocal/src/lib/types/Timestamps.ts +4 -4
  337. package/src/ruvocal/src/lib/types/TokenCache.ts +6 -6
  338. package/src/ruvocal/src/lib/types/Tool.ts +77 -77
  339. package/src/ruvocal/src/lib/types/UrlDependency.ts +5 -5
  340. package/src/ruvocal/src/lib/types/User.ts +14 -14
  341. package/src/ruvocal/src/lib/utils/PublicConfig.svelte.ts +75 -75
  342. package/src/ruvocal/src/lib/utils/auth.ts +17 -17
  343. package/src/ruvocal/src/lib/utils/chunk.ts +33 -33
  344. package/src/ruvocal/src/lib/utils/cookiesAreEnabled.ts +13 -13
  345. package/src/ruvocal/src/lib/utils/debounce.ts +17 -17
  346. package/src/ruvocal/src/lib/utils/deepestChild.ts +6 -6
  347. package/src/ruvocal/src/lib/utils/favicon.ts +21 -21
  348. package/src/ruvocal/src/lib/utils/fetchJSON.ts +23 -23
  349. package/src/ruvocal/src/lib/utils/file2base64.ts +14 -14
  350. package/src/ruvocal/src/lib/utils/formatUserCount.ts +37 -37
  351. package/src/ruvocal/src/lib/utils/generationState.spec.ts +75 -75
  352. package/src/ruvocal/src/lib/utils/generationState.ts +26 -26
  353. package/src/ruvocal/src/lib/utils/getHref.ts +41 -41
  354. package/src/ruvocal/src/lib/utils/getReturnFromGenerator.ts +7 -7
  355. package/src/ruvocal/src/lib/utils/haptics.ts +64 -64
  356. package/src/ruvocal/src/lib/utils/hashConv.ts +12 -12
  357. package/src/ruvocal/src/lib/utils/hf.ts +17 -17
  358. package/src/ruvocal/src/lib/utils/isDesktop.ts +7 -7
  359. package/src/ruvocal/src/lib/utils/isUrl.ts +8 -8
  360. package/src/ruvocal/src/lib/utils/isVirtualKeyboard.ts +16 -16
  361. package/src/ruvocal/src/lib/utils/loadAttachmentsFromUrls.ts +115 -115
  362. package/src/ruvocal/src/lib/utils/marked.spec.ts +96 -96
  363. package/src/ruvocal/src/lib/utils/marked.ts +531 -531
  364. package/src/ruvocal/src/lib/utils/mcpValidation.ts +147 -147
  365. package/src/ruvocal/src/lib/utils/mergeAsyncGenerators.ts +38 -38
  366. package/src/ruvocal/src/lib/utils/messageUpdates.spec.ts +262 -262
  367. package/src/ruvocal/src/lib/utils/messageUpdates.ts +324 -324
  368. package/src/ruvocal/src/lib/utils/mime.ts +56 -56
  369. package/src/ruvocal/src/lib/utils/models.ts +14 -14
  370. package/src/ruvocal/src/lib/utils/parseBlocks.ts +120 -120
  371. package/src/ruvocal/src/lib/utils/parseIncompleteMarkdown.ts +644 -644
  372. package/src/ruvocal/src/lib/utils/parseStringToList.ts +10 -10
  373. package/src/ruvocal/src/lib/utils/randomUuid.ts +14 -14
  374. package/src/ruvocal/src/lib/utils/searchTokens.ts +33 -33
  375. package/src/ruvocal/src/lib/utils/sha256.ts +7 -7
  376. package/src/ruvocal/src/lib/utils/stringifyError.ts +12 -12
  377. package/src/ruvocal/src/lib/utils/sum.ts +3 -3
  378. package/src/ruvocal/src/lib/utils/template.spec.ts +59 -59
  379. package/src/ruvocal/src/lib/utils/template.ts +53 -53
  380. package/src/ruvocal/src/lib/utils/timeout.ts +9 -9
  381. package/src/ruvocal/src/lib/utils/toolProgress.spec.ts +46 -46
  382. package/src/ruvocal/src/lib/utils/toolProgress.ts +11 -11
  383. package/src/ruvocal/src/lib/utils/tree/addChildren.spec.ts +102 -102
  384. package/src/ruvocal/src/lib/utils/tree/addChildren.ts +48 -48
  385. package/src/ruvocal/src/lib/utils/tree/addSibling.spec.ts +81 -81
  386. package/src/ruvocal/src/lib/utils/tree/addSibling.ts +41 -41
  387. package/src/ruvocal/src/lib/utils/tree/buildSubtree.spec.ts +110 -110
  388. package/src/ruvocal/src/lib/utils/tree/buildSubtree.ts +24 -24
  389. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.spec.ts +31 -31
  390. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.ts +36 -36
  391. package/src/ruvocal/src/lib/utils/tree/isMessageId.spec.ts +15 -15
  392. package/src/ruvocal/src/lib/utils/tree/isMessageId.ts +5 -5
  393. package/src/ruvocal/src/lib/utils/tree/tree.d.ts +14 -14
  394. package/src/ruvocal/src/lib/utils/tree/treeHelpers.spec.ts +167 -167
  395. package/src/ruvocal/src/lib/utils/updates.ts +39 -39
  396. package/src/ruvocal/src/lib/utils/urlParams.ts +13 -13
  397. package/src/ruvocal/src/lib/wasm/idb.ts +438 -438
  398. package/src/ruvocal/src/lib/wasm/index.ts +1213 -1213
  399. package/src/ruvocal/src/lib/wasm/tests/wasm-capabilities.test.ts +565 -565
  400. package/src/ruvocal/src/lib/wasm/wasm.worker.ts +332 -332
  401. package/src/ruvocal/src/lib/wasm/workerClient.ts +166 -166
  402. package/src/ruvocal/src/lib/workers/autopilotWorker.ts +221 -221
  403. package/src/ruvocal/src/lib/workers/detailFetchWorker.ts +100 -100
  404. package/src/ruvocal/src/lib/workers/markdownWorker.ts +61 -61
  405. package/src/ruvocal/src/routes/+error.svelte +20 -20
  406. package/src/ruvocal/src/routes/+layout.svelte +324 -324
  407. package/src/ruvocal/src/routes/+layout.ts +91 -91
  408. package/src/ruvocal/src/routes/+page.svelte +168 -168
  409. package/src/ruvocal/src/routes/.well-known/oauth-cimd/+server.ts +37 -37
  410. package/src/ruvocal/src/routes/__debug/openai/+server.ts +21 -21
  411. package/src/ruvocal/src/routes/admin/export/+server.ts +159 -159
  412. package/src/ruvocal/src/routes/admin/stats/compute/+server.ts +16 -16
  413. package/src/ruvocal/src/routes/api/conversation/[id]/+server.ts +40 -40
  414. package/src/ruvocal/src/routes/api/conversation/[id]/message/[messageId]/+server.ts +42 -42
  415. package/src/ruvocal/src/routes/api/conversations/+server.ts +48 -48
  416. package/src/ruvocal/src/routes/api/fetch-url/+server.ts +147 -147
  417. package/src/ruvocal/src/routes/api/mcp/health/+server.ts +292 -292
  418. package/src/ruvocal/src/routes/api/mcp/servers/+server.ts +32 -32
  419. package/src/ruvocal/src/routes/api/models/+server.ts +25 -25
  420. package/src/ruvocal/src/routes/api/transcribe/+server.ts +104 -104
  421. package/src/ruvocal/src/routes/api/user/+server.ts +15 -15
  422. package/src/ruvocal/src/routes/api/user/validate-token/+server.ts +20 -20
  423. package/src/ruvocal/src/routes/api/v2/conversations/+server.ts +48 -48
  424. package/src/ruvocal/src/routes/api/v2/conversations/[id]/+server.ts +94 -94
  425. package/src/ruvocal/src/routes/api/v2/conversations/[id]/message/[messageId]/+server.ts +43 -43
  426. package/src/ruvocal/src/routes/api/v2/conversations/import-share/+server.ts +23 -23
  427. package/src/ruvocal/src/routes/api/v2/debug/config/+server.ts +16 -16
  428. package/src/ruvocal/src/routes/api/v2/debug/refresh/+server.ts +30 -30
  429. package/src/ruvocal/src/routes/api/v2/export/+server.ts +196 -196
  430. package/src/ruvocal/src/routes/api/v2/feature-flags/+server.ts +14 -14
  431. package/src/ruvocal/src/routes/api/v2/models/+server.ts +38 -38
  432. package/src/ruvocal/src/routes/api/v2/models/[namespace]/+server.ts +8 -8
  433. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/+server.ts +8 -8
  434. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/subscribe/+server.ts +28 -28
  435. package/src/ruvocal/src/routes/api/v2/models/[namespace]/subscribe/+server.ts +28 -28
  436. package/src/ruvocal/src/routes/api/v2/models/old/+server.ts +7 -7
  437. package/src/ruvocal/src/routes/api/v2/models/refresh/+server.ts +33 -33
  438. package/src/ruvocal/src/routes/api/v2/public-config/+server.ts +7 -7
  439. package/src/ruvocal/src/routes/api/v2/user/+server.ts +17 -17
  440. package/src/ruvocal/src/routes/api/v2/user/billing-orgs/+server.ts +73 -73
  441. package/src/ruvocal/src/routes/api/v2/user/reports/+server.ts +17 -17
  442. package/src/ruvocal/src/routes/api/v2/user/settings/+server.ts +110 -110
  443. package/src/ruvocal/src/routes/conversation/+server.ts +115 -115
  444. package/src/ruvocal/src/routes/conversation/[id]/+page.svelte +586 -586
  445. package/src/ruvocal/src/routes/conversation/[id]/+page.ts +60 -60
  446. package/src/ruvocal/src/routes/conversation/[id]/+server.ts +740 -740
  447. package/src/ruvocal/src/routes/conversation/[id]/message/[messageId]/prompt/+server.ts +66 -66
  448. package/src/ruvocal/src/routes/conversation/[id]/share/+server.ts +69 -69
  449. package/src/ruvocal/src/routes/conversation/[id]/stop-generating/+server.ts +35 -35
  450. package/src/ruvocal/src/routes/healthcheck/+server.ts +3 -3
  451. package/src/ruvocal/src/routes/login/+server.ts +5 -5
  452. package/src/ruvocal/src/routes/login/callback/+server.ts +103 -103
  453. package/src/ruvocal/src/routes/login/callback/updateUser.spec.ts +157 -157
  454. package/src/ruvocal/src/routes/login/callback/updateUser.ts +215 -215
  455. package/src/ruvocal/src/routes/logout/+server.ts +18 -18
  456. package/src/ruvocal/src/routes/metrics/+server.ts +18 -18
  457. package/src/ruvocal/src/routes/models/+page.svelte +233 -233
  458. package/src/ruvocal/src/routes/models/[...model]/+page.svelte +161 -161
  459. package/src/ruvocal/src/routes/models/[...model]/+page.ts +14 -14
  460. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/+server.ts +64 -64
  461. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/ModelThumbnail.svelte +28 -28
  462. package/src/ruvocal/src/routes/privacy/+page.svelte +11 -11
  463. package/src/ruvocal/src/routes/r/[id]/+page.ts +34 -34
  464. package/src/ruvocal/src/routes/settings/(nav)/+layout.svelte +282 -282
  465. package/src/ruvocal/src/routes/settings/(nav)/+layout.ts +1 -1
  466. package/src/ruvocal/src/routes/settings/(nav)/+server.ts +59 -59
  467. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.svelte +464 -464
  468. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.ts +14 -14
  469. package/src/ruvocal/src/routes/settings/(nav)/application/+page.svelte +362 -362
  470. package/src/ruvocal/src/routes/settings/+layout.svelte +40 -40
  471. package/src/ruvocal/src/styles/highlight-js.css +195 -195
  472. package/src/ruvocal/src/styles/main.css +144 -144
  473. package/src/ruvocal/static/chatui/favicon-dark.svg +3 -3
  474. package/src/ruvocal/static/chatui/favicon-dev.svg +3 -3
  475. package/src/ruvocal/static/chatui/favicon.svg +3 -3
  476. package/src/ruvocal/static/chatui/icon.svg +3 -3
  477. package/src/ruvocal/static/chatui/logo.svg +7 -7
  478. package/src/ruvocal/static/chatui/manifest.json +54 -54
  479. package/src/ruvocal/static/chatui/welcome.js +184 -184
  480. package/src/ruvocal/static/huggingchat/favicon-dark.svg +4 -4
  481. package/src/ruvocal/static/huggingchat/favicon-dev.svg +4 -4
  482. package/src/ruvocal/static/huggingchat/favicon.svg +4 -4
  483. package/src/ruvocal/static/huggingchat/fulltext-logo.svg +1 -1
  484. package/src/ruvocal/static/huggingchat/icon.svg +4 -4
  485. package/src/ruvocal/static/huggingchat/logo.svg +4 -4
  486. package/src/ruvocal/static/huggingchat/manifest.json +54 -54
  487. package/src/ruvocal/static/huggingchat/routes.chat.json +226 -226
  488. package/src/ruvocal/static/robots.txt +10 -10
  489. package/src/ruvocal/static/wasm/rvagent_wasm.js +1539 -1539
  490. package/src/ruvocal/stub/@reflink/reflink/package.json +5 -5
  491. package/src/ruvocal/svelte.config.js +53 -53
  492. package/src/ruvocal/tailwind.config.cjs +30 -30
  493. package/src/ruvocal/tsconfig.json +19 -19
  494. package/src/ruvocal/vite.config.ts +87 -87
  495. package/src/scripts/deploy.sh +116 -116
  496. package/src/scripts/generate-config.js +245 -245
  497. package/src/scripts/generate-welcome.js +187 -187
  498. package/src/scripts/package-rvf.sh +116 -116
@@ -1,518 +1,518 @@
1
- import { config } from "$lib/server/config";
2
- import type { ChatTemplateInput } from "$lib/types/Template";
3
- import { z } from "zod";
4
- import endpoints, { endpointSchema, type Endpoint } from "./endpoints/endpoints";
5
-
6
- import JSON5 from "json5";
7
- import { logger } from "$lib/server/logger";
8
- import { makeRouterEndpoint } from "$lib/server/router/endpoint";
9
-
10
- type Optional<T, K extends keyof T> = Pick<Partial<T>, K> & Omit<T, K>;
11
-
12
- const sanitizeJSONEnv = (val: string, fallback: string) => {
13
- const raw = (val ?? "").trim();
14
- const unquoted = raw.startsWith("`") && raw.endsWith("`") ? raw.slice(1, -1) : raw;
15
- return unquoted || fallback;
16
- };
17
-
18
- const modelConfig = z.object({
19
- /** Used as an identifier in DB */
20
- id: z.string().optional(),
21
- /** Used to link to the model page, and for inference */
22
- name: z.string().default(""),
23
- displayName: z.string().min(1).optional(),
24
- description: z.string().min(1).optional(),
25
- logoUrl: z.string().url().optional(),
26
- websiteUrl: z.string().url().optional(),
27
- modelUrl: z.string().url().optional(),
28
- tokenizer: z.never().optional(),
29
- datasetName: z.string().min(1).optional(),
30
- datasetUrl: z.string().url().optional(),
31
- preprompt: z.string().default(""),
32
- prepromptUrl: z.string().url().optional(),
33
- chatPromptTemplate: z.never().optional(),
34
- promptExamples: z
35
- .array(
36
- z.object({
37
- title: z.string().min(1),
38
- prompt: z.string().min(1),
39
- })
40
- )
41
- .optional(),
42
- endpoints: z.array(endpointSchema).optional(),
43
- providers: z.array(z.object({ supports_tools: z.boolean().optional() }).passthrough()).optional(),
44
- parameters: z
45
- .object({
46
- temperature: z.number().min(0).max(2).optional(),
47
- truncate: z.number().int().positive().optional(),
48
- max_tokens: z.number().int().positive().optional(),
49
- stop: z.array(z.string()).optional(),
50
- top_p: z.number().positive().optional(),
51
- top_k: z.number().positive().optional(),
52
- frequency_penalty: z.number().min(-2).max(2).optional(),
53
- presence_penalty: z.number().min(-2).max(2).optional(),
54
- })
55
- .passthrough()
56
- .optional(),
57
- multimodal: z.boolean().default(false),
58
- multimodalAcceptedMimetypes: z.array(z.string()).optional(),
59
- // Aggregated tool-calling capability across providers (HF router)
60
- supportsTools: z.boolean().default(false),
61
- unlisted: z.boolean().default(false),
62
- embeddingModel: z.never().optional(),
63
- /** Used to enable/disable system prompt usage */
64
- systemRoleSupported: z.boolean().default(true),
65
- });
66
-
67
- type ModelConfig = z.infer<typeof modelConfig>;
68
-
69
- const overrideEntrySchema = modelConfig
70
- .partial()
71
- .extend({
72
- id: z.string().optional(),
73
- name: z.string().optional(),
74
- })
75
- .refine((value) => Boolean((value.id ?? value.name)?.trim()), {
76
- message: "Model override entry must provide an id or name",
77
- });
78
-
79
- type ModelOverride = z.infer<typeof overrideEntrySchema>;
80
-
81
- const openaiBaseUrl = config.OPENAI_BASE_URL
82
- ? config.OPENAI_BASE_URL.replace(/\/$/, "")
83
- : undefined;
84
- const isHFRouter = openaiBaseUrl === "https://router.huggingface.co/v1";
85
-
86
- const listSchema = z
87
- .object({
88
- data: z.array(
89
- z.object({
90
- id: z.string(),
91
- description: z.string().optional(),
92
- providers: z
93
- .array(z.object({ supports_tools: z.boolean().optional() }).passthrough())
94
- .optional(),
95
- architecture: z
96
- .object({
97
- input_modalities: z.array(z.string()).optional(),
98
- })
99
- .passthrough()
100
- .optional(),
101
- })
102
- ),
103
- })
104
- .passthrough();
105
-
106
- function getChatPromptRender(_m: ModelConfig): (inputs: ChatTemplateInput) => string {
107
- // Minimal template to support legacy "completions" flow if ever used.
108
- // We avoid any tokenizer/Jinja usage in this build.
109
- return ({ messages, preprompt }) => {
110
- const parts: string[] = [];
111
- if (preprompt) parts.push(`[SYSTEM]\n${preprompt}`);
112
- for (const msg of messages) {
113
- const role = msg.from === "assistant" ? "ASSISTANT" : msg.from.toUpperCase();
114
- parts.push(`[${role}]\n${msg.content}`);
115
- }
116
- parts.push(`[ASSISTANT]`);
117
- return parts.join("\n\n");
118
- };
119
- }
120
-
121
- const processModel = async (m: ModelConfig) => ({
122
- ...m,
123
- chatPromptRender: await getChatPromptRender(m),
124
- id: m.id || m.name,
125
- displayName: m.displayName || m.name,
126
- preprompt: m.prepromptUrl ? await fetch(m.prepromptUrl).then((r) => r.text()) : m.preprompt,
127
- parameters: { ...m.parameters, stop_sequences: m.parameters?.stop },
128
- unlisted: m.unlisted ?? false,
129
- });
130
-
131
- const addEndpoint = (m: Awaited<ReturnType<typeof processModel>>) => ({
132
- ...m,
133
- getEndpoint: async (): Promise<Endpoint> => {
134
- if (!m.endpoints || m.endpoints.length === 0) {
135
- throw new Error("No endpoints configured. This build requires OpenAI-compatible endpoints.");
136
- }
137
- // Only support OpenAI-compatible endpoints in this build
138
- const endpoint = m.endpoints[0];
139
- if (endpoint.type !== "openai") {
140
- throw new Error("Only 'openai' endpoint type is supported in this build");
141
- }
142
- return await endpoints.openai({ ...endpoint, model: m });
143
- },
144
- });
145
-
146
- type InternalProcessedModel = Awaited<ReturnType<typeof addEndpoint>> & {
147
- isRouter: boolean;
148
- hasInferenceAPI: boolean;
149
- };
150
-
151
- const inferenceApiIds: string[] = [];
152
-
153
- const getModelOverrides = (): ModelOverride[] => {
154
- const overridesEnv = (Reflect.get(config, "MODELS") as string | undefined) ?? "";
155
-
156
- if (!overridesEnv.trim()) {
157
- return [];
158
- }
159
-
160
- try {
161
- return z.array(overrideEntrySchema).parse(JSON5.parse(sanitizeJSONEnv(overridesEnv, "[]")));
162
- } catch (error) {
163
- logger.error(error, "[models] Failed to parse MODELS overrides");
164
- return [];
165
- }
166
- };
167
-
168
- export type ModelsRefreshSummary = {
169
- refreshedAt: Date;
170
- durationMs: number;
171
- added: string[];
172
- removed: string[];
173
- changed: string[];
174
- total: number;
175
- };
176
-
177
- export type ProcessedModel = InternalProcessedModel;
178
-
179
- export let models: ProcessedModel[] = [];
180
- export let defaultModel!: ProcessedModel;
181
- export let taskModel!: ProcessedModel;
182
- export let validModelIdSchema: z.ZodType<string> = z.string();
183
- export let lastModelRefresh = new Date(0);
184
- export let lastModelRefreshDurationMs = 0;
185
- export let lastModelRefreshSummary: ModelsRefreshSummary = {
186
- refreshedAt: new Date(0),
187
- durationMs: 0,
188
- added: [],
189
- removed: [],
190
- changed: [],
191
- total: 0,
192
- };
193
-
194
- let inflightRefresh: Promise<ModelsRefreshSummary> | null = null;
195
-
196
- const createValidModelIdSchema = (modelList: ProcessedModel[]): z.ZodType<string> => {
197
- if (modelList.length === 0) {
198
- throw new Error("No models available to build validation schema");
199
- }
200
- const ids = new Set(modelList.map((m) => m.id));
201
- return z.string().refine((value) => ids.has(value), "Invalid model id");
202
- };
203
-
204
- const resolveTaskModel = (modelList: ProcessedModel[]) => {
205
- if (modelList.length === 0) {
206
- throw new Error("No models available to select task model");
207
- }
208
-
209
- if (config.TASK_MODEL) {
210
- const preferred = modelList.find(
211
- (m) => m.name === config.TASK_MODEL || m.id === config.TASK_MODEL
212
- );
213
- if (preferred) {
214
- return preferred;
215
- }
216
- }
217
-
218
- return modelList[0];
219
- };
220
-
221
- const signatureForModel = (model: ProcessedModel) =>
222
- JSON.stringify({
223
- description: model.description,
224
- displayName: model.displayName,
225
- providers: model.providers,
226
- parameters: model.parameters,
227
- preprompt: model.preprompt,
228
- prepromptUrl: model.prepromptUrl,
229
- endpoints:
230
- model.endpoints?.map((endpoint) => {
231
- if (endpoint.type === "openai") {
232
- const { type, baseURL } = endpoint;
233
- return { type, baseURL };
234
- }
235
- return { type: endpoint.type };
236
- }) ?? null,
237
- multimodal: model.multimodal,
238
- multimodalAcceptedMimetypes: model.multimodalAcceptedMimetypes,
239
- supportsTools: (model as unknown as { supportsTools?: boolean }).supportsTools ?? false,
240
- isRouter: model.isRouter,
241
- hasInferenceAPI: model.hasInferenceAPI,
242
- });
243
-
244
- const applyModelState = (newModels: ProcessedModel[], startedAt: number): ModelsRefreshSummary => {
245
- if (newModels.length === 0) {
246
- throw new Error("Failed to load any models from upstream");
247
- }
248
-
249
- const previousIds = new Set(models.map((m) => m.id));
250
- const previousSignatures = new Map(models.map((m) => [m.id, signatureForModel(m)]));
251
- const refreshedAt = new Date();
252
- const durationMs = Date.now() - startedAt;
253
-
254
- models = newModels;
255
- defaultModel = models[0];
256
- taskModel = resolveTaskModel(models);
257
- validModelIdSchema = createValidModelIdSchema(models);
258
- lastModelRefresh = refreshedAt;
259
- lastModelRefreshDurationMs = durationMs;
260
-
261
- const added = newModels.map((m) => m.id).filter((id) => !previousIds.has(id));
262
- const removed = Array.from(previousIds).filter(
263
- (id) => !newModels.some((model) => model.id === id)
264
- );
265
- const changed = newModels
266
- .filter((model) => {
267
- const previousSignature = previousSignatures.get(model.id);
268
- return previousSignature !== undefined && previousSignature !== signatureForModel(model);
269
- })
270
- .map((model) => model.id);
271
-
272
- const summary: ModelsRefreshSummary = {
273
- refreshedAt,
274
- durationMs,
275
- added,
276
- removed,
277
- changed,
278
- total: models.length,
279
- };
280
-
281
- lastModelRefreshSummary = summary;
282
-
283
- logger.info(
284
- {
285
- total: summary.total,
286
- added: summary.added,
287
- removed: summary.removed,
288
- changed: summary.changed,
289
- durationMs: summary.durationMs,
290
- },
291
- "[models] Model cache refreshed"
292
- );
293
-
294
- return summary;
295
- };
296
-
297
- const buildModels = async (): Promise<ProcessedModel[]> => {
298
- if (!openaiBaseUrl) {
299
- logger.error(
300
- "OPENAI_BASE_URL is required. Set it to an OpenAI-compatible base (e.g., https://router.huggingface.co/v1)."
301
- );
302
- throw new Error("OPENAI_BASE_URL not set");
303
- }
304
-
305
- try {
306
- const baseURL = openaiBaseUrl;
307
- logger.info({ baseURL }, "[models] Using OpenAI-compatible base URL");
308
-
309
- // Canonical auth token is OPENAI_API_KEY; keep HF_TOKEN as legacy alias
310
- const authToken = config.OPENAI_API_KEY || config.HF_TOKEN;
311
-
312
- // Use auth token from the start if available to avoid rate limiting issues
313
- // Some APIs rate-limit unauthenticated requests more aggressively
314
- const response = await fetch(`${baseURL}/models`, {
315
- headers: authToken ? { Authorization: `Bearer ${authToken}` } : undefined,
316
- });
317
- logger.info({ status: response.status }, "[models] First fetch status");
318
- if (!response.ok && response.status === 401 && !authToken) {
319
- // If we get 401 and didn't have a token, there's nothing we can do
320
- throw new Error(
321
- `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText} (no auth token available)`
322
- );
323
- }
324
- if (!response.ok) {
325
- throw new Error(
326
- `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText}`
327
- );
328
- }
329
- const json = await response.json();
330
- logger.info({ keys: Object.keys(json || {}) }, "[models] Response keys");
331
-
332
- const parsed = listSchema.parse(json);
333
- logger.info({ count: parsed.data.length }, "[models] Parsed models count");
334
-
335
- let modelsRaw = parsed.data.map((m) => {
336
- let logoUrl: string | undefined = undefined;
337
- if (isHFRouter && m.id.includes("/")) {
338
- const org = m.id.split("/")[0];
339
- logoUrl = `https://huggingface.co/api/avatars/${encodeURIComponent(org)}`;
340
- }
341
-
342
- const inputModalities = (m.architecture?.input_modalities ?? []).map((modality) =>
343
- modality.toLowerCase()
344
- );
345
- const supportsImageInput =
346
- inputModalities.includes("image") || inputModalities.includes("vision");
347
-
348
- // If any provider supports tools, consider the model as supporting tools
349
- const supportsTools = Boolean((m.providers ?? []).some((p) => p?.supports_tools === true));
350
- return {
351
- id: m.id,
352
- name: m.id,
353
- displayName: m.id,
354
- description: m.description,
355
- logoUrl,
356
- providers: m.providers,
357
- multimodal: supportsImageInput,
358
- multimodalAcceptedMimetypes: supportsImageInput ? ["image/*"] : undefined,
359
- supportsTools,
360
- endpoints: [
361
- {
362
- type: "openai" as const,
363
- baseURL,
364
- // apiKey will be taken from OPENAI_API_KEY or HF_TOKEN automatically
365
- },
366
- ],
367
- } as ModelConfig;
368
- }) as ModelConfig[];
369
-
370
- const overrides = getModelOverrides();
371
-
372
- if (overrides.length) {
373
- const overrideMap = new Map<string, ModelOverride>();
374
- for (const override of overrides) {
375
- for (const key of [override.id, override.name]) {
376
- const trimmed = key?.trim();
377
- if (trimmed) overrideMap.set(trimmed, override);
378
- }
379
- }
380
-
381
- // Filter to only configured models and apply overrides, preserving MODELS order
382
- const filteredAndOrdered: ModelConfig[] = [];
383
- for (const override of overrides) {
384
- const matchKey = override.name?.trim() || override.id?.trim() || "";
385
- const found = modelsRaw.find(
386
- (model) => model.id === matchKey || model.name === matchKey
387
- );
388
- if (found) {
389
- const { id, name, ...rest } = override;
390
- void id;
391
- void name;
392
- filteredAndOrdered.push({ ...found, ...rest });
393
- }
394
- }
395
-
396
- // If we matched at least one, use filtered list; otherwise fall back to all models with overrides
397
- if (filteredAndOrdered.length > 0) {
398
- modelsRaw = filteredAndOrdered;
399
- } else {
400
- modelsRaw = modelsRaw.map((model) => {
401
- const override = overrideMap.get(model.id ?? "") ?? overrideMap.get(model.name ?? "");
402
- if (!override) return model;
403
-
404
- const { id, name, ...rest } = override;
405
- void id;
406
- void name;
407
-
408
- return {
409
- ...model,
410
- ...rest,
411
- };
412
- });
413
- }
414
- }
415
-
416
- const builtModels = await Promise.all(
417
- modelsRaw.map((e) =>
418
- processModel(e)
419
- .then(addEndpoint)
420
- .then(async (m) => ({
421
- ...m,
422
- hasInferenceAPI: inferenceApiIds.includes(m.id ?? m.name),
423
- // router decoration added later
424
- isRouter: false as boolean,
425
- }))
426
- )
427
- );
428
-
429
- const archBase = (config.LLM_ROUTER_ARCH_BASE_URL || "").trim();
430
- const routerLabel = (config.PUBLIC_LLM_ROUTER_DISPLAY_NAME || "Omni").trim() || "Omni";
431
- const routerLogo = (config.PUBLIC_LLM_ROUTER_LOGO_URL || "").trim();
432
- const routerAliasId = (config.PUBLIC_LLM_ROUTER_ALIAS_ID || "omni").trim() || "omni";
433
- const routerMultimodalEnabled =
434
- (config.LLM_ROUTER_ENABLE_MULTIMODAL || "").toLowerCase() === "true";
435
- const routerToolsEnabled = (config.LLM_ROUTER_ENABLE_TOOLS || "").toLowerCase() === "true";
436
-
437
- let decorated = builtModels as ProcessedModel[];
438
-
439
- if (archBase) {
440
- // Build a minimal model config for the alias
441
- const aliasRaw = {
442
- id: routerAliasId,
443
- name: routerAliasId,
444
- displayName: routerLabel,
445
- description: "Automatically routes your messages to the best model for your request.",
446
- logoUrl: routerLogo || undefined,
447
- preprompt: "",
448
- endpoints: [
449
- {
450
- type: "openai" as const,
451
- baseURL: openaiBaseUrl,
452
- },
453
- ],
454
- // Keep the alias visible
455
- unlisted: false,
456
- } as ModelConfig;
457
-
458
- if (routerMultimodalEnabled) {
459
- aliasRaw.multimodal = true;
460
- aliasRaw.multimodalAcceptedMimetypes = ["image/*"];
461
- }
462
-
463
- if (routerToolsEnabled) {
464
- aliasRaw.supportsTools = true;
465
- }
466
-
467
- const aliasBase = await processModel(aliasRaw);
468
- // Create a self-referential ProcessedModel for the router endpoint
469
- const aliasModel: ProcessedModel = {
470
- ...aliasBase,
471
- isRouter: true,
472
- hasInferenceAPI: false,
473
- // getEndpoint uses the router wrapper regardless of the endpoints array
474
- getEndpoint: async (): Promise<Endpoint> => makeRouterEndpoint(aliasModel),
475
- } as ProcessedModel;
476
-
477
- // Put alias first
478
- decorated = [aliasModel, ...decorated];
479
- }
480
-
481
- return decorated;
482
- } catch (e) {
483
- logger.error(e, "Failed to load models from OpenAI base URL");
484
- throw e;
485
- }
486
- };
487
-
488
- const rebuildModels = async (): Promise<ModelsRefreshSummary> => {
489
- const startedAt = Date.now();
490
- const newModels = await buildModels();
491
- return applyModelState(newModels, startedAt);
492
- };
493
-
494
- await rebuildModels();
495
-
496
- export const refreshModels = async (): Promise<ModelsRefreshSummary> => {
497
- if (inflightRefresh) {
498
- return inflightRefresh;
499
- }
500
-
501
- inflightRefresh = rebuildModels().finally(() => {
502
- inflightRefresh = null;
503
- });
504
-
505
- return inflightRefresh;
506
- };
507
-
508
- export const validateModel = (_models: BackendModel[]) => {
509
- // Zod enum function requires 2 parameters
510
- return z.enum([_models[0].id, ..._models.slice(1).map((m) => m.id)]);
511
- };
512
-
513
- // if `TASK_MODEL` is string & name of a model in `MODELS`, then we use `MODELS[TASK_MODEL]`, else we try to parse `TASK_MODEL` as a model config itself
514
-
515
- export type BackendModel = Optional<
516
- typeof defaultModel,
517
- "preprompt" | "parameters" | "multimodal" | "unlisted" | "hasInferenceAPI"
518
- >;
1
+ import { config } from "$lib/server/config";
2
+ import type { ChatTemplateInput } from "$lib/types/Template";
3
+ import { z } from "zod";
4
+ import endpoints, { endpointSchema, type Endpoint } from "./endpoints/endpoints";
5
+
6
+ import JSON5 from "json5";
7
+ import { logger } from "$lib/server/logger";
8
+ import { makeRouterEndpoint } from "$lib/server/router/endpoint";
9
+
10
+ type Optional<T, K extends keyof T> = Pick<Partial<T>, K> & Omit<T, K>;
11
+
12
+ const sanitizeJSONEnv = (val: string, fallback: string) => {
13
+ const raw = (val ?? "").trim();
14
+ const unquoted = raw.startsWith("`") && raw.endsWith("`") ? raw.slice(1, -1) : raw;
15
+ return unquoted || fallback;
16
+ };
17
+
18
+ const modelConfig = z.object({
19
+ /** Used as an identifier in DB */
20
+ id: z.string().optional(),
21
+ /** Used to link to the model page, and for inference */
22
+ name: z.string().default(""),
23
+ displayName: z.string().min(1).optional(),
24
+ description: z.string().min(1).optional(),
25
+ logoUrl: z.string().url().optional(),
26
+ websiteUrl: z.string().url().optional(),
27
+ modelUrl: z.string().url().optional(),
28
+ tokenizer: z.never().optional(),
29
+ datasetName: z.string().min(1).optional(),
30
+ datasetUrl: z.string().url().optional(),
31
+ preprompt: z.string().default(""),
32
+ prepromptUrl: z.string().url().optional(),
33
+ chatPromptTemplate: z.never().optional(),
34
+ promptExamples: z
35
+ .array(
36
+ z.object({
37
+ title: z.string().min(1),
38
+ prompt: z.string().min(1),
39
+ })
40
+ )
41
+ .optional(),
42
+ endpoints: z.array(endpointSchema).optional(),
43
+ providers: z.array(z.object({ supports_tools: z.boolean().optional() }).passthrough()).optional(),
44
+ parameters: z
45
+ .object({
46
+ temperature: z.number().min(0).max(2).optional(),
47
+ truncate: z.number().int().positive().optional(),
48
+ max_tokens: z.number().int().positive().optional(),
49
+ stop: z.array(z.string()).optional(),
50
+ top_p: z.number().positive().optional(),
51
+ top_k: z.number().positive().optional(),
52
+ frequency_penalty: z.number().min(-2).max(2).optional(),
53
+ presence_penalty: z.number().min(-2).max(2).optional(),
54
+ })
55
+ .passthrough()
56
+ .optional(),
57
+ multimodal: z.boolean().default(false),
58
+ multimodalAcceptedMimetypes: z.array(z.string()).optional(),
59
+ // Aggregated tool-calling capability across providers (HF router)
60
+ supportsTools: z.boolean().default(false),
61
+ unlisted: z.boolean().default(false),
62
+ embeddingModel: z.never().optional(),
63
+ /** Used to enable/disable system prompt usage */
64
+ systemRoleSupported: z.boolean().default(true),
65
+ });
66
+
67
+ type ModelConfig = z.infer<typeof modelConfig>;
68
+
69
+ const overrideEntrySchema = modelConfig
70
+ .partial()
71
+ .extend({
72
+ id: z.string().optional(),
73
+ name: z.string().optional(),
74
+ })
75
+ .refine((value) => Boolean((value.id ?? value.name)?.trim()), {
76
+ message: "Model override entry must provide an id or name",
77
+ });
78
+
79
+ type ModelOverride = z.infer<typeof overrideEntrySchema>;
80
+
81
+ const openaiBaseUrl = config.OPENAI_BASE_URL
82
+ ? config.OPENAI_BASE_URL.replace(/\/$/, "")
83
+ : undefined;
84
+ const isHFRouter = openaiBaseUrl === "https://router.huggingface.co/v1";
85
+
86
+ const listSchema = z
87
+ .object({
88
+ data: z.array(
89
+ z.object({
90
+ id: z.string(),
91
+ description: z.string().optional(),
92
+ providers: z
93
+ .array(z.object({ supports_tools: z.boolean().optional() }).passthrough())
94
+ .optional(),
95
+ architecture: z
96
+ .object({
97
+ input_modalities: z.array(z.string()).optional(),
98
+ })
99
+ .passthrough()
100
+ .optional(),
101
+ })
102
+ ),
103
+ })
104
+ .passthrough();
105
+
106
+ function getChatPromptRender(_m: ModelConfig): (inputs: ChatTemplateInput) => string {
107
+ // Minimal template to support legacy "completions" flow if ever used.
108
+ // We avoid any tokenizer/Jinja usage in this build.
109
+ return ({ messages, preprompt }) => {
110
+ const parts: string[] = [];
111
+ if (preprompt) parts.push(`[SYSTEM]\n${preprompt}`);
112
+ for (const msg of messages) {
113
+ const role = msg.from === "assistant" ? "ASSISTANT" : msg.from.toUpperCase();
114
+ parts.push(`[${role}]\n${msg.content}`);
115
+ }
116
+ parts.push(`[ASSISTANT]`);
117
+ return parts.join("\n\n");
118
+ };
119
+ }
120
+
121
+ const processModel = async (m: ModelConfig) => ({
122
+ ...m,
123
+ chatPromptRender: await getChatPromptRender(m),
124
+ id: m.id || m.name,
125
+ displayName: m.displayName || m.name,
126
+ preprompt: m.prepromptUrl ? await fetch(m.prepromptUrl).then((r) => r.text()) : m.preprompt,
127
+ parameters: { ...m.parameters, stop_sequences: m.parameters?.stop },
128
+ unlisted: m.unlisted ?? false,
129
+ });
130
+
131
+ const addEndpoint = (m: Awaited<ReturnType<typeof processModel>>) => ({
132
+ ...m,
133
+ getEndpoint: async (): Promise<Endpoint> => {
134
+ if (!m.endpoints || m.endpoints.length === 0) {
135
+ throw new Error("No endpoints configured. This build requires OpenAI-compatible endpoints.");
136
+ }
137
+ // Only support OpenAI-compatible endpoints in this build
138
+ const endpoint = m.endpoints[0];
139
+ if (endpoint.type !== "openai") {
140
+ throw new Error("Only 'openai' endpoint type is supported in this build");
141
+ }
142
+ return await endpoints.openai({ ...endpoint, model: m });
143
+ },
144
+ });
145
+
146
+ type InternalProcessedModel = Awaited<ReturnType<typeof addEndpoint>> & {
147
+ isRouter: boolean;
148
+ hasInferenceAPI: boolean;
149
+ };
150
+
151
+ const inferenceApiIds: string[] = [];
152
+
153
+ const getModelOverrides = (): ModelOverride[] => {
154
+ const overridesEnv = (Reflect.get(config, "MODELS") as string | undefined) ?? "";
155
+
156
+ if (!overridesEnv.trim()) {
157
+ return [];
158
+ }
159
+
160
+ try {
161
+ return z.array(overrideEntrySchema).parse(JSON5.parse(sanitizeJSONEnv(overridesEnv, "[]")));
162
+ } catch (error) {
163
+ logger.error(error, "[models] Failed to parse MODELS overrides");
164
+ return [];
165
+ }
166
+ };
167
+
168
+ export type ModelsRefreshSummary = {
169
+ refreshedAt: Date;
170
+ durationMs: number;
171
+ added: string[];
172
+ removed: string[];
173
+ changed: string[];
174
+ total: number;
175
+ };
176
+
177
+ export type ProcessedModel = InternalProcessedModel;
178
+
179
+ export let models: ProcessedModel[] = [];
180
+ export let defaultModel!: ProcessedModel;
181
+ export let taskModel!: ProcessedModel;
182
+ export let validModelIdSchema: z.ZodType<string> = z.string();
183
+ export let lastModelRefresh = new Date(0);
184
+ export let lastModelRefreshDurationMs = 0;
185
+ export let lastModelRefreshSummary: ModelsRefreshSummary = {
186
+ refreshedAt: new Date(0),
187
+ durationMs: 0,
188
+ added: [],
189
+ removed: [],
190
+ changed: [],
191
+ total: 0,
192
+ };
193
+
194
+ let inflightRefresh: Promise<ModelsRefreshSummary> | null = null;
195
+
196
+ const createValidModelIdSchema = (modelList: ProcessedModel[]): z.ZodType<string> => {
197
+ if (modelList.length === 0) {
198
+ throw new Error("No models available to build validation schema");
199
+ }
200
+ const ids = new Set(modelList.map((m) => m.id));
201
+ return z.string().refine((value) => ids.has(value), "Invalid model id");
202
+ };
203
+
204
+ const resolveTaskModel = (modelList: ProcessedModel[]) => {
205
+ if (modelList.length === 0) {
206
+ throw new Error("No models available to select task model");
207
+ }
208
+
209
+ if (config.TASK_MODEL) {
210
+ const preferred = modelList.find(
211
+ (m) => m.name === config.TASK_MODEL || m.id === config.TASK_MODEL
212
+ );
213
+ if (preferred) {
214
+ return preferred;
215
+ }
216
+ }
217
+
218
+ return modelList[0];
219
+ };
220
+
221
+ const signatureForModel = (model: ProcessedModel) =>
222
+ JSON.stringify({
223
+ description: model.description,
224
+ displayName: model.displayName,
225
+ providers: model.providers,
226
+ parameters: model.parameters,
227
+ preprompt: model.preprompt,
228
+ prepromptUrl: model.prepromptUrl,
229
+ endpoints:
230
+ model.endpoints?.map((endpoint) => {
231
+ if (endpoint.type === "openai") {
232
+ const { type, baseURL } = endpoint;
233
+ return { type, baseURL };
234
+ }
235
+ return { type: endpoint.type };
236
+ }) ?? null,
237
+ multimodal: model.multimodal,
238
+ multimodalAcceptedMimetypes: model.multimodalAcceptedMimetypes,
239
+ supportsTools: (model as unknown as { supportsTools?: boolean }).supportsTools ?? false,
240
+ isRouter: model.isRouter,
241
+ hasInferenceAPI: model.hasInferenceAPI,
242
+ });
243
+
244
+ const applyModelState = (newModels: ProcessedModel[], startedAt: number): ModelsRefreshSummary => {
245
+ if (newModels.length === 0) {
246
+ throw new Error("Failed to load any models from upstream");
247
+ }
248
+
249
+ const previousIds = new Set(models.map((m) => m.id));
250
+ const previousSignatures = new Map(models.map((m) => [m.id, signatureForModel(m)]));
251
+ const refreshedAt = new Date();
252
+ const durationMs = Date.now() - startedAt;
253
+
254
+ models = newModels;
255
+ defaultModel = models[0];
256
+ taskModel = resolveTaskModel(models);
257
+ validModelIdSchema = createValidModelIdSchema(models);
258
+ lastModelRefresh = refreshedAt;
259
+ lastModelRefreshDurationMs = durationMs;
260
+
261
+ const added = newModels.map((m) => m.id).filter((id) => !previousIds.has(id));
262
+ const removed = Array.from(previousIds).filter(
263
+ (id) => !newModels.some((model) => model.id === id)
264
+ );
265
+ const changed = newModels
266
+ .filter((model) => {
267
+ const previousSignature = previousSignatures.get(model.id);
268
+ return previousSignature !== undefined && previousSignature !== signatureForModel(model);
269
+ })
270
+ .map((model) => model.id);
271
+
272
+ const summary: ModelsRefreshSummary = {
273
+ refreshedAt,
274
+ durationMs,
275
+ added,
276
+ removed,
277
+ changed,
278
+ total: models.length,
279
+ };
280
+
281
+ lastModelRefreshSummary = summary;
282
+
283
+ logger.info(
284
+ {
285
+ total: summary.total,
286
+ added: summary.added,
287
+ removed: summary.removed,
288
+ changed: summary.changed,
289
+ durationMs: summary.durationMs,
290
+ },
291
+ "[models] Model cache refreshed"
292
+ );
293
+
294
+ return summary;
295
+ };
296
+
297
+ const buildModels = async (): Promise<ProcessedModel[]> => {
298
+ if (!openaiBaseUrl) {
299
+ logger.error(
300
+ "OPENAI_BASE_URL is required. Set it to an OpenAI-compatible base (e.g., https://router.huggingface.co/v1)."
301
+ );
302
+ throw new Error("OPENAI_BASE_URL not set");
303
+ }
304
+
305
+ try {
306
+ const baseURL = openaiBaseUrl;
307
+ logger.info({ baseURL }, "[models] Using OpenAI-compatible base URL");
308
+
309
+ // Canonical auth token is OPENAI_API_KEY; keep HF_TOKEN as legacy alias
310
+ const authToken = config.OPENAI_API_KEY || config.HF_TOKEN;
311
+
312
+ // Use auth token from the start if available to avoid rate limiting issues
313
+ // Some APIs rate-limit unauthenticated requests more aggressively
314
+ const response = await fetch(`${baseURL}/models`, {
315
+ headers: authToken ? { Authorization: `Bearer ${authToken}` } : undefined,
316
+ });
317
+ logger.info({ status: response.status }, "[models] First fetch status");
318
+ if (!response.ok && response.status === 401 && !authToken) {
319
+ // If we get 401 and didn't have a token, there's nothing we can do
320
+ throw new Error(
321
+ `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText} (no auth token available)`
322
+ );
323
+ }
324
+ if (!response.ok) {
325
+ throw new Error(
326
+ `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText}`
327
+ );
328
+ }
329
+ const json = await response.json();
330
+ logger.info({ keys: Object.keys(json || {}) }, "[models] Response keys");
331
+
332
+ const parsed = listSchema.parse(json);
333
+ logger.info({ count: parsed.data.length }, "[models] Parsed models count");
334
+
335
+ let modelsRaw = parsed.data.map((m) => {
336
+ let logoUrl: string | undefined = undefined;
337
+ if (isHFRouter && m.id.includes("/")) {
338
+ const org = m.id.split("/")[0];
339
+ logoUrl = `https://huggingface.co/api/avatars/${encodeURIComponent(org)}`;
340
+ }
341
+
342
+ const inputModalities = (m.architecture?.input_modalities ?? []).map((modality) =>
343
+ modality.toLowerCase()
344
+ );
345
+ const supportsImageInput =
346
+ inputModalities.includes("image") || inputModalities.includes("vision");
347
+
348
+ // If any provider supports tools, consider the model as supporting tools
349
+ const supportsTools = Boolean((m.providers ?? []).some((p) => p?.supports_tools === true));
350
+ return {
351
+ id: m.id,
352
+ name: m.id,
353
+ displayName: m.id,
354
+ description: m.description,
355
+ logoUrl,
356
+ providers: m.providers,
357
+ multimodal: supportsImageInput,
358
+ multimodalAcceptedMimetypes: supportsImageInput ? ["image/*"] : undefined,
359
+ supportsTools,
360
+ endpoints: [
361
+ {
362
+ type: "openai" as const,
363
+ baseURL,
364
+ // apiKey will be taken from OPENAI_API_KEY or HF_TOKEN automatically
365
+ },
366
+ ],
367
+ } as ModelConfig;
368
+ }) as ModelConfig[];
369
+
370
+ const overrides = getModelOverrides();
371
+
372
+ if (overrides.length) {
373
+ const overrideMap = new Map<string, ModelOverride>();
374
+ for (const override of overrides) {
375
+ for (const key of [override.id, override.name]) {
376
+ const trimmed = key?.trim();
377
+ if (trimmed) overrideMap.set(trimmed, override);
378
+ }
379
+ }
380
+
381
+ // Filter to only configured models and apply overrides, preserving MODELS order
382
+ const filteredAndOrdered: ModelConfig[] = [];
383
+ for (const override of overrides) {
384
+ const matchKey = override.name?.trim() || override.id?.trim() || "";
385
+ const found = modelsRaw.find(
386
+ (model) => model.id === matchKey || model.name === matchKey
387
+ );
388
+ if (found) {
389
+ const { id, name, ...rest } = override;
390
+ void id;
391
+ void name;
392
+ filteredAndOrdered.push({ ...found, ...rest });
393
+ }
394
+ }
395
+
396
+ // If we matched at least one, use filtered list; otherwise fall back to all models with overrides
397
+ if (filteredAndOrdered.length > 0) {
398
+ modelsRaw = filteredAndOrdered;
399
+ } else {
400
+ modelsRaw = modelsRaw.map((model) => {
401
+ const override = overrideMap.get(model.id ?? "") ?? overrideMap.get(model.name ?? "");
402
+ if (!override) return model;
403
+
404
+ const { id, name, ...rest } = override;
405
+ void id;
406
+ void name;
407
+
408
+ return {
409
+ ...model,
410
+ ...rest,
411
+ };
412
+ });
413
+ }
414
+ }
415
+
416
+ const builtModels = await Promise.all(
417
+ modelsRaw.map((e) =>
418
+ processModel(e)
419
+ .then(addEndpoint)
420
+ .then(async (m) => ({
421
+ ...m,
422
+ hasInferenceAPI: inferenceApiIds.includes(m.id ?? m.name),
423
+ // router decoration added later
424
+ isRouter: false as boolean,
425
+ }))
426
+ )
427
+ );
428
+
429
+ const archBase = (config.LLM_ROUTER_ARCH_BASE_URL || "").trim();
430
+ const routerLabel = (config.PUBLIC_LLM_ROUTER_DISPLAY_NAME || "Omni").trim() || "Omni";
431
+ const routerLogo = (config.PUBLIC_LLM_ROUTER_LOGO_URL || "").trim();
432
+ const routerAliasId = (config.PUBLIC_LLM_ROUTER_ALIAS_ID || "omni").trim() || "omni";
433
+ const routerMultimodalEnabled =
434
+ (config.LLM_ROUTER_ENABLE_MULTIMODAL || "").toLowerCase() === "true";
435
+ const routerToolsEnabled = (config.LLM_ROUTER_ENABLE_TOOLS || "").toLowerCase() === "true";
436
+
437
+ let decorated = builtModels as ProcessedModel[];
438
+
439
+ if (archBase) {
440
+ // Build a minimal model config for the alias
441
+ const aliasRaw = {
442
+ id: routerAliasId,
443
+ name: routerAliasId,
444
+ displayName: routerLabel,
445
+ description: "Automatically routes your messages to the best model for your request.",
446
+ logoUrl: routerLogo || undefined,
447
+ preprompt: "",
448
+ endpoints: [
449
+ {
450
+ type: "openai" as const,
451
+ baseURL: openaiBaseUrl,
452
+ },
453
+ ],
454
+ // Keep the alias visible
455
+ unlisted: false,
456
+ } as ModelConfig;
457
+
458
+ if (routerMultimodalEnabled) {
459
+ aliasRaw.multimodal = true;
460
+ aliasRaw.multimodalAcceptedMimetypes = ["image/*"];
461
+ }
462
+
463
+ if (routerToolsEnabled) {
464
+ aliasRaw.supportsTools = true;
465
+ }
466
+
467
+ const aliasBase = await processModel(aliasRaw);
468
+ // Create a self-referential ProcessedModel for the router endpoint
469
+ const aliasModel: ProcessedModel = {
470
+ ...aliasBase,
471
+ isRouter: true,
472
+ hasInferenceAPI: false,
473
+ // getEndpoint uses the router wrapper regardless of the endpoints array
474
+ getEndpoint: async (): Promise<Endpoint> => makeRouterEndpoint(aliasModel),
475
+ } as ProcessedModel;
476
+
477
+ // Put alias first
478
+ decorated = [aliasModel, ...decorated];
479
+ }
480
+
481
+ return decorated;
482
+ } catch (e) {
483
+ logger.error(e, "Failed to load models from OpenAI base URL");
484
+ throw e;
485
+ }
486
+ };
487
+
488
+ const rebuildModels = async (): Promise<ModelsRefreshSummary> => {
489
+ const startedAt = Date.now();
490
+ const newModels = await buildModels();
491
+ return applyModelState(newModels, startedAt);
492
+ };
493
+
494
+ await rebuildModels();
495
+
496
+ export const refreshModels = async (): Promise<ModelsRefreshSummary> => {
497
+ if (inflightRefresh) {
498
+ return inflightRefresh;
499
+ }
500
+
501
+ inflightRefresh = rebuildModels().finally(() => {
502
+ inflightRefresh = null;
503
+ });
504
+
505
+ return inflightRefresh;
506
+ };
507
+
508
+ export const validateModel = (_models: BackendModel[]) => {
509
+ // Zod enum function requires 2 parameters
510
+ return z.enum([_models[0].id, ..._models.slice(1).map((m) => m.id)]);
511
+ };
512
+
513
+ // if `TASK_MODEL` is string & name of a model in `MODELS`, then we use `MODELS[TASK_MODEL]`, else we try to parse `TASK_MODEL` as a model config itself
514
+
515
+ export type BackendModel = Optional<
516
+ typeof defaultModel,
517
+ "preprompt" | "parameters" | "multimodal" | "unlisted" | "hasInferenceAPI"
518
+ >;