ruflo 3.6.30 → 3.7.0-alpha.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (500) hide show
  1. package/README.md +393 -45
  2. package/bin/ruflo.js +57 -57
  3. package/package.json +3 -2
  4. package/src/chat-ui/Dockerfile +25 -25
  5. package/src/chat-ui/patch-mcp-url-safety.sh +28 -28
  6. package/src/config/config.example.json +76 -76
  7. package/src/mcp-bridge/Dockerfile +45 -45
  8. package/src/mcp-bridge/index.js +1668 -1668
  9. package/src/mcp-bridge/mcp-stdio-kernel.js +159 -159
  10. package/src/mcp-bridge/package.json +17 -17
  11. package/src/mcp-bridge/test-harness.js +470 -470
  12. package/src/nginx/Dockerfile +10 -10
  13. package/src/nginx/nginx.conf +67 -67
  14. package/src/nginx/static/favicon-dark.svg +4 -4
  15. package/src/nginx/static/favicon.svg +4 -4
  16. package/src/nginx/static/icon.svg +5 -5
  17. package/src/nginx/static/logo.svg +9 -9
  18. package/src/nginx/static/manifest.json +22 -22
  19. package/src/nginx/static/welcome.js +184 -184
  20. package/src/ruvocal/.claude/skills/add-model-descriptions/SKILL.md +73 -73
  21. package/src/ruvocal/.devcontainer/Dockerfile +9 -9
  22. package/src/ruvocal/.devcontainer/devcontainer.json +36 -36
  23. package/src/ruvocal/.dockerignore +16 -16
  24. package/src/ruvocal/.eslintignore +13 -13
  25. package/src/ruvocal/.eslintrc.cjs +45 -45
  26. package/src/ruvocal/.gcloudignore +18 -18
  27. package/src/ruvocal/.github/ISSUE_TEMPLATE/bug-report--chat-ui-.md +43 -43
  28. package/src/ruvocal/.github/ISSUE_TEMPLATE/config-support.md +9 -9
  29. package/src/ruvocal/.github/ISSUE_TEMPLATE/feature-request--chat-ui-.md +17 -17
  30. package/src/ruvocal/.github/ISSUE_TEMPLATE/huggingchat.md +11 -11
  31. package/src/ruvocal/.github/release.yml +16 -16
  32. package/src/ruvocal/.github/workflows/build-docs.yml +18 -18
  33. package/src/ruvocal/.github/workflows/build-image.yml +142 -142
  34. package/src/ruvocal/.github/workflows/build-pr-docs.yml +20 -20
  35. package/src/ruvocal/.github/workflows/deploy-dev.yml +63 -63
  36. package/src/ruvocal/.github/workflows/deploy-prod.yml +78 -78
  37. package/src/ruvocal/.github/workflows/lint-and-test.yml +84 -84
  38. package/src/ruvocal/.github/workflows/slugify.yaml +72 -72
  39. package/src/ruvocal/.github/workflows/trufflehog.yml +17 -17
  40. package/src/ruvocal/.github/workflows/upload-pr-documentation.yml +16 -16
  41. package/src/ruvocal/.husky/lint-stage-config.js +4 -4
  42. package/src/ruvocal/.husky/pre-commit +2 -2
  43. package/src/ruvocal/.prettierignore +14 -14
  44. package/src/ruvocal/.prettierrc +7 -7
  45. package/src/ruvocal/CLAUDE.md +126 -126
  46. package/src/ruvocal/Dockerfile +96 -96
  47. package/src/ruvocal/LICENSE +202 -202
  48. package/src/ruvocal/PRIVACY.md +41 -41
  49. package/src/ruvocal/README.md +164 -164
  50. package/src/ruvocal/chart/Chart.yaml +5 -5
  51. package/src/ruvocal/chart/env/dev.yaml +260 -260
  52. package/src/ruvocal/chart/env/prod.yaml +273 -273
  53. package/src/ruvocal/chart/templates/_helpers.tpl +22 -22
  54. package/src/ruvocal/chart/templates/config.yaml +10 -10
  55. package/src/ruvocal/chart/templates/deployment.yaml +81 -81
  56. package/src/ruvocal/chart/templates/hpa.yaml +45 -45
  57. package/src/ruvocal/chart/templates/infisical.yaml +24 -24
  58. package/src/ruvocal/chart/templates/ingress-internal.yaml +32 -32
  59. package/src/ruvocal/chart/templates/ingress.yaml +32 -32
  60. package/src/ruvocal/chart/templates/network-policy.yaml +36 -36
  61. package/src/ruvocal/chart/templates/service-account.yaml +13 -13
  62. package/src/ruvocal/chart/templates/service-monitor.yaml +17 -17
  63. package/src/ruvocal/chart/templates/service.yaml +21 -21
  64. package/src/ruvocal/chart/values.yaml +73 -73
  65. package/src/ruvocal/cloudbuild.yaml +68 -68
  66. package/src/ruvocal/config/branding.env.example +19 -19
  67. package/src/ruvocal/docker-compose.yml +21 -21
  68. package/src/ruvocal/docs/adr/ADR-029-HUGGINGFACE-CHAT-UI-CLOUD-RUN.md +1236 -1236
  69. package/src/ruvocal/docs/adr/ADR-033-RUVECTOR-RUFLO-MCP-INTEGRATION.md +111 -111
  70. package/src/ruvocal/docs/adr/ADR-034-OPTIONAL-MCP-BACKENDS.md +117 -117
  71. package/src/ruvocal/docs/adr/ADR-035-MCP-TOOL-GROUPS.md +186 -186
  72. package/src/ruvocal/docs/adr/ADR-037-AUTOPILOT-CHAT-MODE.md +1500 -1500
  73. package/src/ruvocal/docs/adr/ADR-038-RUVOCAL-FORK.md +286 -286
  74. package/src/ruvocal/docs/source/_toctree.yml +30 -30
  75. package/src/ruvocal/docs/source/configuration/common-issues.md +38 -38
  76. package/src/ruvocal/docs/source/configuration/llm-router.md +105 -105
  77. package/src/ruvocal/docs/source/configuration/mcp-tools.md +84 -84
  78. package/src/ruvocal/docs/source/configuration/metrics.md +9 -9
  79. package/src/ruvocal/docs/source/configuration/open-id.md +57 -57
  80. package/src/ruvocal/docs/source/configuration/overview.md +89 -89
  81. package/src/ruvocal/docs/source/configuration/theming.md +20 -20
  82. package/src/ruvocal/docs/source/developing/architecture.md +48 -48
  83. package/src/ruvocal/docs/source/index.md +53 -53
  84. package/src/ruvocal/docs/source/installation/docker.md +43 -43
  85. package/src/ruvocal/docs/source/installation/helm.md +43 -43
  86. package/src/ruvocal/docs/source/installation/local.md +62 -62
  87. package/src/ruvocal/entrypoint.sh +18 -18
  88. package/src/ruvocal/mcp-bridge/Dockerfile +45 -45
  89. package/src/ruvocal/mcp-bridge/cloudbuild.yaml +49 -49
  90. package/src/ruvocal/mcp-bridge/index.js +1878 -1878
  91. package/src/ruvocal/mcp-bridge/mcp-stdio-kernel.js +159 -159
  92. package/src/ruvocal/mcp-bridge/package-lock.json +762 -762
  93. package/src/ruvocal/mcp-bridge/package.json +17 -17
  94. package/src/ruvocal/mcp-bridge/test-harness.js +470 -470
  95. package/src/ruvocal/package-lock.json +11741 -11741
  96. package/src/ruvocal/package.json +121 -121
  97. package/src/ruvocal/postcss.config.js +6 -6
  98. package/src/ruvocal/rvf.manifest.json +204 -204
  99. package/src/ruvocal/scripts/config.ts +64 -64
  100. package/src/ruvocal/scripts/generate-welcome.mjs +181 -181
  101. package/src/ruvocal/scripts/populate.ts +288 -288
  102. package/src/ruvocal/scripts/samples.txt +194 -194
  103. package/src/ruvocal/scripts/setups/vitest-setup-server.ts +44 -44
  104. package/src/ruvocal/scripts/updateLocalEnv.ts +48 -48
  105. package/src/ruvocal/src/ambient.d.ts +7 -7
  106. package/src/ruvocal/src/app.d.ts +29 -29
  107. package/src/ruvocal/src/app.html +53 -53
  108. package/src/ruvocal/src/hooks.server.ts +32 -32
  109. package/src/ruvocal/src/hooks.ts +6 -6
  110. package/src/ruvocal/src/lib/APIClient.ts +148 -148
  111. package/src/ruvocal/src/lib/actions/clickOutside.ts +18 -18
  112. package/src/ruvocal/src/lib/actions/snapScrollToBottom.ts +346 -346
  113. package/src/ruvocal/src/lib/buildPrompt.ts +33 -33
  114. package/src/ruvocal/src/lib/components/AnnouncementBanner.svelte +20 -20
  115. package/src/ruvocal/src/lib/components/BackgroundGenerationPoller.svelte +168 -168
  116. package/src/ruvocal/src/lib/components/CodeBlock.svelte +73 -73
  117. package/src/ruvocal/src/lib/components/CopyToClipBoardBtn.svelte +92 -92
  118. package/src/ruvocal/src/lib/components/DeleteConversationModal.svelte +75 -75
  119. package/src/ruvocal/src/lib/components/EditConversationModal.svelte +100 -100
  120. package/src/ruvocal/src/lib/components/ExpandNavigation.svelte +22 -22
  121. package/src/ruvocal/src/lib/components/FoundationBackground.svelte +242 -242
  122. package/src/ruvocal/src/lib/components/HoverTooltip.svelte +44 -44
  123. package/src/ruvocal/src/lib/components/HtmlPreviewModal.svelte +143 -143
  124. package/src/ruvocal/src/lib/components/InfiniteScroll.svelte +50 -50
  125. package/src/ruvocal/src/lib/components/MobileNav.svelte +300 -300
  126. package/src/ruvocal/src/lib/components/Modal.svelte +115 -115
  127. package/src/ruvocal/src/lib/components/ModelCardMetadata.svelte +71 -71
  128. package/src/ruvocal/src/lib/components/NavConversationItem.svelte +151 -151
  129. package/src/ruvocal/src/lib/components/NavMenu.svelte +313 -313
  130. package/src/ruvocal/src/lib/components/Pagination.svelte +97 -97
  131. package/src/ruvocal/src/lib/components/PaginationArrow.svelte +27 -27
  132. package/src/ruvocal/src/lib/components/Portal.svelte +24 -24
  133. package/src/ruvocal/src/lib/components/RetryBtn.svelte +18 -18
  134. package/src/ruvocal/src/lib/components/RuFloUniverse.svelte +185 -185
  135. package/src/ruvocal/src/lib/components/RufloHelpModal.svelte +411 -411
  136. package/src/ruvocal/src/lib/components/ScrollToBottomBtn.svelte +47 -47
  137. package/src/ruvocal/src/lib/components/ScrollToPreviousBtn.svelte +77 -77
  138. package/src/ruvocal/src/lib/components/ShareConversationModal.svelte +182 -182
  139. package/src/ruvocal/src/lib/components/StopGeneratingBtn.svelte +69 -69
  140. package/src/ruvocal/src/lib/components/SubscribeModal.svelte +87 -87
  141. package/src/ruvocal/src/lib/components/Switch.svelte +36 -36
  142. package/src/ruvocal/src/lib/components/SystemPromptModal.svelte +44 -44
  143. package/src/ruvocal/src/lib/components/Toast.svelte +27 -27
  144. package/src/ruvocal/src/lib/components/Tooltip.svelte +30 -30
  145. package/src/ruvocal/src/lib/components/WelcomeModal.svelte +46 -46
  146. package/src/ruvocal/src/lib/components/chat/Alternatives.svelte +77 -77
  147. package/src/ruvocal/src/lib/components/chat/BlockWrapper.svelte +72 -72
  148. package/src/ruvocal/src/lib/components/chat/ChatInput.svelte +490 -490
  149. package/src/ruvocal/src/lib/components/chat/ChatIntroduction.svelte +123 -123
  150. package/src/ruvocal/src/lib/components/chat/ChatMessage.svelte +548 -548
  151. package/src/ruvocal/src/lib/components/chat/ChatWindow.svelte +1057 -1057
  152. package/src/ruvocal/src/lib/components/chat/FileDropzone.svelte +92 -92
  153. package/src/ruvocal/src/lib/components/chat/ImageLightbox.svelte +66 -66
  154. package/src/ruvocal/src/lib/components/chat/MarkdownBlock.svelte +23 -23
  155. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte +69 -69
  156. package/src/ruvocal/src/lib/components/chat/MarkdownRenderer.svelte.test.ts +58 -58
  157. package/src/ruvocal/src/lib/components/chat/MessageAvatar.svelte +103 -103
  158. package/src/ruvocal/src/lib/components/chat/ModelSwitch.svelte +64 -64
  159. package/src/ruvocal/src/lib/components/chat/OpenReasoningResults.svelte +81 -81
  160. package/src/ruvocal/src/lib/components/chat/TaskGroup.svelte +88 -88
  161. package/src/ruvocal/src/lib/components/chat/ToolUpdate.svelte +273 -273
  162. package/src/ruvocal/src/lib/components/chat/UploadedFile.svelte +253 -253
  163. package/src/ruvocal/src/lib/components/chat/UrlFetchModal.svelte +203 -203
  164. package/src/ruvocal/src/lib/components/chat/VoiceRecorder.svelte +214 -214
  165. package/src/ruvocal/src/lib/components/icons/IconBurger.svelte +20 -20
  166. package/src/ruvocal/src/lib/components/icons/IconCheap.svelte +20 -20
  167. package/src/ruvocal/src/lib/components/icons/IconChevron.svelte +24 -24
  168. package/src/ruvocal/src/lib/components/icons/IconDazzled.svelte +40 -40
  169. package/src/ruvocal/src/lib/components/icons/IconFast.svelte +20 -20
  170. package/src/ruvocal/src/lib/components/icons/IconLoading.svelte +22 -22
  171. package/src/ruvocal/src/lib/components/icons/IconMCP.svelte +28 -28
  172. package/src/ruvocal/src/lib/components/icons/IconMoon.svelte +21 -21
  173. package/src/ruvocal/src/lib/components/icons/IconNew.svelte +20 -20
  174. package/src/ruvocal/src/lib/components/icons/IconOmni.svelte +90 -90
  175. package/src/ruvocal/src/lib/components/icons/IconPaperclip.svelte +24 -24
  176. package/src/ruvocal/src/lib/components/icons/IconPro.svelte +37 -37
  177. package/src/ruvocal/src/lib/components/icons/IconShare.svelte +21 -21
  178. package/src/ruvocal/src/lib/components/icons/IconSun.svelte +93 -93
  179. package/src/ruvocal/src/lib/components/icons/Logo.svelte +68 -68
  180. package/src/ruvocal/src/lib/components/icons/LogoHuggingFaceBorderless.svelte +54 -54
  181. package/src/ruvocal/src/lib/components/mcp/AddServerForm.svelte +250 -250
  182. package/src/ruvocal/src/lib/components/mcp/MCPServerManager.svelte +185 -185
  183. package/src/ruvocal/src/lib/components/mcp/ServerCard.svelte +203 -203
  184. package/src/ruvocal/src/lib/components/players/AudioPlayer.svelte +82 -82
  185. package/src/ruvocal/src/lib/components/voice/AudioWaveform.svelte +96 -96
  186. package/src/ruvocal/src/lib/components/wasm/GalleryPanel.svelte +357 -357
  187. package/src/ruvocal/src/lib/constants/mcpExamples.ts +114 -114
  188. package/src/ruvocal/src/lib/constants/mime.ts +11 -11
  189. package/src/ruvocal/src/lib/constants/pagination.ts +1 -1
  190. package/src/ruvocal/src/lib/constants/publicSepToken.ts +1 -1
  191. package/src/ruvocal/src/lib/constants/routerExamples.ts +133 -133
  192. package/src/ruvocal/src/lib/constants/rvagentPresets.ts +206 -206
  193. package/src/ruvocal/src/lib/createShareLink.ts +27 -27
  194. package/src/ruvocal/src/lib/jobs/refresh-conversation-stats.ts +297 -297
  195. package/src/ruvocal/src/lib/migrations/lock.ts +56 -56
  196. package/src/ruvocal/src/lib/migrations/migrations.spec.ts +74 -74
  197. package/src/ruvocal/src/lib/migrations/migrations.ts +109 -109
  198. package/src/ruvocal/src/lib/migrations/routines/01-update-search-assistants.ts +50 -50
  199. package/src/ruvocal/src/lib/migrations/routines/02-update-assistants-models.ts +48 -48
  200. package/src/ruvocal/src/lib/migrations/routines/04-update-message-updates.ts +151 -151
  201. package/src/ruvocal/src/lib/migrations/routines/05-update-message-files.ts +56 -56
  202. package/src/ruvocal/src/lib/migrations/routines/06-trim-message-updates.ts +56 -56
  203. package/src/ruvocal/src/lib/migrations/routines/08-update-featured-to-review.ts +32 -32
  204. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.spec.ts +214 -214
  205. package/src/ruvocal/src/lib/migrations/routines/09-delete-empty-conversations.ts +88 -88
  206. package/src/ruvocal/src/lib/migrations/routines/10-update-reports-assistantid.ts +29 -29
  207. package/src/ruvocal/src/lib/migrations/routines/index.ts +15 -15
  208. package/src/ruvocal/src/lib/server/__tests__/conversation-stop-generating.spec.ts +103 -103
  209. package/src/ruvocal/src/lib/server/abortRegistry.ts +57 -57
  210. package/src/ruvocal/src/lib/server/abortedGenerations.ts +43 -43
  211. package/src/ruvocal/src/lib/server/adminToken.ts +62 -62
  212. package/src/ruvocal/src/lib/server/api/__tests__/conversations-id.spec.ts +296 -296
  213. package/src/ruvocal/src/lib/server/api/__tests__/conversations-message.spec.ts +216 -216
  214. package/src/ruvocal/src/lib/server/api/__tests__/conversations.spec.ts +235 -235
  215. package/src/ruvocal/src/lib/server/api/__tests__/misc.spec.ts +72 -72
  216. package/src/ruvocal/src/lib/server/api/__tests__/testHelpers.ts +86 -86
  217. package/src/ruvocal/src/lib/server/api/__tests__/user-reports.spec.ts +78 -78
  218. package/src/ruvocal/src/lib/server/api/__tests__/user.spec.ts +239 -239
  219. package/src/ruvocal/src/lib/server/api/types.ts +37 -37
  220. package/src/ruvocal/src/lib/server/api/utils/requireAuth.ts +22 -22
  221. package/src/ruvocal/src/lib/server/api/utils/resolveConversation.ts +69 -69
  222. package/src/ruvocal/src/lib/server/api/utils/resolveModel.ts +27 -27
  223. package/src/ruvocal/src/lib/server/api/utils/superjsonResponse.ts +15 -15
  224. package/src/ruvocal/src/lib/server/apiToken.ts +11 -11
  225. package/src/ruvocal/src/lib/server/auth.ts +554 -554
  226. package/src/ruvocal/src/lib/server/config.ts +187 -187
  227. package/src/ruvocal/src/lib/server/conversation.ts +83 -83
  228. package/src/ruvocal/src/lib/server/database/__tests__/rvf.spec.ts +709 -709
  229. package/src/ruvocal/src/lib/server/database/postgres.ts +700 -700
  230. package/src/ruvocal/src/lib/server/database/rvf.ts +1078 -1078
  231. package/src/ruvocal/src/lib/server/database.ts +145 -145
  232. package/src/ruvocal/src/lib/server/endpoints/document.ts +68 -68
  233. package/src/ruvocal/src/lib/server/endpoints/endpoints.ts +43 -43
  234. package/src/ruvocal/src/lib/server/endpoints/images.ts +211 -211
  235. package/src/ruvocal/src/lib/server/endpoints/openai/endpointOai.ts +266 -266
  236. package/src/ruvocal/src/lib/server/endpoints/openai/openAIChatToTextGenerationStream.ts +212 -212
  237. package/src/ruvocal/src/lib/server/endpoints/openai/openAICompletionToTextGenerationStream.ts +32 -32
  238. package/src/ruvocal/src/lib/server/endpoints/preprocessMessages.ts +61 -61
  239. package/src/ruvocal/src/lib/server/exitHandler.ts +59 -59
  240. package/src/ruvocal/src/lib/server/files/downloadFile.ts +34 -34
  241. package/src/ruvocal/src/lib/server/files/uploadFile.ts +29 -29
  242. package/src/ruvocal/src/lib/server/findRepoRoot.ts +13 -13
  243. package/src/ruvocal/src/lib/server/generateFromDefaultEndpoint.ts +46 -46
  244. package/src/ruvocal/src/lib/server/hooks/error.ts +37 -37
  245. package/src/ruvocal/src/lib/server/hooks/fetch.ts +22 -22
  246. package/src/ruvocal/src/lib/server/hooks/handle.ts +250 -250
  247. package/src/ruvocal/src/lib/server/hooks/init.ts +51 -51
  248. package/src/ruvocal/src/lib/server/isURLLocal.spec.ts +31 -31
  249. package/src/ruvocal/src/lib/server/isURLLocal.ts +74 -74
  250. package/src/ruvocal/src/lib/server/logger.ts +42 -42
  251. package/src/ruvocal/src/lib/server/mcp/clientPool.spec.ts +175 -175
  252. package/src/ruvocal/src/lib/server/mcp/hf.ts +32 -32
  253. package/src/ruvocal/src/lib/server/mcp/httpClient.ts +122 -122
  254. package/src/ruvocal/src/lib/server/mcp/registry.ts +76 -76
  255. package/src/ruvocal/src/lib/server/mcp/tools.ts +196 -196
  256. package/src/ruvocal/src/lib/server/metrics.ts +255 -255
  257. package/src/ruvocal/src/lib/server/models.ts +518 -518
  258. package/src/ruvocal/src/lib/server/requestContext.ts +55 -55
  259. package/src/ruvocal/src/lib/server/router/arch.ts +230 -230
  260. package/src/ruvocal/src/lib/server/router/endpoint.ts +316 -316
  261. package/src/ruvocal/src/lib/server/router/multimodal.ts +28 -28
  262. package/src/ruvocal/src/lib/server/router/policy.ts +49 -49
  263. package/src/ruvocal/src/lib/server/router/toolsRoute.ts +51 -51
  264. package/src/ruvocal/src/lib/server/router/types.ts +21 -21
  265. package/src/ruvocal/src/lib/server/sendSlack.ts +23 -23
  266. package/src/ruvocal/src/lib/server/textGeneration/generate.ts +258 -258
  267. package/src/ruvocal/src/lib/server/textGeneration/index.ts +96 -96
  268. package/src/ruvocal/src/lib/server/textGeneration/mcp/fileRefs.ts +155 -155
  269. package/src/ruvocal/src/lib/server/textGeneration/mcp/routerResolution.ts +108 -108
  270. package/src/ruvocal/src/lib/server/textGeneration/mcp/runMcpFlow.ts +831 -831
  271. package/src/ruvocal/src/lib/server/textGeneration/mcp/toolInvocation.ts +349 -349
  272. package/src/ruvocal/src/lib/server/textGeneration/mcp/wasmTools.test.ts +633 -633
  273. package/src/ruvocal/src/lib/server/textGeneration/reasoning.ts +23 -23
  274. package/src/ruvocal/src/lib/server/textGeneration/title.ts +83 -83
  275. package/src/ruvocal/src/lib/server/textGeneration/types.ts +28 -28
  276. package/src/ruvocal/src/lib/server/textGeneration/utils/prepareFiles.ts +88 -88
  277. package/src/ruvocal/src/lib/server/textGeneration/utils/routing.ts +21 -21
  278. package/src/ruvocal/src/lib/server/textGeneration/utils/toolPrompt.ts +49 -49
  279. package/src/ruvocal/src/lib/server/urlSafety.ts +77 -77
  280. package/src/ruvocal/src/lib/server/usageLimits.ts +30 -30
  281. package/src/ruvocal/src/lib/stores/autopilotStore.svelte.ts +175 -175
  282. package/src/ruvocal/src/lib/stores/backgroundGenerations.svelte.ts +32 -32
  283. package/src/ruvocal/src/lib/stores/backgroundGenerations.ts +1 -1
  284. package/src/ruvocal/src/lib/stores/errors.ts +9 -9
  285. package/src/ruvocal/src/lib/stores/isAborted.ts +3 -3
  286. package/src/ruvocal/src/lib/stores/isPro.ts +4 -4
  287. package/src/ruvocal/src/lib/stores/loading.ts +3 -3
  288. package/src/ruvocal/src/lib/stores/mcpServers.ts +534 -534
  289. package/src/ruvocal/src/lib/stores/pendingChatInput.ts +3 -3
  290. package/src/ruvocal/src/lib/stores/pendingMessage.ts +9 -9
  291. package/src/ruvocal/src/lib/stores/settings.ts +182 -182
  292. package/src/ruvocal/src/lib/stores/shareModal.ts +13 -13
  293. package/src/ruvocal/src/lib/stores/titleUpdate.ts +8 -8
  294. package/src/ruvocal/src/lib/stores/wasmMcp.ts +472 -472
  295. package/src/ruvocal/src/lib/switchTheme.ts +124 -124
  296. package/src/ruvocal/src/lib/types/AbortedGeneration.ts +8 -8
  297. package/src/ruvocal/src/lib/types/Assistant.ts +31 -31
  298. package/src/ruvocal/src/lib/types/AssistantStats.ts +11 -11
  299. package/src/ruvocal/src/lib/types/ConfigKey.ts +4 -4
  300. package/src/ruvocal/src/lib/types/ConvSidebar.ts +9 -9
  301. package/src/ruvocal/src/lib/types/Conversation.ts +27 -27
  302. package/src/ruvocal/src/lib/types/ConversationStats.ts +13 -13
  303. package/src/ruvocal/src/lib/types/Message.ts +41 -41
  304. package/src/ruvocal/src/lib/types/MessageEvent.ts +10 -10
  305. package/src/ruvocal/src/lib/types/MessageUpdate.ts +139 -139
  306. package/src/ruvocal/src/lib/types/MigrationResult.ts +7 -7
  307. package/src/ruvocal/src/lib/types/Model.ts +23 -23
  308. package/src/ruvocal/src/lib/types/Report.ts +12 -12
  309. package/src/ruvocal/src/lib/types/Review.ts +6 -6
  310. package/src/ruvocal/src/lib/types/Semaphore.ts +19 -19
  311. package/src/ruvocal/src/lib/types/Session.ts +22 -22
  312. package/src/ruvocal/src/lib/types/Settings.ts +93 -93
  313. package/src/ruvocal/src/lib/types/SharedConversation.ts +9 -9
  314. package/src/ruvocal/src/lib/types/Template.ts +6 -6
  315. package/src/ruvocal/src/lib/types/Timestamps.ts +4 -4
  316. package/src/ruvocal/src/lib/types/TokenCache.ts +6 -6
  317. package/src/ruvocal/src/lib/types/Tool.ts +77 -77
  318. package/src/ruvocal/src/lib/types/UrlDependency.ts +5 -5
  319. package/src/ruvocal/src/lib/types/User.ts +14 -14
  320. package/src/ruvocal/src/lib/utils/PublicConfig.svelte.ts +75 -75
  321. package/src/ruvocal/src/lib/utils/auth.ts +17 -17
  322. package/src/ruvocal/src/lib/utils/chunk.ts +33 -33
  323. package/src/ruvocal/src/lib/utils/cookiesAreEnabled.ts +13 -13
  324. package/src/ruvocal/src/lib/utils/debounce.ts +17 -17
  325. package/src/ruvocal/src/lib/utils/deepestChild.ts +6 -6
  326. package/src/ruvocal/src/lib/utils/favicon.ts +21 -21
  327. package/src/ruvocal/src/lib/utils/fetchJSON.ts +23 -23
  328. package/src/ruvocal/src/lib/utils/file2base64.ts +14 -14
  329. package/src/ruvocal/src/lib/utils/formatUserCount.ts +37 -37
  330. package/src/ruvocal/src/lib/utils/generationState.spec.ts +75 -75
  331. package/src/ruvocal/src/lib/utils/generationState.ts +26 -26
  332. package/src/ruvocal/src/lib/utils/getHref.ts +41 -41
  333. package/src/ruvocal/src/lib/utils/getReturnFromGenerator.ts +7 -7
  334. package/src/ruvocal/src/lib/utils/haptics.ts +64 -64
  335. package/src/ruvocal/src/lib/utils/hashConv.ts +12 -12
  336. package/src/ruvocal/src/lib/utils/hf.ts +17 -17
  337. package/src/ruvocal/src/lib/utils/isDesktop.ts +7 -7
  338. package/src/ruvocal/src/lib/utils/isUrl.ts +8 -8
  339. package/src/ruvocal/src/lib/utils/isVirtualKeyboard.ts +16 -16
  340. package/src/ruvocal/src/lib/utils/loadAttachmentsFromUrls.ts +115 -115
  341. package/src/ruvocal/src/lib/utils/marked.spec.ts +96 -96
  342. package/src/ruvocal/src/lib/utils/marked.ts +531 -531
  343. package/src/ruvocal/src/lib/utils/mcpValidation.ts +147 -147
  344. package/src/ruvocal/src/lib/utils/mergeAsyncGenerators.ts +38 -38
  345. package/src/ruvocal/src/lib/utils/messageUpdates.spec.ts +262 -262
  346. package/src/ruvocal/src/lib/utils/messageUpdates.ts +324 -324
  347. package/src/ruvocal/src/lib/utils/mime.ts +56 -56
  348. package/src/ruvocal/src/lib/utils/models.ts +14 -14
  349. package/src/ruvocal/src/lib/utils/parseBlocks.ts +120 -120
  350. package/src/ruvocal/src/lib/utils/parseIncompleteMarkdown.ts +644 -644
  351. package/src/ruvocal/src/lib/utils/parseStringToList.ts +10 -10
  352. package/src/ruvocal/src/lib/utils/randomUuid.ts +14 -14
  353. package/src/ruvocal/src/lib/utils/searchTokens.ts +33 -33
  354. package/src/ruvocal/src/lib/utils/sha256.ts +7 -7
  355. package/src/ruvocal/src/lib/utils/stringifyError.ts +12 -12
  356. package/src/ruvocal/src/lib/utils/sum.ts +3 -3
  357. package/src/ruvocal/src/lib/utils/template.spec.ts +59 -59
  358. package/src/ruvocal/src/lib/utils/template.ts +53 -53
  359. package/src/ruvocal/src/lib/utils/timeout.ts +9 -9
  360. package/src/ruvocal/src/lib/utils/toolProgress.spec.ts +46 -46
  361. package/src/ruvocal/src/lib/utils/toolProgress.ts +11 -11
  362. package/src/ruvocal/src/lib/utils/tree/addChildren.spec.ts +102 -102
  363. package/src/ruvocal/src/lib/utils/tree/addChildren.ts +48 -48
  364. package/src/ruvocal/src/lib/utils/tree/addSibling.spec.ts +81 -81
  365. package/src/ruvocal/src/lib/utils/tree/addSibling.ts +41 -41
  366. package/src/ruvocal/src/lib/utils/tree/buildSubtree.spec.ts +110 -110
  367. package/src/ruvocal/src/lib/utils/tree/buildSubtree.ts +24 -24
  368. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.spec.ts +31 -31
  369. package/src/ruvocal/src/lib/utils/tree/convertLegacyConversation.ts +36 -36
  370. package/src/ruvocal/src/lib/utils/tree/isMessageId.spec.ts +15 -15
  371. package/src/ruvocal/src/lib/utils/tree/isMessageId.ts +5 -5
  372. package/src/ruvocal/src/lib/utils/tree/tree.d.ts +14 -14
  373. package/src/ruvocal/src/lib/utils/tree/treeHelpers.spec.ts +167 -167
  374. package/src/ruvocal/src/lib/utils/updates.ts +39 -39
  375. package/src/ruvocal/src/lib/utils/urlParams.ts +13 -13
  376. package/src/ruvocal/src/lib/wasm/idb.ts +438 -438
  377. package/src/ruvocal/src/lib/wasm/index.ts +1213 -1213
  378. package/src/ruvocal/src/lib/wasm/tests/wasm-capabilities.test.ts +565 -565
  379. package/src/ruvocal/src/lib/wasm/wasm.worker.ts +332 -332
  380. package/src/ruvocal/src/lib/wasm/workerClient.ts +166 -166
  381. package/src/ruvocal/src/lib/workers/autopilotWorker.ts +221 -221
  382. package/src/ruvocal/src/lib/workers/detailFetchWorker.ts +100 -100
  383. package/src/ruvocal/src/lib/workers/markdownWorker.ts +61 -61
  384. package/src/ruvocal/src/routes/+error.svelte +20 -20
  385. package/src/ruvocal/src/routes/+layout.svelte +324 -324
  386. package/src/ruvocal/src/routes/+layout.ts +91 -91
  387. package/src/ruvocal/src/routes/+page.svelte +168 -168
  388. package/src/ruvocal/src/routes/.well-known/oauth-cimd/+server.ts +37 -37
  389. package/src/ruvocal/src/routes/__debug/openai/+server.ts +21 -21
  390. package/src/ruvocal/src/routes/admin/export/+server.ts +159 -159
  391. package/src/ruvocal/src/routes/admin/stats/compute/+server.ts +16 -16
  392. package/src/ruvocal/src/routes/api/conversation/[id]/+server.ts +40 -40
  393. package/src/ruvocal/src/routes/api/conversation/[id]/message/[messageId]/+server.ts +42 -42
  394. package/src/ruvocal/src/routes/api/conversations/+server.ts +48 -48
  395. package/src/ruvocal/src/routes/api/fetch-url/+server.ts +147 -147
  396. package/src/ruvocal/src/routes/api/mcp/health/+server.ts +292 -292
  397. package/src/ruvocal/src/routes/api/mcp/servers/+server.ts +32 -32
  398. package/src/ruvocal/src/routes/api/models/+server.ts +25 -25
  399. package/src/ruvocal/src/routes/api/transcribe/+server.ts +104 -104
  400. package/src/ruvocal/src/routes/api/user/+server.ts +15 -15
  401. package/src/ruvocal/src/routes/api/user/validate-token/+server.ts +20 -20
  402. package/src/ruvocal/src/routes/api/v2/conversations/+server.ts +48 -48
  403. package/src/ruvocal/src/routes/api/v2/conversations/[id]/+server.ts +94 -94
  404. package/src/ruvocal/src/routes/api/v2/conversations/[id]/message/[messageId]/+server.ts +43 -43
  405. package/src/ruvocal/src/routes/api/v2/conversations/import-share/+server.ts +23 -23
  406. package/src/ruvocal/src/routes/api/v2/debug/config/+server.ts +16 -16
  407. package/src/ruvocal/src/routes/api/v2/debug/refresh/+server.ts +30 -30
  408. package/src/ruvocal/src/routes/api/v2/export/+server.ts +196 -196
  409. package/src/ruvocal/src/routes/api/v2/feature-flags/+server.ts +14 -14
  410. package/src/ruvocal/src/routes/api/v2/models/+server.ts +38 -38
  411. package/src/ruvocal/src/routes/api/v2/models/[namespace]/+server.ts +8 -8
  412. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/+server.ts +8 -8
  413. package/src/ruvocal/src/routes/api/v2/models/[namespace]/[model]/subscribe/+server.ts +28 -28
  414. package/src/ruvocal/src/routes/api/v2/models/[namespace]/subscribe/+server.ts +28 -28
  415. package/src/ruvocal/src/routes/api/v2/models/old/+server.ts +7 -7
  416. package/src/ruvocal/src/routes/api/v2/models/refresh/+server.ts +33 -33
  417. package/src/ruvocal/src/routes/api/v2/public-config/+server.ts +7 -7
  418. package/src/ruvocal/src/routes/api/v2/user/+server.ts +17 -17
  419. package/src/ruvocal/src/routes/api/v2/user/billing-orgs/+server.ts +73 -73
  420. package/src/ruvocal/src/routes/api/v2/user/reports/+server.ts +17 -17
  421. package/src/ruvocal/src/routes/api/v2/user/settings/+server.ts +110 -110
  422. package/src/ruvocal/src/routes/conversation/+server.ts +115 -115
  423. package/src/ruvocal/src/routes/conversation/[id]/+page.svelte +586 -586
  424. package/src/ruvocal/src/routes/conversation/[id]/+page.ts +60 -60
  425. package/src/ruvocal/src/routes/conversation/[id]/+server.ts +740 -740
  426. package/src/ruvocal/src/routes/conversation/[id]/message/[messageId]/prompt/+server.ts +66 -66
  427. package/src/ruvocal/src/routes/conversation/[id]/share/+server.ts +69 -69
  428. package/src/ruvocal/src/routes/conversation/[id]/stop-generating/+server.ts +35 -35
  429. package/src/ruvocal/src/routes/healthcheck/+server.ts +3 -3
  430. package/src/ruvocal/src/routes/login/+server.ts +5 -5
  431. package/src/ruvocal/src/routes/login/callback/+server.ts +103 -103
  432. package/src/ruvocal/src/routes/login/callback/updateUser.spec.ts +157 -157
  433. package/src/ruvocal/src/routes/login/callback/updateUser.ts +215 -215
  434. package/src/ruvocal/src/routes/logout/+server.ts +18 -18
  435. package/src/ruvocal/src/routes/metrics/+server.ts +18 -18
  436. package/src/ruvocal/src/routes/models/+page.svelte +233 -233
  437. package/src/ruvocal/src/routes/models/[...model]/+page.svelte +161 -161
  438. package/src/ruvocal/src/routes/models/[...model]/+page.ts +14 -14
  439. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/+server.ts +64 -64
  440. package/src/ruvocal/src/routes/models/[...model]/thumbnail.png/ModelThumbnail.svelte +28 -28
  441. package/src/ruvocal/src/routes/privacy/+page.svelte +11 -11
  442. package/src/ruvocal/src/routes/r/[id]/+page.ts +34 -34
  443. package/src/ruvocal/src/routes/settings/(nav)/+layout.svelte +282 -282
  444. package/src/ruvocal/src/routes/settings/(nav)/+layout.ts +1 -1
  445. package/src/ruvocal/src/routes/settings/(nav)/+server.ts +59 -59
  446. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.svelte +464 -464
  447. package/src/ruvocal/src/routes/settings/(nav)/[...model]/+page.ts +14 -14
  448. package/src/ruvocal/src/routes/settings/(nav)/application/+page.svelte +362 -362
  449. package/src/ruvocal/src/routes/settings/+layout.svelte +40 -40
  450. package/src/ruvocal/src/styles/highlight-js.css +195 -195
  451. package/src/ruvocal/src/styles/main.css +144 -144
  452. package/src/ruvocal/static/chatui/favicon-dark.svg +3 -3
  453. package/src/ruvocal/static/chatui/favicon-dev.svg +3 -3
  454. package/src/ruvocal/static/chatui/favicon.svg +3 -3
  455. package/src/ruvocal/static/chatui/icon.svg +3 -3
  456. package/src/ruvocal/static/chatui/logo.svg +7 -7
  457. package/src/ruvocal/static/chatui/manifest.json +54 -54
  458. package/src/ruvocal/static/chatui/welcome.js +184 -184
  459. package/src/ruvocal/static/huggingchat/favicon-dark.svg +4 -4
  460. package/src/ruvocal/static/huggingchat/favicon-dev.svg +4 -4
  461. package/src/ruvocal/static/huggingchat/favicon.svg +4 -4
  462. package/src/ruvocal/static/huggingchat/fulltext-logo.svg +1 -1
  463. package/src/ruvocal/static/huggingchat/icon.svg +4 -4
  464. package/src/ruvocal/static/huggingchat/logo.svg +4 -4
  465. package/src/ruvocal/static/huggingchat/manifest.json +54 -54
  466. package/src/ruvocal/static/huggingchat/routes.chat.json +226 -226
  467. package/src/ruvocal/static/robots.txt +10 -10
  468. package/src/ruvocal/static/wasm/rvagent_wasm.js +1539 -1539
  469. package/src/ruvocal/stub/@reflink/reflink/package.json +5 -5
  470. package/src/ruvocal/svelte.config.js +53 -53
  471. package/src/ruvocal/tailwind.config.cjs +30 -30
  472. package/src/ruvocal/tsconfig.json +19 -19
  473. package/src/ruvocal/vite.config.ts +87 -87
  474. package/src/scripts/deploy.sh +116 -116
  475. package/src/scripts/generate-config.js +245 -245
  476. package/src/scripts/generate-welcome.js +187 -187
  477. package/src/scripts/package-rvf.sh +116 -116
  478. package/src/ruvocal/.claude-flow/daemon-state.json +0 -135
  479. package/src/ruvocal/.claude-flow/data/pending-insights.jsonl +0 -0
  480. package/src/ruvocal/.claude-flow/data/ranked-context.json +0 -5
  481. package/src/ruvocal/.claude-flow/logs/daemon.log +0 -31
  482. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_prompt.log +0 -989
  483. package/src/ruvocal/.claude-flow/logs/headless/audit_1777949411822_juxau0_result.log +0 -67
  484. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_prompt.log +0 -989
  485. package/src/ruvocal/.claude-flow/logs/headless/audit_1777950042278_jvj5xq_result.log +0 -93
  486. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_prompt.log +0 -1498
  487. package/src/ruvocal/.claude-flow/logs/headless/optimize_1777949531823_yt5yc2_result.log +0 -93
  488. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_prompt.log +0 -1498
  489. package/src/ruvocal/.claude-flow/logs/headless/testgaps_1777949771821_elw1j4_result.log +0 -100
  490. package/src/ruvocal/.claude-flow/metrics/codebase-map.json +0 -11
  491. package/src/ruvocal/.claude-flow/metrics/consolidation.json +0 -6
  492. package/src/ruvocal/.claude-flow/neural/stats.json +0 -6
  493. package/src/ruvocal/.claude-flow/sessions/current.json +0 -13
  494. package/src/ruvocal/.env +0 -194
  495. package/src/ruvocal/.env.ci +0 -1
  496. package/src/ruvocal/.swarm/attestation.db +0 -0
  497. package/src/ruvocal/.swarm/hnsw.index +0 -0
  498. package/src/ruvocal/.swarm/hnsw.metadata.json +0 -1
  499. package/src/ruvocal/.swarm/memory.db +0 -0
  500. package/src/ruvocal/.swarm/schema.sql +0 -305
@@ -1,518 +1,518 @@
1
- import { config } from "$lib/server/config";
2
- import type { ChatTemplateInput } from "$lib/types/Template";
3
- import { z } from "zod";
4
- import endpoints, { endpointSchema, type Endpoint } from "./endpoints/endpoints";
5
-
6
- import JSON5 from "json5";
7
- import { logger } from "$lib/server/logger";
8
- import { makeRouterEndpoint } from "$lib/server/router/endpoint";
9
-
10
- type Optional<T, K extends keyof T> = Pick<Partial<T>, K> & Omit<T, K>;
11
-
12
- const sanitizeJSONEnv = (val: string, fallback: string) => {
13
- const raw = (val ?? "").trim();
14
- const unquoted = raw.startsWith("`") && raw.endsWith("`") ? raw.slice(1, -1) : raw;
15
- return unquoted || fallback;
16
- };
17
-
18
- const modelConfig = z.object({
19
- /** Used as an identifier in DB */
20
- id: z.string().optional(),
21
- /** Used to link to the model page, and for inference */
22
- name: z.string().default(""),
23
- displayName: z.string().min(1).optional(),
24
- description: z.string().min(1).optional(),
25
- logoUrl: z.string().url().optional(),
26
- websiteUrl: z.string().url().optional(),
27
- modelUrl: z.string().url().optional(),
28
- tokenizer: z.never().optional(),
29
- datasetName: z.string().min(1).optional(),
30
- datasetUrl: z.string().url().optional(),
31
- preprompt: z.string().default(""),
32
- prepromptUrl: z.string().url().optional(),
33
- chatPromptTemplate: z.never().optional(),
34
- promptExamples: z
35
- .array(
36
- z.object({
37
- title: z.string().min(1),
38
- prompt: z.string().min(1),
39
- })
40
- )
41
- .optional(),
42
- endpoints: z.array(endpointSchema).optional(),
43
- providers: z.array(z.object({ supports_tools: z.boolean().optional() }).passthrough()).optional(),
44
- parameters: z
45
- .object({
46
- temperature: z.number().min(0).max(2).optional(),
47
- truncate: z.number().int().positive().optional(),
48
- max_tokens: z.number().int().positive().optional(),
49
- stop: z.array(z.string()).optional(),
50
- top_p: z.number().positive().optional(),
51
- top_k: z.number().positive().optional(),
52
- frequency_penalty: z.number().min(-2).max(2).optional(),
53
- presence_penalty: z.number().min(-2).max(2).optional(),
54
- })
55
- .passthrough()
56
- .optional(),
57
- multimodal: z.boolean().default(false),
58
- multimodalAcceptedMimetypes: z.array(z.string()).optional(),
59
- // Aggregated tool-calling capability across providers (HF router)
60
- supportsTools: z.boolean().default(false),
61
- unlisted: z.boolean().default(false),
62
- embeddingModel: z.never().optional(),
63
- /** Used to enable/disable system prompt usage */
64
- systemRoleSupported: z.boolean().default(true),
65
- });
66
-
67
- type ModelConfig = z.infer<typeof modelConfig>;
68
-
69
- const overrideEntrySchema = modelConfig
70
- .partial()
71
- .extend({
72
- id: z.string().optional(),
73
- name: z.string().optional(),
74
- })
75
- .refine((value) => Boolean((value.id ?? value.name)?.trim()), {
76
- message: "Model override entry must provide an id or name",
77
- });
78
-
79
- type ModelOverride = z.infer<typeof overrideEntrySchema>;
80
-
81
- const openaiBaseUrl = config.OPENAI_BASE_URL
82
- ? config.OPENAI_BASE_URL.replace(/\/$/, "")
83
- : undefined;
84
- const isHFRouter = openaiBaseUrl === "https://router.huggingface.co/v1";
85
-
86
- const listSchema = z
87
- .object({
88
- data: z.array(
89
- z.object({
90
- id: z.string(),
91
- description: z.string().optional(),
92
- providers: z
93
- .array(z.object({ supports_tools: z.boolean().optional() }).passthrough())
94
- .optional(),
95
- architecture: z
96
- .object({
97
- input_modalities: z.array(z.string()).optional(),
98
- })
99
- .passthrough()
100
- .optional(),
101
- })
102
- ),
103
- })
104
- .passthrough();
105
-
106
- function getChatPromptRender(_m: ModelConfig): (inputs: ChatTemplateInput) => string {
107
- // Minimal template to support legacy "completions" flow if ever used.
108
- // We avoid any tokenizer/Jinja usage in this build.
109
- return ({ messages, preprompt }) => {
110
- const parts: string[] = [];
111
- if (preprompt) parts.push(`[SYSTEM]\n${preprompt}`);
112
- for (const msg of messages) {
113
- const role = msg.from === "assistant" ? "ASSISTANT" : msg.from.toUpperCase();
114
- parts.push(`[${role}]\n${msg.content}`);
115
- }
116
- parts.push(`[ASSISTANT]`);
117
- return parts.join("\n\n");
118
- };
119
- }
120
-
121
- const processModel = async (m: ModelConfig) => ({
122
- ...m,
123
- chatPromptRender: await getChatPromptRender(m),
124
- id: m.id || m.name,
125
- displayName: m.displayName || m.name,
126
- preprompt: m.prepromptUrl ? await fetch(m.prepromptUrl).then((r) => r.text()) : m.preprompt,
127
- parameters: { ...m.parameters, stop_sequences: m.parameters?.stop },
128
- unlisted: m.unlisted ?? false,
129
- });
130
-
131
- const addEndpoint = (m: Awaited<ReturnType<typeof processModel>>) => ({
132
- ...m,
133
- getEndpoint: async (): Promise<Endpoint> => {
134
- if (!m.endpoints || m.endpoints.length === 0) {
135
- throw new Error("No endpoints configured. This build requires OpenAI-compatible endpoints.");
136
- }
137
- // Only support OpenAI-compatible endpoints in this build
138
- const endpoint = m.endpoints[0];
139
- if (endpoint.type !== "openai") {
140
- throw new Error("Only 'openai' endpoint type is supported in this build");
141
- }
142
- return await endpoints.openai({ ...endpoint, model: m });
143
- },
144
- });
145
-
146
- type InternalProcessedModel = Awaited<ReturnType<typeof addEndpoint>> & {
147
- isRouter: boolean;
148
- hasInferenceAPI: boolean;
149
- };
150
-
151
- const inferenceApiIds: string[] = [];
152
-
153
- const getModelOverrides = (): ModelOverride[] => {
154
- const overridesEnv = (Reflect.get(config, "MODELS") as string | undefined) ?? "";
155
-
156
- if (!overridesEnv.trim()) {
157
- return [];
158
- }
159
-
160
- try {
161
- return z.array(overrideEntrySchema).parse(JSON5.parse(sanitizeJSONEnv(overridesEnv, "[]")));
162
- } catch (error) {
163
- logger.error(error, "[models] Failed to parse MODELS overrides");
164
- return [];
165
- }
166
- };
167
-
168
- export type ModelsRefreshSummary = {
169
- refreshedAt: Date;
170
- durationMs: number;
171
- added: string[];
172
- removed: string[];
173
- changed: string[];
174
- total: number;
175
- };
176
-
177
- export type ProcessedModel = InternalProcessedModel;
178
-
179
- export let models: ProcessedModel[] = [];
180
- export let defaultModel!: ProcessedModel;
181
- export let taskModel!: ProcessedModel;
182
- export let validModelIdSchema: z.ZodType<string> = z.string();
183
- export let lastModelRefresh = new Date(0);
184
- export let lastModelRefreshDurationMs = 0;
185
- export let lastModelRefreshSummary: ModelsRefreshSummary = {
186
- refreshedAt: new Date(0),
187
- durationMs: 0,
188
- added: [],
189
- removed: [],
190
- changed: [],
191
- total: 0,
192
- };
193
-
194
- let inflightRefresh: Promise<ModelsRefreshSummary> | null = null;
195
-
196
- const createValidModelIdSchema = (modelList: ProcessedModel[]): z.ZodType<string> => {
197
- if (modelList.length === 0) {
198
- throw new Error("No models available to build validation schema");
199
- }
200
- const ids = new Set(modelList.map((m) => m.id));
201
- return z.string().refine((value) => ids.has(value), "Invalid model id");
202
- };
203
-
204
- const resolveTaskModel = (modelList: ProcessedModel[]) => {
205
- if (modelList.length === 0) {
206
- throw new Error("No models available to select task model");
207
- }
208
-
209
- if (config.TASK_MODEL) {
210
- const preferred = modelList.find(
211
- (m) => m.name === config.TASK_MODEL || m.id === config.TASK_MODEL
212
- );
213
- if (preferred) {
214
- return preferred;
215
- }
216
- }
217
-
218
- return modelList[0];
219
- };
220
-
221
- const signatureForModel = (model: ProcessedModel) =>
222
- JSON.stringify({
223
- description: model.description,
224
- displayName: model.displayName,
225
- providers: model.providers,
226
- parameters: model.parameters,
227
- preprompt: model.preprompt,
228
- prepromptUrl: model.prepromptUrl,
229
- endpoints:
230
- model.endpoints?.map((endpoint) => {
231
- if (endpoint.type === "openai") {
232
- const { type, baseURL } = endpoint;
233
- return { type, baseURL };
234
- }
235
- return { type: endpoint.type };
236
- }) ?? null,
237
- multimodal: model.multimodal,
238
- multimodalAcceptedMimetypes: model.multimodalAcceptedMimetypes,
239
- supportsTools: (model as unknown as { supportsTools?: boolean }).supportsTools ?? false,
240
- isRouter: model.isRouter,
241
- hasInferenceAPI: model.hasInferenceAPI,
242
- });
243
-
244
- const applyModelState = (newModels: ProcessedModel[], startedAt: number): ModelsRefreshSummary => {
245
- if (newModels.length === 0) {
246
- throw new Error("Failed to load any models from upstream");
247
- }
248
-
249
- const previousIds = new Set(models.map((m) => m.id));
250
- const previousSignatures = new Map(models.map((m) => [m.id, signatureForModel(m)]));
251
- const refreshedAt = new Date();
252
- const durationMs = Date.now() - startedAt;
253
-
254
- models = newModels;
255
- defaultModel = models[0];
256
- taskModel = resolveTaskModel(models);
257
- validModelIdSchema = createValidModelIdSchema(models);
258
- lastModelRefresh = refreshedAt;
259
- lastModelRefreshDurationMs = durationMs;
260
-
261
- const added = newModels.map((m) => m.id).filter((id) => !previousIds.has(id));
262
- const removed = Array.from(previousIds).filter(
263
- (id) => !newModels.some((model) => model.id === id)
264
- );
265
- const changed = newModels
266
- .filter((model) => {
267
- const previousSignature = previousSignatures.get(model.id);
268
- return previousSignature !== undefined && previousSignature !== signatureForModel(model);
269
- })
270
- .map((model) => model.id);
271
-
272
- const summary: ModelsRefreshSummary = {
273
- refreshedAt,
274
- durationMs,
275
- added,
276
- removed,
277
- changed,
278
- total: models.length,
279
- };
280
-
281
- lastModelRefreshSummary = summary;
282
-
283
- logger.info(
284
- {
285
- total: summary.total,
286
- added: summary.added,
287
- removed: summary.removed,
288
- changed: summary.changed,
289
- durationMs: summary.durationMs,
290
- },
291
- "[models] Model cache refreshed"
292
- );
293
-
294
- return summary;
295
- };
296
-
297
- const buildModels = async (): Promise<ProcessedModel[]> => {
298
- if (!openaiBaseUrl) {
299
- logger.error(
300
- "OPENAI_BASE_URL is required. Set it to an OpenAI-compatible base (e.g., https://router.huggingface.co/v1)."
301
- );
302
- throw new Error("OPENAI_BASE_URL not set");
303
- }
304
-
305
- try {
306
- const baseURL = openaiBaseUrl;
307
- logger.info({ baseURL }, "[models] Using OpenAI-compatible base URL");
308
-
309
- // Canonical auth token is OPENAI_API_KEY; keep HF_TOKEN as legacy alias
310
- const authToken = config.OPENAI_API_KEY || config.HF_TOKEN;
311
-
312
- // Use auth token from the start if available to avoid rate limiting issues
313
- // Some APIs rate-limit unauthenticated requests more aggressively
314
- const response = await fetch(`${baseURL}/models`, {
315
- headers: authToken ? { Authorization: `Bearer ${authToken}` } : undefined,
316
- });
317
- logger.info({ status: response.status }, "[models] First fetch status");
318
- if (!response.ok && response.status === 401 && !authToken) {
319
- // If we get 401 and didn't have a token, there's nothing we can do
320
- throw new Error(
321
- `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText} (no auth token available)`
322
- );
323
- }
324
- if (!response.ok) {
325
- throw new Error(
326
- `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText}`
327
- );
328
- }
329
- const json = await response.json();
330
- logger.info({ keys: Object.keys(json || {}) }, "[models] Response keys");
331
-
332
- const parsed = listSchema.parse(json);
333
- logger.info({ count: parsed.data.length }, "[models] Parsed models count");
334
-
335
- let modelsRaw = parsed.data.map((m) => {
336
- let logoUrl: string | undefined = undefined;
337
- if (isHFRouter && m.id.includes("/")) {
338
- const org = m.id.split("/")[0];
339
- logoUrl = `https://huggingface.co/api/avatars/${encodeURIComponent(org)}`;
340
- }
341
-
342
- const inputModalities = (m.architecture?.input_modalities ?? []).map((modality) =>
343
- modality.toLowerCase()
344
- );
345
- const supportsImageInput =
346
- inputModalities.includes("image") || inputModalities.includes("vision");
347
-
348
- // If any provider supports tools, consider the model as supporting tools
349
- const supportsTools = Boolean((m.providers ?? []).some((p) => p?.supports_tools === true));
350
- return {
351
- id: m.id,
352
- name: m.id,
353
- displayName: m.id,
354
- description: m.description,
355
- logoUrl,
356
- providers: m.providers,
357
- multimodal: supportsImageInput,
358
- multimodalAcceptedMimetypes: supportsImageInput ? ["image/*"] : undefined,
359
- supportsTools,
360
- endpoints: [
361
- {
362
- type: "openai" as const,
363
- baseURL,
364
- // apiKey will be taken from OPENAI_API_KEY or HF_TOKEN automatically
365
- },
366
- ],
367
- } as ModelConfig;
368
- }) as ModelConfig[];
369
-
370
- const overrides = getModelOverrides();
371
-
372
- if (overrides.length) {
373
- const overrideMap = new Map<string, ModelOverride>();
374
- for (const override of overrides) {
375
- for (const key of [override.id, override.name]) {
376
- const trimmed = key?.trim();
377
- if (trimmed) overrideMap.set(trimmed, override);
378
- }
379
- }
380
-
381
- // Filter to only configured models and apply overrides, preserving MODELS order
382
- const filteredAndOrdered: ModelConfig[] = [];
383
- for (const override of overrides) {
384
- const matchKey = override.name?.trim() || override.id?.trim() || "";
385
- const found = modelsRaw.find(
386
- (model) => model.id === matchKey || model.name === matchKey
387
- );
388
- if (found) {
389
- const { id, name, ...rest } = override;
390
- void id;
391
- void name;
392
- filteredAndOrdered.push({ ...found, ...rest });
393
- }
394
- }
395
-
396
- // If we matched at least one, use filtered list; otherwise fall back to all models with overrides
397
- if (filteredAndOrdered.length > 0) {
398
- modelsRaw = filteredAndOrdered;
399
- } else {
400
- modelsRaw = modelsRaw.map((model) => {
401
- const override = overrideMap.get(model.id ?? "") ?? overrideMap.get(model.name ?? "");
402
- if (!override) return model;
403
-
404
- const { id, name, ...rest } = override;
405
- void id;
406
- void name;
407
-
408
- return {
409
- ...model,
410
- ...rest,
411
- };
412
- });
413
- }
414
- }
415
-
416
- const builtModels = await Promise.all(
417
- modelsRaw.map((e) =>
418
- processModel(e)
419
- .then(addEndpoint)
420
- .then(async (m) => ({
421
- ...m,
422
- hasInferenceAPI: inferenceApiIds.includes(m.id ?? m.name),
423
- // router decoration added later
424
- isRouter: false as boolean,
425
- }))
426
- )
427
- );
428
-
429
- const archBase = (config.LLM_ROUTER_ARCH_BASE_URL || "").trim();
430
- const routerLabel = (config.PUBLIC_LLM_ROUTER_DISPLAY_NAME || "Omni").trim() || "Omni";
431
- const routerLogo = (config.PUBLIC_LLM_ROUTER_LOGO_URL || "").trim();
432
- const routerAliasId = (config.PUBLIC_LLM_ROUTER_ALIAS_ID || "omni").trim() || "omni";
433
- const routerMultimodalEnabled =
434
- (config.LLM_ROUTER_ENABLE_MULTIMODAL || "").toLowerCase() === "true";
435
- const routerToolsEnabled = (config.LLM_ROUTER_ENABLE_TOOLS || "").toLowerCase() === "true";
436
-
437
- let decorated = builtModels as ProcessedModel[];
438
-
439
- if (archBase) {
440
- // Build a minimal model config for the alias
441
- const aliasRaw = {
442
- id: routerAliasId,
443
- name: routerAliasId,
444
- displayName: routerLabel,
445
- description: "Automatically routes your messages to the best model for your request.",
446
- logoUrl: routerLogo || undefined,
447
- preprompt: "",
448
- endpoints: [
449
- {
450
- type: "openai" as const,
451
- baseURL: openaiBaseUrl,
452
- },
453
- ],
454
- // Keep the alias visible
455
- unlisted: false,
456
- } as ModelConfig;
457
-
458
- if (routerMultimodalEnabled) {
459
- aliasRaw.multimodal = true;
460
- aliasRaw.multimodalAcceptedMimetypes = ["image/*"];
461
- }
462
-
463
- if (routerToolsEnabled) {
464
- aliasRaw.supportsTools = true;
465
- }
466
-
467
- const aliasBase = await processModel(aliasRaw);
468
- // Create a self-referential ProcessedModel for the router endpoint
469
- const aliasModel: ProcessedModel = {
470
- ...aliasBase,
471
- isRouter: true,
472
- hasInferenceAPI: false,
473
- // getEndpoint uses the router wrapper regardless of the endpoints array
474
- getEndpoint: async (): Promise<Endpoint> => makeRouterEndpoint(aliasModel),
475
- } as ProcessedModel;
476
-
477
- // Put alias first
478
- decorated = [aliasModel, ...decorated];
479
- }
480
-
481
- return decorated;
482
- } catch (e) {
483
- logger.error(e, "Failed to load models from OpenAI base URL");
484
- throw e;
485
- }
486
- };
487
-
488
- const rebuildModels = async (): Promise<ModelsRefreshSummary> => {
489
- const startedAt = Date.now();
490
- const newModels = await buildModels();
491
- return applyModelState(newModels, startedAt);
492
- };
493
-
494
- await rebuildModels();
495
-
496
- export const refreshModels = async (): Promise<ModelsRefreshSummary> => {
497
- if (inflightRefresh) {
498
- return inflightRefresh;
499
- }
500
-
501
- inflightRefresh = rebuildModels().finally(() => {
502
- inflightRefresh = null;
503
- });
504
-
505
- return inflightRefresh;
506
- };
507
-
508
- export const validateModel = (_models: BackendModel[]) => {
509
- // Zod enum function requires 2 parameters
510
- return z.enum([_models[0].id, ..._models.slice(1).map((m) => m.id)]);
511
- };
512
-
513
- // if `TASK_MODEL` is string & name of a model in `MODELS`, then we use `MODELS[TASK_MODEL]`, else we try to parse `TASK_MODEL` as a model config itself
514
-
515
- export type BackendModel = Optional<
516
- typeof defaultModel,
517
- "preprompt" | "parameters" | "multimodal" | "unlisted" | "hasInferenceAPI"
518
- >;
1
+ import { config } from "$lib/server/config";
2
+ import type { ChatTemplateInput } from "$lib/types/Template";
3
+ import { z } from "zod";
4
+ import endpoints, { endpointSchema, type Endpoint } from "./endpoints/endpoints";
5
+
6
+ import JSON5 from "json5";
7
+ import { logger } from "$lib/server/logger";
8
+ import { makeRouterEndpoint } from "$lib/server/router/endpoint";
9
+
10
+ type Optional<T, K extends keyof T> = Pick<Partial<T>, K> & Omit<T, K>;
11
+
12
+ const sanitizeJSONEnv = (val: string, fallback: string) => {
13
+ const raw = (val ?? "").trim();
14
+ const unquoted = raw.startsWith("`") && raw.endsWith("`") ? raw.slice(1, -1) : raw;
15
+ return unquoted || fallback;
16
+ };
17
+
18
+ const modelConfig = z.object({
19
+ /** Used as an identifier in DB */
20
+ id: z.string().optional(),
21
+ /** Used to link to the model page, and for inference */
22
+ name: z.string().default(""),
23
+ displayName: z.string().min(1).optional(),
24
+ description: z.string().min(1).optional(),
25
+ logoUrl: z.string().url().optional(),
26
+ websiteUrl: z.string().url().optional(),
27
+ modelUrl: z.string().url().optional(),
28
+ tokenizer: z.never().optional(),
29
+ datasetName: z.string().min(1).optional(),
30
+ datasetUrl: z.string().url().optional(),
31
+ preprompt: z.string().default(""),
32
+ prepromptUrl: z.string().url().optional(),
33
+ chatPromptTemplate: z.never().optional(),
34
+ promptExamples: z
35
+ .array(
36
+ z.object({
37
+ title: z.string().min(1),
38
+ prompt: z.string().min(1),
39
+ })
40
+ )
41
+ .optional(),
42
+ endpoints: z.array(endpointSchema).optional(),
43
+ providers: z.array(z.object({ supports_tools: z.boolean().optional() }).passthrough()).optional(),
44
+ parameters: z
45
+ .object({
46
+ temperature: z.number().min(0).max(2).optional(),
47
+ truncate: z.number().int().positive().optional(),
48
+ max_tokens: z.number().int().positive().optional(),
49
+ stop: z.array(z.string()).optional(),
50
+ top_p: z.number().positive().optional(),
51
+ top_k: z.number().positive().optional(),
52
+ frequency_penalty: z.number().min(-2).max(2).optional(),
53
+ presence_penalty: z.number().min(-2).max(2).optional(),
54
+ })
55
+ .passthrough()
56
+ .optional(),
57
+ multimodal: z.boolean().default(false),
58
+ multimodalAcceptedMimetypes: z.array(z.string()).optional(),
59
+ // Aggregated tool-calling capability across providers (HF router)
60
+ supportsTools: z.boolean().default(false),
61
+ unlisted: z.boolean().default(false),
62
+ embeddingModel: z.never().optional(),
63
+ /** Used to enable/disable system prompt usage */
64
+ systemRoleSupported: z.boolean().default(true),
65
+ });
66
+
67
+ type ModelConfig = z.infer<typeof modelConfig>;
68
+
69
+ const overrideEntrySchema = modelConfig
70
+ .partial()
71
+ .extend({
72
+ id: z.string().optional(),
73
+ name: z.string().optional(),
74
+ })
75
+ .refine((value) => Boolean((value.id ?? value.name)?.trim()), {
76
+ message: "Model override entry must provide an id or name",
77
+ });
78
+
79
+ type ModelOverride = z.infer<typeof overrideEntrySchema>;
80
+
81
+ const openaiBaseUrl = config.OPENAI_BASE_URL
82
+ ? config.OPENAI_BASE_URL.replace(/\/$/, "")
83
+ : undefined;
84
+ const isHFRouter = openaiBaseUrl === "https://router.huggingface.co/v1";
85
+
86
+ const listSchema = z
87
+ .object({
88
+ data: z.array(
89
+ z.object({
90
+ id: z.string(),
91
+ description: z.string().optional(),
92
+ providers: z
93
+ .array(z.object({ supports_tools: z.boolean().optional() }).passthrough())
94
+ .optional(),
95
+ architecture: z
96
+ .object({
97
+ input_modalities: z.array(z.string()).optional(),
98
+ })
99
+ .passthrough()
100
+ .optional(),
101
+ })
102
+ ),
103
+ })
104
+ .passthrough();
105
+
106
+ function getChatPromptRender(_m: ModelConfig): (inputs: ChatTemplateInput) => string {
107
+ // Minimal template to support legacy "completions" flow if ever used.
108
+ // We avoid any tokenizer/Jinja usage in this build.
109
+ return ({ messages, preprompt }) => {
110
+ const parts: string[] = [];
111
+ if (preprompt) parts.push(`[SYSTEM]\n${preprompt}`);
112
+ for (const msg of messages) {
113
+ const role = msg.from === "assistant" ? "ASSISTANT" : msg.from.toUpperCase();
114
+ parts.push(`[${role}]\n${msg.content}`);
115
+ }
116
+ parts.push(`[ASSISTANT]`);
117
+ return parts.join("\n\n");
118
+ };
119
+ }
120
+
121
+ const processModel = async (m: ModelConfig) => ({
122
+ ...m,
123
+ chatPromptRender: await getChatPromptRender(m),
124
+ id: m.id || m.name,
125
+ displayName: m.displayName || m.name,
126
+ preprompt: m.prepromptUrl ? await fetch(m.prepromptUrl).then((r) => r.text()) : m.preprompt,
127
+ parameters: { ...m.parameters, stop_sequences: m.parameters?.stop },
128
+ unlisted: m.unlisted ?? false,
129
+ });
130
+
131
+ const addEndpoint = (m: Awaited<ReturnType<typeof processModel>>) => ({
132
+ ...m,
133
+ getEndpoint: async (): Promise<Endpoint> => {
134
+ if (!m.endpoints || m.endpoints.length === 0) {
135
+ throw new Error("No endpoints configured. This build requires OpenAI-compatible endpoints.");
136
+ }
137
+ // Only support OpenAI-compatible endpoints in this build
138
+ const endpoint = m.endpoints[0];
139
+ if (endpoint.type !== "openai") {
140
+ throw new Error("Only 'openai' endpoint type is supported in this build");
141
+ }
142
+ return await endpoints.openai({ ...endpoint, model: m });
143
+ },
144
+ });
145
+
146
+ type InternalProcessedModel = Awaited<ReturnType<typeof addEndpoint>> & {
147
+ isRouter: boolean;
148
+ hasInferenceAPI: boolean;
149
+ };
150
+
151
+ const inferenceApiIds: string[] = [];
152
+
153
+ const getModelOverrides = (): ModelOverride[] => {
154
+ const overridesEnv = (Reflect.get(config, "MODELS") as string | undefined) ?? "";
155
+
156
+ if (!overridesEnv.trim()) {
157
+ return [];
158
+ }
159
+
160
+ try {
161
+ return z.array(overrideEntrySchema).parse(JSON5.parse(sanitizeJSONEnv(overridesEnv, "[]")));
162
+ } catch (error) {
163
+ logger.error(error, "[models] Failed to parse MODELS overrides");
164
+ return [];
165
+ }
166
+ };
167
+
168
+ export type ModelsRefreshSummary = {
169
+ refreshedAt: Date;
170
+ durationMs: number;
171
+ added: string[];
172
+ removed: string[];
173
+ changed: string[];
174
+ total: number;
175
+ };
176
+
177
+ export type ProcessedModel = InternalProcessedModel;
178
+
179
+ export let models: ProcessedModel[] = [];
180
+ export let defaultModel!: ProcessedModel;
181
+ export let taskModel!: ProcessedModel;
182
+ export let validModelIdSchema: z.ZodType<string> = z.string();
183
+ export let lastModelRefresh = new Date(0);
184
+ export let lastModelRefreshDurationMs = 0;
185
+ export let lastModelRefreshSummary: ModelsRefreshSummary = {
186
+ refreshedAt: new Date(0),
187
+ durationMs: 0,
188
+ added: [],
189
+ removed: [],
190
+ changed: [],
191
+ total: 0,
192
+ };
193
+
194
+ let inflightRefresh: Promise<ModelsRefreshSummary> | null = null;
195
+
196
+ const createValidModelIdSchema = (modelList: ProcessedModel[]): z.ZodType<string> => {
197
+ if (modelList.length === 0) {
198
+ throw new Error("No models available to build validation schema");
199
+ }
200
+ const ids = new Set(modelList.map((m) => m.id));
201
+ return z.string().refine((value) => ids.has(value), "Invalid model id");
202
+ };
203
+
204
+ const resolveTaskModel = (modelList: ProcessedModel[]) => {
205
+ if (modelList.length === 0) {
206
+ throw new Error("No models available to select task model");
207
+ }
208
+
209
+ if (config.TASK_MODEL) {
210
+ const preferred = modelList.find(
211
+ (m) => m.name === config.TASK_MODEL || m.id === config.TASK_MODEL
212
+ );
213
+ if (preferred) {
214
+ return preferred;
215
+ }
216
+ }
217
+
218
+ return modelList[0];
219
+ };
220
+
221
+ const signatureForModel = (model: ProcessedModel) =>
222
+ JSON.stringify({
223
+ description: model.description,
224
+ displayName: model.displayName,
225
+ providers: model.providers,
226
+ parameters: model.parameters,
227
+ preprompt: model.preprompt,
228
+ prepromptUrl: model.prepromptUrl,
229
+ endpoints:
230
+ model.endpoints?.map((endpoint) => {
231
+ if (endpoint.type === "openai") {
232
+ const { type, baseURL } = endpoint;
233
+ return { type, baseURL };
234
+ }
235
+ return { type: endpoint.type };
236
+ }) ?? null,
237
+ multimodal: model.multimodal,
238
+ multimodalAcceptedMimetypes: model.multimodalAcceptedMimetypes,
239
+ supportsTools: (model as unknown as { supportsTools?: boolean }).supportsTools ?? false,
240
+ isRouter: model.isRouter,
241
+ hasInferenceAPI: model.hasInferenceAPI,
242
+ });
243
+
244
+ const applyModelState = (newModels: ProcessedModel[], startedAt: number): ModelsRefreshSummary => {
245
+ if (newModels.length === 0) {
246
+ throw new Error("Failed to load any models from upstream");
247
+ }
248
+
249
+ const previousIds = new Set(models.map((m) => m.id));
250
+ const previousSignatures = new Map(models.map((m) => [m.id, signatureForModel(m)]));
251
+ const refreshedAt = new Date();
252
+ const durationMs = Date.now() - startedAt;
253
+
254
+ models = newModels;
255
+ defaultModel = models[0];
256
+ taskModel = resolveTaskModel(models);
257
+ validModelIdSchema = createValidModelIdSchema(models);
258
+ lastModelRefresh = refreshedAt;
259
+ lastModelRefreshDurationMs = durationMs;
260
+
261
+ const added = newModels.map((m) => m.id).filter((id) => !previousIds.has(id));
262
+ const removed = Array.from(previousIds).filter(
263
+ (id) => !newModels.some((model) => model.id === id)
264
+ );
265
+ const changed = newModels
266
+ .filter((model) => {
267
+ const previousSignature = previousSignatures.get(model.id);
268
+ return previousSignature !== undefined && previousSignature !== signatureForModel(model);
269
+ })
270
+ .map((model) => model.id);
271
+
272
+ const summary: ModelsRefreshSummary = {
273
+ refreshedAt,
274
+ durationMs,
275
+ added,
276
+ removed,
277
+ changed,
278
+ total: models.length,
279
+ };
280
+
281
+ lastModelRefreshSummary = summary;
282
+
283
+ logger.info(
284
+ {
285
+ total: summary.total,
286
+ added: summary.added,
287
+ removed: summary.removed,
288
+ changed: summary.changed,
289
+ durationMs: summary.durationMs,
290
+ },
291
+ "[models] Model cache refreshed"
292
+ );
293
+
294
+ return summary;
295
+ };
296
+
297
+ const buildModels = async (): Promise<ProcessedModel[]> => {
298
+ if (!openaiBaseUrl) {
299
+ logger.error(
300
+ "OPENAI_BASE_URL is required. Set it to an OpenAI-compatible base (e.g., https://router.huggingface.co/v1)."
301
+ );
302
+ throw new Error("OPENAI_BASE_URL not set");
303
+ }
304
+
305
+ try {
306
+ const baseURL = openaiBaseUrl;
307
+ logger.info({ baseURL }, "[models] Using OpenAI-compatible base URL");
308
+
309
+ // Canonical auth token is OPENAI_API_KEY; keep HF_TOKEN as legacy alias
310
+ const authToken = config.OPENAI_API_KEY || config.HF_TOKEN;
311
+
312
+ // Use auth token from the start if available to avoid rate limiting issues
313
+ // Some APIs rate-limit unauthenticated requests more aggressively
314
+ const response = await fetch(`${baseURL}/models`, {
315
+ headers: authToken ? { Authorization: `Bearer ${authToken}` } : undefined,
316
+ });
317
+ logger.info({ status: response.status }, "[models] First fetch status");
318
+ if (!response.ok && response.status === 401 && !authToken) {
319
+ // If we get 401 and didn't have a token, there's nothing we can do
320
+ throw new Error(
321
+ `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText} (no auth token available)`
322
+ );
323
+ }
324
+ if (!response.ok) {
325
+ throw new Error(
326
+ `Failed to fetch ${baseURL}/models: ${response.status} ${response.statusText}`
327
+ );
328
+ }
329
+ const json = await response.json();
330
+ logger.info({ keys: Object.keys(json || {}) }, "[models] Response keys");
331
+
332
+ const parsed = listSchema.parse(json);
333
+ logger.info({ count: parsed.data.length }, "[models] Parsed models count");
334
+
335
+ let modelsRaw = parsed.data.map((m) => {
336
+ let logoUrl: string | undefined = undefined;
337
+ if (isHFRouter && m.id.includes("/")) {
338
+ const org = m.id.split("/")[0];
339
+ logoUrl = `https://huggingface.co/api/avatars/${encodeURIComponent(org)}`;
340
+ }
341
+
342
+ const inputModalities = (m.architecture?.input_modalities ?? []).map((modality) =>
343
+ modality.toLowerCase()
344
+ );
345
+ const supportsImageInput =
346
+ inputModalities.includes("image") || inputModalities.includes("vision");
347
+
348
+ // If any provider supports tools, consider the model as supporting tools
349
+ const supportsTools = Boolean((m.providers ?? []).some((p) => p?.supports_tools === true));
350
+ return {
351
+ id: m.id,
352
+ name: m.id,
353
+ displayName: m.id,
354
+ description: m.description,
355
+ logoUrl,
356
+ providers: m.providers,
357
+ multimodal: supportsImageInput,
358
+ multimodalAcceptedMimetypes: supportsImageInput ? ["image/*"] : undefined,
359
+ supportsTools,
360
+ endpoints: [
361
+ {
362
+ type: "openai" as const,
363
+ baseURL,
364
+ // apiKey will be taken from OPENAI_API_KEY or HF_TOKEN automatically
365
+ },
366
+ ],
367
+ } as ModelConfig;
368
+ }) as ModelConfig[];
369
+
370
+ const overrides = getModelOverrides();
371
+
372
+ if (overrides.length) {
373
+ const overrideMap = new Map<string, ModelOverride>();
374
+ for (const override of overrides) {
375
+ for (const key of [override.id, override.name]) {
376
+ const trimmed = key?.trim();
377
+ if (trimmed) overrideMap.set(trimmed, override);
378
+ }
379
+ }
380
+
381
+ // Filter to only configured models and apply overrides, preserving MODELS order
382
+ const filteredAndOrdered: ModelConfig[] = [];
383
+ for (const override of overrides) {
384
+ const matchKey = override.name?.trim() || override.id?.trim() || "";
385
+ const found = modelsRaw.find(
386
+ (model) => model.id === matchKey || model.name === matchKey
387
+ );
388
+ if (found) {
389
+ const { id, name, ...rest } = override;
390
+ void id;
391
+ void name;
392
+ filteredAndOrdered.push({ ...found, ...rest });
393
+ }
394
+ }
395
+
396
+ // If we matched at least one, use filtered list; otherwise fall back to all models with overrides
397
+ if (filteredAndOrdered.length > 0) {
398
+ modelsRaw = filteredAndOrdered;
399
+ } else {
400
+ modelsRaw = modelsRaw.map((model) => {
401
+ const override = overrideMap.get(model.id ?? "") ?? overrideMap.get(model.name ?? "");
402
+ if (!override) return model;
403
+
404
+ const { id, name, ...rest } = override;
405
+ void id;
406
+ void name;
407
+
408
+ return {
409
+ ...model,
410
+ ...rest,
411
+ };
412
+ });
413
+ }
414
+ }
415
+
416
+ const builtModels = await Promise.all(
417
+ modelsRaw.map((e) =>
418
+ processModel(e)
419
+ .then(addEndpoint)
420
+ .then(async (m) => ({
421
+ ...m,
422
+ hasInferenceAPI: inferenceApiIds.includes(m.id ?? m.name),
423
+ // router decoration added later
424
+ isRouter: false as boolean,
425
+ }))
426
+ )
427
+ );
428
+
429
+ const archBase = (config.LLM_ROUTER_ARCH_BASE_URL || "").trim();
430
+ const routerLabel = (config.PUBLIC_LLM_ROUTER_DISPLAY_NAME || "Omni").trim() || "Omni";
431
+ const routerLogo = (config.PUBLIC_LLM_ROUTER_LOGO_URL || "").trim();
432
+ const routerAliasId = (config.PUBLIC_LLM_ROUTER_ALIAS_ID || "omni").trim() || "omni";
433
+ const routerMultimodalEnabled =
434
+ (config.LLM_ROUTER_ENABLE_MULTIMODAL || "").toLowerCase() === "true";
435
+ const routerToolsEnabled = (config.LLM_ROUTER_ENABLE_TOOLS || "").toLowerCase() === "true";
436
+
437
+ let decorated = builtModels as ProcessedModel[];
438
+
439
+ if (archBase) {
440
+ // Build a minimal model config for the alias
441
+ const aliasRaw = {
442
+ id: routerAliasId,
443
+ name: routerAliasId,
444
+ displayName: routerLabel,
445
+ description: "Automatically routes your messages to the best model for your request.",
446
+ logoUrl: routerLogo || undefined,
447
+ preprompt: "",
448
+ endpoints: [
449
+ {
450
+ type: "openai" as const,
451
+ baseURL: openaiBaseUrl,
452
+ },
453
+ ],
454
+ // Keep the alias visible
455
+ unlisted: false,
456
+ } as ModelConfig;
457
+
458
+ if (routerMultimodalEnabled) {
459
+ aliasRaw.multimodal = true;
460
+ aliasRaw.multimodalAcceptedMimetypes = ["image/*"];
461
+ }
462
+
463
+ if (routerToolsEnabled) {
464
+ aliasRaw.supportsTools = true;
465
+ }
466
+
467
+ const aliasBase = await processModel(aliasRaw);
468
+ // Create a self-referential ProcessedModel for the router endpoint
469
+ const aliasModel: ProcessedModel = {
470
+ ...aliasBase,
471
+ isRouter: true,
472
+ hasInferenceAPI: false,
473
+ // getEndpoint uses the router wrapper regardless of the endpoints array
474
+ getEndpoint: async (): Promise<Endpoint> => makeRouterEndpoint(aliasModel),
475
+ } as ProcessedModel;
476
+
477
+ // Put alias first
478
+ decorated = [aliasModel, ...decorated];
479
+ }
480
+
481
+ return decorated;
482
+ } catch (e) {
483
+ logger.error(e, "Failed to load models from OpenAI base URL");
484
+ throw e;
485
+ }
486
+ };
487
+
488
+ const rebuildModels = async (): Promise<ModelsRefreshSummary> => {
489
+ const startedAt = Date.now();
490
+ const newModels = await buildModels();
491
+ return applyModelState(newModels, startedAt);
492
+ };
493
+
494
+ await rebuildModels();
495
+
496
+ export const refreshModels = async (): Promise<ModelsRefreshSummary> => {
497
+ if (inflightRefresh) {
498
+ return inflightRefresh;
499
+ }
500
+
501
+ inflightRefresh = rebuildModels().finally(() => {
502
+ inflightRefresh = null;
503
+ });
504
+
505
+ return inflightRefresh;
506
+ };
507
+
508
+ export const validateModel = (_models: BackendModel[]) => {
509
+ // Zod enum function requires 2 parameters
510
+ return z.enum([_models[0].id, ..._models.slice(1).map((m) => m.id)]);
511
+ };
512
+
513
+ // if `TASK_MODEL` is string & name of a model in `MODELS`, then we use `MODELS[TASK_MODEL]`, else we try to parse `TASK_MODEL` as a model config itself
514
+
515
+ export type BackendModel = Optional<
516
+ typeof defaultModel,
517
+ "preprompt" | "parameters" | "multimodal" | "unlisted" | "hasInferenceAPI"
518
+ >;