onbuzz 4.9.13 → 4.10.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/node_modules/glob/README.md +31 -5
- package/node_modules/glob/dist/commonjs/glob.d.ts +8 -0
- package/node_modules/glob/dist/commonjs/glob.d.ts.map +1 -1
- package/node_modules/glob/dist/commonjs/glob.js +2 -1
- package/node_modules/glob/dist/commonjs/glob.js.map +1 -1
- package/node_modules/glob/dist/commonjs/index.min.js +3 -3
- package/node_modules/glob/dist/commonjs/index.min.js.map +4 -4
- package/node_modules/glob/dist/commonjs/pattern.d.ts +3 -0
- package/node_modules/glob/dist/commonjs/pattern.d.ts.map +1 -1
- package/node_modules/glob/dist/commonjs/pattern.js +4 -0
- package/node_modules/glob/dist/commonjs/pattern.js.map +1 -1
- package/node_modules/glob/dist/esm/glob.d.ts +8 -0
- package/node_modules/glob/dist/esm/glob.d.ts.map +1 -1
- package/node_modules/glob/dist/esm/glob.js +2 -1
- package/node_modules/glob/dist/esm/glob.js.map +1 -1
- package/node_modules/glob/dist/esm/index.min.js +3 -3
- package/node_modules/glob/dist/esm/index.min.js.map +4 -4
- package/node_modules/glob/dist/esm/pattern.d.ts +3 -0
- package/node_modules/glob/dist/esm/pattern.d.ts.map +1 -1
- package/node_modules/glob/dist/esm/pattern.js +4 -0
- package/node_modules/glob/dist/esm/pattern.js.map +1 -1
- package/node_modules/{@isaacs → glob/node_modules}/balanced-match/README.md +7 -10
- package/node_modules/{@isaacs → glob/node_modules}/balanced-match/package.json +7 -18
- package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/README.md +3 -6
- package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/commonjs/index.js +6 -4
- package/node_modules/glob/node_modules/brace-expansion/dist/commonjs/index.js.map +1 -0
- package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/esm/index.js +6 -4
- package/node_modules/glob/node_modules/brace-expansion/dist/esm/index.js.map +1 -0
- package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/package.json +11 -7
- package/node_modules/glob/node_modules/minimatch/README.md +76 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/assert-valid-pattern.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/assert-valid-pattern.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/assert-valid-pattern.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/ast.d.ts +4 -2
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/ast.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/ast.js +309 -55
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/ast.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/brace-expressions.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/brace-expressions.js +2 -4
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/brace-expressions.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/escape.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/escape.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/escape.js +4 -4
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/escape.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/index.d.ts +81 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/index.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/index.js +232 -134
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/index.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/unescape.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/unescape.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/unescape.js +8 -8
- package/node_modules/glob/node_modules/minimatch/dist/commonjs/unescape.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/assert-valid-pattern.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/assert-valid-pattern.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/assert-valid-pattern.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/ast.d.ts +4 -2
- package/node_modules/glob/node_modules/minimatch/dist/esm/ast.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/ast.js +309 -55
- package/node_modules/glob/node_modules/minimatch/dist/esm/ast.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/brace-expressions.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/brace-expressions.js +2 -4
- package/node_modules/glob/node_modules/minimatch/dist/esm/brace-expressions.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/escape.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/escape.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/escape.js +4 -4
- package/node_modules/glob/node_modules/minimatch/dist/esm/escape.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/index.d.ts +81 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/index.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/index.js +232 -134
- package/node_modules/glob/node_modules/minimatch/dist/esm/index.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/unescape.d.ts +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/unescape.d.ts.map +1 -1
- package/node_modules/glob/node_modules/minimatch/dist/esm/unescape.js +8 -8
- package/node_modules/glob/node_modules/minimatch/dist/esm/unescape.js.map +1 -1
- package/node_modules/glob/node_modules/minimatch/package.json +17 -11
- package/node_modules/glob/package.json +10 -13
- package/node_modules/minipass/LICENSE.md +55 -0
- package/node_modules/minipass/dist/commonjs/index.d.ts +12 -16
- package/node_modules/minipass/dist/commonjs/index.d.ts.map +1 -1
- package/node_modules/minipass/dist/commonjs/index.js +13 -3
- package/node_modules/minipass/dist/commonjs/index.js.map +1 -1
- package/node_modules/minipass/dist/esm/index.d.ts +12 -16
- package/node_modules/minipass/dist/esm/index.d.ts.map +1 -1
- package/node_modules/minipass/dist/esm/index.js +3 -1
- package/node_modules/minipass/dist/esm/index.js.map +1 -1
- package/node_modules/minipass/package.json +9 -14
- package/node_modules/path-scurry/node_modules/lru-cache/README.md +96 -10
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/diagnostics-channel-browser.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/diagnostics-channel-browser.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/diagnostics-channel.js +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.d.ts +1400 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.js +1726 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.min.js +2 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/index.min.js.map +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/perf.js +10 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/browser/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/diagnostics-channel-cjs.cjs.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/diagnostics-channel-cjs.d.cts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/diagnostics-channel.js +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.d.ts +109 -32
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.d.ts.map +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.js +334 -197
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.js.map +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.min.js +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/index.min.js.map +4 -4
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/diagnostics-channel-node.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/diagnostics-channel-node.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/diagnostics-channel.js +9 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.d.ts +1400 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.js +1726 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.min.js +2 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/index.min.js.map +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/perf.js +10 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/node/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/perf.js +10 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/commonjs/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/diagnostics-channel-browser.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/diagnostics-channel-browser.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/diagnostics-channel.js +4 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.d.ts +1400 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.js +1722 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.min.js +2 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/index.min.js.map +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/perf.js +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/browser/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/diagnostics-channel-esm.d.mts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/diagnostics-channel-esm.mjs.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/diagnostics-channel.js +19 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.d.ts +109 -32
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.d.ts.map +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.js +333 -196
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.js.map +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.min.js +1 -1
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/index.min.js.map +4 -4
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/diagnostics-channel-node.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/diagnostics-channel-node.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/diagnostics-channel.d.ts +5 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/diagnostics-channel.js +6 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.d.ts +1400 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.js +1722 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.min.js +2 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/index.min.js.map +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/perf.js +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/node/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/perf.d.ts +12 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/perf.d.ts.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/perf.js +7 -0
- package/node_modules/path-scurry/node_modules/lru-cache/dist/esm/perf.js.map +1 -0
- package/node_modules/path-scurry/node_modules/lru-cache/package.json +71 -18
- package/node_modules/path-scurry/package.json +8 -24
- package/package.json +1 -1
- package/scripts/debug-balance-probe.mjs +35 -35
- package/scripts/push-image.sh +43 -43
- package/scripts/setup-acr.sh +65 -65
- package/scripts/verify-optional-deps.js +96 -1
- package/src/__tests__/composioCliFlags.test.js +239 -239
- package/src/analyzers/CSSAnalyzer.js +298 -297
- package/src/analyzers/ConfigValidator.js +691 -690
- package/src/analyzers/ESLintAnalyzer.js +320 -320
- package/src/analyzers/JavaScriptAnalyzer.js +260 -261
- package/src/analyzers/PrettierFormatter.js +246 -247
- package/src/analyzers/PythonAnalyzer.js +283 -283
- package/src/analyzers/SecurityAnalyzer.js +729 -729
- package/src/analyzers/SparrowAnalyzer.js +341 -341
- package/src/analyzers/TypeScriptAnalyzer.js +247 -247
- package/src/analyzers/__tests__/CSSAnalyzer.test.js +41 -41
- package/src/analyzers/__tests__/ConfigValidator.test.js +362 -362
- package/src/analyzers/__tests__/JavaScriptAnalyzer.test.js +40 -40
- package/src/analyzers/__tests__/PythonAnalyzer.test.js +205 -208
- package/src/analyzers/__tests__/SecurityAnalyzer.test.js +303 -303
- package/src/analyzers/__tests__/TypeScriptAnalyzer.test.js +187 -187
- package/src/analyzers/codeCloneDetector/analyzer.js +344 -344
- package/src/analyzers/codeCloneDetector/detector.js +250 -250
- package/src/analyzers/codeCloneDetector/index.js +194 -192
- package/src/analyzers/codeCloneDetector/parser.js +199 -199
- package/src/core/__tests__/agentPool.test.js +866 -866
- package/src/core/__tests__/agentPoolAutoResume.test.js +209 -209
- package/src/core/__tests__/agentPoolWakeOnMessage.test.js +315 -315
- package/src/core/__tests__/agentScheduler.emptyResponseChatStall.test.js +213 -213
- package/src/core/__tests__/agentScheduler.errorCategorisation.test.js +246 -246
- package/src/core/__tests__/agentScheduler.firstChunkTimeout.test.js +138 -138
- package/src/core/__tests__/agentScheduler.modeTransitions.test.js +233 -233
- package/src/core/__tests__/agentScheduler.nativePromptPick.test.js +319 -319
- package/src/core/__tests__/agentScheduler.taskLifecycleInstruction.test.js +78 -78
- package/src/core/__tests__/agentScheduler.visualizer.test.js +258 -258
- package/src/core/__tests__/flowCheckpointStore.test.js +140 -140
- package/src/core/__tests__/flowEndToEnd.test.js +565 -565
- package/src/core/__tests__/flowFieldMapping.test.js +188 -189
- package/src/core/__tests__/flowLintClientMirror.test.js +96 -98
- package/src/core/__tests__/flowSavePayload.test.js +170 -169
- package/src/core/__tests__/flowTemplates.test.js +311 -311
- package/src/core/__tests__/flowVersionStore.test.js +123 -123
- package/src/core/__tests__/messageProcessor.test.js +669 -669
- package/src/core/__tests__/stateManager.test.js +0 -1
- package/src/core/agentPool.js +2474 -2475
- package/src/core/agentScheduler.js +1 -4
- package/src/core/contextManager.js +708 -708
- package/src/core/flowExecutor.js +1510 -1510
- package/src/core/flowFieldMapping.js +136 -138
- package/src/core/messageProcessor.js +953 -954
- package/src/core/orchestrator.js +593 -595
- package/src/core/stateManager.js +1765 -1752
- package/src/index.js +1221 -1221
- package/src/interfaces/__tests__/archivedAgentDelete.test.js +207 -207
- package/src/interfaces/__tests__/bulkAgentRoute.test.js +361 -361
- package/src/interfaces/__tests__/imageServing.test.js +228 -228
- package/src/interfaces/__tests__/remoteSessionAuth.test.js +308 -308
- package/src/interfaces/__tests__/videoJobsRoutes.test.js +178 -179
- package/src/interfaces/__tests__/webServer.marketplace.test.js +629 -629
- package/src/interfaces/schedulerRoutes.js +50 -50
- package/src/interfaces/terminal/__tests__/smoke/connection.test.js +341 -350
- package/src/interfaces/terminal/__tests__/smoke/enhancements.test.js +156 -156
- package/src/interfaces/terminal/__tests__/smoke/imports.test.js +325 -330
- package/src/interfaces/terminal/__tests__/smoke/tools.test.js +385 -388
- package/src/interfaces/terminal/api/session.js +265 -266
- package/src/interfaces/terminal/api/websocket.js +496 -497
- package/src/interfaces/terminal/components/AgentCreator.js +691 -705
- package/src/interfaces/terminal/components/AgentEditor.js +676 -678
- package/src/interfaces/terminal/components/AgentSwitcher.js +331 -330
- package/src/interfaces/terminal/components/ErrorPanel.js +263 -264
- package/src/interfaces/terminal/components/Header.js +28 -28
- package/src/interfaces/terminal/components/Layout.js +598 -603
- package/src/interfaces/terminal/components/MessageList.js +280 -281
- package/src/interfaces/terminal/components/SettingsPanel.js +410 -415
- package/src/interfaces/terminal/components/StatusBar.js +2 -0
- package/src/interfaces/terminal/index.js +168 -168
- package/src/interfaces/terminal/state/useAgentControl.js +496 -496
- package/src/interfaces/terminal/state/useAgents.js +537 -537
- package/src/interfaces/terminal/state/useMessages.js +629 -630
- package/src/interfaces/terminal/state/useTools.js +554 -554
- package/src/interfaces/terminal/utils/debugLogger.js +44 -44
- package/src/interfaces/terminal/utils/settingsStorage.js +232 -232
- package/src/interfaces/webServer.js +7578 -7579
- package/src/interfaces/webServer.js.bak +7046 -7046
- package/src/modules/fileExplorer/__tests__/zipDownload.test.js +237 -237
- package/src/modules/fileExplorer/controller.js +470 -469
- package/src/modules/fileExplorer/routes.js +285 -286
- package/src/modules/widget/__tests__/isDisabled.test.js +41 -41
- package/src/modules/widget/__tests__/routes.test.js +677 -678
- package/src/modules/widget/__tests__/runtime.test.js +401 -401
- package/src/modules/widget/__tests__/versioning.test.js +309 -309
- package/src/modules/widget/__tests__/webComponentRuntime.test.js +565 -565
- package/src/modules/widget/__tests__/widgetTool.test.js +316 -316
- package/src/modules/widget/routes.js +435 -435
- package/src/modules/widget/runtime/bundle.js +640 -640
- package/src/modules/widget/runtime/webComponentBundle.js +470 -470
- package/src/modules/widget/schema.js +182 -181
- package/src/modules/widget/widgetTool.js +1389 -1389
- package/src/services/__tests__/agentActivityService.test.js +401 -402
- package/src/services/__tests__/benchmarkService.test.js +184 -184
- package/src/services/__tests__/contextInjectionService.test.js +246 -246
- package/src/services/__tests__/conversationQuery.test.js +721 -723
- package/src/services/__tests__/credentialVault.test.js +469 -469
- package/src/services/__tests__/discordService.integration.test.js +638 -639
- package/src/services/__tests__/flowContextService.test.js +590 -590
- package/src/services/__tests__/memoryService.test.js +1 -1
- package/src/services/__tests__/messageSource.test.js +380 -380
- package/src/services/__tests__/modelRouterNaming.test.js +111 -111
- package/src/services/__tests__/projectDetector.test.js +34 -34
- package/src/services/__tests__/promptService.test.js +242 -242
- package/src/services/__tests__/telegramService.test.js +941 -941
- package/src/services/__tests__/tokenCountingService.test.js +48 -48
- package/src/services/agentActivityService.js +419 -420
- package/src/services/aiService.js +2997 -3001
- package/src/services/apiKeyManager.js +359 -359
- package/src/services/benchmarkService.js +196 -196
- package/src/services/codebaseKnowledgeService.js +2 -2
- package/src/services/composioService.js +738 -738
- package/src/services/conversationCompactionService.js +1258 -1257
- package/src/services/credentialVault.js +685 -685
- package/src/services/discordService.js +792 -793
- package/src/services/embeddings/__tests__/azureCustomProvider.test.js +232 -232
- package/src/services/embeddings/__tests__/embeddingService.test.js +417 -417
- package/src/services/embeddings/__tests__/localProvider.test.js +263 -263
- package/src/services/embeddings/autoRecall.js +218 -219
- package/src/services/embeddings/indexers/__tests__/agentIndexer.test.js +232 -232
- package/src/services/embeddings/indexers/__tests__/memoryIndexer.test.js +418 -418
- package/src/services/embeddings/indexers/__tests__/reminisceIndexer.test.js +356 -357
- package/src/services/embeddings/indexers/__tests__/skillsIndexer.test.js +145 -145
- package/src/services/embeddings/indexers/__tests__/taskIndexer.test.js +146 -146
- package/src/services/embeddings/indexers/composioIndexer.js +279 -279
- package/src/services/embeddings/providerInterface.js +206 -206
- package/src/services/embeddings/providers/localProvider.js +11 -7
- package/src/services/embeddings/providers/openaiProvider.js +101 -101
- package/src/services/embeddings/vectorStore/inMemoryJsonStore.js +356 -356
- package/src/services/errorHandler.js +809 -809
- package/src/services/flowContextService.js +586 -586
- package/src/services/grounding/MockAdapter.js +125 -125
- package/src/services/modelRouterService.js +26 -31
- package/src/services/modelsService.js +322 -322
- package/src/services/ollamaService.js +452 -452
- package/src/services/projectDetector.js +403 -404
- package/src/services/promptService.js +418 -418
- package/src/services/qualityInspector.js +795 -795
- package/src/services/scheduleService.js +726 -726
- package/src/services/serviceRegistry.js +386 -386
- package/src/services/telegrafBot.js +174 -174
- package/src/services/telegramService.js +1972 -1972
- package/src/services/visualEditorBridge.js +1033 -1033
- package/src/services/visualEditorServer.js +1769 -1774
- package/src/services/whatsappService.js +667 -668
- package/src/tools/__tests__/agentCommunicationTool.findAgent.test.js +226 -226
- package/src/tools/__tests__/agentCommunicationTool.test.js +3 -3
- package/src/tools/__tests__/agentDelayTool.test.js +342 -342
- package/src/tools/__tests__/baseTool.test.js +3 -3
- package/src/tools/__tests__/codeMapTool.test.js +915 -915
- package/src/tools/__tests__/fileContentReplaceTool.test.js +309 -309
- package/src/tools/__tests__/fileTreeTool.test.js +274 -274
- package/src/tools/__tests__/filesystemTool.test.js +815 -815
- package/src/tools/__tests__/foundryWebSearchTool.test.js +252 -252
- package/src/tools/__tests__/imageTool.validator.test.js +194 -194
- package/src/tools/__tests__/jobDoneTool.test.js +580 -581
- package/src/tools/__tests__/memoryTool.forgetStale.test.js +272 -272
- package/src/tools/__tests__/memoryTool.reminisce.test.js +2 -2
- package/src/tools/__tests__/memoryTool.reminisceSemanticSearch.test.js +301 -301
- package/src/tools/__tests__/memoryTool.semanticSearch.test.js +405 -405
- package/src/tools/__tests__/memoryTool.teamPool.test.js +293 -293
- package/src/tools/__tests__/memoryTool.test.js +1 -1
- package/src/tools/__tests__/seekTool.test.js +282 -282
- package/src/tools/__tests__/skillsTool.search.test.js +164 -164
- package/src/tools/__tests__/skillsTool.test.js +226 -226
- package/src/tools/__tests__/staticAnalysisTool.test.js +509 -509
- package/src/tools/__tests__/taskManagerTool.discipline.test.js +137 -137
- package/src/tools/__tests__/taskManagerTool.search.test.js +143 -143
- package/src/tools/__tests__/taskManagerTool.test.js +866 -866
- package/src/tools/__tests__/terminalTool.test.js +448 -448
- package/src/tools/__tests__/toolShapeForgiveness.test.js +259 -260
- package/src/tools/__tests__/userPromptTool.test.js +297 -297
- package/src/tools/__tests__/videoTool.jobs.test.js +147 -147
- package/src/tools/__tests__/webTool.e2e.test.js +609 -603
- package/src/tools/__tests__/webTool.unit.test.js +195 -195
- package/src/tools/__tests__/webTool.visionModel.test.js +75 -75
- package/src/tools/agentCommunicationTool.js +8 -10
- package/src/tools/agentDelayTool.js +496 -497
- package/src/tools/asyncToolManager.js +602 -603
- package/src/tools/baseTool.js +12 -11
- package/src/tools/cloneDetectionTool.js +576 -581
- package/src/tools/codeMapTool.js +0 -6
- package/src/tools/composioTool.js +617 -617
- package/src/tools/dependencyResolverTool.js +1211 -1212
- package/src/tools/desktop/DesktopTool.js +629 -638
- package/src/tools/desktop/__tests__/DesktopTool.e2e.test.js +306 -306
- package/src/tools/desktop/__tests__/DesktopTool.test.js +507 -507
- package/src/tools/desktop/__tests__/osController.test.js +364 -364
- package/src/tools/desktop/osController.js +491 -491
- package/src/tools/docxTool.js +623 -623
- package/src/tools/excelTool.js +636 -636
- package/src/tools/fileContentReplaceTool.js +5 -7
- package/src/tools/fileSystemTool.js +12 -19
- package/src/tools/fileTreeTool.js +840 -840
- package/src/tools/foundryWebSearchTool.js +273 -273
- package/src/tools/helpTool.js +198 -198
- package/src/tools/imageTool.js +1397 -1397
- package/src/tools/importAnalyzerTool.js +1056 -1056
- package/src/tools/jobDoneTool.js +495 -495
- package/src/tools/memoryTool.js +1 -1
- package/src/tools/office/pres/__tests__/presSystem.test.js +365 -365
- package/src/tools/office/pres/archetypes/agenda.js +61 -61
- package/src/tools/office/pres/archetypes/bentoGrid.js +218 -219
- package/src/tools/office/pres/archetypes/bigStat.js +140 -142
- package/src/tools/office/pres/archetypes/closing.js +70 -70
- package/src/tools/office/pres/archetypes/hero.js +70 -70
- package/src/tools/office/pres/archetypes/productHero.js +93 -94
- package/src/tools/office/pres/archetypes/table.js +73 -74
- package/src/tools/office/pres/backgrounds/orb.js +66 -66
- package/src/tools/office/pres/components.js +422 -423
- package/src/tools/officeTool.js +441 -441
- package/src/tools/pdfTool.js +625 -627
- package/src/tools/platformControlTool.js +1081 -1081
- package/src/tools/seekTool.js +917 -918
- package/src/tools/skillsTool.js +1 -1
- package/src/tools/staticAnalysisTool.js +2143 -2146
- package/src/tools/taskManagerTool.js +3324 -3324
- package/src/tools/terminalTool.js +2615 -2618
- package/src/tools/videoTool.js +1303 -1303
- package/src/tools/visionTool.js +508 -508
- package/src/tools/visualEditorTool.js +1289 -1290
- package/src/tools/webTool.js +3368 -3368
- package/src/tools/whatsappTool.js +464 -464
- package/src/types/__tests__/agent.test.js +499 -499
- package/src/types/__tests__/contextReference.test.js +606 -606
- package/src/types/__tests__/conversation.test.js +555 -555
- package/src/types/__tests__/toolCommand.test.js +584 -584
- package/src/types/contextReference.js +974 -971
- package/src/types/conversation.js +729 -729
- package/src/types/toolCommand.js +746 -746
- package/src/utilities/__tests__/attachmentValidator.test.js +80 -80
- package/src/utilities/__tests__/auditReport.test.js +328 -328
- package/src/utilities/__tests__/directoryAccessManager.test.js +388 -388
- package/src/utilities/__tests__/jsonRepair.test.js +103 -104
- package/src/utilities/__tests__/modeTransitionReasons.test.js +105 -105
- package/src/utilities/__tests__/platformUtils.test.js +80 -87
- package/src/utilities/__tests__/structuredFileValidator.test.js +261 -263
- package/src/utilities/__tests__/toolConstants.test.js +92 -94
- package/src/utilities/__tests__/useIsTouchDevice.detect.test.js +114 -114
- package/src/utilities/__tests__/webUiUtilSync.test.js +117 -117
- package/src/utilities/attachmentValidator.js +284 -288
- package/src/utilities/authCache.js.backup-1779570472481 +121 -121
- package/src/utilities/browserStealth.js +631 -630
- package/src/utilities/configManager.js +616 -617
- package/src/utilities/directoryAccessManager.js +564 -565
- package/src/utilities/fileProcessor.js +308 -307
- package/src/utilities/humanBehavior.js +454 -453
- package/src/utilities/logger.js +479 -479
- package/src/utilities/structuredFileValidator.js +696 -699
- package/src/utilities/tagParser.js +5 -10
- package/src/utilities/userDataDir.js +308 -308
- package/node_modules/@isaacs/brace-expansion/dist/commonjs/index.js.map +0 -1
- package/node_modules/@isaacs/brace-expansion/dist/esm/index.js.map +0 -1
- package/node_modules/minipass/LICENSE +0 -15
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/LICENSE.md +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/commonjs/index.d.ts +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/commonjs/index.d.ts.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/commonjs/index.js +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/commonjs/index.js.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/commonjs/package.json +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/esm/index.d.ts +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/esm/index.d.ts.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/esm/index.js +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/esm/index.js.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/balanced-match/dist/esm/package.json +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/LICENSE +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/commonjs/index.d.ts +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/commonjs/index.d.ts.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/commonjs/package.json +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/esm/index.d.ts +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/esm/index.d.ts.map +0 -0
- /package/node_modules/{@isaacs → glob/node_modules}/brace-expansion/dist/esm/package.json +0 -0
package/src/tools/visionTool.js
CHANGED
|
@@ -1,508 +1,508 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Vision Tool — Image analysis for agents
|
|
3
|
-
*
|
|
4
|
-
* Purpose:
|
|
5
|
-
* - Analyze images from disk with natural language questions
|
|
6
|
-
* - Session-based: first call uploads image, subsequent calls reuse it
|
|
7
|
-
* - Uses the best available vision model (prefers o4-mini for best MMMU/cost ratio)
|
|
8
|
-
* - Returns structured answers only (no filler text)
|
|
9
|
-
*
|
|
10
|
-
* Actions:
|
|
11
|
-
* - analyze: Send an image + question, get a structured answer + session ID
|
|
12
|
-
* - ask: Ask a follow-up question about an image in an existing session
|
|
13
|
-
* - list-sessions: List active vision sessions
|
|
14
|
-
* - close-session: Close a vision session to free memory
|
|
15
|
-
*/
|
|
16
|
-
|
|
17
|
-
import { BaseTool } from './baseTool.js';
|
|
18
|
-
import { promises as fs } from 'fs';
|
|
19
|
-
import path from 'path';
|
|
20
|
-
|
|
21
|
-
// Vision model selection uses catalog tags + recommended_for fields.
|
|
22
|
-
// No hardcoded model names — the catalog determines which models are best for vision.
|
|
23
|
-
|
|
24
|
-
const MAX_IMAGE_SIZE_BYTES = 20 * 1024 * 1024; // 20MB
|
|
25
|
-
const SESSION_TIMEOUT_MS = 30 * 60 * 1000; // 30 minutes
|
|
26
|
-
const CLEANUP_INTERVAL_MS = 5 * 60 * 1000; // 5 minutes
|
|
27
|
-
|
|
28
|
-
class VisionTool extends BaseTool {
|
|
29
|
-
constructor(config = {}, logger = null) {
|
|
30
|
-
super(config, logger);
|
|
31
|
-
|
|
32
|
-
this.aiService = null;
|
|
33
|
-
this.modelsService = null;
|
|
34
|
-
this.requiresProject = false;
|
|
35
|
-
this.isAsync = false;
|
|
36
|
-
this.timeout = 120000; // 2 minutes (vision can be slow)
|
|
37
|
-
|
|
38
|
-
// Session storage: sessionId → { imageBase64, mimeType, history, createdAt, lastActivity }
|
|
39
|
-
this.sessions = new Map();
|
|
40
|
-
this.cleanupTimer = null;
|
|
41
|
-
}
|
|
42
|
-
|
|
43
|
-
// --- Dependency Injection ---
|
|
44
|
-
|
|
45
|
-
setAIService(aiService) { this.aiService = aiService; }
|
|
46
|
-
setModelsService(modelsService) { this.modelsService = modelsService; }
|
|
47
|
-
setAgentPool(agentPool) { this.agentPool = agentPool; }
|
|
48
|
-
|
|
49
|
-
getDescription() {
|
|
50
|
-
return `Vision Tool: Analyze images with AI vision models.
|
|
51
|
-
|
|
52
|
-
Send an image file + a question and receive a structured answer. Supports follow-up questions on the same image without re-uploading.
|
|
53
|
-
|
|
54
|
-
ACTIONS:
|
|
55
|
-
|
|
56
|
-
1. ANALYZE — Send image + question (creates a session):
|
|
57
|
-
\`\`\`json
|
|
58
|
-
{ "toolId": "vision", "action": "analyze", "imagePath": "/path/to/image.png", "question": "What objects are in this image?" }
|
|
59
|
-
\`\`\`
|
|
60
|
-
Returns: { answer, sessionId, model }
|
|
61
|
-
|
|
62
|
-
2. ASK — Follow-up question on an existing session:
|
|
63
|
-
\`\`\`json
|
|
64
|
-
{ "toolId": "vision", "action": "ask", "sessionId": "vs-...", "question": "What color is the largest object?" }
|
|
65
|
-
\`\`\`
|
|
66
|
-
Returns: { answer, sessionId, model }
|
|
67
|
-
|
|
68
|
-
3. LIST-SESSIONS — Show active vision sessions:
|
|
69
|
-
\`\`\`json
|
|
70
|
-
{ "toolId": "vision", "action": "list-sessions" }
|
|
71
|
-
\`\`\`
|
|
72
|
-
|
|
73
|
-
4. CLOSE-SESSION — Free a session:
|
|
74
|
-
\`\`\`json
|
|
75
|
-
{ "toolId": "vision", "action": "close-session", "sessionId": "vs-..." }
|
|
76
|
-
\`\`\`
|
|
77
|
-
|
|
78
|
-
SUPPORTED FORMATS: JPEG, PNG, GIF, WebP, BMP (max 20MB)
|
|
79
|
-
MODEL: Automatically selects the best available vision model (prefers Anthropic Sonnet/Opus).
|
|
80
|
-
ANSWERS: Structured, direct answers only — no filler text.`;
|
|
81
|
-
}
|
|
82
|
-
|
|
83
|
-
parseParameters(content) {
|
|
84
|
-
return content;
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
getRequiredParameters() {
|
|
88
|
-
return ['action'];
|
|
89
|
-
}
|
|
90
|
-
|
|
91
|
-
getSupportedActions() {
|
|
92
|
-
return ['analyze', 'ask', 'list-sessions', 'close-session'];
|
|
93
|
-
}
|
|
94
|
-
|
|
95
|
-
validateParameterTypes(params) {
|
|
96
|
-
const errors = [];
|
|
97
|
-
if (params.action && typeof params.action !== 'string') errors.push('action must be a string');
|
|
98
|
-
if (params.imagePath !== undefined && typeof params.imagePath !== 'string') errors.push('imagePath must be a string');
|
|
99
|
-
if (params.question !== undefined && typeof params.question !== 'string') errors.push('question must be a string');
|
|
100
|
-
if (params.sessionId !== undefined && typeof params.sessionId !== 'string') errors.push('sessionId must be a string');
|
|
101
|
-
return errors;
|
|
102
|
-
}
|
|
103
|
-
|
|
104
|
-
customValidateParameters(params) {
|
|
105
|
-
const errors = [];
|
|
106
|
-
const validActions = this.getSupportedActions();
|
|
107
|
-
if (!validActions.includes(params.action)) {
|
|
108
|
-
errors.push(`Invalid action: "${params.action}". Valid: ${validActions.join(', ')}`);
|
|
109
|
-
return errors;
|
|
110
|
-
}
|
|
111
|
-
if (params.action === 'analyze') {
|
|
112
|
-
if (!params.imagePath) errors.push('"imagePath" is required for analyze');
|
|
113
|
-
if (!params.question) errors.push('"question" is required for analyze');
|
|
114
|
-
}
|
|
115
|
-
if (params.action === 'ask') {
|
|
116
|
-
if (!params.sessionId) errors.push('"sessionId" is required for ask');
|
|
117
|
-
if (!params.question) errors.push('"question" is required for ask');
|
|
118
|
-
}
|
|
119
|
-
if (params.action === 'close-session') {
|
|
120
|
-
if (!params.sessionId) errors.push('"sessionId" is required for close-session');
|
|
121
|
-
}
|
|
122
|
-
return errors;
|
|
123
|
-
}
|
|
124
|
-
|
|
125
|
-
async execute(params, context = {}) {
|
|
126
|
-
// Reverse-forgiveness: accept plural envelope {actions:[{type/action}]}
|
|
127
|
-
// even though this tool's canonical shape is singular.
|
|
128
|
-
if (Array.isArray(params?.actions) && params.actions.length > 0) {
|
|
129
|
-
const a = params.actions[0] || {};
|
|
130
|
-
params = { ...params, ...a, action: a.type || a.action || params.action };
|
|
131
|
-
}
|
|
132
|
-
|
|
133
|
-
this._ensureCleanup();
|
|
134
|
-
|
|
135
|
-
try {
|
|
136
|
-
switch (params.action) {
|
|
137
|
-
case 'analyze':
|
|
138
|
-
return await this._analyze(params.imagePath, params.question, context);
|
|
139
|
-
case 'ask':
|
|
140
|
-
return await this._ask(params.sessionId, params.question, context);
|
|
141
|
-
case 'list-sessions':
|
|
142
|
-
return this._listSessions();
|
|
143
|
-
case 'close-session':
|
|
144
|
-
return this._closeSession(params.sessionId);
|
|
145
|
-
default:
|
|
146
|
-
return { success: false, error: `Unknown action: ${params.action}` };
|
|
147
|
-
}
|
|
148
|
-
} catch (error) {
|
|
149
|
-
return { success: false, error: error.message };
|
|
150
|
-
}
|
|
151
|
-
}
|
|
152
|
-
|
|
153
|
-
// --- Core Actions ---
|
|
154
|
-
|
|
155
|
-
_resolveImagePath(imagePath, context) {
|
|
156
|
-
// Resolve relative to agent's working directory (synced with terminal/filesystem tools)
|
|
157
|
-
if (path.isAbsolute(imagePath)) return imagePath;
|
|
158
|
-
const workingDir = context.directoryAccess?.workingDirectory || context.projectDir || process.cwd();
|
|
159
|
-
return path.resolve(workingDir, imagePath);
|
|
160
|
-
}
|
|
161
|
-
|
|
162
|
-
async _analyze(imagePath, question, context) {
|
|
163
|
-
// Read and validate image — resolve relative to agent's working directory
|
|
164
|
-
const resolvedPath = this._resolveImagePath(imagePath, context);
|
|
165
|
-
let imageBuffer;
|
|
166
|
-
try {
|
|
167
|
-
imageBuffer = await fs.readFile(resolvedPath);
|
|
168
|
-
} catch {
|
|
169
|
-
throw new Error(`Image not found: ${imagePath}`);
|
|
170
|
-
}
|
|
171
|
-
|
|
172
|
-
if (imageBuffer.length > MAX_IMAGE_SIZE_BYTES) {
|
|
173
|
-
throw new Error(`Image too large (${(imageBuffer.length / 1024 / 1024).toFixed(1)}MB). Max: ${MAX_IMAGE_SIZE_BYTES / 1024 / 1024}MB`);
|
|
174
|
-
}
|
|
175
|
-
|
|
176
|
-
const ext = path.extname(resolvedPath).toLowerCase();
|
|
177
|
-
const mimeMap = { '.jpg': 'image/jpeg', '.jpeg': 'image/jpeg', '.png': 'image/png', '.gif': 'image/gif', '.webp': 'image/webp', '.bmp': 'image/bmp' };
|
|
178
|
-
const mimeType = mimeMap[ext];
|
|
179
|
-
if (!mimeType) {
|
|
180
|
-
throw new Error(`Unsupported image format: ${ext}. Supported: ${Object.keys(mimeMap).join(', ')}`);
|
|
181
|
-
}
|
|
182
|
-
|
|
183
|
-
const imageBase64 = imageBuffer.toString('base64');
|
|
184
|
-
|
|
185
|
-
// Create session
|
|
186
|
-
const sessionId = `vs-${Date.now()}-${Math.random().toString(36).substr(2, 6)}`;
|
|
187
|
-
this.sessions.set(sessionId, {
|
|
188
|
-
imageBase64,
|
|
189
|
-
mimeType,
|
|
190
|
-
imagePath: resolvedPath,
|
|
191
|
-
history: [],
|
|
192
|
-
createdAt: Date.now(),
|
|
193
|
-
lastActivity: Date.now()
|
|
194
|
-
});
|
|
195
|
-
|
|
196
|
-
// Send to vision model
|
|
197
|
-
const answer = await this._sendVisionRequest(imageBase64, mimeType, question, [], context);
|
|
198
|
-
|
|
199
|
-
// Store in history
|
|
200
|
-
this.sessions.get(sessionId).history.push(
|
|
201
|
-
{ role: 'user', content: question },
|
|
202
|
-
{ role: 'assistant', content: answer }
|
|
203
|
-
);
|
|
204
|
-
|
|
205
|
-
return {
|
|
206
|
-
success: true,
|
|
207
|
-
result: {
|
|
208
|
-
answer,
|
|
209
|
-
sessionId,
|
|
210
|
-
model: this._getSelectedModel(),
|
|
211
|
-
imagePath: resolvedPath
|
|
212
|
-
}
|
|
213
|
-
};
|
|
214
|
-
}
|
|
215
|
-
|
|
216
|
-
async _ask(sessionId, question, context) {
|
|
217
|
-
const session = this.sessions.get(sessionId);
|
|
218
|
-
if (!session) {
|
|
219
|
-
throw new Error(`Vision session not found: ${sessionId}. Use "analyze" to start a new session.`);
|
|
220
|
-
}
|
|
221
|
-
|
|
222
|
-
session.lastActivity = Date.now();
|
|
223
|
-
|
|
224
|
-
// Send with conversation history
|
|
225
|
-
const answer = await this._sendVisionRequest(
|
|
226
|
-
session.imageBase64,
|
|
227
|
-
session.mimeType,
|
|
228
|
-
question,
|
|
229
|
-
session.history,
|
|
230
|
-
context
|
|
231
|
-
);
|
|
232
|
-
|
|
233
|
-
// Append to history
|
|
234
|
-
session.history.push(
|
|
235
|
-
{ role: 'user', content: question },
|
|
236
|
-
{ role: 'assistant', content: answer }
|
|
237
|
-
);
|
|
238
|
-
|
|
239
|
-
return {
|
|
240
|
-
success: true,
|
|
241
|
-
result: {
|
|
242
|
-
answer,
|
|
243
|
-
sessionId,
|
|
244
|
-
model: this._getSelectedModel(),
|
|
245
|
-
questionsInSession: session.history.filter(h => h.role === 'user').length
|
|
246
|
-
}
|
|
247
|
-
};
|
|
248
|
-
}
|
|
249
|
-
|
|
250
|
-
_listSessions() {
|
|
251
|
-
const sessions = [];
|
|
252
|
-
for (const [id, session] of this.sessions) {
|
|
253
|
-
sessions.push({
|
|
254
|
-
sessionId: id,
|
|
255
|
-
imagePath: session.imagePath,
|
|
256
|
-
questionsAsked: session.history.filter(h => h.role === 'user').length,
|
|
257
|
-
createdAt: new Date(session.createdAt).toISOString(),
|
|
258
|
-
lastActivity: new Date(session.lastActivity).toISOString()
|
|
259
|
-
});
|
|
260
|
-
}
|
|
261
|
-
return { success: true, result: { sessions, count: sessions.length } };
|
|
262
|
-
}
|
|
263
|
-
|
|
264
|
-
_closeSession(sessionId) {
|
|
265
|
-
if (!this.sessions.has(sessionId)) {
|
|
266
|
-
return { success: false, error: `Session not found: ${sessionId}` };
|
|
267
|
-
}
|
|
268
|
-
this.sessions.delete(sessionId);
|
|
269
|
-
return { success: true, result: { closed: sessionId } };
|
|
270
|
-
}
|
|
271
|
-
|
|
272
|
-
// --- Vision API ---
|
|
273
|
-
|
|
274
|
-
async _sendVisionRequest(imageBase64, mimeType, question, history, context) {
|
|
275
|
-
if (!this.aiService) {
|
|
276
|
-
throw new Error('AI service not available. Vision tool requires aiService dependency.');
|
|
277
|
-
}
|
|
278
|
-
|
|
279
|
-
const model = this._selectVisionModel(context);
|
|
280
|
-
if (!model) {
|
|
281
|
-
throw new Error('No vision-capable model available. Ensure at least one model with vision support is configured.');
|
|
282
|
-
}
|
|
283
|
-
|
|
284
|
-
this.logger?.info('[VisionTool] Selected vision model', { model, visionModelsAvailable: this._getVisionModels().map(m => m.name) });
|
|
285
|
-
|
|
286
|
-
const systemPrompt = 'You are a precise image analysis assistant. Answer the question about the image directly and concisely. Provide only the answer — no preamble, no filler, no commentary. If the image contains text, transcribe it accurately. If asked about objects, list them clearly. Structure your response for programmatic consumption.';
|
|
287
|
-
|
|
288
|
-
// Build messages with image
|
|
289
|
-
const messages = [];
|
|
290
|
-
|
|
291
|
-
// System prompt
|
|
292
|
-
messages.push({ role: 'system', content: systemPrompt });
|
|
293
|
-
|
|
294
|
-
// First message includes the image
|
|
295
|
-
const imageContent = [
|
|
296
|
-
{ type: 'image_url', image_url: { url: `data:${mimeType};base64,${imageBase64}` } },
|
|
297
|
-
{ type: 'text', text: history.length === 0 ? question : history[0].content }
|
|
298
|
-
];
|
|
299
|
-
messages.push({ role: 'user', content: imageContent });
|
|
300
|
-
|
|
301
|
-
// Add conversation history (skip first user message, already included with image)
|
|
302
|
-
for (let i = 1; i < history.length; i++) {
|
|
303
|
-
const h = history[i];
|
|
304
|
-
messages.push({ role: h.role, content: h.content });
|
|
305
|
-
}
|
|
306
|
-
|
|
307
|
-
// Add current question (if there's history, this is a follow-up)
|
|
308
|
-
if (history.length > 0) {
|
|
309
|
-
messages.push({ role: 'user', content: question });
|
|
310
|
-
}
|
|
311
|
-
|
|
312
|
-
// Primary: send through chat completions with multimodal content
|
|
313
|
-
// This works with all vision models via the /chat/completions endpoint
|
|
314
|
-
try {
|
|
315
|
-
const response = await this._callChatCompletionsWithImage(imageBase64, mimeType, question, history, model, systemPrompt, context);
|
|
316
|
-
return response;
|
|
317
|
-
} catch (chatError) {
|
|
318
|
-
this.logger?.warn('[VisionTool] Chat completions with image failed, trying /llm/vision endpoint', { error: chatError.message });
|
|
319
|
-
}
|
|
320
|
-
|
|
321
|
-
// Fallback: dedicated /llm/vision endpoint (supports fewer models)
|
|
322
|
-
try {
|
|
323
|
-
const response = await this._callVisionEndpoint(imageBase64, question, model, context);
|
|
324
|
-
return response;
|
|
325
|
-
} catch (visionError) {
|
|
326
|
-
throw new Error(`Vision analysis failed: ${visionError.message}
|
|
327
|
-
}
|
|
328
|
-
}
|
|
329
|
-
|
|
330
|
-
async _callChatCompletionsWithImage(imageBase64, mimeType, question, history, model, systemPrompt, context) {
|
|
331
|
-
const backendUrl = this.aiService?.backendUrl || 'https://loxia-api-g7hrb8bxdae8a2h7.z02.azurefd.net';
|
|
332
|
-
const sessionId = context.sessionId;
|
|
333
|
-
|
|
334
|
-
let apiKey = null;
|
|
335
|
-
if (this.aiService?.apiKeyManager) {
|
|
336
|
-
const keys = this.aiService.apiKeyManager.getKeysForRequest(sessionId, { platformProvided: true });
|
|
337
|
-
apiKey = keys.loxiaApiKey;
|
|
338
|
-
}
|
|
339
|
-
|
|
340
|
-
// Build messages array with image in the first user message
|
|
341
|
-
const messages = [];
|
|
342
|
-
|
|
343
|
-
// First user message includes the image
|
|
344
|
-
// Format image for the selected model's provider
|
|
345
|
-
const isAnthropic = model.toLowerCase().includes('claude') || model.toLowerCase().includes('anthropic');
|
|
346
|
-
const imageBlock = isAnthropic
|
|
347
|
-
? { type: 'image', source: { type: 'base64', media_type: mimeType, data: imageBase64 } }
|
|
348
|
-
: { type: 'image_url', image_url: { url: `data:${mimeType};base64,${imageBase64}` } };
|
|
349
|
-
|
|
350
|
-
const firstQuestion = history.length > 0 ? history[0].content : question;
|
|
351
|
-
messages.push({
|
|
352
|
-
role: 'user',
|
|
353
|
-
content: [
|
|
354
|
-
imageBlock,
|
|
355
|
-
{ type: 'text', text: firstQuestion }
|
|
356
|
-
]
|
|
357
|
-
});
|
|
358
|
-
|
|
359
|
-
// Add conversation history (skip first user message, already included)
|
|
360
|
-
for (let i = 1; i < history.length; i++) {
|
|
361
|
-
messages.push({ role: history[i].role, content: history[i].content });
|
|
362
|
-
}
|
|
363
|
-
|
|
364
|
-
// Add current question if this is a follow-up
|
|
365
|
-
if (history.length > 0) {
|
|
366
|
-
messages.push({ role: 'user', content: question });
|
|
367
|
-
}
|
|
368
|
-
|
|
369
|
-
// Build payload matching the /llm/chat endpoint format
|
|
370
|
-
const firstUserContent = messages[0]?.content;
|
|
371
|
-
const messageText = Array.isArray(firstUserContent)
|
|
372
|
-
? firstUserContent.find(c => c.type === 'text')?.text || question
|
|
373
|
-
: question;
|
|
374
|
-
|
|
375
|
-
const payload = {
|
|
376
|
-
model,
|
|
377
|
-
message: messageText,
|
|
378
|
-
systemPrompt,
|
|
379
|
-
messages, // Multimodal messages array
|
|
380
|
-
options: {
|
|
381
|
-
max_tokens: 2048,
|
|
382
|
-
temperature: 0.1
|
|
383
|
-
},
|
|
384
|
-
metadata: {
|
|
385
|
-
requestId: `vision-${Date.now()}`,
|
|
386
|
-
agentId: context.agentId
|
|
387
|
-
}
|
|
388
|
-
};
|
|
389
|
-
|
|
390
|
-
const response = await fetch(`${backendUrl}/llm/chat`, {
|
|
391
|
-
method: 'POST',
|
|
392
|
-
headers: {
|
|
393
|
-
'Content-Type': 'application/json',
|
|
394
|
-
...(apiKey && { 'Authorization': `Bearer ${apiKey}` })
|
|
395
|
-
},
|
|
396
|
-
body: JSON.stringify(payload),
|
|
397
|
-
signal: AbortSignal.timeout(120000)
|
|
398
|
-
});
|
|
399
|
-
|
|
400
|
-
if (!response.ok) {
|
|
401
|
-
const errorData = await response.json().catch(() => ({}));
|
|
402
|
-
throw new Error(errorData.error?.message || errorData.error || `Chat completions returned ${response.status}`);
|
|
403
|
-
}
|
|
404
|
-
|
|
405
|
-
const data = await response.json();
|
|
406
|
-
return data.content || data.choices?.[0]?.message?.content || '';
|
|
407
|
-
}
|
|
408
|
-
|
|
409
|
-
async _callVisionEndpoint(imageBase64, prompt, model, context) {
|
|
410
|
-
// Call the backend /llm/vision endpoint directly
|
|
411
|
-
const backendUrl = this.aiService?.backendUrl || 'https://loxia-api-g7hrb8bxdae8a2h7.z02.azurefd.net';
|
|
412
|
-
const sessionId = context.sessionId;
|
|
413
|
-
|
|
414
|
-
// Get API key
|
|
415
|
-
let apiKey = null;
|
|
416
|
-
if (this.aiService?.apiKeyManager) {
|
|
417
|
-
const keys = this.aiService.apiKeyManager.getKeysForRequest(sessionId, { platformProvided: true });
|
|
418
|
-
apiKey = keys.loxiaApiKey;
|
|
419
|
-
}
|
|
420
|
-
|
|
421
|
-
const response = await fetch(`${backendUrl}/llm/vision`, {
|
|
422
|
-
method: 'POST',
|
|
423
|
-
headers: {
|
|
424
|
-
'Content-Type': 'application/json',
|
|
425
|
-
...(apiKey && { 'Authorization': `Bearer ${apiKey}` })
|
|
426
|
-
},
|
|
427
|
-
body: JSON.stringify({ image: imageBase64, prompt, model, metadata: {} }),
|
|
428
|
-
signal: AbortSignal.timeout(120000)
|
|
429
|
-
});
|
|
430
|
-
|
|
431
|
-
if (!response.ok) {
|
|
432
|
-
const errorData = await response.json().catch(() => ({}));
|
|
433
|
-
throw new Error(errorData.error || `Vision API returned ${response.status}`);
|
|
434
|
-
}
|
|
435
|
-
|
|
436
|
-
const data = await response.json();
|
|
437
|
-
return data.content || '';
|
|
438
|
-
}
|
|
439
|
-
|
|
440
|
-
_selectVisionModel(context = {}) {
|
|
441
|
-
const visionModels = this._getVisionModels();
|
|
442
|
-
if (visionModels.length === 0) {
|
|
443
|
-
this.logger?.warn('[VisionTool] No vision-capable model found in model list');
|
|
444
|
-
return null;
|
|
445
|
-
}
|
|
446
|
-
|
|
447
|
-
// 1. Model explicitly recommended for vision (from catalog)
|
|
448
|
-
const recommended = visionModels.find(m => m.recommended_for?.includes('vision'));
|
|
449
|
-
if (recommended) { this._selectedModel = recommended.name; return this._selectedModel; }
|
|
450
|
-
|
|
451
|
-
// 2. Vision model with budget tier (best cost/quality)
|
|
452
|
-
const budgetVision = visionModels.find(m => m.tier === 'budget');
|
|
453
|
-
if (budgetVision) { this._selectedModel = budgetVision.name; return this._selectedModel; }
|
|
454
|
-
|
|
455
|
-
// 3. Agent's current model if it has vision capability
|
|
456
|
-
const agentModel = context.currentModel;
|
|
457
|
-
if (agentModel && visionModels.some(m => m.name === agentModel)) {
|
|
458
|
-
this._selectedModel = agentModel;
|
|
459
|
-
return this._selectedModel;
|
|
460
|
-
}
|
|
461
|
-
|
|
462
|
-
// 4. First available vision model
|
|
463
|
-
this._selectedModel = visionModels[0].name;
|
|
464
|
-
return this._selectedModel;
|
|
465
|
-
}
|
|
466
|
-
|
|
467
|
-
_getVisionModels() {
|
|
468
|
-
if (!this.modelsService) return [];
|
|
469
|
-
const allModels = this.modelsService.getModels?.() || [];
|
|
470
|
-
return allModels.filter(m => m.supportsVision === true);
|
|
471
|
-
}
|
|
472
|
-
|
|
473
|
-
_getSelectedModel() {
|
|
474
|
-
return this._selectedModel || null;
|
|
475
|
-
}
|
|
476
|
-
|
|
477
|
-
// --- Cleanup ---
|
|
478
|
-
|
|
479
|
-
_ensureCleanup() {
|
|
480
|
-
if (this.cleanupTimer) return;
|
|
481
|
-
this.cleanupTimer = setInterval(() => {
|
|
482
|
-
const now = Date.now();
|
|
483
|
-
for (const [id, session] of this.sessions) {
|
|
484
|
-
if (now - session.lastActivity > SESSION_TIMEOUT_MS) {
|
|
485
|
-
this.sessions.delete(id);
|
|
486
|
-
this.logger?.debug('[VisionTool] Session expired', { sessionId: id });
|
|
487
|
-
}
|
|
488
|
-
}
|
|
489
|
-
}, CLEANUP_INTERVAL_MS);
|
|
490
|
-
// Don't prevent process exit
|
|
491
|
-
if (this.cleanupTimer.unref) this.cleanupTimer.unref();
|
|
492
|
-
}
|
|
493
|
-
|
|
494
|
-
getParameterSchema() {
|
|
495
|
-
return {
|
|
496
|
-
type: 'object',
|
|
497
|
-
required: ['action'],
|
|
498
|
-
properties: {
|
|
499
|
-
action: { type: 'string', enum: ['analyze', 'ask', 'list-sessions', 'close-session'] },
|
|
500
|
-
imagePath: { type: 'string', description: 'Path to image file (for analyze)' },
|
|
501
|
-
question: { type: 'string', description: 'Question about the image' },
|
|
502
|
-
sessionId: { type: 'string', description: 'Session ID (for ask/close-session)' }
|
|
503
|
-
}
|
|
504
|
-
};
|
|
505
|
-
}
|
|
506
|
-
}
|
|
507
|
-
|
|
508
|
-
export default VisionTool;
|
|
1
|
+
/**
|
|
2
|
+
* Vision Tool — Image analysis for agents
|
|
3
|
+
*
|
|
4
|
+
* Purpose:
|
|
5
|
+
* - Analyze images from disk with natural language questions
|
|
6
|
+
* - Session-based: first call uploads image, subsequent calls reuse it
|
|
7
|
+
* - Uses the best available vision model (prefers o4-mini for best MMMU/cost ratio)
|
|
8
|
+
* - Returns structured answers only (no filler text)
|
|
9
|
+
*
|
|
10
|
+
* Actions:
|
|
11
|
+
* - analyze: Send an image + question, get a structured answer + session ID
|
|
12
|
+
* - ask: Ask a follow-up question about an image in an existing session
|
|
13
|
+
* - list-sessions: List active vision sessions
|
|
14
|
+
* - close-session: Close a vision session to free memory
|
|
15
|
+
*/
|
|
16
|
+
|
|
17
|
+
import { BaseTool } from './baseTool.js';
|
|
18
|
+
import { promises as fs } from 'fs';
|
|
19
|
+
import path from 'path';
|
|
20
|
+
|
|
21
|
+
// Vision model selection uses catalog tags + recommended_for fields.
|
|
22
|
+
// No hardcoded model names — the catalog determines which models are best for vision.
|
|
23
|
+
|
|
24
|
+
const MAX_IMAGE_SIZE_BYTES = 20 * 1024 * 1024; // 20MB
|
|
25
|
+
const SESSION_TIMEOUT_MS = 30 * 60 * 1000; // 30 minutes
|
|
26
|
+
const CLEANUP_INTERVAL_MS = 5 * 60 * 1000; // 5 minutes
|
|
27
|
+
|
|
28
|
+
class VisionTool extends BaseTool {
|
|
29
|
+
constructor(config = {}, logger = null) {
|
|
30
|
+
super(config, logger);
|
|
31
|
+
|
|
32
|
+
this.aiService = null;
|
|
33
|
+
this.modelsService = null;
|
|
34
|
+
this.requiresProject = false;
|
|
35
|
+
this.isAsync = false;
|
|
36
|
+
this.timeout = 120000; // 2 minutes (vision can be slow)
|
|
37
|
+
|
|
38
|
+
// Session storage: sessionId → { imageBase64, mimeType, history, createdAt, lastActivity }
|
|
39
|
+
this.sessions = new Map();
|
|
40
|
+
this.cleanupTimer = null;
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
// --- Dependency Injection ---
|
|
44
|
+
|
|
45
|
+
setAIService(aiService) { this.aiService = aiService; }
|
|
46
|
+
setModelsService(modelsService) { this.modelsService = modelsService; }
|
|
47
|
+
setAgentPool(agentPool) { this.agentPool = agentPool; }
|
|
48
|
+
|
|
49
|
+
getDescription() {
|
|
50
|
+
return `Vision Tool: Analyze images with AI vision models.
|
|
51
|
+
|
|
52
|
+
Send an image file + a question and receive a structured answer. Supports follow-up questions on the same image without re-uploading.
|
|
53
|
+
|
|
54
|
+
ACTIONS:
|
|
55
|
+
|
|
56
|
+
1. ANALYZE — Send image + question (creates a session):
|
|
57
|
+
\`\`\`json
|
|
58
|
+
{ "toolId": "vision", "action": "analyze", "imagePath": "/path/to/image.png", "question": "What objects are in this image?" }
|
|
59
|
+
\`\`\`
|
|
60
|
+
Returns: { answer, sessionId, model }
|
|
61
|
+
|
|
62
|
+
2. ASK — Follow-up question on an existing session:
|
|
63
|
+
\`\`\`json
|
|
64
|
+
{ "toolId": "vision", "action": "ask", "sessionId": "vs-...", "question": "What color is the largest object?" }
|
|
65
|
+
\`\`\`
|
|
66
|
+
Returns: { answer, sessionId, model }
|
|
67
|
+
|
|
68
|
+
3. LIST-SESSIONS — Show active vision sessions:
|
|
69
|
+
\`\`\`json
|
|
70
|
+
{ "toolId": "vision", "action": "list-sessions" }
|
|
71
|
+
\`\`\`
|
|
72
|
+
|
|
73
|
+
4. CLOSE-SESSION — Free a session:
|
|
74
|
+
\`\`\`json
|
|
75
|
+
{ "toolId": "vision", "action": "close-session", "sessionId": "vs-..." }
|
|
76
|
+
\`\`\`
|
|
77
|
+
|
|
78
|
+
SUPPORTED FORMATS: JPEG, PNG, GIF, WebP, BMP (max 20MB)
|
|
79
|
+
MODEL: Automatically selects the best available vision model (prefers Anthropic Sonnet/Opus).
|
|
80
|
+
ANSWERS: Structured, direct answers only — no filler text.`;
|
|
81
|
+
}
|
|
82
|
+
|
|
83
|
+
parseParameters(content) {
|
|
84
|
+
return content;
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
getRequiredParameters() {
|
|
88
|
+
return ['action'];
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
getSupportedActions() {
|
|
92
|
+
return ['analyze', 'ask', 'list-sessions', 'close-session'];
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
validateParameterTypes(params) {
|
|
96
|
+
const errors = [];
|
|
97
|
+
if (params.action && typeof params.action !== 'string') errors.push('action must be a string');
|
|
98
|
+
if (params.imagePath !== undefined && typeof params.imagePath !== 'string') errors.push('imagePath must be a string');
|
|
99
|
+
if (params.question !== undefined && typeof params.question !== 'string') errors.push('question must be a string');
|
|
100
|
+
if (params.sessionId !== undefined && typeof params.sessionId !== 'string') errors.push('sessionId must be a string');
|
|
101
|
+
return errors;
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
customValidateParameters(params) {
|
|
105
|
+
const errors = [];
|
|
106
|
+
const validActions = this.getSupportedActions();
|
|
107
|
+
if (!validActions.includes(params.action)) {
|
|
108
|
+
errors.push(`Invalid action: "${params.action}". Valid: ${validActions.join(', ')}`);
|
|
109
|
+
return errors;
|
|
110
|
+
}
|
|
111
|
+
if (params.action === 'analyze') {
|
|
112
|
+
if (!params.imagePath) errors.push('"imagePath" is required for analyze');
|
|
113
|
+
if (!params.question) errors.push('"question" is required for analyze');
|
|
114
|
+
}
|
|
115
|
+
if (params.action === 'ask') {
|
|
116
|
+
if (!params.sessionId) errors.push('"sessionId" is required for ask');
|
|
117
|
+
if (!params.question) errors.push('"question" is required for ask');
|
|
118
|
+
}
|
|
119
|
+
if (params.action === 'close-session') {
|
|
120
|
+
if (!params.sessionId) errors.push('"sessionId" is required for close-session');
|
|
121
|
+
}
|
|
122
|
+
return errors;
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
async execute(params, context = {}) {
|
|
126
|
+
// Reverse-forgiveness: accept plural envelope {actions:[{type/action}]}
|
|
127
|
+
// even though this tool's canonical shape is singular.
|
|
128
|
+
if (Array.isArray(params?.actions) && params.actions.length > 0) {
|
|
129
|
+
const a = params.actions[0] || {};
|
|
130
|
+
params = { ...params, ...a, action: a.type || a.action || params.action };
|
|
131
|
+
}
|
|
132
|
+
|
|
133
|
+
this._ensureCleanup();
|
|
134
|
+
|
|
135
|
+
try {
|
|
136
|
+
switch (params.action) {
|
|
137
|
+
case 'analyze':
|
|
138
|
+
return await this._analyze(params.imagePath, params.question, context);
|
|
139
|
+
case 'ask':
|
|
140
|
+
return await this._ask(params.sessionId, params.question, context);
|
|
141
|
+
case 'list-sessions':
|
|
142
|
+
return this._listSessions();
|
|
143
|
+
case 'close-session':
|
|
144
|
+
return this._closeSession(params.sessionId);
|
|
145
|
+
default:
|
|
146
|
+
return { success: false, error: `Unknown action: ${params.action}` };
|
|
147
|
+
}
|
|
148
|
+
} catch (error) {
|
|
149
|
+
return { success: false, error: error.message };
|
|
150
|
+
}
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
// --- Core Actions ---
|
|
154
|
+
|
|
155
|
+
_resolveImagePath(imagePath, context) {
|
|
156
|
+
// Resolve relative to agent's working directory (synced with terminal/filesystem tools)
|
|
157
|
+
if (path.isAbsolute(imagePath)) return imagePath;
|
|
158
|
+
const workingDir = context.directoryAccess?.workingDirectory || context.projectDir || process.cwd();
|
|
159
|
+
return path.resolve(workingDir, imagePath);
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
async _analyze(imagePath, question, context) {
|
|
163
|
+
// Read and validate image — resolve relative to agent's working directory
|
|
164
|
+
const resolvedPath = this._resolveImagePath(imagePath, context);
|
|
165
|
+
let imageBuffer;
|
|
166
|
+
try {
|
|
167
|
+
imageBuffer = await fs.readFile(resolvedPath);
|
|
168
|
+
} catch {
|
|
169
|
+
throw new Error(`Image not found: ${imagePath}`);
|
|
170
|
+
}
|
|
171
|
+
|
|
172
|
+
if (imageBuffer.length > MAX_IMAGE_SIZE_BYTES) {
|
|
173
|
+
throw new Error(`Image too large (${(imageBuffer.length / 1024 / 1024).toFixed(1)}MB). Max: ${MAX_IMAGE_SIZE_BYTES / 1024 / 1024}MB`);
|
|
174
|
+
}
|
|
175
|
+
|
|
176
|
+
const ext = path.extname(resolvedPath).toLowerCase();
|
|
177
|
+
const mimeMap = { '.jpg': 'image/jpeg', '.jpeg': 'image/jpeg', '.png': 'image/png', '.gif': 'image/gif', '.webp': 'image/webp', '.bmp': 'image/bmp' };
|
|
178
|
+
const mimeType = mimeMap[ext];
|
|
179
|
+
if (!mimeType) {
|
|
180
|
+
throw new Error(`Unsupported image format: ${ext}. Supported: ${Object.keys(mimeMap).join(', ')}`);
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
const imageBase64 = imageBuffer.toString('base64');
|
|
184
|
+
|
|
185
|
+
// Create session
|
|
186
|
+
const sessionId = `vs-${Date.now()}-${Math.random().toString(36).substr(2, 6)}`;
|
|
187
|
+
this.sessions.set(sessionId, {
|
|
188
|
+
imageBase64,
|
|
189
|
+
mimeType,
|
|
190
|
+
imagePath: resolvedPath,
|
|
191
|
+
history: [],
|
|
192
|
+
createdAt: Date.now(),
|
|
193
|
+
lastActivity: Date.now()
|
|
194
|
+
});
|
|
195
|
+
|
|
196
|
+
// Send to vision model
|
|
197
|
+
const answer = await this._sendVisionRequest(imageBase64, mimeType, question, [], context);
|
|
198
|
+
|
|
199
|
+
// Store in history
|
|
200
|
+
this.sessions.get(sessionId).history.push(
|
|
201
|
+
{ role: 'user', content: question },
|
|
202
|
+
{ role: 'assistant', content: answer }
|
|
203
|
+
);
|
|
204
|
+
|
|
205
|
+
return {
|
|
206
|
+
success: true,
|
|
207
|
+
result: {
|
|
208
|
+
answer,
|
|
209
|
+
sessionId,
|
|
210
|
+
model: this._getSelectedModel(),
|
|
211
|
+
imagePath: resolvedPath
|
|
212
|
+
}
|
|
213
|
+
};
|
|
214
|
+
}
|
|
215
|
+
|
|
216
|
+
async _ask(sessionId, question, context) {
|
|
217
|
+
const session = this.sessions.get(sessionId);
|
|
218
|
+
if (!session) {
|
|
219
|
+
throw new Error(`Vision session not found: ${sessionId}. Use "analyze" to start a new session.`);
|
|
220
|
+
}
|
|
221
|
+
|
|
222
|
+
session.lastActivity = Date.now();
|
|
223
|
+
|
|
224
|
+
// Send with conversation history
|
|
225
|
+
const answer = await this._sendVisionRequest(
|
|
226
|
+
session.imageBase64,
|
|
227
|
+
session.mimeType,
|
|
228
|
+
question,
|
|
229
|
+
session.history,
|
|
230
|
+
context
|
|
231
|
+
);
|
|
232
|
+
|
|
233
|
+
// Append to history
|
|
234
|
+
session.history.push(
|
|
235
|
+
{ role: 'user', content: question },
|
|
236
|
+
{ role: 'assistant', content: answer }
|
|
237
|
+
);
|
|
238
|
+
|
|
239
|
+
return {
|
|
240
|
+
success: true,
|
|
241
|
+
result: {
|
|
242
|
+
answer,
|
|
243
|
+
sessionId,
|
|
244
|
+
model: this._getSelectedModel(),
|
|
245
|
+
questionsInSession: session.history.filter(h => h.role === 'user').length
|
|
246
|
+
}
|
|
247
|
+
};
|
|
248
|
+
}
|
|
249
|
+
|
|
250
|
+
_listSessions() {
|
|
251
|
+
const sessions = [];
|
|
252
|
+
for (const [id, session] of this.sessions) {
|
|
253
|
+
sessions.push({
|
|
254
|
+
sessionId: id,
|
|
255
|
+
imagePath: session.imagePath,
|
|
256
|
+
questionsAsked: session.history.filter(h => h.role === 'user').length,
|
|
257
|
+
createdAt: new Date(session.createdAt).toISOString(),
|
|
258
|
+
lastActivity: new Date(session.lastActivity).toISOString()
|
|
259
|
+
});
|
|
260
|
+
}
|
|
261
|
+
return { success: true, result: { sessions, count: sessions.length } };
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
_closeSession(sessionId) {
|
|
265
|
+
if (!this.sessions.has(sessionId)) {
|
|
266
|
+
return { success: false, error: `Session not found: ${sessionId}` };
|
|
267
|
+
}
|
|
268
|
+
this.sessions.delete(sessionId);
|
|
269
|
+
return { success: true, result: { closed: sessionId } };
|
|
270
|
+
}
|
|
271
|
+
|
|
272
|
+
// --- Vision API ---
|
|
273
|
+
|
|
274
|
+
async _sendVisionRequest(imageBase64, mimeType, question, history, context) {
|
|
275
|
+
if (!this.aiService) {
|
|
276
|
+
throw new Error('AI service not available. Vision tool requires aiService dependency.');
|
|
277
|
+
}
|
|
278
|
+
|
|
279
|
+
const model = this._selectVisionModel(context);
|
|
280
|
+
if (!model) {
|
|
281
|
+
throw new Error('No vision-capable model available. Ensure at least one model with vision support is configured.');
|
|
282
|
+
}
|
|
283
|
+
|
|
284
|
+
this.logger?.info('[VisionTool] Selected vision model', { model, visionModelsAvailable: this._getVisionModels().map(m => m.name) });
|
|
285
|
+
|
|
286
|
+
const systemPrompt = 'You are a precise image analysis assistant. Answer the question about the image directly and concisely. Provide only the answer — no preamble, no filler, no commentary. If the image contains text, transcribe it accurately. If asked about objects, list them clearly. Structure your response for programmatic consumption.';
|
|
287
|
+
|
|
288
|
+
// Build messages with image
|
|
289
|
+
const messages = [];
|
|
290
|
+
|
|
291
|
+
// System prompt
|
|
292
|
+
messages.push({ role: 'system', content: systemPrompt });
|
|
293
|
+
|
|
294
|
+
// First message includes the image
|
|
295
|
+
const imageContent = [
|
|
296
|
+
{ type: 'image_url', image_url: { url: `data:${mimeType};base64,${imageBase64}` } },
|
|
297
|
+
{ type: 'text', text: history.length === 0 ? question : history[0].content }
|
|
298
|
+
];
|
|
299
|
+
messages.push({ role: 'user', content: imageContent });
|
|
300
|
+
|
|
301
|
+
// Add conversation history (skip first user message, already included with image)
|
|
302
|
+
for (let i = 1; i < history.length; i++) {
|
|
303
|
+
const h = history[i];
|
|
304
|
+
messages.push({ role: h.role, content: h.content });
|
|
305
|
+
}
|
|
306
|
+
|
|
307
|
+
// Add current question (if there's history, this is a follow-up)
|
|
308
|
+
if (history.length > 0) {
|
|
309
|
+
messages.push({ role: 'user', content: question });
|
|
310
|
+
}
|
|
311
|
+
|
|
312
|
+
// Primary: send through chat completions with multimodal content
|
|
313
|
+
// This works with all vision models via the /chat/completions endpoint
|
|
314
|
+
try {
|
|
315
|
+
const response = await this._callChatCompletionsWithImage(imageBase64, mimeType, question, history, model, systemPrompt, context);
|
|
316
|
+
return response;
|
|
317
|
+
} catch (chatError) {
|
|
318
|
+
this.logger?.warn('[VisionTool] Chat completions with image failed, trying /llm/vision endpoint', { error: chatError.message });
|
|
319
|
+
}
|
|
320
|
+
|
|
321
|
+
// Fallback: dedicated /llm/vision endpoint (supports fewer models)
|
|
322
|
+
try {
|
|
323
|
+
const response = await this._callVisionEndpoint(imageBase64, question, model, context);
|
|
324
|
+
return response;
|
|
325
|
+
} catch (visionError) {
|
|
326
|
+
throw new Error(`Vision analysis failed: ${visionError.message}`, { cause: visionError });
|
|
327
|
+
}
|
|
328
|
+
}
|
|
329
|
+
|
|
330
|
+
async _callChatCompletionsWithImage(imageBase64, mimeType, question, history, model, systemPrompt, context) {
|
|
331
|
+
const backendUrl = this.aiService?.backendUrl || 'https://loxia-api-g7hrb8bxdae8a2h7.z02.azurefd.net';
|
|
332
|
+
const sessionId = context.sessionId;
|
|
333
|
+
|
|
334
|
+
let apiKey = null;
|
|
335
|
+
if (this.aiService?.apiKeyManager) {
|
|
336
|
+
const keys = this.aiService.apiKeyManager.getKeysForRequest(sessionId, { platformProvided: true });
|
|
337
|
+
apiKey = keys.loxiaApiKey;
|
|
338
|
+
}
|
|
339
|
+
|
|
340
|
+
// Build messages array with image in the first user message
|
|
341
|
+
const messages = [];
|
|
342
|
+
|
|
343
|
+
// First user message includes the image
|
|
344
|
+
// Format image for the selected model's provider
|
|
345
|
+
const isAnthropic = model.toLowerCase().includes('claude') || model.toLowerCase().includes('anthropic');
|
|
346
|
+
const imageBlock = isAnthropic
|
|
347
|
+
? { type: 'image', source: { type: 'base64', media_type: mimeType, data: imageBase64 } }
|
|
348
|
+
: { type: 'image_url', image_url: { url: `data:${mimeType};base64,${imageBase64}` } };
|
|
349
|
+
|
|
350
|
+
const firstQuestion = history.length > 0 ? history[0].content : question;
|
|
351
|
+
messages.push({
|
|
352
|
+
role: 'user',
|
|
353
|
+
content: [
|
|
354
|
+
imageBlock,
|
|
355
|
+
{ type: 'text', text: firstQuestion }
|
|
356
|
+
]
|
|
357
|
+
});
|
|
358
|
+
|
|
359
|
+
// Add conversation history (skip first user message, already included)
|
|
360
|
+
for (let i = 1; i < history.length; i++) {
|
|
361
|
+
messages.push({ role: history[i].role, content: history[i].content });
|
|
362
|
+
}
|
|
363
|
+
|
|
364
|
+
// Add current question if this is a follow-up
|
|
365
|
+
if (history.length > 0) {
|
|
366
|
+
messages.push({ role: 'user', content: question });
|
|
367
|
+
}
|
|
368
|
+
|
|
369
|
+
// Build payload matching the /llm/chat endpoint format
|
|
370
|
+
const firstUserContent = messages[0]?.content;
|
|
371
|
+
const messageText = Array.isArray(firstUserContent)
|
|
372
|
+
? firstUserContent.find(c => c.type === 'text')?.text || question
|
|
373
|
+
: question;
|
|
374
|
+
|
|
375
|
+
const payload = {
|
|
376
|
+
model,
|
|
377
|
+
message: messageText,
|
|
378
|
+
systemPrompt,
|
|
379
|
+
messages, // Multimodal messages array
|
|
380
|
+
options: {
|
|
381
|
+
max_tokens: 2048,
|
|
382
|
+
temperature: 0.1
|
|
383
|
+
},
|
|
384
|
+
metadata: {
|
|
385
|
+
requestId: `vision-${Date.now()}`,
|
|
386
|
+
agentId: context.agentId
|
|
387
|
+
}
|
|
388
|
+
};
|
|
389
|
+
|
|
390
|
+
const response = await fetch(`${backendUrl}/llm/chat`, {
|
|
391
|
+
method: 'POST',
|
|
392
|
+
headers: {
|
|
393
|
+
'Content-Type': 'application/json',
|
|
394
|
+
...(apiKey && { 'Authorization': `Bearer ${apiKey}` })
|
|
395
|
+
},
|
|
396
|
+
body: JSON.stringify(payload),
|
|
397
|
+
signal: AbortSignal.timeout(120000)
|
|
398
|
+
});
|
|
399
|
+
|
|
400
|
+
if (!response.ok) {
|
|
401
|
+
const errorData = await response.json().catch(() => ({}));
|
|
402
|
+
throw new Error(errorData.error?.message || errorData.error || `Chat completions returned ${response.status}`);
|
|
403
|
+
}
|
|
404
|
+
|
|
405
|
+
const data = await response.json();
|
|
406
|
+
return data.content || data.choices?.[0]?.message?.content || '';
|
|
407
|
+
}
|
|
408
|
+
|
|
409
|
+
async _callVisionEndpoint(imageBase64, prompt, model, context) {
|
|
410
|
+
// Call the backend /llm/vision endpoint directly
|
|
411
|
+
const backendUrl = this.aiService?.backendUrl || 'https://loxia-api-g7hrb8bxdae8a2h7.z02.azurefd.net';
|
|
412
|
+
const sessionId = context.sessionId;
|
|
413
|
+
|
|
414
|
+
// Get API key
|
|
415
|
+
let apiKey = null;
|
|
416
|
+
if (this.aiService?.apiKeyManager) {
|
|
417
|
+
const keys = this.aiService.apiKeyManager.getKeysForRequest(sessionId, { platformProvided: true });
|
|
418
|
+
apiKey = keys.loxiaApiKey;
|
|
419
|
+
}
|
|
420
|
+
|
|
421
|
+
const response = await fetch(`${backendUrl}/llm/vision`, {
|
|
422
|
+
method: 'POST',
|
|
423
|
+
headers: {
|
|
424
|
+
'Content-Type': 'application/json',
|
|
425
|
+
...(apiKey && { 'Authorization': `Bearer ${apiKey}` })
|
|
426
|
+
},
|
|
427
|
+
body: JSON.stringify({ image: imageBase64, prompt, model, metadata: {} }),
|
|
428
|
+
signal: AbortSignal.timeout(120000)
|
|
429
|
+
});
|
|
430
|
+
|
|
431
|
+
if (!response.ok) {
|
|
432
|
+
const errorData = await response.json().catch(() => ({}));
|
|
433
|
+
throw new Error(errorData.error || `Vision API returned ${response.status}`);
|
|
434
|
+
}
|
|
435
|
+
|
|
436
|
+
const data = await response.json();
|
|
437
|
+
return data.content || '';
|
|
438
|
+
}
|
|
439
|
+
|
|
440
|
+
_selectVisionModel(context = {}) {
|
|
441
|
+
const visionModels = this._getVisionModels();
|
|
442
|
+
if (visionModels.length === 0) {
|
|
443
|
+
this.logger?.warn('[VisionTool] No vision-capable model found in model list');
|
|
444
|
+
return null;
|
|
445
|
+
}
|
|
446
|
+
|
|
447
|
+
// 1. Model explicitly recommended for vision (from catalog)
|
|
448
|
+
const recommended = visionModels.find(m => m.recommended_for?.includes('vision'));
|
|
449
|
+
if (recommended) { this._selectedModel = recommended.name; return this._selectedModel; }
|
|
450
|
+
|
|
451
|
+
// 2. Vision model with budget tier (best cost/quality)
|
|
452
|
+
const budgetVision = visionModels.find(m => m.tier === 'budget');
|
|
453
|
+
if (budgetVision) { this._selectedModel = budgetVision.name; return this._selectedModel; }
|
|
454
|
+
|
|
455
|
+
// 3. Agent's current model if it has vision capability
|
|
456
|
+
const agentModel = context.currentModel;
|
|
457
|
+
if (agentModel && visionModels.some(m => m.name === agentModel)) {
|
|
458
|
+
this._selectedModel = agentModel;
|
|
459
|
+
return this._selectedModel;
|
|
460
|
+
}
|
|
461
|
+
|
|
462
|
+
// 4. First available vision model
|
|
463
|
+
this._selectedModel = visionModels[0].name;
|
|
464
|
+
return this._selectedModel;
|
|
465
|
+
}
|
|
466
|
+
|
|
467
|
+
_getVisionModels() {
|
|
468
|
+
if (!this.modelsService) return [];
|
|
469
|
+
const allModels = this.modelsService.getModels?.() || [];
|
|
470
|
+
return allModels.filter(m => m.supportsVision === true);
|
|
471
|
+
}
|
|
472
|
+
|
|
473
|
+
_getSelectedModel() {
|
|
474
|
+
return this._selectedModel || null;
|
|
475
|
+
}
|
|
476
|
+
|
|
477
|
+
// --- Cleanup ---
|
|
478
|
+
|
|
479
|
+
_ensureCleanup() {
|
|
480
|
+
if (this.cleanupTimer) return;
|
|
481
|
+
this.cleanupTimer = setInterval(() => {
|
|
482
|
+
const now = Date.now();
|
|
483
|
+
for (const [id, session] of this.sessions) {
|
|
484
|
+
if (now - session.lastActivity > SESSION_TIMEOUT_MS) {
|
|
485
|
+
this.sessions.delete(id);
|
|
486
|
+
this.logger?.debug('[VisionTool] Session expired', { sessionId: id });
|
|
487
|
+
}
|
|
488
|
+
}
|
|
489
|
+
}, CLEANUP_INTERVAL_MS);
|
|
490
|
+
// Don't prevent process exit
|
|
491
|
+
if (this.cleanupTimer.unref) this.cleanupTimer.unref();
|
|
492
|
+
}
|
|
493
|
+
|
|
494
|
+
getParameterSchema() {
|
|
495
|
+
return {
|
|
496
|
+
type: 'object',
|
|
497
|
+
required: ['action'],
|
|
498
|
+
properties: {
|
|
499
|
+
action: { type: 'string', enum: ['analyze', 'ask', 'list-sessions', 'close-session'] },
|
|
500
|
+
imagePath: { type: 'string', description: 'Path to image file (for analyze)' },
|
|
501
|
+
question: { type: 'string', description: 'Question about the image' },
|
|
502
|
+
sessionId: { type: 'string', description: 'Session ID (for ask/close-session)' }
|
|
503
|
+
}
|
|
504
|
+
};
|
|
505
|
+
}
|
|
506
|
+
}
|
|
507
|
+
|
|
508
|
+
export default VisionTool;
|