npm - @agile-vibe-coding/avc - Versions diffs - 0.1.1 → 0.3.1 - Mend

@agile-vibe-coding/avc 0.1.1 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (239) hide show

package/cli/agent-loader.js +21 -0
package/cli/agents/agent-selector.md +152 -0
package/cli/agents/architecture-recommender.md +418 -0
package/cli/agents/code-implementer.md +117 -0
package/cli/agents/code-validator.md +80 -0
package/cli/agents/context-reviewer-epic.md +101 -0
package/cli/agents/context-reviewer-story.md +92 -0
package/cli/agents/context-writer-epic.md +145 -0
package/cli/agents/context-writer-story.md +111 -0
package/cli/agents/database-deep-dive.md +470 -0
package/cli/agents/database-recommender.md +634 -0
package/cli/agents/doc-distributor.md +176 -0
package/cli/agents/doc-writer-epic.md +42 -0
package/cli/agents/doc-writer-story.md +43 -0
package/cli/agents/documentation-updater.md +203 -0
package/cli/agents/duplicate-detector.md +110 -0
package/cli/agents/epic-story-decomposer.md +559 -0
package/cli/agents/feature-context-generator.md +91 -0
package/cli/agents/gap-checker-epic.md +52 -0
package/cli/agents/impact-checker-story.md +51 -0
package/cli/agents/migration-guide-generator.md +305 -0
package/cli/agents/mission-scope-generator.md +143 -0
package/cli/agents/mission-scope-validator.md +146 -0
package/cli/agents/project-context-extractor.md +122 -0
package/cli/agents/project-documentation-creator.json +226 -0
package/cli/agents/project-documentation-creator.md +595 -0
package/cli/agents/question-prefiller.md +269 -0
package/cli/agents/refiner-epic.md +39 -0
package/cli/agents/refiner-story.md +42 -0
package/cli/agents/scaffolding-generator.md +99 -0
package/cli/agents/seed-validator.md +71 -0
package/cli/agents/story-doc-enricher.md +133 -0
package/cli/agents/story-scope-reviewer.md +147 -0
package/cli/agents/story-splitter.md +83 -0
package/cli/agents/suggestion-business-analyst.md +88 -0
package/cli/agents/suggestion-deployment-architect.md +263 -0
package/cli/agents/suggestion-product-manager.md +129 -0
package/cli/agents/suggestion-security-specialist.md +156 -0
package/cli/agents/suggestion-technical-architect.md +269 -0
package/cli/agents/suggestion-ux-researcher.md +93 -0
package/cli/agents/task-subtask-decomposer.md +188 -0
package/cli/agents/validator-documentation.json +183 -0
package/cli/agents/validator-documentation.md +455 -0
package/cli/agents/validator-selector.md +211 -0
package/cli/ansi-colors.js +21 -0
package/cli/api-reference-tool.js +368 -0
package/cli/build-docs.js +29 -8
package/cli/ceremony-history.js +369 -0
package/cli/checks/catalog.json +76 -0
package/cli/checks/code/quality.json +26 -0
package/cli/checks/code/testing.json +14 -0
package/cli/checks/code/traceability.json +26 -0
package/cli/checks/cross-refs/epic.json +171 -0
package/cli/checks/cross-refs/story.json +149 -0
package/cli/checks/epic/api.json +114 -0
package/cli/checks/epic/backend.json +126 -0
package/cli/checks/epic/cloud.json +126 -0
package/cli/checks/epic/data.json +102 -0
package/cli/checks/epic/database.json +114 -0
package/cli/checks/epic/developer.json +182 -0
package/cli/checks/epic/devops.json +174 -0
package/cli/checks/epic/frontend.json +162 -0
package/cli/checks/epic/mobile.json +102 -0
package/cli/checks/epic/qa.json +90 -0
package/cli/checks/epic/security.json +184 -0
package/cli/checks/epic/solution-architect.json +192 -0
package/cli/checks/epic/test-architect.json +90 -0
package/cli/checks/epic/ui.json +102 -0
package/cli/checks/epic/ux.json +90 -0
package/cli/checks/fixes/epic-fix-template.md +10 -0
package/cli/checks/fixes/story-fix-template.md +10 -0
package/cli/checks/story/api.json +186 -0
package/cli/checks/story/backend.json +102 -0
package/cli/checks/story/cloud.json +102 -0
package/cli/checks/story/data.json +210 -0
package/cli/checks/story/database.json +102 -0
package/cli/checks/story/developer.json +168 -0
package/cli/checks/story/devops.json +102 -0
package/cli/checks/story/frontend.json +174 -0
package/cli/checks/story/mobile.json +102 -0
package/cli/checks/story/qa.json +210 -0
package/cli/checks/story/security.json +198 -0
package/cli/checks/story/solution-architect.json +230 -0
package/cli/checks/story/test-architect.json +210 -0
package/cli/checks/story/ui.json +102 -0
package/cli/checks/story/ux.json +102 -0
package/cli/coding-order.js +401 -0
package/cli/command-logger.js +49 -12
package/cli/components/static-output.js +63 -0
package/cli/console-output-manager.js +94 -0
package/cli/dependency-checker.js +72 -0
package/cli/docs-sync.js +306 -0
package/cli/epic-story-validator.js +659 -0
package/cli/evaluation-prompts.js +1008 -0
package/cli/execution-context.js +195 -0
package/cli/generate-summary-table.js +340 -0
package/cli/init-model-config.js +704 -0
package/cli/init.js +1737 -278
package/cli/kanban-server-manager.js +227 -0
package/cli/llm-claude.js +150 -1
package/cli/llm-gemini.js +109 -0
package/cli/llm-local.js +493 -0
package/cli/llm-mock.js +233 -0
package/cli/llm-openai.js +454 -0
package/cli/llm-provider.js +379 -3
package/cli/llm-token-limits.js +211 -0
package/cli/llm-verifier.js +662 -0
package/cli/llm-xiaomi.js +143 -0
package/cli/message-constants.js +49 -0
package/cli/message-manager.js +334 -0
package/cli/message-types.js +96 -0
package/cli/messaging-api.js +291 -0
package/cli/micro-check-fixer.js +335 -0
package/cli/micro-check-runner.js +449 -0
package/cli/micro-check-scorer.js +148 -0
package/cli/micro-check-validator.js +538 -0
package/cli/model-pricing.js +192 -0
package/cli/model-query-engine.js +468 -0
package/cli/model-recommendation-analyzer.js +495 -0
package/cli/model-selector.js +270 -0
package/cli/output-buffer.js +107 -0
package/cli/process-manager.js +73 -2
package/cli/prompt-logger.js +57 -0
package/cli/repl-ink.js +4625 -1094
package/cli/repl-old.js +3 -4
package/cli/seed-processor.js +962 -0
package/cli/sprint-planning-processor.js +4162 -0
package/cli/template-processor.js +2149 -105
package/cli/templates/project.md +25 -8
package/cli/templates/vitepress-config.mts.template +5 -4
package/cli/token-tracker.js +547 -0
package/cli/tools/generate-story-validators.js +317 -0
package/cli/tools/generate-validators.js +669 -0
package/cli/update-checker.js +19 -17
package/cli/update-notifier.js +4 -4
package/cli/validation-router.js +667 -0
package/cli/verification-tracker.js +563 -0
package/cli/worktree-runner.js +654 -0
package/kanban/README.md +386 -0
package/kanban/client/README.md +205 -0
package/kanban/client/components.json +20 -0
package/kanban/client/dist/assets/index-D_KC5EQT.css +1 -0
package/kanban/client/dist/assets/index-DjY5zqW7.js +351 -0
package/kanban/client/dist/index.html +16 -0
package/kanban/client/dist/vite.svg +1 -0
package/kanban/client/index.html +15 -0
package/kanban/client/package-lock.json +9442 -0
package/kanban/client/package.json +44 -0
package/kanban/client/postcss.config.js +6 -0
package/kanban/client/public/vite.svg +1 -0
package/kanban/client/src/App.jsx +651 -0
package/kanban/client/src/components/ProjectFileEditorPopup.jsx +117 -0
package/kanban/client/src/components/ceremony/AskArchPopup.jsx +420 -0
package/kanban/client/src/components/ceremony/AskModelPopup.jsx +629 -0
package/kanban/client/src/components/ceremony/CeremonyWorkflowModal.jsx +1133 -0
package/kanban/client/src/components/ceremony/EpicStorySelectionModal.jsx +254 -0
package/kanban/client/src/components/ceremony/ProviderSwitcherButton.jsx +290 -0
package/kanban/client/src/components/ceremony/SponsorCallModal.jsx +686 -0
package/kanban/client/src/components/ceremony/SprintPlanningModal.jsx +838 -0
package/kanban/client/src/components/ceremony/steps/ArchitectureStep.jsx +150 -0
package/kanban/client/src/components/ceremony/steps/CompleteStep.jsx +136 -0
package/kanban/client/src/components/ceremony/steps/DatabaseStep.jsx +202 -0
package/kanban/client/src/components/ceremony/steps/DeploymentStep.jsx +123 -0
package/kanban/client/src/components/ceremony/steps/MissionStep.jsx +106 -0
package/kanban/client/src/components/ceremony/steps/ReviewAnswersStep.jsx +329 -0
package/kanban/client/src/components/ceremony/steps/RunningStep.jsx +249 -0
package/kanban/client/src/components/kanban/CardDetailModal.jsx +646 -0
package/kanban/client/src/components/kanban/EpicSection.jsx +146 -0
package/kanban/client/src/components/kanban/FilterToolbar.jsx +222 -0
package/kanban/client/src/components/kanban/GroupingSelector.jsx +63 -0
package/kanban/client/src/components/kanban/KanbanBoard.jsx +211 -0
package/kanban/client/src/components/kanban/KanbanCard.jsx +147 -0
package/kanban/client/src/components/kanban/KanbanColumn.jsx +90 -0
package/kanban/client/src/components/kanban/RefineWorkItemPopup.jsx +784 -0
package/kanban/client/src/components/kanban/RunButton.jsx +162 -0
package/kanban/client/src/components/kanban/SeedButton.jsx +176 -0
package/kanban/client/src/components/layout/LoadingScreen.jsx +82 -0
package/kanban/client/src/components/process/ProcessMonitorBar.jsx +80 -0
package/kanban/client/src/components/settings/AgentEditorPopup.jsx +171 -0
package/kanban/client/src/components/settings/AgentsTab.jsx +381 -0
package/kanban/client/src/components/settings/ApiKeysTab.jsx +142 -0
package/kanban/client/src/components/settings/CeremonyModelsTab.jsx +105 -0
package/kanban/client/src/components/settings/CheckEditorPopup.jsx +507 -0
package/kanban/client/src/components/settings/CostThresholdsTab.jsx +95 -0
package/kanban/client/src/components/settings/ModelPricingTab.jsx +269 -0
package/kanban/client/src/components/settings/OpenAIAuthSection.jsx +412 -0
package/kanban/client/src/components/settings/ServersTab.jsx +121 -0
package/kanban/client/src/components/settings/SettingsModal.jsx +84 -0
package/kanban/client/src/components/stats/CostModal.jsx +384 -0
package/kanban/client/src/components/ui/badge.jsx +27 -0
package/kanban/client/src/components/ui/dialog.jsx +121 -0
package/kanban/client/src/components/ui/tabs.jsx +85 -0
package/kanban/client/src/hooks/__tests__/useGrouping.test.js +232 -0
package/kanban/client/src/hooks/useGrouping.js +177 -0
package/kanban/client/src/hooks/useWebSocket.js +120 -0
package/kanban/client/src/lib/__tests__/api.test.js +196 -0
package/kanban/client/src/lib/__tests__/status-grouping.test.js +94 -0
package/kanban/client/src/lib/api.js +515 -0
package/kanban/client/src/lib/status-grouping.js +154 -0
package/kanban/client/src/lib/utils.js +11 -0
package/kanban/client/src/main.jsx +10 -0
package/kanban/client/src/store/__tests__/kanbanStore.test.js +164 -0
package/kanban/client/src/store/ceremonyStore.js +172 -0
package/kanban/client/src/store/filterStore.js +201 -0
package/kanban/client/src/store/kanbanStore.js +123 -0
package/kanban/client/src/store/processStore.js +65 -0
package/kanban/client/src/store/sprintPlanningStore.js +33 -0
package/kanban/client/src/styles/globals.css +59 -0
package/kanban/client/tailwind.config.js +77 -0
package/kanban/client/vite.config.js +28 -0
package/kanban/client/vitest.config.js +28 -0
package/kanban/dev-start.sh +47 -0
package/kanban/package.json +12 -0
package/kanban/server/index.js +537 -0
package/kanban/server/routes/ceremony.js +454 -0
package/kanban/server/routes/costs.js +163 -0
package/kanban/server/routes/openai-oauth.js +366 -0
package/kanban/server/routes/processes.js +50 -0
package/kanban/server/routes/settings.js +736 -0
package/kanban/server/routes/websocket.js +281 -0
package/kanban/server/routes/work-items.js +487 -0
package/kanban/server/services/CeremonyService.js +1441 -0
package/kanban/server/services/FileSystemScanner.js +95 -0
package/kanban/server/services/FileWatcher.js +144 -0
package/kanban/server/services/HierarchyBuilder.js +196 -0
package/kanban/server/services/ProcessRegistry.js +122 -0
package/kanban/server/services/TaskRunnerService.js +261 -0
package/kanban/server/services/WorkItemReader.js +123 -0
package/kanban/server/services/WorkItemRefineService.js +510 -0
package/kanban/server/start.js +49 -0
package/kanban/server/utils/kanban-logger.js +132 -0
package/kanban/server/utils/markdown.js +91 -0
package/kanban/server/utils/status-grouping.js +107 -0
package/kanban/server/workers/run-task-worker.js +121 -0
package/kanban/server/workers/seed-worker.js +94 -0
package/kanban/server/workers/sponsor-call-worker.js +92 -0
package/kanban/server/workers/sprint-planning-worker.js +212 -0
package/package.json +19 -7
package/cli/agents/documentation.md +0 -302

package/cli/llm-local.js ADDED Viewed

@@ -0,0 +1,493 @@
+import OpenAI from 'openai';
+import { jsonrepair } from 'jsonrepair';
+import { LLMProvider } from './llm-provider.js';
+/**
+ * Known local inference servers and their default endpoints.
+ * All expose an OpenAI-compatible Chat Completions API.
+ */
+const KNOWN_SERVERS = [
+  { app: 'lmstudio',  url: 'http://localhost:1234/v1',   label: 'LM Studio' },
+  { app: 'ollama',    url: 'http://localhost:11434/v1',   label: 'Ollama' },
+  { app: 'llamacpp',  url: 'http://localhost:8080/v1',    label: 'llama.cpp' },
+  { app: 'vllm',      url: 'http://localhost:8000/v1',    label: 'vLLM' },
+  { app: 'localai',   url: 'http://localhost:8081/v1',    label: 'LocalAI' },
+];
+export { KNOWN_SERVERS };
+/**
+ * Probe a single server: GET /models with a short timeout.
+ * @param {string} baseURL - e.g. 'http://localhost:1234/v1'
+ * @param {number} timeoutMs
+ * @returns {Promise<Array<{id:string, owned_by?:string, context_length?:number}>>}
+ */
+async function probeServer(baseURL, timeoutMs = 1500) {
+  const controller = new AbortController();
+  const timer = setTimeout(() => controller.abort(), timeoutMs);
+  try {
+    const resp = await fetch(`${baseURL}/models`, { signal: controller.signal });
+    if (!resp.ok) return [];
+    const body = await resp.json();
+    return body.data || [];
+  } catch {
+    return [];
+  } finally {
+    clearTimeout(timer);
+  }
+}
+/**
+ * Discover all running local inference servers and their loaded models.
+ * Also checks LOCAL_LLM_URL env var for custom endpoints.
+ * @returns {Promise<Array<{app:string, label:string, url:string, models:Array}>>}
+ */
+export async function discoverLocalServers() {
+  const servers = [...KNOWN_SERVERS];
+  // Add custom endpoint from env if set and not already in the list
+  const customUrl = process.env.LOCAL_LLM_URL;
+  if (customUrl) {
+    const normalized = customUrl.replace(/\/+$/, '');
+    const base = normalized.endsWith('/v1') ? normalized : `${normalized}/v1`;
+    if (!servers.some(s => s.url === base)) {
+      servers.unshift({ app: 'custom', url: base, label: 'Custom Local' });
+    }
+  }
+  const results = await Promise.all(
+    servers.map(async (server) => {
+      const rawModels = await probeServer(server.url);
+      if (rawModels.length === 0) return null;
+      const models = rawModels.map(m => ({
+        id: m.id,
+        ownedBy: m.owned_by || null,
+        contextLength: m.context_length || null,
+      }));
+      return { ...server, models };
+    })
+  );
+  return results.filter(Boolean);
+}
+/**
+ * Strip any XML-like tag blocks that local models use for internal reasoning.
+ * Models use a variety of tags: <think>, <reasoning>, <reflection>, <scratchpad>,
+ * <internal>, <thought>, <analysis>, <planning>, <chain_of_thought>, etc.
+ * Instead of maintaining an allowlist, we strip ALL matched <word>...</word> blocks
+ * that appear before the actual content.
+ */
+function cleanLocalResponse(text) {
+  let cleaned = text;
+  // Pass 1: remove all <single_word>...</single_word> blocks (case-insensitive, multi-line).
+  // These are almost universally reasoning/thinking wrappers in local models.
+  // Matches tags like <think>, <reasoning>, <reflection>, <scratchpad>, <thought>,
+  // <analysis>, <planning>, <internal>, <chain_of_thought>, etc.
+  // Uses a backreference to ensure opening and closing tags match.
+  cleaned = cleaned.replace(/<([a-z][a-z0-9_]*)>[\s\S]*?<\/\1>\s*/gi, '');
+  return cleaned.trim();
+}
+/**
+ * For JSON responses: extract the JSON payload from whatever the model emitted.
+ * Handles code fences, residual text before/after JSON, and nested structures.
+ */
+function extractJSON(text) {
+  let s = text.trim();
+  // Strip markdown code fences
+  if (s.startsWith('```')) {
+    s = s.replace(/^```(?:json)?\s*\n?/, '').replace(/\n?\s*```\s*$/, '').trim();
+  }
+  // If it already looks like JSON, return as-is
+  if (s.startsWith('{') || s.startsWith('[')) return s;
+  // Otherwise, find the first { or [ and extract to its matching closer.
+  // This handles models that emit preamble text before the JSON.
+  const objStart = s.indexOf('{');
+  const arrStart = s.indexOf('[');
+  let start = -1;
+  let openChar, closeChar;
+  if (objStart >= 0 && (arrStart < 0 || objStart < arrStart)) {
+    start = objStart; openChar = '{'; closeChar = '}';
+  } else if (arrStart >= 0) {
+    start = arrStart; openChar = '['; closeChar = ']';
+  }
+  if (start < 0) return s; // no JSON found, return as-is for error reporting
+  // Walk forward counting nesting depth, respecting strings
+  let depth = 0;
+  let inString = false;
+  let escape = false;
+  for (let i = start; i < s.length; i++) {
+    const ch = s[i];
+    if (escape) { escape = false; continue; }
+    if (ch === '\\' && inString) { escape = true; continue; }
+    if (ch === '"') { inString = !inString; continue; }
+    if (inString) continue;
+    if (ch === openChar) depth++;
+    if (ch === closeChar) { depth--; if (depth === 0) return s.slice(start, i + 1); }
+  }
+  // Unbalanced — return from start to end, let JSON.parse report the real error
+  return s.slice(start);
+}
+/**
+ * LocalProvider — connects to any OpenAI-compatible local inference server.
+ * Uses the `openai` SDK pointed at a local base URL.
+ */
+export class LocalProvider extends LLMProvider {
+  /**
+   * @param {string} model - Model ID loaded on the local server
+   * @param {string} [baseURL] - Override base URL (defaults to auto-detect or LOCAL_LLM_URL)
+   */
+  constructor(model = 'default', baseURL = null) {
+    super('local', model);
+    this._baseURL = baseURL || process.env.LOCAL_LLM_URL || null;
+  }
+  /**
+   * Auto-detect which server has the requested model, or use configured base URL.
+   */
+  async _resolveBaseURL() {
+    if (this._baseURL) {
+      const normalized = this._baseURL.replace(/\/+$/, '');
+      return normalized.endsWith('/v1') ? normalized : `${normalized}/v1`;
+    }
+    // Auto-detect: probe known servers for the model
+    const servers = await discoverLocalServers();
+    for (const server of servers) {
+      if (server.models.some(m => m.id === this.model)) {
+        this._baseURL = server.url;
+        return server.url;
+      }
+    }
+    // Fallback: if any server is running, use the first one
+    if (servers.length > 0) {
+      this._baseURL = servers[0].url;
+      return servers[0].url;
+    }
+    throw new Error(
+      `No local inference server found. Start LM Studio, Ollama, or another local server, ` +
+      `or set LOCAL_LLM_URL in your .env file.`
+    );
+  }
+  _createClient() {
+    // Deferred — actual client creation happens in _ensureClient() after async base URL resolution
+    return null;
+  }
+  async _ensureClient() {
+    if (this._client) return;
+    const baseURL = await this._resolveBaseURL();
+    this._client = new OpenAI({
+      baseURL,
+      apiKey: 'not-needed', // Local servers don't require API keys
+      timeout: 30 * 60_000, // 30 min — local models on consumer hardware can be very slow
+      maxRetries: 0,
+    });
+  }
+  /**
+   * Stream a chat completion and collect the full response.
+   * Streaming prevents server-side idle timeouts (e.g. LM Studio's 5-min default)
+   * because tokens flow continuously over the connection.
+   * @returns {{ content: string, usage: object|null }}
+   */
+  async _streamCompletion(params) {
+    const stream = await this._client.chat.completions.create({
+      ...params,
+      stream: true,
+      stream_options: { include_usage: true },
+    });
+    const chunks = [];
+    let usage = null;
+    for await (const chunk of stream) {
+      const delta = chunk.choices?.[0]?.delta?.content;
+      if (delta) chunks.push(delta);
+      // The last chunk with stream_options.include_usage carries the usage object
+      if (chunk.usage) usage = chunk.usage;
+    }
+    return { content: chunks.join(''), usage };
+  }
+  async _callProvider(prompt, maxTokens, systemInstructions) {
+    await this._ensureClient();
+    const messages = [];
+    if (systemInstructions) {
+      messages.push({ role: 'system', content: systemInstructions });
+    }
+    messages.push({ role: 'user', content: prompt });
+    const params = {
+      model: this.model,
+      messages,
+      // Don't send max_tokens to local servers — let the server use its own
+      // context window limit. Artificially capping output truncates large responses.
+    };
+    const { content, usage } = await this._streamCompletion(params);
+    this._trackTokens(usage);
+    return cleanLocalResponse(content);
+  }
+  async generateJSON(prompt, agentInstructions = null, cachedContext = null) {
+    await this._ensureClient();
+    const JSON_SYSTEM = 'You are a helpful assistant that always returns valid JSON. Your response must be a valid JSON object or array, nothing else. Do not include any thinking, reasoning, or explanation — only the JSON.';
+    const systemParts = [JSON_SYSTEM];
+    if (agentInstructions) systemParts.push(agentInstructions);
+    if (cachedContext) systemParts.push(`---\n\n${cachedContext}`);
+    const messages = [
+      { role: 'system', content: systemParts.join('\n\n') },
+      { role: 'user',   content: prompt },
+    ];
+    const params = {
+      model: this.model,
+      messages,
+      // Don't send max_tokens to local servers — let the server use its own
+      // context window limit. Artificially capping output truncates large responses.
+    };
+    // Try JSON mode — not all local servers support it; fall back gracefully
+    let useJsonMode = true;
+    const _t0 = Date.now();
+    let content;
+    let usage;
+    try {
+      ({ content, usage } = await this._withRetry(
+        () => this._streamCompletion({
+          ...params,
+          ...(useJsonMode ? { response_format: { type: 'json_object' } } : {}),
+        }),
+        'JSON generation (Local)'
+      ));
+    } catch (err) {
+      // If JSON mode is not supported, retry without it
+      if (useJsonMode && (err.message?.includes('response_format') || err.status === 400)) {
+        useJsonMode = false;
+        ({ content, usage } = await this._withRetry(
+          () => this._streamCompletion(params),
+          'JSON generation (Local, no json_mode)'
+        ));
+      } else {
+        throw err;
+      }
+    }
+    this._trackTokens(usage, {
+      prompt,
+      agentInstructions: agentInstructions ?? null,
+      response: content,
+      elapsed: Date.now() - _t0,
+    });
+    // Strip reasoning tags, code fences, and extract JSON payload
+    let jsonStr = extractJSON(cleanLocalResponse(content));
+    try {
+      return JSON.parse(jsonStr);
+    } catch (firstError) {
+      if (jsonStr.startsWith('{') || jsonStr.startsWith('[')) {
+        try { return JSON.parse(jsonrepair(jsonStr)); } catch { /* fall through */ }
+      }
+      throw new Error(`Failed to parse JSON response from local model: ${firstError.message}\n\nResponse was:\n${content}`);
+    }
+  }
+  /**
+   * Generate JSON with tool-calling support.
+   * Runs a tool-call loop: if the model emits tool_calls, they are executed
+   * via the provided dispatcher and results fed back until the model returns
+   * a final JSON content response.
+   *
+   * @param {string} prompt - User prompt
+   * @param {string|null} agentInstructions - System instructions
+   * @param {Array} tools - OpenAI-format tool definitions
+   * @param {Function} toolDispatcher - async (name, args) => string
+   * @param {number} [maxRounds=5] - Max tool-call rounds to prevent infinite loops
+   * @returns {Promise<Object>} Parsed JSON response
+   */
+  async generateJSONWithTools(prompt, agentInstructions, tools, toolDispatcher, maxRounds = 5) {
+    await this._ensureClient();
+    const JSON_SYSTEM = 'You are a helpful assistant that always returns valid JSON. When you need accurate API details for external services, use the fetch_api_reference tool before writing your response. Your final response must be a valid JSON object or array, nothing else.';
+    const systemParts = [JSON_SYSTEM];
+    if (agentInstructions) systemParts.push(agentInstructions);
+    const messages = [
+      { role: 'system', content: systemParts.join('\n\n') },
+      { role: 'user',   content: prompt },
+    ];
+    const _t0 = Date.now();
+    let totalUsage = { prompt_tokens: 0, completion_tokens: 0 };
+    let toolCallCount = 0;
+    let forceNoTools = false;
+    for (let round = 0; round < maxRounds + 2; round++) {
+      const params = {
+        model: this.model,
+        messages,
+        ...(forceNoTools ? {} : { tools }),
+      };
+      let response;
+      try {
+        if (forceNoTools) {
+          // Final forced round: use streaming to prevent LM Studio's server-side idle timeout
+          // (non-streaming requests can timeout after ~5 min under load).
+          // No tools in params, so we only expect content back — streaming is safe.
+          const { content, usage } = await this._streamCompletion(params);
+          response = {
+            usage,
+            choices: [{ finish_reason: 'stop', message: { content, tool_calls: null } }],
+          };
+        } else {
+          // Tool-call rounds: use non-streaming (streaming tool call support is inconsistent across local servers)
+          response = await this._withRetry(
+            () => this._client.chat.completions.create(params),
+            `JSON+tools generation (Local, round ${round + 1})`
+          );
+        }
+      } catch (err) {
+        // If tools not supported, fall back to regular generateJSON
+        if (err.message?.includes('tools') || err.status === 400) {
+          console.log('[DEBUG] Local server does not support tools — falling back to generateJSON');
+          return this.generateJSON(prompt, agentInstructions);
+        }
+        throw err;
+      }
+      // Accumulate token usage
+      if (response.usage) {
+        totalUsage.prompt_tokens += response.usage.prompt_tokens || 0;
+        totalUsage.completion_tokens += response.usage.completion_tokens || 0;
+      }
+      const choice = response.choices?.[0];
+      if (!choice) {
+        throw new Error('No response choice from local model');
+      }
+      // If the model wants to call tools, execute them and loop
+      if (choice.finish_reason === 'tool_calls' || choice.message?.tool_calls?.length > 0) {
+        if (round >= maxRounds) {
+          console.log(`[DEBUG] Tool call loop exceeded ${maxRounds} rounds — forcing final response without tools`);
+          // Re-request without tools to force a content response
+          messages.push(choice.message);
+          messages.push({ role: 'user', content: 'Please provide your final JSON response now, without calling any more tools.' });
+          forceNoTools = true;
+          continue;
+        }
+        // Append assistant message with tool calls
+        messages.push(choice.message);
+        // Execute each tool call
+        for (const toolCall of choice.message.tool_calls) {
+          toolCallCount++;
+          const fnName = toolCall.function?.name;
+          let fnArgs;
+          try {
+            fnArgs = JSON.parse(toolCall.function?.arguments || '{}');
+          } catch {
+            fnArgs = {};
+          }
+          console.log(`[DEBUG] Tool call #${toolCallCount}: ${fnName}(${JSON.stringify(fnArgs)})`);
+          let result;
+          try {
+            result = await toolDispatcher(fnName, fnArgs);
+          } catch (err) {
+            result = `Tool error: ${err.message}`;
+          }
+          // Append tool result
+          messages.push({
+            role: 'tool',
+            tool_call_id: toolCall.id,
+            content: typeof result === 'string' ? result : JSON.stringify(result),
+          });
+        }
+        continue; // Loop back for the model to process tool results
+      }
+      // Model returned content — extract and parse JSON
+      const content = choice.message?.content || '';
+      this._trackTokens(totalUsage, {
+        prompt,
+        agentInstructions: agentInstructions ?? null,
+        response: content,
+        elapsed: Date.now() - _t0,
+      });
+      if (toolCallCount > 0) {
+        console.log(`[DEBUG] Tool-augmented generation complete: ${toolCallCount} tool call(s) in ${round + 1} round(s)`);
+      }
+      const jsonStr = extractJSON(cleanLocalResponse(content));
+      try {
+        return JSON.parse(jsonStr);
+      } catch (firstError) {
+        if (jsonStr.startsWith('{') || jsonStr.startsWith('[')) {
+          try { return JSON.parse(jsonrepair(jsonStr)); } catch { /* fall through */ }
+        }
+        throw new Error(`Failed to parse JSON response from local model (with tools): ${firstError.message}\n\nResponse was:\n${content}`);
+      }
+    }
+    throw new Error('Tool call loop exhausted without final response');
+  }
+  async generateText(prompt, agentInstructions = null, cachedContext = null) {
+    await this._ensureClient();
+    const systemParts = [];
+    if (agentInstructions) systemParts.push(agentInstructions);
+    if (cachedContext) systemParts.push(cachedContext);
+    const messages = [];
+    if (systemParts.length > 0) {
+      messages.push({ role: 'system', content: systemParts.join('\n\n') });
+    }
+    messages.push({ role: 'user', content: prompt });
+    const _t0 = Date.now();
+    const { content, usage } = await this._withRetry(
+      () => this._streamCompletion({
+        model: this.model,
+        messages,
+        // Don't send max_tokens to local servers — let the server manage limits.
+      }),
+      'Text generation (Local)'
+    );
+    const textContent = cleanLocalResponse(content);
+    this._trackTokens(usage, {
+      prompt,
+      agentInstructions: agentInstructions ?? null,
+      response: textContent,
+      elapsed: Date.now() - _t0,
+    });
+    return textContent;
+  }
+}