npm - agent-tool-forge - Versions diffs - 0.3.0 - Mend

agent-tool-forge 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (107) hide show

package/LICENSE +21 -0
package/README.md +209 -0
package/lib/agent-registry.js +170 -0
package/lib/api-client.js +792 -0
package/lib/api-loader.js +260 -0
package/lib/auth.d.ts +25 -0
package/lib/auth.js +158 -0
package/lib/checks/check-adapter.js +172 -0
package/lib/checks/compose.js +42 -0
package/lib/checks/content-match.js +14 -0
package/lib/checks/cost-budget.js +11 -0
package/lib/checks/index.js +18 -0
package/lib/checks/json-valid.js +15 -0
package/lib/checks/latency.js +11 -0
package/lib/checks/length-bounds.js +17 -0
package/lib/checks/negative-match.js +14 -0
package/lib/checks/no-hallucinated-numbers.js +63 -0
package/lib/checks/non-empty.js +34 -0
package/lib/checks/regex-match.js +12 -0
package/lib/checks/run-checks.js +84 -0
package/lib/checks/schema-match.js +26 -0
package/lib/checks/tool-call-count.js +16 -0
package/lib/checks/tool-selection.js +34 -0
package/lib/checks/types.js +45 -0
package/lib/comparison/compare.js +86 -0
package/lib/comparison/format.js +104 -0
package/lib/comparison/index.js +6 -0
package/lib/comparison/statistics.js +59 -0
package/lib/comparison/types.js +41 -0
package/lib/config-schema.js +200 -0
package/lib/config.d.ts +66 -0
package/lib/conversation-store.d.ts +77 -0
package/lib/conversation-store.js +443 -0
package/lib/db.d.ts +6 -0
package/lib/db.js +1112 -0
package/lib/dep-check.js +99 -0
package/lib/drift-background.js +61 -0
package/lib/drift-monitor.js +187 -0
package/lib/eval-runner.js +566 -0
package/lib/fixtures/fixture-store.js +161 -0
package/lib/fixtures/index.js +11 -0
package/lib/forge-engine.js +982 -0
package/lib/forge-eval-generator.js +417 -0
package/lib/forge-file-writer.js +386 -0
package/lib/forge-service-client.js +190 -0
package/lib/forge-service.d.ts +4 -0
package/lib/forge-service.js +655 -0
package/lib/forge-verifier-generator.js +271 -0
package/lib/handlers/admin.js +151 -0
package/lib/handlers/agents.js +229 -0
package/lib/handlers/chat-resume.js +334 -0
package/lib/handlers/chat-sync.js +320 -0
package/lib/handlers/chat.js +320 -0
package/lib/handlers/conversations.js +92 -0
package/lib/handlers/preferences.js +88 -0
package/lib/handlers/tools-list.js +58 -0
package/lib/hitl-engine.d.ts +60 -0
package/lib/hitl-engine.js +261 -0
package/lib/http-utils.js +92 -0
package/lib/index.d.ts +20 -0
package/lib/index.js +141 -0
package/lib/init.js +636 -0
package/lib/manual-entry.js +59 -0
package/lib/mcp-server.js +252 -0
package/lib/output-groups.js +54 -0
package/lib/postgres-store.d.ts +31 -0
package/lib/postgres-store.js +465 -0
package/lib/preference-store.d.ts +47 -0
package/lib/preference-store.js +79 -0
package/lib/prompt-store.d.ts +42 -0
package/lib/prompt-store.js +60 -0
package/lib/rate-limiter.d.ts +30 -0
package/lib/rate-limiter.js +104 -0
package/lib/react-engine.d.ts +110 -0
package/lib/react-engine.js +337 -0
package/lib/runner/cli.js +156 -0
package/lib/runner/cost-estimator.js +71 -0
package/lib/runner/gate.js +46 -0
package/lib/runner/index.js +165 -0
package/lib/sidecar.d.ts +83 -0
package/lib/sidecar.js +161 -0
package/lib/sse.d.ts +15 -0
package/lib/sse.js +30 -0
package/lib/tools-scanner.js +91 -0
package/lib/tui.js +253 -0
package/lib/verifier-report.js +78 -0
package/lib/verifier-runner.js +338 -0
package/lib/verifier-scanner.js +70 -0
package/lib/verifier-worker-pool.js +196 -0
package/lib/views/chat.js +340 -0
package/lib/views/endpoints.js +203 -0
package/lib/views/eval-run.js +206 -0
package/lib/views/forge-agent.js +538 -0
package/lib/views/forge.js +410 -0
package/lib/views/main-menu.js +275 -0
package/lib/views/mediation.js +381 -0
package/lib/views/model-compare.js +430 -0
package/lib/views/model-comparison.js +333 -0
package/lib/views/onboarding.js +470 -0
package/lib/views/performance.js +237 -0
package/lib/views/run-evals.js +205 -0
package/lib/views/settings.js +829 -0
package/lib/views/tools-evals.js +514 -0
package/lib/views/verifier-coverage.js +617 -0
package/lib/workers/verifier-worker.js +52 -0
package/package.json +123 -0
package/widget/forge-chat.js +789 -0

package/lib/views/model-compare.js ADDED Viewed

@@ -0,0 +1,430 @@
+/**
+ * Model Compare View — side-by-side model spec comparison.
+ *
+ * Runs the current forge state against two models in parallel (config.models.generation
+ * and config.models.secondary) and shows the resulting specs side by side so the user
+ * can choose which result to carry forward into the forge dialogue.
+ *
+ * Key bindings:
+ *   a / 1  — use Model A result
+ *   b / 2  — use Model B result
+ *   m      — merge (Model A base, overlay non-null fields from Model B)
+ *   Escape — cancel, navigate back to forge
+ */
+import blessed from 'blessed';
+import { existsSync, readFileSync } from 'fs';
+import { resolve, dirname } from 'path';
+import { fileURLToPath } from 'url';
+import { forgeStep, createInitialState } from '../forge-engine.js';
+import { resolveModelConfig } from '../api-client.js';
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const ENV_FILE   = resolve(__dirname, '../../.env');
+// ── Helpers ────────────────────────────────────────────────────────────────
+/**
+ * Read key=value pairs from .env into a plain object.
+ * Skips blank lines and comments. Strips surrounding quotes from values.
+ *
+ * @returns {Record<string, string>}
+ */
+function loadEnv() {
+  if (!existsSync(ENV_FILE)) return {};
+  const lines = readFileSync(ENV_FILE, 'utf-8').split('\n');
+  const out = {};
+  for (const line of lines) {
+    const trimmed = line.trim();
+    if (!trimmed || trimmed.startsWith('#')) continue;
+    const eqIdx = trimmed.indexOf('=');
+    if (eqIdx === -1) continue;
+    const key = trimmed.slice(0, eqIdx).trim();
+    const val = trimmed.slice(eqIdx + 1).trim().replace(/^["']|["']$/g, '');
+    out[key] = val;
+  }
+  return out;
+}
+/**
+ * Deep-merge two spec objects: use specA as the base and overlay any non-null,
+ * non-undefined top-level field from specB.
+ *
+ * @param {object} specA
+ * @param {object} specB
+ * @returns {object}
+ */
+function mergeSpecs(specA, specB) {
+  const merged = { ...specA };
+  for (const [key, val] of Object.entries(specB)) {
+    if (val !== null && val !== undefined) {
+      merged[key] = val;
+    }
+  }
+  return merged;
+}
+/**
+ * Format a forgeStep result for display in a panel.
+ * Shows the assistant text (if any) followed by the spec as pretty-printed JSON.
+ *
+ * @param {{ assistantText: string, nextState: { spec: object } }} result
+ * @returns {string}
+ */
+function formatResult(result) {
+  const parts = [];
+  if (result.assistantText && result.assistantText.trim()) {
+    parts.push(result.assistantText.trim());
+    parts.push('');
+    parts.push('─'.repeat(40));
+    parts.push('');
+  }
+  parts.push('Spec:');
+  try {
+    parts.push(JSON.stringify(result.nextState.spec, null, 2));
+  } catch (_) {
+    parts.push('(could not serialise spec)');
+  }
+  return parts.join('\n');
+}
+// ── createView ─────────────────────────────────────────────────────────────
+export function createView({
+  screen,
+  content,
+  config,
+  navigate,
+  setFooter,
+  screenKey,
+  openPopup,
+  closePopup,
+  startService
+}) {
+  // ── Root container (fills the content area) ─────────────────────────────
+  const root = blessed.box({
+    top: 0, left: 0, width: '100%', height: '100%',
+    tags: true
+  });
+  // Escape/b navigates back immediately.
+  // ── Header row ──────────────────────────────────────────────────────────
+  const header = blessed.box({
+    parent: root,
+    top: 0, left: 0, width: '100%', height: 1,
+    tags: true,
+    content: '{bold}{cyan-fg} Model Comparison{/cyan-fg}{/bold}',
+    style: { bg: 'black' }
+  });
+  // ── Status bar (below header, above panels) ──────────────────────────────
+  const statusBar = blessed.box({
+    parent: root,
+    top: 1, left: 0, width: '100%', height: 1,
+    tags: true,
+    content: '{yellow-fg} Initialising…{/yellow-fg}',
+    style: { bg: 'black' }
+  });
+  // ── Panel labels row ─────────────────────────────────────────────────────
+  const labelRow = blessed.box({
+    parent: root,
+    top: 2, left: 0, width: '100%', height: 2,
+    tags: true,
+    style: { bg: 'black' }
+  });
+  const labelA = blessed.box({
+    parent: labelRow,
+    top: 0, left: 0, width: '50%', height: 2,
+    tags: true,
+    content: '{bold} Model A:{/bold} {cyan-fg}loading…{/cyan-fg}\n {#555555-fg}───────────────────────────────────{/#555555-fg}',
+    style: { bg: 'black' }
+  });
+  const labelB = blessed.box({
+    parent: labelRow,
+    top: 0, left: '50%', width: '50%', height: 2,
+    tags: true,
+    content: '{bold} Model B:{/bold} {cyan-fg}loading…{/cyan-fg}\n {#555555-fg}───────────────────────────────────{/#555555-fg}',
+    style: { bg: 'black' }
+  });
+  // ── Panel boxes (scrollable) ─────────────────────────────────────────────
+  const panelTop  = 4;   // header(1) + status(1) + labelRow(2)
+  const panelHeight = `100%-${panelTop + 1}`;  // leave 1 row for footer
+  const panelA = blessed.scrollablebox({
+    parent: root,
+    top: panelTop, left: 0, width: '50%', height: panelHeight,
+    border: { type: 'line', fg: '#333333' },
+    scrollable: true,
+    alwaysScroll: true,
+    keys: true,
+    vi: true,
+    tags: false,
+    content: '',
+    scrollbar: { ch: '│', style: { fg: '#555555' } },
+    style: { bg: 'black', fg: 'white' }
+  });
+  const panelB = blessed.scrollablebox({
+    parent: root,
+    top: panelTop, left: '50%', width: '50%', height: panelHeight,
+    border: { type: 'line', fg: '#333333' },
+    scrollable: true,
+    alwaysScroll: true,
+    keys: true,
+    vi: true,
+    tags: false,
+    content: '',
+    scrollbar: { ch: '│', style: { fg: '#555555' } },
+    style: { bg: 'black', fg: 'white' }
+  });
+  // ── State ────────────────────────────────────────────────────────────────
+  let modelAResult  = null;
+  let modelBResult  = null;
+  let modelAConfig  = null;
+  let modelBConfig  = null;
+  let forgeState    = null;
+  let ready         = false;   // true once both results have arrived
+  // ── Helpers ──────────────────────────────────────────────────────────────
+  function setStatus(text) {
+    statusBar.setContent(text);
+    screen.render();
+  }
+  function updateLabelA(modelName) {
+    labelA.setContent(
+      `{bold} Model A:{/bold} {cyan-fg}${modelName}{/cyan-fg}\n {#555555-fg}───────────────────────────────────{/#555555-fg}`
+    );
+  }
+  function updateLabelB(modelName) {
+    labelB.setContent(
+      `{bold} Model B:{/bold} {cyan-fg}${modelName}{/cyan-fg}\n {#555555-fg}───────────────────────────────────{/#555555-fg}`
+    );
+  }
+  function showFooterReady() {
+    setFooter(
+      ' {bold}a{/bold}/{bold}1{/bold} use A  ' +
+      '{bold}2{/bold} use B  ' +
+      '{bold}m{/bold} merge  ' +
+      '{bold}Escape{/bold} back'
+    );
+  }
+  function showFooterWaiting() {
+    setFooter(' {yellow-fg}Running comparison…{/yellow-fg}  {bold}Escape{/bold} back');
+  }
+  // ── DB recording ─────────────────────────────────────────────────────────
+  async function recordComparison(chosenModel) {
+    try {
+      const dbPath = resolve(process.cwd(), config?.dbPath || 'forge.db');
+      const { getDb, insertModelComparison } = await import('../db.js');
+      const db = getDb(dbPath);
+      insertModelComparison(db, {
+        tool_name:    forgeState?.spec?.name || 'unknown',
+        model_a:      modelAConfig?.model || 'unknown',
+        model_b:      modelBConfig?.model || 'unknown',
+        spec_a_json:  modelAResult ? JSON.stringify(modelAResult.nextState.spec) : null,
+        spec_b_json:  modelBResult ? JSON.stringify(modelBResult.nextState.spec) : null,
+        chosen_model: chosenModel,
+        phase:        forgeState?.phase || null
+      });
+    } catch (_) {
+      // Non-fatal — DB write failures should not block the workflow.
+    }
+  }
+  // ── Choice actions ────────────────────────────────────────────────────────
+  async function chooseA() {
+    if (!ready || !modelAResult) return;
+    config._chosenSpec = modelAResult.nextState.spec;
+    await recordComparison(modelAConfig?.model || 'model_a');
+    navigate('forge');
+  }
+  async function chooseB() {
+    if (!ready || !modelBResult) return;
+    config._chosenSpec = modelBResult.nextState.spec;
+    await recordComparison(modelBConfig?.model || 'model_b');
+    navigate('forge');
+  }
+  async function chooseMerge() {
+    if (!ready || !modelAResult || !modelBResult) return;
+    config._chosenSpec = mergeSpecs(
+      modelAResult.nextState.spec,
+      modelBResult.nextState.spec
+    );
+    await recordComparison('merge');
+    navigate('forge');
+  }
+  // ── Key bindings ─────────────────────────────────────────────────────────
+  screenKey(['a', '1'], () => { chooseA(); });
+  screenKey(['2'],      () => { chooseB(); });
+  screenKey(['m'],      () => { chooseMerge(); });
+  screenKey(['escape'], () => { navigate('forge'); });
+  // Also handle scroll between panels with Tab
+  screenKey(['tab'], () => {
+    if (screen.focused === panelA) {
+      panelB.focus();
+    } else {
+      panelA.focus();
+    }
+    screen.render();
+  });
+  // ── Main async init (deferred to avoid blocking render) ──────────────────
+  setImmediate(async () => {
+    // 1. Load environment
+    const env = loadEnv();
+    // 2. Resolve model configs
+    modelAConfig = resolveModelConfig(config, env, 'generation');
+    modelBConfig = resolveModelConfig(config, env, 'secondary');
+    // 3. Guard: no secondary model
+    if (!modelBConfig.model) {
+      updateLabelA(modelAConfig.model || 'unknown');
+      updateLabelB('not configured');
+      panelA.setContent('');
+      panelB.setContent(
+        'No secondary model configured.\n\n' +
+        'Set models.secondary in Settings (option 1 → secondary role).'
+      );
+      setStatus('{red-fg} No secondary model configured.{/red-fg}');
+      setFooter(' {bold}Escape{/bold} back');
+      screen.render();
+      return;
+    }
+    // 4. Update labels with resolved model names
+    updateLabelA(modelAConfig.model || 'unknown');
+    updateLabelB(modelBConfig.model || 'unknown');
+    screen.render();
+    // 5. Determine forge state
+    forgeState = config._forgeState || createInitialState();
+    if (!config._forgeState) {
+      // No live state — inject a synthetic user input so the explore phase
+      // has something to work with during a standalone comparison test.
+      forgeState = {
+        ...forgeState,
+        messages: [{ role: 'user', content: config._forgeInput || 'test comparison' }]
+      };
+    }
+    const userInput = config._forgeInput || null;
+    // 6. Show running status and run both models in parallel
+    setStatus('{yellow-fg} Running comparison against both models…{/yellow-fg}');
+    showFooterWaiting();
+    let errorA = null;
+    let errorB = null;
+    [modelAResult, modelBResult] = await Promise.all([
+      forgeStep({
+        state: forgeState,
+        userInput,
+        modelConfig: modelAConfig,
+        existingTools: [],
+        projectConfig: config,
+        projectRoot: process.cwd()
+      }).catch((err) => {
+        errorA = err;
+        return null;
+      }),
+      forgeStep({
+        state: forgeState,
+        userInput,
+        modelConfig: modelBConfig,
+        existingTools: [],
+        projectConfig: config,
+        projectRoot: process.cwd()
+      }).catch((err) => {
+        errorB = err;
+        return null;
+      })
+    ]);
+    // 7. Populate panels with results (or error messages)
+    if (errorA || !modelAResult) {
+      panelA.setContent(
+        `Error calling ${modelAConfig.model}:\n\n${errorA?.message || 'unknown error'}`
+      );
+    } else {
+      panelA.setContent(formatResult(modelAResult));
+    }
+    if (errorB || !modelBResult) {
+      panelB.setContent(
+        `Error calling ${modelBConfig.model}:\n\n${errorB?.message || 'unknown error'}`
+      );
+    } else {
+      panelB.setContent(formatResult(modelBResult));
+    }
+    // 8. Mark ready and update status/footer
+    const readyA = !!modelAResult;
+    const readyB = !!modelBResult;
+    ready = readyA || readyB;
+    if (readyA && readyB) {
+      setStatus('{green-fg} Done.{/green-fg}  Pick a result or merge.');
+      setFooter(
+        ' {bold}a{/bold}/{bold}1{/bold} use A  ' +
+        '{bold}b{/bold}/{bold}2{/bold} use B  ' +
+        '{bold}m{/bold} merge  ' +
+        '{bold}Escape{/bold} back'
+      );
+    } else if (readyA) {
+      const failures = [errorA && 'A', errorB && 'B'].filter(Boolean).join(', ');
+      setStatus(`{yellow-fg} Model(s) failed: ${failures}.  Showing partial results.{/yellow-fg}`);
+      setFooter(
+        ' {bold}a{/bold}/{bold}1{/bold} use A  ' +
+        '{#555555-fg}b/2 use B (unavailable){/#555555-fg}  ' +
+        '{#555555-fg}m merge (unavailable){/#555555-fg}  ' +
+        '{bold}Escape{/bold} back'
+      );
+    } else if (readyB) {
+      const failures = [errorA && 'A', errorB && 'B'].filter(Boolean).join(', ');
+      setStatus(`{yellow-fg} Model(s) failed: ${failures}.  Showing partial results.{/yellow-fg}`);
+      setFooter(
+        '{#555555-fg} a/1 use A (unavailable){/#555555-fg}  ' +
+        '{bold}b{/bold}/{bold}2{/bold} use B  ' +
+        '{#555555-fg}m merge (unavailable){/#555555-fg}  ' +
+        '{bold}Escape{/bold} back'
+      );
+    } else {
+      const failures = [errorA && 'A', errorB && 'B'].filter(Boolean).join(', ');
+      setStatus(`{red-fg} Error in model(s): ${failures}.  Check API keys in Settings.{/red-fg}`);
+      setFooter(' {bold}Escape{/bold} back');
+    }
+    panelA.focus();
+    screen.render();
+  });
+  // Return the root node so tui.js can track it as the active view box.
+  return root;
+}