npm - @amodalai/amodal - Versions diffs - 0.3.26 → 0.3.28 - Mend

@amodalai/amodal 0.3.26 → 0.3.28

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

package/CHANGELOG.md +32 -0
package/dist/src/commands/dev.d.ts.map +1 -1
package/dist/src/commands/dev.js +28 -11
package/dist/src/commands/dev.js.map +1 -1
package/dist/src/commands/eval.d.ts.map +1 -1
package/dist/src/commands/eval.js +4 -2
package/dist/src/commands/eval.js.map +1 -1
package/dist/tsconfig.tsbuildinfo +1 -1
package/package.json +8 -7
package/src/commands/dev.ts +31 -11
package/src/commands/eval.ts +4 -2
package/src/e2e-commands.test.ts +9 -291
package/src/e2e-subprocess.test.ts +153 -0
package/dist/src/fixtures/incident-response.d.ts +0 -92
package/dist/src/fixtures/incident-response.d.ts.map +0 -1
package/dist/src/fixtures/incident-response.js +0 -209
package/dist/src/fixtures/incident-response.js.map +0 -1
package/dist/src/shared/find-free-port.d.ts +0 -21
package/dist/src/shared/find-free-port.d.ts.map +0 -1
package/dist/src/shared/find-free-port.js +0 -62
package/dist/src/shared/find-free-port.js.map +0 -1
package/src/e2e-automations.test.ts +0 -305
package/src/e2e-incident-response.test.ts +0 -345
package/src/e2e-plugin-connections.test.ts +0 -407
package/src/e2e-plugins.test.ts +0 -491
package/src/e2e.test.ts +0 -493
package/src/fixtures/incident-response.ts +0 -233
package/src/shared/find-free-port.ts +0 -67

package/src/e2e-automations.test.ts DELETED Viewed

@@ -1,305 +0,0 @@
-/**
- * @license
- * Copyright 2025 Amodal Labs, Inc.
- * SPDX-License-Identifier: MIT
- */
-/**
- * End-to-end test: Automation lifecycle
- *
- * Tests the full automation control flow via the HTTP API:
- *   1. Create repo with cron + webhook automations on disk
- *   2. Boot `createLocalServer` (which integrates ProactiveRunner)
- *   3. List automations — verify both appear, cron is stopped, webhook is running
- *   4. Start a cron automation — verify it becomes running
- *   5. Stop a cron automation — verify it becomes stopped
- *   6. Reject starting a webhook automation (always active)
- *   7. Manually trigger an automation (run)
- *   8. Webhook endpoint accepts events
- */
-import {describe, it, expect, beforeAll, afterAll} from 'vitest';
-import {mkdtempSync, mkdirSync, writeFileSync, rmSync} from 'node:fs';
-import {join} from 'node:path';
-import {tmpdir} from 'node:os';
-import type {AddressInfo} from 'node:net';
-// ---------------------------------------------------------------------------
-// Fixture data
-// ---------------------------------------------------------------------------
-const CONFIG = {
-  name: 'automation-test-agent',
-  version: '1.0.0',
-  description: 'Agent with automations for e2e testing',
-  models: {
-    main: {provider: 'anthropic', model: 'claude-sonnet-4-20250514'},
-  },
-};
-const CRON_AUTOMATION = `# Automation: Daily Scan
-Schedule: */5 * * * *
-## Check
-Scan all zones for anomalies and report findings.
-## Output
-Summary of anomalies found.
-## Delivery
-stdout
-`;
-const WEBHOOK_AUTOMATION = `# Automation: Alert Handler
-## Check
-Run on webhook when an alert fires. Triage the alert and determine severity.
-## Output
-Triage assessment with severity level.
-## Delivery
-stdout
-`;
-// ---------------------------------------------------------------------------
-// Test suite
-// ---------------------------------------------------------------------------
-describe('E2E: Automation Lifecycle', () => {
-  let repoDir: string;
-  let server: {app: unknown; start: () => Promise<unknown>; stop: () => Promise<void>} | null = null;
-  let baseUrl: string;
-  beforeAll(async () => {
-    // 1. Create repo directory with automations
-    repoDir = mkdtempSync(join(tmpdir(), 'amodal-e2e-automations-'));
-    // Config
-    writeFileSync(join(repoDir, 'amodal.json'), JSON.stringify(CONFIG, null, 2));
-    // Automations
-    const autoDir = join(repoDir, 'automations');
-    mkdirSync(autoDir, {recursive: true});
-    writeFileSync(join(autoDir, 'daily-scan.md'), CRON_AUTOMATION);
-    writeFileSync(join(autoDir, 'alert-handler.md'), WEBHOOK_AUTOMATION);
-    // 2. Boot repo server
-    const {createLocalServer} = await import('@amodalai/runtime');
-    const srv = await createLocalServer({
-      repoPath: repoDir,
-      port: 0, // random port
-      host: '127.0.0.1',
-      hotReload: false,
-      corsOrigin: '*',
-    });
-    const httpServer = await srv.start();
-    const addr = httpServer.address() as AddressInfo;
-    baseUrl = `http://127.0.0.1:${addr.port}`;
-    server = srv;
-  }, 30000);
-  afterAll(async () => {
-    if (server) {
-      await server.stop();
-      server = null;
-    }
-    rmSync(repoDir, {recursive: true, force: true});
-  });
-  // =========================================================================
-  // Health check — server is up
-  // =========================================================================
-  it('should respond to health check', async () => {
-    const resp = await fetch(`${baseUrl}/health`);
-    expect(resp.status).toBe(200);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['status']).toBe('ok');
-    expect(data['mode']).toBe('repo');
-  });
-  // =========================================================================
-  // List — both automations appear with correct initial state
-  // =========================================================================
-  it('should list automations with correct types and initial state', async () => {
-    const resp = await fetch(`${baseUrl}/automations`);
-    expect(resp.status).toBe(200);
-    const data = (await resp.json()) as {
-      automations: Array<{
-        name: string;
-        title: string;
-        schedule?: string;
-        webhookTriggered: boolean;
-        running: boolean;
-      }>;
-    };
-    expect(data.automations).toHaveLength(2);
-    const cronAuto = data.automations.find((a) => a.name === 'daily-scan');
-    expect(cronAuto).toBeDefined();
-    expect(cronAuto?.title).toBe('Daily Scan');
-    expect(cronAuto?.schedule).toBe('*/5 * * * *');
-    expect(cronAuto?.webhookTriggered).toBe(false);
-    expect(cronAuto?.running).toBe(false); // not started yet
-    const webhookAuto = data.automations.find((a) => a.name === 'alert-handler');
-    expect(webhookAuto).toBeDefined();
-    expect(webhookAuto?.title).toBe('Alert Handler');
-    expect(webhookAuto?.webhookTriggered).toBe(true);
-    expect(webhookAuto?.running).toBe(true); // webhooks always active
-  });
-  // =========================================================================
-  // Start — cron automation becomes running
-  // =========================================================================
-  it('should start a cron automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/daily-scan/start`, {method: 'POST'});
-    expect(resp.status).toBe(200);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['status']).toBe('started');
-    // Verify it's now running
-    const listResp = await fetch(`${baseUrl}/automations`);
-    const listData = (await listResp.json()) as {
-      automations: Array<{name: string; running: boolean}>;
-    };
-    const cronAuto = listData.automations.find((a) => a.name === 'daily-scan');
-    expect(cronAuto?.running).toBe(true);
-  });
-  // =========================================================================
-  // Start again — should fail (already running)
-  // =========================================================================
-  it('should reject starting an already running automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/daily-scan/start`, {method: 'POST'});
-    expect(resp.status).toBe(400);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['error']).toContain('already running');
-  });
-  // =========================================================================
-  // Stop — cron automation becomes stopped
-  // =========================================================================
-  it('should stop a running cron automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/daily-scan/stop`, {method: 'POST'});
-    expect(resp.status).toBe(200);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['status']).toBe('stopped');
-    // Verify it's now stopped
-    const listResp = await fetch(`${baseUrl}/automations`);
-    const listData = (await listResp.json()) as {
-      automations: Array<{name: string; running: boolean}>;
-    };
-    const cronAuto = listData.automations.find((a) => a.name === 'daily-scan');
-    expect(cronAuto?.running).toBe(false);
-  });
-  // =========================================================================
-  // Stop again — should fail (not running)
-  // =========================================================================
-  it('should reject stopping a non-running automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/daily-scan/stop`, {method: 'POST'});
-    expect(resp.status).toBe(400);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['error']).toContain('not running');
-  });
-  // =========================================================================
-  // Start webhook automation — should fail (always active)
-  // =========================================================================
-  it('should reject starting a webhook-triggered automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/alert-handler/start`, {method: 'POST'});
-    expect(resp.status).toBe(400);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['error']).toContain('webhook-triggered');
-  });
-  // =========================================================================
-  // Start unknown — should fail
-  // =========================================================================
-  it('should reject starting unknown automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/nonexistent/start`, {method: 'POST'});
-    expect(resp.status).toBe(400);
-    const data = (await resp.json()) as Record<string, unknown>;
-    expect(data['error']).toContain('not found');
-  });
-  // =========================================================================
-  // Run — manually trigger an automation (fire and forget)
-  // =========================================================================
-  it('should reject triggering unknown automation', async () => {
-    const resp = await fetch(`${baseUrl}/automations/nonexistent/run`, {
-      method: 'POST',
-      headers: {'Content-Type': 'application/json'},
-      body: JSON.stringify({}),
-    });
-    expect(resp.status).toBe(404);
-  });
-  // =========================================================================
-  // Webhook endpoint — accepts events
-  // =========================================================================
-  it('should accept webhook events for webhook-triggered automations', async () => {
-    const resp = await fetch(`${baseUrl}/webhooks/alert-handler`, {
-      method: 'POST',
-      headers: {'Content-Type': 'application/json'},
-      body: JSON.stringify({alert: 'high-cpu', host: 'web-01'}),
-    });
-    // May succeed or fail (depends on LLM availability), but route exists
-    expect([200, 500]).toContain(resp.status);
-    const data = (await resp.json()) as Record<string, unknown>;
-    // If 200, it matched and ran
-    if (resp.status === 200) {
-      expect(data['status']).toBe('accepted');
-    }
-    // If 500, it matched but execution failed (no LLM configured) — still validates routing
-    if (resp.status === 500) {
-      expect(data['matched']).toBe(true);
-    }
-  });
-  // =========================================================================
-  // Webhook for non-webhook automation — should 404
-  // =========================================================================
-  it('should reject webhook for cron-only automation', async () => {
-    const resp = await fetch(`${baseUrl}/webhooks/daily-scan`, {
-      method: 'POST',
-      headers: {'Content-Type': 'application/json'},
-      body: JSON.stringify({}),
-    });
-    expect(resp.status).toBe(404);
-  });
-  // =========================================================================
-  // Webhook for unknown automation — should 404
-  // =========================================================================
-  it('should reject webhook for unknown automation', async () => {
-    const resp = await fetch(`${baseUrl}/webhooks/nonexistent`, {
-      method: 'POST',
-      headers: {'Content-Type': 'application/json'},
-      body: JSON.stringify({}),
-    });
-    expect(resp.status).toBe(404);
-  });
-});

package/src/e2e-incident-response.test.ts DELETED Viewed

@@ -1,345 +0,0 @@
-/**
- * @license
- * Copyright 2025 Amodal Labs, Inc.
- * SPDX-License-Identifier: MIT
- */
-/**
- * End-to-end test: Incident Response Agent
- *
- * Tests the full content pipeline with all four content types:
- *   Connection (statuspage API) + Skill (incident triage) +
- *   Knowledge (oncall runbook) + Automation (health check)
- *
- * Flow:
- *   1. Create repo with all content types written to disk
- *   2. Build snapshot → verify all content present
- *   3. Start mock StatusPage API
- *   4. Boot runtime from snapshot → send chat → verify agent uses
- *      the connection, skill, and knowledge in its response
- */
-import {describe, it, expect, beforeAll, afterAll} from 'vitest';
-import {mkdtempSync, mkdirSync, writeFileSync, rmSync, existsSync} from 'node:fs';
-import {join} from 'node:path';
-import {tmpdir} from 'node:os';
-import http from 'node:http';
-import type {
-  MOCK_COMPONENTS} from './fixtures/incident-response.js';
-import {
-  CONFIG,
-  STATUSPAGE_SPEC,
-  STATUSPAGE_ACCESS,
-  STATUSPAGE_SURFACE,
-  TRIAGE_SKILL,
-  ONCALL_RUNBOOK,
-  HEALTH_CHECK_AUTOMATION,
-  createMockStatusPageApi,
-} from './fixtures/incident-response.js';
-import {runBuild} from './commands/build.js';
-import type {DeploySnapshot} from '@amodalai/core';
-import {loadRepo, loadSnapshotFromFile, snapshotToBundle} from '@amodalai/core';
-// ---------------------------------------------------------------------------
-// Helper: send chat and parse SSE events
-// ---------------------------------------------------------------------------
-async function sendChat(
-  port: number,
-  message: string,
-  appId: string,
-  sessionId?: string,
-  timeoutMs = 30000,
-): Promise<{events: Array<Record<string, unknown>>; rawBody: string}> {
-  return new Promise((resolve, reject) => {
-    const payload: Record<string, string> = {message, app_id: appId};
-    if (sessionId) payload['session_id'] = sessionId;
-    const body = JSON.stringify(payload);
-    const req = http.request(
-      {
-        hostname: '127.0.0.1',
-        port,
-        path: '/chat',
-        method: 'POST',
-        headers: {
-          'Content-Type': 'application/json',
-          'Content-Length': Buffer.byteLength(body),
-        },
-        timeout: timeoutMs,
-      },
-      (res) => {
-        let rawBody = '';
-        res.setEncoding('utf8');
-        res.on('data', (chunk: string) => { rawBody += chunk; });
-        res.on('end', () => {
-          const events: Array<Record<string, unknown>> = [];
-          for (const line of rawBody.split('\n')) {
-            if (line.startsWith('data: ')) {
-              try { events.push(JSON.parse(line.slice(6)) as Record<string, unknown>); } catch { /* skip */ }
-            }
-          }
-          resolve({events, rawBody});
-        });
-      },
-    );
-    req.on('error', reject);
-    req.on('timeout', () => req.destroy(new Error('timeout')));
-    req.write(body);
-    req.end();
-  });
-}
-// ---------------------------------------------------------------------------
-// Test suite
-// ---------------------------------------------------------------------------
-describe('E2E: Incident Response Agent', () => {
-  let repoDir: string;
-  let snapshotPath: string;
-  let builtSnapshot: DeploySnapshot;
-  let mockApi: ReturnType<typeof createMockStatusPageApi>;
-  let runtimeServer: {app: unknown; start: () => Promise<unknown>; stop: () => Promise<void>} | null = null;
-  let runtimePort: number;
-  beforeAll(async () => {
-    // 1. Create repo directory structure with all content types
-    repoDir = mkdtempSync(join(tmpdir(), 'amodal-e2e-incident-'));
-    // Config
-    writeFileSync(join(repoDir, 'amodal.json'), JSON.stringify(CONFIG, null, 2));
-    // Connection: statuspage
-    const connDir = join(repoDir, 'connections', 'statuspage');
-    mkdirSync(connDir, {recursive: true});
-    writeFileSync(join(connDir, 'spec.json'), JSON.stringify(STATUSPAGE_SPEC, null, 2));
-    writeFileSync(join(connDir, 'access.json'), JSON.stringify(STATUSPAGE_ACCESS, null, 2));
-    writeFileSync(join(connDir, 'surface.md'), STATUSPAGE_SURFACE);
-    // Skill: incident-triage
-    const skillDir = join(repoDir, 'skills', 'incident-triage');
-    mkdirSync(skillDir, {recursive: true});
-    writeFileSync(join(skillDir, 'SKILL.md'), TRIAGE_SKILL);
-    // Knowledge: oncall-runbook
-    const knowledgeDir = join(repoDir, 'knowledge');
-    mkdirSync(knowledgeDir, {recursive: true});
-    writeFileSync(join(knowledgeDir, 'oncall-runbook.md'), ONCALL_RUNBOOK);
-    // Automation: health-check
-    const autoDir = join(repoDir, 'automations');
-    mkdirSync(autoDir, {recursive: true});
-    writeFileSync(join(autoDir, 'health-check.md'), HEALTH_CHECK_AUTOMATION);
-    // 2. Build snapshot
-    snapshotPath = join(repoDir, 'resolved-config.json');
-    const code = await runBuild({cwd: repoDir, output: snapshotPath});
-    if (code !== 0) throw new Error('Build failed');
-    builtSnapshot = await loadSnapshotFromFile(snapshotPath);
-    // 3. Start mock StatusPage API
-    mockApi = createMockStatusPageApi();
-    await mockApi.start();
-    // 4. Update the spec in the snapshot to point to the mock API
-    //    (In production, the base URL comes from the spec; here we override it)
-    //    We need to rebuild with the mock URL baked in
-    const specWithMockUrl = {
-      ...STATUSPAGE_SPEC,
-      specUrl: `http://127.0.0.1:${mockApi.port}/openapi.json`,
-    };
-    writeFileSync(join(connDir, 'spec.json'), JSON.stringify(specWithMockUrl, null, 2));
-    // Rebuild snapshot with the mock URL
-    const code2 = await runBuild({cwd: repoDir, output: snapshotPath});
-    if (code2 !== 0) throw new Error('Rebuild with mock URL failed');
-    builtSnapshot = await loadSnapshotFromFile(snapshotPath);
-    // 5. Boot runtime from snapshot
-    const {createSnapshotServer} = await import('@amodalai/runtime');
-    runtimeServer = await createSnapshotServer({
-      snapshotPath,
-      port: 0,
-      host: '127.0.0.1',
-    });
-    const httpServer = await runtimeServer.start();
-    const addr = (httpServer as http.Server).address();
-    runtimePort = typeof addr === 'object' && addr ? addr.port : 0;
-  });
-  afterAll(async () => {
-    if (runtimeServer) await runtimeServer.stop();
-    if (mockApi) await mockApi.stop();
-    if (repoDir && existsSync(repoDir)) rmSync(repoDir, {recursive: true, force: true});
-  });
-  // =========================================================================
-  // Phase 1: Repo loading — all content types load from disk
-  // =========================================================================
-  describe('repo loading', () => {
-    it('should load the connection from disk', async () => {
-      const repo = await loadRepo({localPath: repoDir});
-      expect(repo.connections.size).toBe(1);
-      const conn = repo.connections.get('statuspage');
-      expect(conn).toBeDefined();
-      expect(conn!.spec.format).toBe('openapi');
-      expect(conn!.surface.length).toBeGreaterThanOrEqual(3);
-      expect(conn!.surface.find((s) => s.path === '/components')).toBeDefined();
-    });
-    it('should load the skill from disk', async () => {
-      const repo = await loadRepo({localPath: repoDir});
-      expect(repo.skills.length).toBe(1);
-      expect(repo.skills[0].name).toBe('incident-triage');
-      expect(repo.skills[0].body).toContain('Check component status');
-      expect(repo.skills[0].trigger).toContain('service health');
-    });
-    it('should load the knowledge from disk', async () => {
-      const repo = await loadRepo({localPath: repoDir});
-      expect(repo.knowledge.length).toBe(1);
-      expect(repo.knowledge[0].name).toBe('oncall-runbook');
-      expect(repo.knowledge[0].body).toContain('Severity Matrix');
-      expect(repo.knowledge[0].body).toContain('alice@example.com');
-    });
-    it('should load the automation from disk', async () => {
-      const repo = await loadRepo({localPath: repoDir});
-      expect(repo.automations.length).toBe(1);
-      expect(repo.automations[0].name).toBe('health-check');
-      expect(repo.automations[0].title).toBe('Daily Health Check');
-      expect(repo.automations[0].schedule).toBe('0 8 * * *');
-    });
-  });
-  // =========================================================================
-  // Phase 2: Snapshot — all content types serialized
-  // =========================================================================
-  describe('snapshot content', () => {
-    it('should include the connection in the snapshot', () => {
-      expect(Object.keys(builtSnapshot.connections)).toContain('statuspage');
-      const conn = builtSnapshot.connections['statuspage'];
-      expect(conn.spec.format).toBe('openapi');
-      // Surface is serialized as checkbox markdown in snapshot
-      expect(conn.surface).toContain('/components');
-      expect(conn.access.endpoints['GET /components']).toBeDefined();
-    });
-    it('should include the skill in the snapshot', () => {
-      expect(builtSnapshot.skills.length).toBe(1);
-      expect(builtSnapshot.skills[0].name).toBe('incident-triage');
-      expect(builtSnapshot.skills[0].body).toContain('Check component status');
-    });
-    it('should include the knowledge in the snapshot', () => {
-      expect(builtSnapshot.knowledge.length).toBe(1);
-      expect(builtSnapshot.knowledge[0].name).toBe('oncall-runbook');
-      expect(builtSnapshot.knowledge[0].body).toContain('SEV1');
-    });
-    it('should include the automation in the snapshot', () => {
-      expect(builtSnapshot.automations.length).toBe(1);
-      expect(builtSnapshot.automations[0].name).toBe('health-check');
-      expect(builtSnapshot.automations[0].schedule).toBe('0 8 * * *');
-    });
-    it('should round-trip all content through snapshot', () => {
-      const restored = snapshotToBundle(builtSnapshot, 'test');
-      // Connection
-      expect(restored.connections.size).toBe(1);
-      const conn = restored.connections.get('statuspage');
-      expect(conn).toBeDefined();
-      expect(conn!.spec.format).toBe('openapi');
-      // Surface endpoints parsed from markdown
-      expect(conn!.surface.length).toBeGreaterThanOrEqual(3);
-      const getComponents = conn!.surface.find((s) => s.method === 'GET' && s.path === '/components');
-      expect(getComponents).toBeDefined();
-      expect(getComponents!.included).toBe(true);
-      const postIncidents = conn!.surface.find((s) => s.method === 'POST');
-      expect(postIncidents).toBeDefined();
-      expect(postIncidents!.included).toBe(false);
-      // Skill
-      expect(restored.skills[0].name).toBe('incident-triage');
-      expect(restored.skills[0].trigger).toContain('service health');
-      // Knowledge
-      expect(restored.knowledge[0].body).toContain('alice@example.com');
-      // Automation
-      expect(restored.automations[0].schedule).toBe('0 8 * * *');
-    });
-  });
-  // =========================================================================
-  // Phase 3: Runtime — server boots from snapshot and handles chat
-  // =========================================================================
-  describe('runtime from snapshot', () => {
-    it('should serve health check with full content counts', async () => {
-      const resp = await fetch(`http://127.0.0.1:${runtimePort}/health`);
-      const data = (await resp.json()) as Record<string, unknown>;
-      expect(data['status']).toBe('ok');
-      expect(data['mode']).toBe('snapshot');
-      expect(data['agent_name']).toBe('incident-response-agent');
-      expect(data['connections']).toBe(1);
-      expect(data['skills']).toBe(1);
-    });
-    it('should handle chat and stream SSE events', async () => {
-      const {events} = await sendChat(runtimePort, 'Is the API healthy?', 'app-incident-e2e');
-      expect(events.length).toBeGreaterThanOrEqual(2);
-      expect(events.find((e) => e['type'] === 'init')).toBeDefined();
-      expect(events.find((e) => e['type'] === 'done')).toBeDefined();
-    });
-    it('should use the connection when the agent makes a tool call', async () => {
-      // The agent should try to call GET /components via the request tool
-      // when asked about API health, because the triage skill says to do that.
-      // Whether it actually calls the mock depends on the LLM, but we can
-      // check if tool_call_start events reference the statuspage connection.
-      const {events} = await sendChat(
-        runtimePort,
-        'Check the current status of all services using the statuspage connection.',
-        'app-incident-tool-e2e',
-      );
-      const toolCalls = events.filter((e) => e['type'] === 'tool_call_start');
-      const textEvents = events.filter((e) => e['type'] === 'text_delta');
-      const fullText = textEvents.map((e) => String(e['content'] ?? '')).join('');
-      // The agent should have either made a tool call or mentioned the
-      // components in its text response
-      const mentionsConnection = toolCalls.some((tc) => {
-        const params = tc['parameters'] as Record<string, unknown> | undefined;
-        return params?.['connection'] === 'statuspage';
-      });
-      const mentionsComponents = fullText.toLowerCase().includes('api-gateway') ||
-        fullText.toLowerCase().includes('component') ||
-        fullText.toLowerCase().includes('statuspage');
-      // At least one of these should be true
-      expect(mentionsConnection || mentionsComponents).toBe(true);
-    });
-  });
-  // =========================================================================
-  // Phase 4: Mock API verification
-  // =========================================================================
-  describe('mock API interaction', () => {
-    it('should have the mock API running', async () => {
-      const resp = await fetch(`http://127.0.0.1:${mockApi.port}/components`);
-      expect(resp.status).toBe(200);
-      const data = (await resp.json()) as typeof MOCK_COMPONENTS;
-      expect(data.length).toBe(5);
-      expect(data.find((c) => c.name === 'database-primary')?.status).toBe('degraded_performance');
-    });
-  });
-});