npm - sofia-cli - Versions diffs - 0.1.2 → 0.1.4 - Mend

sofia-cli 0.1.2 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (136) hide show

package/README.md +42 -20
package/dist/infra/deploy.sh +193 -0
package/dist/infra/gather-env.sh +211 -0
package/dist/infra/infra/deploy.sh +193 -0
package/dist/infra/infra/gather-env.sh +211 -0
package/dist/infra/infra/main.bicep +90 -0
package/dist/infra/infra/main.bicepparam +18 -0
package/dist/infra/infra/resources.bicep +134 -0
package/dist/infra/infra/teardown.sh +114 -0
package/dist/infra/main.bicep +90 -0
package/dist/infra/main.bicepparam +18 -0
package/dist/infra/resources.bicep +134 -0
package/dist/infra/teardown.sh +114 -0
package/dist/src/cli/developCommand.js +0 -2
package/dist/src/cli/index.js +8 -1
package/dist/src/cli/workshopCommand.js +1 -1
package/dist/src/develop/index.js +1 -1
package/dist/src/develop/pocUtils.js +228 -0
package/dist/src/develop/ralphLoop.js +8 -27
package/dist/src/shared/data/cards.json +655 -670
package/docs/architecture.md +2 -1
package/package.json +5 -3
package/src/cli/developCommand.ts +1 -3
package/src/cli/index.ts +11 -1
package/src/cli/workshopCommand.ts +21 -17
package/src/develop/dynamicScaffolder.ts +36 -30
package/src/develop/index.ts +13 -2
package/src/develop/pocUtils.ts +296 -0
package/src/develop/ralphLoop.ts +8 -28
package/src/develop/templateRegistry.ts +19 -18
package/src/shared/data/cards.json +655 -670
package/tests/e2e/developE2e.spec.ts +3 -61
package/tests/e2e/developFailureE2e.spec.ts +34 -38
package/tests/integration/pocGithubMcp.spec.ts +29 -39
package/tests/integration/pocLocalFallback.spec.ts +29 -39
package/tests/integration/ralphLoopFlow.spec.ts +46 -66
package/tests/integration/ralphLoopPartial.spec.ts +30 -37
package/tests/unit/develop/githubMcpAdapter.spec.ts +0 -134
package/tests/unit/develop/outputValidator.spec.ts +45 -21
package/tests/unit/develop/ralphLoop.spec.ts +58 -94
package/tsconfig.json +2 -1
package/vitest.workspace.ts +5 -0
package/dist/src/develop/pocScaffolder.js +0 -542
package/dist/tests/e2e/developE2e.spec.js +0 -126
package/dist/tests/e2e/developFailureE2e.spec.js +0 -247
package/dist/tests/e2e/developPty.spec.js +0 -75
package/dist/tests/e2e/discoveryWebSearchRelevance.spec.js +0 -84
package/dist/tests/e2e/harness.spec.js +0 -83
package/dist/tests/e2e/mcpLive.spec.js +0 -120
package/dist/tests/e2e/newSession.e2e.spec.js +0 -177
package/dist/tests/e2e/ralphLoopEnrichmentComparison.spec.js +0 -62
package/dist/tests/e2e/workiqEnrichment.spec.js +0 -56
package/dist/tests/e2e/zavaSimulation.spec.js +0 -452
package/dist/tests/fixtures/test-fixture-project/src/add.js +0 -3
package/dist/tests/fixtures/test-fixture-project/tests/failing.test.js +0 -6
package/dist/tests/fixtures/test-fixture-project/tests/hanging.test.js +0 -8
package/dist/tests/fixtures/test-fixture-project/tests/passing.test.js +0 -10
package/dist/tests/fixtures/test-fixture-project/vitest.config.js +0 -6
package/dist/tests/integration/autoStartConversation.spec.js +0 -138
package/dist/tests/integration/defaultCommand.spec.js +0 -147
package/dist/tests/integration/directCommandNonTty.spec.js +0 -224
package/dist/tests/integration/directCommandTty.spec.js +0 -151
package/dist/tests/integration/discoveryEnrichmentFlow.spec.js +0 -175
package/dist/tests/integration/exportArtifacts.spec.js +0 -202
package/dist/tests/integration/exportFallbackFlow.spec.js +0 -99
package/dist/tests/integration/mcpDegradationFlow.spec.js +0 -190
package/dist/tests/integration/mcpTransportFlow.spec.js +0 -139
package/dist/tests/integration/newSessionFlow.spec.js +0 -343
package/dist/tests/integration/pocGithubMcp.spec.js +0 -186
package/dist/tests/integration/pocLocalFallback.spec.js +0 -171
package/dist/tests/integration/pocScaffold.spec.js +0 -163
package/dist/tests/integration/ralphLoopFlow.spec.js +0 -359
package/dist/tests/integration/ralphLoopPartial.spec.js +0 -368
package/dist/tests/integration/resumeAndBacktrack.spec.js +0 -247
package/dist/tests/integration/spinnerLifecycle.spec.js +0 -220
package/dist/tests/integration/summarizationFlow.spec.js +0 -115
package/dist/tests/integration/testRunnerReal.spec.js +0 -52
package/dist/tests/integration/webSearchAgent.spec.js +0 -128
package/dist/tests/live/copilotSdkLive.spec.js +0 -107
package/dist/tests/live/zavaFullWorkshop.spec.js +0 -392
package/dist/tests/setup/loadEnv.js +0 -3
package/dist/tests/unit/cli/developCommand.spec.js +0 -567
package/dist/tests/unit/cli/directCommands.spec.js +0 -279
package/dist/tests/unit/cli/envLoader.spec.js +0 -58
package/dist/tests/unit/cli/ioContext.spec.js +0 -119
package/dist/tests/unit/cli/preflight.spec.js +0 -108
package/dist/tests/unit/cli/statusCommand.spec.js +0 -111
package/dist/tests/unit/cli/workshopClientFallback.spec.js +0 -80
package/dist/tests/unit/cli/workshopCommand.spec.js +0 -328
package/dist/tests/unit/config/vitestEnvSetup.spec.js +0 -13
package/dist/tests/unit/develop/checkpointState.spec.js +0 -315
package/dist/tests/unit/develop/codeGenerator.spec.js +0 -355
package/dist/tests/unit/develop/githubMcpAdapter.spec.js +0 -231
package/dist/tests/unit/develop/mcpContextEnricher.spec.js +0 -433
package/dist/tests/unit/develop/outputValidator.spec.js +0 -119
package/dist/tests/unit/develop/pocScaffolder.spec.js +0 -353
package/dist/tests/unit/develop/ralphLoop.spec.js +0 -1248
package/dist/tests/unit/develop/templateRegistry.spec.js +0 -85
package/dist/tests/unit/develop/testRunner.spec.js +0 -249
package/dist/tests/unit/infraBicep.spec.js +0 -92
package/dist/tests/unit/infraDeploy.spec.js +0 -82
package/dist/tests/unit/infraTeardown.spec.js +0 -63
package/dist/tests/unit/logging/logger.spec.js +0 -43
package/dist/tests/unit/loop/conversationLoop.spec.js +0 -592
package/dist/tests/unit/loop/phaseSummarizer.spec.js +0 -141
package/dist/tests/unit/loop/streamingMarkdown.spec.js +0 -147
package/dist/tests/unit/mcp/mcpManager.spec.js +0 -279
package/dist/tests/unit/mcp/mcpTransport.spec.js +0 -529
package/dist/tests/unit/mcp/retryPolicy.spec.js +0 -218
package/dist/tests/unit/mcp/timeoutValidation.spec.js +0 -46
package/dist/tests/unit/mcp/webSearch.spec.js +0 -567
package/dist/tests/unit/phases/contextSummarizer.spec.js +0 -140
package/dist/tests/unit/phases/discoveryEnricher.repeatCalls.spec.js +0 -93
package/dist/tests/unit/phases/discoveryEnricher.spec.js +0 -411
package/dist/tests/unit/phases/phaseExtractors.spec.js +0 -352
package/dist/tests/unit/phases/phaseHandlers.spec.js +0 -425
package/dist/tests/unit/prompts/promptLoader.spec.js +0 -118
package/dist/tests/unit/schemas/pocSchemas.spec.js +0 -412
package/dist/tests/unit/schemas/session.spec.js +0 -257
package/dist/tests/unit/sessions/exportPaths.spec.js +0 -31
package/dist/tests/unit/sessions/exportWriter.spec.js +0 -655
package/dist/tests/unit/sessions/sessionManager.spec.js +0 -151
package/dist/tests/unit/sessions/sessionStore.spec.js +0 -116
package/dist/tests/unit/shared/activitySpinner.spec.js +0 -175
package/dist/tests/unit/shared/cardsLoader.spec.js +0 -76
package/dist/tests/unit/shared/copilotClient.spec.js +0 -155
package/dist/tests/unit/shared/errorClassifier.spec.js +0 -131
package/dist/tests/unit/shared/events.spec.js +0 -55
package/dist/tests/unit/shared/markdownRenderer.spec.js +0 -35
package/dist/tests/unit/shared/markdownRendererChunks.spec.js +0 -70
package/dist/tests/unit/shared/tableRenderer.spec.js +0 -34
package/dist/vitest.config.js +0 -14
package/dist/vitest.live.config.js +0 -18
package/src/develop/pocScaffolder.ts +0 -646
package/tests/integration/pocScaffold.spec.ts +0 -220
package/tests/unit/develop/pocScaffolder.spec.ts +0 -451

package/dist/tests/e2e/developFailureE2e.spec.js DELETED Viewed

@@ -1,247 +0,0 @@
-/**
- * T050: E2E failure/recovery test.
- *
- * Verifies graceful termination; verifies `finalStatus` is "failed" or "partial"
- * in session state; verifies `terminationReason: "max-iterations"`;
- * verifies user-facing output includes recovery guidance (Constitution VI compliance).
- */
-import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
-import { mkdtemp, rm } from 'node:fs/promises';
-import { join } from 'node:path';
-import { tmpdir } from 'node:os';
-import { createRequire } from 'node:module';
-import { RalphLoop } from '../../src/develop/ralphLoop.js';
-vi.mock('node:child_process', async (importOriginal) => {
-    const actual = await importOriginal();
-    return {
-        ...actual,
-        spawn: vi.fn((cmd, args) => {
-            if (cmd === 'npm' && args.includes('install')) {
-                return {
-                    stdout: { on: vi.fn() },
-                    stderr: { on: vi.fn() },
-                    on: vi.fn((event, cb) => {
-                        if (event === 'close')
-                            cb(0);
-                    }),
-                    kill: vi.fn(),
-                    killed: false,
-                };
-            }
-            return actual.spawn(cmd, args);
-        }),
-    };
-});
-const require = createRequire(import.meta.url);
-const fixtureSession = require('../fixtures/completedSession.json');
-describe('E2E: failure/recovery (T050)', () => {
-    let tmpDir;
-    let originalExitCode;
-    beforeEach(async () => {
-        tmpDir = await mkdtemp(join(tmpdir(), 'sofia-e2e-failure-'));
-        originalExitCode = process.exitCode;
-        process.exitCode = undefined;
-    });
-    afterEach(async () => {
-        await rm(tmpDir, { recursive: true, force: true });
-        process.exitCode = originalExitCode;
-        vi.restoreAllMocks();
-    });
-    function makeIo() {
-        const writtenLines = [];
-        const activityLines = [];
-        return {
-            writtenLines,
-            activityLines,
-            write: vi.fn((text) => { writtenLines.push(text); }),
-            writeActivity: vi.fn((text) => { activityLines.push(text); }),
-            writeToolSummary: vi.fn(),
-            readInput: vi.fn().mockResolvedValue(null),
-            showDecisionGate: vi.fn(),
-            isJsonMode: false,
-            isTTY: false,
-        };
-    }
-    function makeFakeScaffolder(outputDir) {
-        return {
-            scaffold: vi.fn().mockImplementation(async () => {
-                const { writeFile, mkdir } = await import('node:fs/promises');
-                await mkdir(join(outputDir, 'src'), { recursive: true });
-                await writeFile(join(outputDir, 'package.json'), JSON.stringify({
-                    name: 'test-poc',
-                    scripts: { test: 'vitest run' },
-                    dependencies: {},
-                    devDependencies: {},
-                }), 'utf-8');
-                await writeFile(join(outputDir, 'src', 'index.ts'), 'export function main() {}', 'utf-8');
-                return {
-                    createdFiles: ['package.json', 'src/index.ts'],
-                    skippedFiles: [],
-                    context: {
-                        projectName: 'test-poc',
-                        ideaTitle: 'Test',
-                        ideaDescription: 'Test',
-                        techStack: { language: 'TypeScript', runtime: 'Node.js 20', testRunner: 'npm test' },
-                        planSummary: 'Test',
-                        sessionId: fixtureSession.sessionId,
-                        outputDir,
-                    },
-                };
-            }),
-            getTemplateFiles: () => [],
-        };
-    }
-    function makeAlwaysFailingClient() {
-        return {
-            createSession: vi.fn().mockResolvedValue({
-                send: vi.fn().mockReturnValue({
-                    async *[Symbol.asyncIterator]() {
-                        yield { type: 'TextDelta', text: '', timestamp: '' };
-                    },
-                }),
-                getHistory: () => [],
-            }),
-        };
-    }
-    function makeAlwaysFailingTestRunner() {
-        return {
-            run: vi.fn().mockResolvedValue({
-                passed: 0,
-                failed: 1,
-                skipped: 0,
-                total: 1,
-                durationMs: 400,
-                failures: [{ testName: 'test', message: 'always fails' }],
-                rawOutput: '',
-            }),
-        };
-    }
-    it('terminates with max-iterations when all tests keep failing', async () => {
-        const io = makeIo();
-        const scaffolder = makeFakeScaffolder(tmpDir);
-        const client = makeAlwaysFailingClient();
-        const testRunner = makeAlwaysFailingTestRunner();
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session: fixtureSession,
-            outputDir: tmpDir,
-            maxIterations: 2,
-            testRunner,
-            scaffolder,
-        });
-        const result = await ralph.run();
-        expect(result.terminationReason).toBe('max-iterations');
-        expect(['failed', 'partial']).toContain(result.finalStatus);
-    });
-    it('verifies terminationReason=max-iterations in session state', async () => {
-        const io = makeIo();
-        const scaffolder = makeFakeScaffolder(tmpDir);
-        const client = makeAlwaysFailingClient();
-        const testRunner = makeAlwaysFailingTestRunner();
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session: fixtureSession,
-            outputDir: tmpDir,
-            maxIterations: 2,
-            testRunner,
-            scaffolder,
-        });
-        const result = await ralph.run();
-        expect(result.session.poc?.terminationReason).toBe('max-iterations');
-        expect(result.session.poc?.finalStatus).toBeDefined();
-    });
-    it('session has iteration history after failed loop', async () => {
-        const io = makeIo();
-        const scaffolder = makeFakeScaffolder(tmpDir);
-        const client = makeAlwaysFailingClient();
-        const testRunner = makeAlwaysFailingTestRunner();
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session: fixtureSession,
-            outputDir: tmpDir,
-            maxIterations: 2,
-            testRunner,
-            scaffolder,
-        });
-        const result = await ralph.run();
-        // Should have at least scaffold iteration
-        expect(result.session.poc?.iterations.length).toBeGreaterThan(0);
-        expect(result.session.poc?.iterations[0].outcome).toBe('scaffold');
-    });
-    it('shows recovery guidance in non-JSON output for failed status (Constitution VI)', async () => {
-        const { developCommand } = await import('../../src/cli/developCommand.js');
-        const devIo = makeIo();
-        const client = makeAlwaysFailingClient();
-        const store = {
-            load: vi.fn().mockResolvedValue(fixtureSession),
-            save: vi.fn().mockResolvedValue(undefined),
-            list: vi.fn().mockResolvedValue([fixtureSession.sessionId]),
-        };
-        // Mock RalphLoop.prototype.run to return failed immediately
-        const originalRun = RalphLoop.prototype.run;
-        const sessionWithFailedPoc = {
-            ...fixtureSession,
-            poc: {
-                repoSource: 'local',
-                repoPath: tmpDir,
-                iterations: [],
-                finalStatus: 'failed',
-                terminationReason: 'max-iterations',
-            },
-        };
-        RalphLoop.prototype.run = vi.fn().mockResolvedValue({
-            session: sessionWithFailedPoc,
-            finalStatus: 'failed',
-            terminationReason: 'max-iterations',
-            iterationsCompleted: 2,
-            outputDir: tmpDir,
-        });
-        try {
-            await developCommand({ session: fixtureSession.sessionId, maxIterations: 1, output: tmpDir }, { store, io: devIo, client });
-        }
-        finally {
-            RalphLoop.prototype.run = originalRun;
-        }
-        const allOutput = devIo.writtenLines.join('\n');
-        // developCommand should show recovery guidance for non-success status
-        expect(allOutput).toMatch(/resume|retry|force|more.*iter/i);
-    });
-    it('sets process.exitCode=1 when loop terminates with failed status', async () => {
-        const { developCommand } = await import('../../src/cli/developCommand.js');
-        const devIo = makeIo();
-        const client = makeAlwaysFailingClient();
-        const store = {
-            load: vi.fn().mockResolvedValue(fixtureSession),
-            save: vi.fn().mockResolvedValue(undefined),
-            list: vi.fn().mockResolvedValue([fixtureSession.sessionId]),
-        };
-        const sessionWithFailedPoc = {
-            ...fixtureSession,
-            poc: {
-                repoSource: 'local',
-                repoPath: tmpDir,
-                iterations: [],
-                finalStatus: 'failed',
-                terminationReason: 'max-iterations',
-            },
-        };
-        const originalRun = RalphLoop.prototype.run;
-        RalphLoop.prototype.run = vi.fn().mockResolvedValue({
-            session: sessionWithFailedPoc,
-            finalStatus: 'failed',
-            terminationReason: 'max-iterations',
-            iterationsCompleted: 2,
-            outputDir: tmpDir,
-        });
-        try {
-            await developCommand({ session: fixtureSession.sessionId }, { store, io: devIo, client });
-        }
-        finally {
-            RalphLoop.prototype.run = originalRun;
-        }
-        expect(process.exitCode).toBe(1);
-    });
-});

package/dist/tests/e2e/developPty.spec.js DELETED Viewed

@@ -1,75 +0,0 @@
-/**
- * T049-T051: PTY-based interactive E2E tests for `sofia dev`.
- *
- * Validates Ctrl+C handling, progress output, and clean exit behavior.
- * Gracefully skips if node-pty allocation fails (e.g., CI without TTY).
- */
-import { describe, it, expect } from 'vitest';
-// ── PTY availability guard (T051) ────────────────────────────────────────────
-let pty;
-let ptyAvailable = false;
-try {
-    pty = await import('node-pty');
-    // Attempt a minimal allocation to verify PTY works
-    const testProc = pty.spawn('echo', ['test'], { cols: 80, rows: 24 });
-    testProc.kill();
-    ptyAvailable = true;
-}
-catch {
-    ptyAvailable = false;
-}
-describe('PTY-based E2E: sofia dev', () => {
-    // T051: Skip gracefully if node-pty allocation fails
-    const itPty = ptyAvailable ? it : it.skip;
-    itPty('help output appears in PTY buffer (T050)', async () => {
-        if (!pty)
-            return;
-        const proc = pty.spawn('npx', ['tsx', 'src/cli/index.ts', 'dev', '--help'], {
-            cols: 120,
-            rows: 40,
-            cwd: process.cwd(),
-            env: { ...process.env },
-        });
-        let output = '';
-        proc.onData((data) => {
-            output += data;
-        });
-        const exitCode = await new Promise((resolve) => {
-            proc.onExit(({ exitCode: code }) => {
-                resolve(code);
-            });
-            setTimeout(() => {
-                proc.kill();
-                resolve(-1);
-            }, 15_000);
-        });
-        // --help should produce usage output containing 'dev'
-        expect(output).toContain('dev');
-        expect(exitCode).toBe(0);
-    }, 20_000);
-    itPty('Ctrl+C sends signal to running process (T049)', async () => {
-        if (!pty)
-            return;
-        // Use a simple process that sleeps, then send Ctrl+C
-        const proc = pty.spawn('sleep', ['30'], {
-            cols: 80,
-            rows: 24,
-            cwd: process.cwd(),
-            env: { ...process.env },
-        });
-        // Wait briefly then send Ctrl+C
-        await new Promise((resolve) => setTimeout(resolve, 500));
-        proc.write('\x03'); // Ctrl+C
-        const exitCode = await new Promise((resolve) => {
-            proc.onExit(({ exitCode: code }) => {
-                resolve(code);
-            });
-            setTimeout(() => {
-                proc.kill();
-                resolve(-999);
-            }, 5_000);
-        });
-        // Process should have been interrupted (not timed out)
-        expect(exitCode).not.toBe(-999);
-    }, 10_000);
-});

package/dist/tests/e2e/discoveryWebSearchRelevance.spec.js DELETED Viewed

@@ -1,84 +0,0 @@
-/**
- * T041: Discovery web search enrichment relevance validation (SC-003-005).
- *
- * Validates that discovery web search enrichment retrieves keyword-relevant
- * context for at least 3 out of 5 test company descriptions.
- * Gated behind SOFIA_LIVE_MCP_TESTS=true because it requires real web search.
- *
- * Acceptance criteria:
- * - Run enrichFromWebSearch() for 5 different company descriptions
- * - At least 3/5 must return results with keyword-relevant content
- * - "Keyword-relevant" = at least one result snippet contains a word from the company/industry
- */
-import { describe, it, expect } from 'vitest';
-const LIVE = process.env.SOFIA_LIVE_MCP_TESTS === 'true';
-const TEST_COMPANIES = [
-    {
-        summary: '"Nestlé" is a global food and beverage company headquartered in Switzerland.',
-        keywords: ['food', 'beverage', 'switzerland', 'global', 'company'],
-    },
-    {
-        summary: '"Zara" is a global retail company headquartered in Spain.',
-        keywords: ['retail', 'fashion', 'spain', 'global', 'company'],
-    },
-    {
-        summary: '"Microsoft Corporation" is a global technology company headquartered in Redmond, Washington.',
-        keywords: ['technology', 'software', 'hardware', 'cloud', 'global'],
-    },
-    {
-        summary: '"Maersk" is a global shipping and logistics company headquartered in Copenhagen, Denmark.',
-        keywords: ['shipping', 'logistics', 'denmark', 'global', 'company'],
-    },
-    {
-        summary: '"Hasbro" is a global toy and entertainment company headquartered in Pawtucket, Rhode Island.',
-        keywords: ['toy', 'entertainment', 'rhode island', 'global', 'company'],
-    },
-];
-describe.skipIf(!LIVE)('Discovery web search relevance validation (T041 / SC-003-005)', () => {
-    it('at least 3/5 company descriptions return keyword-relevant results', async () => {
-        const { DiscoveryEnricher } = await import('../../src/phases/discoveryEnricher.js');
-        const { createWebSearchTool } = await import('../../src/mcp/webSearch.js');
-        const webSearchFn = createWebSearchTool({
-            projectEndpoint: process.env.FOUNDRY_PROJECT_ENDPOINT,
-            modelDeploymentName: process.env.FOUNDRY_MODEL_DEPLOYMENT_NAME,
-        });
-        const webSearchClient = {
-            search: async (query) => webSearchFn(query),
-        };
-        const enricher = new DiscoveryEnricher();
-        let relevantCount = 0;
-        const results = [];
-        for (const company of TEST_COMPANIES) {
-            const enrichment = await enricher.enrichFromWebSearch(company.summary, webSearchClient);
-            // Collect all result strings from enrichment
-            const allText = [
-                ...(enrichment.companyNews ?? []),
-                ...(enrichment.competitorInfo ?? []),
-                ...(enrichment.industryTrends ?? []),
-            ]
-                .join(' ')
-                .toLowerCase();
-            const snippetCount = (enrichment.companyNews?.length ?? 0) +
-                (enrichment.competitorInfo?.length ?? 0) +
-                (enrichment.industryTrends?.length ?? 0);
-            // Check if any keyword appears in the results
-            const hasRelevantKeyword = company.keywords.some((kw) => allText.includes(kw.toLowerCase()));
-            if (hasRelevantKeyword && snippetCount > 0) {
-                relevantCount++;
-            }
-            results.push({
-                company: company.summary.split('"')[1] || company.summary.slice(0, 30),
-                relevant: hasRelevantKeyword && snippetCount > 0,
-                snippetCount,
-            });
-        }
-        // Log outcomes for manual review
-        console.log('=== T041 Web Search Relevance Validation ===');
-        for (const r of results) {
-            console.log(`  ${r.relevant ? '✓' : '✗'} ${r.company}: ${r.snippetCount} snippets`);
-        }
-        console.log(`Result: ${relevantCount}/5 companies have relevant results`);
-        // Acceptance: at least 3 out of 5
-        expect(relevantCount).toBeGreaterThanOrEqual(3);
-    }, 120_000); // 2 minute timeout for multiple web searches
-});

package/dist/tests/e2e/harness.spec.js DELETED Viewed

@@ -1,83 +0,0 @@
-/**
- * E2E test harness skeleton.
- *
- * Uses node-pty to drive the sofIA CLI interactively, simulating
- * user input and verifying streaming output. This is a skeleton —
- * actual E2E test scenarios will be added in US1 (T021).
- *
- * Requirements:
- * - node-pty must be installed (`npm install node-pty`)
- * - Tests run under the `test:e2e` npm script
- */
-import { describe, it, expect } from 'vitest';
-import { spawn } from 'node:child_process';
-import { join, dirname } from 'node:path';
-import { fileURLToPath } from 'node:url';
-const __dirname = dirname(fileURLToPath(import.meta.url));
-const PROJECT_ROOT = join(__dirname, '..', '..');
-const CLI_ENTRY = join(PROJECT_ROOT, 'src', 'cli', 'index.ts');
-/**
- * Run the sofIA CLI with given arguments and return output.
- * Uses tsx to run TypeScript directly.
- */
-function runCli(args, timeoutMs = 10000) {
-    return new Promise((resolve, reject) => {
-        const child = spawn('npx', ['tsx', CLI_ENTRY, ...args], {
-            cwd: PROJECT_ROOT,
-            env: { ...process.env, NODE_ENV: 'test' },
-            stdio: ['pipe', 'pipe', 'pipe'],
-        });
-        const stdout = [];
-        const stderr = [];
-        child.stdout.on('data', (chunk) => stdout.push(chunk));
-        child.stderr.on('data', (chunk) => stderr.push(chunk));
-        const timer = setTimeout(() => {
-            child.kill('SIGTERM');
-            reject(new Error(`CLI timed out after ${timeoutMs}ms`));
-        }, timeoutMs);
-        child.on('close', (code) => {
-            clearTimeout(timer);
-            resolve({
-                stdout: Buffer.concat(stdout).toString('utf-8'),
-                stderr: Buffer.concat(stderr).toString('utf-8'),
-                exitCode: code,
-            });
-        });
-        child.on('error', (err) => {
-            clearTimeout(timer);
-            reject(err);
-        });
-    });
-}
-// ── Tests ────────────────────────────────────────────────────────────────────
-describe('E2E Harness', () => {
-    it('displays help when invoked with --help', async () => {
-        const result = await runCli(['--help']);
-        expect(result.exitCode).toBe(0);
-        expect(result.stdout).toContain('sofIA');
-        expect(result.stdout).toContain('workshop');
-        expect(result.stdout).toContain('status');
-        expect(result.stdout).toContain('export');
-    }, 15_000);
-    it('displays version when invoked with --version', async () => {
-        const result = await runCli(['--version']);
-        expect(result.exitCode).toBe(0);
-        expect(result.stdout.trim()).toMatch(/^\d+\.\d+\.\d+$/);
-    }, 15_000);
-    it('shows workshop help', async () => {
-        const result = await runCli(['workshop', '--help']);
-        expect(result.exitCode).toBe(0);
-        expect(result.stdout).toContain('workshop');
-    }, 15_000);
-    it('lists sessions or reports none when status invoked without session', async () => {
-        const result = await runCli(['status', '--json']);
-        // Either lists sessions or reports no sessions found — both valid
-        const parsed = JSON.parse(result.stdout);
-        expect(parsed).toBeDefined();
-        expect('sessions' in parsed || 'error' in parsed).toBe(true);
-    }, 15_000);
-    it('returns error for export without session', async () => {
-        const result = await runCli(['export', '--json']);
-        expect(result.stdout).toContain('No session specified');
-    }, 15_000);
-});

package/dist/tests/e2e/mcpLive.spec.js DELETED Viewed

@@ -1,120 +0,0 @@
-/**
- * T039: Live MCP smoke tests.
- *
- * Gated behind SOFIA_LIVE_MCP_TESTS=true environment variable.
- * These tests exercise real MCP server integrations:
- * - GitHub MCP: create/delete a test repository (infrastructure validation only)
- * - Context7: resolve a library ID
- * - Azure MCP: return documentation for a simple query
- * - Web search: return results for a test query
- *
- * NOTE: GitHub MCP test validates the infrastructure works, but sofIA does NOT
- * automatically create GitHub repos during PoC generation. PoCs are created locally
- * with git init, and users manually push when ready (safer approach).
- *
- * Requires:
- * - GitHub MCP: GITHUB_TOKEN env var OR `gh auth login` (GitHub CLI)
- * - MCP servers accessible
- */
-import { describe, it, expect } from 'vitest';
-import { execSync } from 'node:child_process';
-const LIVE = process.env.SOFIA_LIVE_MCP_TESTS === 'true';
-/**
- * Check if GitHub authentication is available (env var or GitHub CLI).
- */
-function hasGitHubAuth() {
-    if (process.env.GITHUB_TOKEN)
-        return true;
-    try {
-        const token = execSync('gh auth token', {
-            encoding: 'utf8',
-            stdio: ['pipe', 'pipe', 'ignore'],
-            timeout: 2000,
-        }).trim();
-        return !!token;
-    }
-    catch {
-        return false;
-    }
-}
-describe.skipIf(!LIVE)('Live MCP Smoke Tests (T039)', () => {
-    it.skipIf(!hasGitHubAuth())('GitHub MCP: creates and deletes a test repository', { timeout: 35_000 }, async () => {
-        // This test requires GITHUB_TOKEN env var OR `gh auth login` (GitHub CLI)
-        const { McpManager, loadMcpConfig } = await import('../../src/mcp/mcpManager.js');
-        const config = await loadMcpConfig('.vscode/mcp.json');
-        const manager = new McpManager(config);
-        manager.markConnected('github');
-        const repoName = `sofia-mcp-test-${Date.now()}`;
-        try {
-            const createResult = await manager.callTool('github', 'create_repository', {
-                name: repoName,
-                description: 'Automated MCP integration test — safe to delete',
-                private: true,
-            }, { timeoutMs: 30_000 });
-            expect(createResult).toBeDefined();
-            expect(typeof createResult).toBe('object');
-            // Verify the repository was created - McpManager already parses the content
-            expect(createResult).toHaveProperty('url');
-            expect(createResult.url).toContain(repoName);
-            // Best-effort cleanup: delete the test repo using GitHub CLI
-            // Note: This requires delete_repo scope; if it fails, the repo will need manual cleanup
-            try {
-                const username = execSync('gh api user --jq .login', { encoding: 'utf8' }).trim();
-                execSync(`gh repo delete ${username}/${repoName} --yes`, {
-                    encoding: 'utf8',
-                    stdio: ['pipe', 'pipe', 'pipe'], // capture all output
-                });
-            }
-            catch (_cleanupError) {
-                // Cleanup failure is not a test failure - just log it
-                console.warn(`⚠️  Could not auto-delete test repo ${repoName}. Please delete manually or grant delete_repo scope.`);
-                console.warn(`   Command: gh repo delete <username>/${repoName} --yes`);
-            }
-        }
-        finally {
-            await manager.disconnectAll();
-        }
-    });
-    it('Context7: resolves "express" library ID', async () => {
-        const { McpManager, loadMcpConfig } = await import('../../src/mcp/mcpManager.js');
-        const config = await loadMcpConfig('.vscode/mcp.json');
-        const manager = new McpManager(config);
-        manager.markConnected('context7');
-        try {
-            const result = await manager.callTool('context7', 'resolve-library-id', {
-                query: 'resolve express library id',
-                libraryName: 'express',
-            }, { timeoutMs: 30_000 });
-            expect(result).toBeDefined();
-            const rawText = typeof result.text === 'string' ? result.text : JSON.stringify(result);
-            const content = rawText.toLowerCase();
-            // Response should contain meaningful resolve-library-id content
-            const expectedKeywords = ['express', 'context7-compatible library id', 'code snippets'];
-            const matchedKeywords = expectedKeywords.filter((keyword) => content.includes(keyword));
-            expect(matchedKeywords.length).toBeGreaterThanOrEqual(2);
-            // Ensure at least one high-confidence Express library ID appears
-            expect(content).toMatch(/\/expressjs\/express|\/websites\/expressjs_en/);
-        }
-        finally {
-            await manager.disconnectAll();
-        }
-    });
-    it('Web search: returns results for a test query', async () => {
-        const { createWebSearchTool, isWebSearchConfigured } = await import('../../src/mcp/webSearch.js');
-        // Skip if web search is not configured
-        if (!isWebSearchConfigured()) {
-            console.log('Web search not configured, skipping test');
-            return;
-        }
-        const webSearch = createWebSearchTool({
-            projectEndpoint: process.env.FOUNDRY_PROJECT_ENDPOINT,
-            modelDeploymentName: process.env.FOUNDRY_MODEL_DEPLOYMENT_NAME,
-        });
-        const result = await webSearch('TypeScript Node.js framework 2025');
-        expect(result.degraded).toBeOneOf([false, undefined]);
-        expect(result).toBeDefined();
-        expect(result.results).toBeDefined();
-        expect(Array.isArray(result.results)).toBe(true);
-        expect(result.results.length).toBeGreaterThan(0);
-    }, 30_000); // 30 second timeout for web search
-});