npm - sofia-cli - Versions diffs - 0.1.2 → 0.1.4 - Mend

sofia-cli 0.1.2 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (136) hide show

package/README.md +42 -20
package/dist/infra/deploy.sh +193 -0
package/dist/infra/gather-env.sh +211 -0
package/dist/infra/infra/deploy.sh +193 -0
package/dist/infra/infra/gather-env.sh +211 -0
package/dist/infra/infra/main.bicep +90 -0
package/dist/infra/infra/main.bicepparam +18 -0
package/dist/infra/infra/resources.bicep +134 -0
package/dist/infra/infra/teardown.sh +114 -0
package/dist/infra/main.bicep +90 -0
package/dist/infra/main.bicepparam +18 -0
package/dist/infra/resources.bicep +134 -0
package/dist/infra/teardown.sh +114 -0
package/dist/src/cli/developCommand.js +0 -2
package/dist/src/cli/index.js +8 -1
package/dist/src/cli/workshopCommand.js +1 -1
package/dist/src/develop/index.js +1 -1
package/dist/src/develop/pocUtils.js +228 -0
package/dist/src/develop/ralphLoop.js +8 -27
package/dist/src/shared/data/cards.json +655 -670
package/docs/architecture.md +2 -1
package/package.json +5 -3
package/src/cli/developCommand.ts +1 -3
package/src/cli/index.ts +11 -1
package/src/cli/workshopCommand.ts +21 -17
package/src/develop/dynamicScaffolder.ts +36 -30
package/src/develop/index.ts +13 -2
package/src/develop/pocUtils.ts +296 -0
package/src/develop/ralphLoop.ts +8 -28
package/src/develop/templateRegistry.ts +19 -18
package/src/shared/data/cards.json +655 -670
package/tests/e2e/developE2e.spec.ts +3 -61
package/tests/e2e/developFailureE2e.spec.ts +34 -38
package/tests/integration/pocGithubMcp.spec.ts +29 -39
package/tests/integration/pocLocalFallback.spec.ts +29 -39
package/tests/integration/ralphLoopFlow.spec.ts +46 -66
package/tests/integration/ralphLoopPartial.spec.ts +30 -37
package/tests/unit/develop/githubMcpAdapter.spec.ts +0 -134
package/tests/unit/develop/outputValidator.spec.ts +45 -21
package/tests/unit/develop/ralphLoop.spec.ts +58 -94
package/tsconfig.json +2 -1
package/vitest.workspace.ts +5 -0
package/dist/src/develop/pocScaffolder.js +0 -542
package/dist/tests/e2e/developE2e.spec.js +0 -126
package/dist/tests/e2e/developFailureE2e.spec.js +0 -247
package/dist/tests/e2e/developPty.spec.js +0 -75
package/dist/tests/e2e/discoveryWebSearchRelevance.spec.js +0 -84
package/dist/tests/e2e/harness.spec.js +0 -83
package/dist/tests/e2e/mcpLive.spec.js +0 -120
package/dist/tests/e2e/newSession.e2e.spec.js +0 -177
package/dist/tests/e2e/ralphLoopEnrichmentComparison.spec.js +0 -62
package/dist/tests/e2e/workiqEnrichment.spec.js +0 -56
package/dist/tests/e2e/zavaSimulation.spec.js +0 -452
package/dist/tests/fixtures/test-fixture-project/src/add.js +0 -3
package/dist/tests/fixtures/test-fixture-project/tests/failing.test.js +0 -6
package/dist/tests/fixtures/test-fixture-project/tests/hanging.test.js +0 -8
package/dist/tests/fixtures/test-fixture-project/tests/passing.test.js +0 -10
package/dist/tests/fixtures/test-fixture-project/vitest.config.js +0 -6
package/dist/tests/integration/autoStartConversation.spec.js +0 -138
package/dist/tests/integration/defaultCommand.spec.js +0 -147
package/dist/tests/integration/directCommandNonTty.spec.js +0 -224
package/dist/tests/integration/directCommandTty.spec.js +0 -151
package/dist/tests/integration/discoveryEnrichmentFlow.spec.js +0 -175
package/dist/tests/integration/exportArtifacts.spec.js +0 -202
package/dist/tests/integration/exportFallbackFlow.spec.js +0 -99
package/dist/tests/integration/mcpDegradationFlow.spec.js +0 -190
package/dist/tests/integration/mcpTransportFlow.spec.js +0 -139
package/dist/tests/integration/newSessionFlow.spec.js +0 -343
package/dist/tests/integration/pocGithubMcp.spec.js +0 -186
package/dist/tests/integration/pocLocalFallback.spec.js +0 -171
package/dist/tests/integration/pocScaffold.spec.js +0 -163
package/dist/tests/integration/ralphLoopFlow.spec.js +0 -359
package/dist/tests/integration/ralphLoopPartial.spec.js +0 -368
package/dist/tests/integration/resumeAndBacktrack.spec.js +0 -247
package/dist/tests/integration/spinnerLifecycle.spec.js +0 -220
package/dist/tests/integration/summarizationFlow.spec.js +0 -115
package/dist/tests/integration/testRunnerReal.spec.js +0 -52
package/dist/tests/integration/webSearchAgent.spec.js +0 -128
package/dist/tests/live/copilotSdkLive.spec.js +0 -107
package/dist/tests/live/zavaFullWorkshop.spec.js +0 -392
package/dist/tests/setup/loadEnv.js +0 -3
package/dist/tests/unit/cli/developCommand.spec.js +0 -567
package/dist/tests/unit/cli/directCommands.spec.js +0 -279
package/dist/tests/unit/cli/envLoader.spec.js +0 -58
package/dist/tests/unit/cli/ioContext.spec.js +0 -119
package/dist/tests/unit/cli/preflight.spec.js +0 -108
package/dist/tests/unit/cli/statusCommand.spec.js +0 -111
package/dist/tests/unit/cli/workshopClientFallback.spec.js +0 -80
package/dist/tests/unit/cli/workshopCommand.spec.js +0 -328
package/dist/tests/unit/config/vitestEnvSetup.spec.js +0 -13
package/dist/tests/unit/develop/checkpointState.spec.js +0 -315
package/dist/tests/unit/develop/codeGenerator.spec.js +0 -355
package/dist/tests/unit/develop/githubMcpAdapter.spec.js +0 -231
package/dist/tests/unit/develop/mcpContextEnricher.spec.js +0 -433
package/dist/tests/unit/develop/outputValidator.spec.js +0 -119
package/dist/tests/unit/develop/pocScaffolder.spec.js +0 -353
package/dist/tests/unit/develop/ralphLoop.spec.js +0 -1248
package/dist/tests/unit/develop/templateRegistry.spec.js +0 -85
package/dist/tests/unit/develop/testRunner.spec.js +0 -249
package/dist/tests/unit/infraBicep.spec.js +0 -92
package/dist/tests/unit/infraDeploy.spec.js +0 -82
package/dist/tests/unit/infraTeardown.spec.js +0 -63
package/dist/tests/unit/logging/logger.spec.js +0 -43
package/dist/tests/unit/loop/conversationLoop.spec.js +0 -592
package/dist/tests/unit/loop/phaseSummarizer.spec.js +0 -141
package/dist/tests/unit/loop/streamingMarkdown.spec.js +0 -147
package/dist/tests/unit/mcp/mcpManager.spec.js +0 -279
package/dist/tests/unit/mcp/mcpTransport.spec.js +0 -529
package/dist/tests/unit/mcp/retryPolicy.spec.js +0 -218
package/dist/tests/unit/mcp/timeoutValidation.spec.js +0 -46
package/dist/tests/unit/mcp/webSearch.spec.js +0 -567
package/dist/tests/unit/phases/contextSummarizer.spec.js +0 -140
package/dist/tests/unit/phases/discoveryEnricher.repeatCalls.spec.js +0 -93
package/dist/tests/unit/phases/discoveryEnricher.spec.js +0 -411
package/dist/tests/unit/phases/phaseExtractors.spec.js +0 -352
package/dist/tests/unit/phases/phaseHandlers.spec.js +0 -425
package/dist/tests/unit/prompts/promptLoader.spec.js +0 -118
package/dist/tests/unit/schemas/pocSchemas.spec.js +0 -412
package/dist/tests/unit/schemas/session.spec.js +0 -257
package/dist/tests/unit/sessions/exportPaths.spec.js +0 -31
package/dist/tests/unit/sessions/exportWriter.spec.js +0 -655
package/dist/tests/unit/sessions/sessionManager.spec.js +0 -151
package/dist/tests/unit/sessions/sessionStore.spec.js +0 -116
package/dist/tests/unit/shared/activitySpinner.spec.js +0 -175
package/dist/tests/unit/shared/cardsLoader.spec.js +0 -76
package/dist/tests/unit/shared/copilotClient.spec.js +0 -155
package/dist/tests/unit/shared/errorClassifier.spec.js +0 -131
package/dist/tests/unit/shared/events.spec.js +0 -55
package/dist/tests/unit/shared/markdownRenderer.spec.js +0 -35
package/dist/tests/unit/shared/markdownRendererChunks.spec.js +0 -70
package/dist/tests/unit/shared/tableRenderer.spec.js +0 -34
package/dist/vitest.config.js +0 -14
package/dist/vitest.live.config.js +0 -18
package/src/develop/pocScaffolder.ts +0 -646
package/tests/integration/pocScaffold.spec.ts +0 -220
package/tests/unit/develop/pocScaffolder.spec.ts +0 -451

package/dist/tests/integration/ralphLoopFlow.spec.js DELETED Viewed

@@ -1,359 +0,0 @@
-/**
- * T023: Integration test for Ralph loop with fakes.
- *
- * Uses a fake CopilotClient and fake test runner:
- * scaffold → fail tests → LLM generates fix → tests pass → loop terminates with success.
- * Verifies at least one iteration where failing test guides a fix (SC-002-003).
- */
-import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
-import { mkdtemp, rm, readFile } from 'node:fs/promises';
-import { join } from 'node:path';
-import { tmpdir } from 'node:os';
-import { createRequire } from 'node:module';
-import { RalphLoop } from '../../src/develop/ralphLoop.js';
-// Mock npm install
-vi.mock('node:child_process', async (importOriginal) => {
-    const actual = await importOriginal();
-    return {
-        ...actual,
-        spawn: vi.fn((cmd, args) => {
-            if (cmd === 'npm' && args.includes('install')) {
-                return {
-                    stdout: { on: vi.fn() },
-                    stderr: { on: vi.fn() },
-                    on: vi.fn((event, cb) => {
-                        if (event === 'close')
-                            cb(0);
-                    }),
-                    kill: vi.fn(),
-                    killed: false,
-                };
-            }
-            return actual.spawn(cmd, args);
-        }),
-    };
-});
-// Mock validatePocOutput to always pass in integration tests
-vi.mock('../../src/develop/pocScaffolder.js', async (importOriginal) => {
-    const actual = await importOriginal();
-    return {
-        ...actual,
-        validatePocOutput: vi.fn().mockResolvedValue({ valid: true, missingFiles: [], errors: [] }),
-    };
-});
-const require = createRequire(import.meta.url);
-const fixtureSession = require('../fixtures/completedSession.json');
-// ── Helpers ───────────────────────────────────────────────────────────────────
-function makeIo() {
-    return {
-        write: vi.fn(),
-        writeActivity: vi.fn(),
-        writeToolSummary: vi.fn(),
-        readInput: vi.fn().mockResolvedValue(null),
-        showDecisionGate: vi.fn(),
-        isJsonMode: false,
-        isTTY: false,
-    };
-}
-function makeFakeScaffolder(outputDir) {
-    return {
-        scaffold: vi.fn().mockImplementation(async () => {
-            const { writeFile, mkdir } = await import('node:fs/promises');
-            await mkdir(join(outputDir, 'src'), { recursive: true });
-            await mkdir(join(outputDir, 'tests'), { recursive: true });
-            await writeFile(join(outputDir, 'package.json'), JSON.stringify({
-                name: 'route-optimizer-poc',
-                scripts: { test: 'vitest run' },
-                dependencies: {},
-                devDependencies: { vitest: '^3.0.0' },
-            }), 'utf-8');
-            await writeFile(join(outputDir, 'src', 'index.ts'), '// TODO: implement\nexport function optimize() { return []; }', 'utf-8');
-            await writeFile(join(outputDir, 'tests', 'index.test.ts'), 'import { describe, it, expect } from "vitest";\nimport { optimize } from "../src/index.js";\ndescribe("optimizer", () => { it("should return stops", () => { expect(optimize().length).toBeGreaterThan(0); }); });', 'utf-8');
-            return {
-                createdFiles: ['package.json', 'src/index.ts', 'tests/index.test.ts'],
-                skippedFiles: [],
-                context: {
-                    projectName: 'route-optimizer-poc',
-                    ideaTitle: 'AI-Powered Route Optimizer',
-                    ideaDescription: 'Optimize routes',
-                    techStack: { language: 'TypeScript', runtime: 'Node.js 20', testRunner: 'npm test' },
-                    planSummary: 'Route optimization',
-                    sessionId: fixtureSession.sessionId,
-                    outputDir,
-                },
-            };
-        }),
-        getTemplateFiles: () => ['package.json', 'src/index.ts', 'tests/index.test.ts'],
-    };
-}
-// ── SC-002-003: Iterative refinement test ────────────────────────────────────
-describe('RalphLoop integration — iterative refinement (SC-002-003)', () => {
-    let tmpDir;
-    beforeEach(async () => {
-        tmpDir = await mkdtemp(join(tmpdir(), 'sofia-ralph-flow-'));
-    });
-    afterEach(async () => {
-        await rm(tmpDir, { recursive: true, force: true });
-        vi.clearAllMocks();
-    });
-    it('scaffold → fail tests → LLM fix → tests pass → success', async () => {
-        const io = makeIo();
-        const scaffolder = makeFakeScaffolder(tmpDir);
-        // Test runner: fails first, passes second
-        let testCallCount = 0;
-        const testRunner = {
-            run: vi.fn().mockImplementation(async () => {
-                testCallCount++;
-                if (testCallCount === 1) {
-                    // First run: fails
-                    return {
-                        passed: 0,
-                        failed: 1,
-                        skipped: 0,
-                        total: 1,
-                        durationMs: 400,
-                        failures: [
-                            {
-                                testName: 'optimizer > should return stops',
-                                message: 'Expected length to be greater than 0',
-                                file: 'tests/index.test.ts',
-                                line: 3,
-                            },
-                        ],
-                        rawOutput: 'FAIL tests/index.test.ts',
-                    };
-                }
-                // Subsequent runs: pass
-                return {
-                    passed: 1,
-                    failed: 0,
-                    skipped: 0,
-                    total: 1,
-                    durationMs: 300,
-                    failures: [],
-                    rawOutput: 'PASS tests/index.test.ts',
-                };
-            }),
-        };
-        // LLM response: generates a fix for the failing test
-        const client = {
-            createSession: vi.fn().mockResolvedValue({
-                send: vi.fn().mockReturnValue({
-                    async *[Symbol.asyncIterator]() {
-                        yield {
-                            type: 'TextDelta',
-                            text: [
-                                '```typescript file=src/index.ts',
-                                '// Fixed implementation',
-                                'export function optimize(): string[] {',
-                                '  return ["stop-1", "stop-2", "stop-3"];',
-                                '}',
-                                '```',
-                            ].join('\n') + '\n',
-                            timestamp: '',
-                        };
-                    },
-                }),
-                getHistory: () => [],
-            }),
-        };
-        const sessionUpdates = [];
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session: fixtureSession,
-            outputDir: tmpDir,
-            maxIterations: 5,
-            testRunner,
-            scaffolder,
-            onSessionUpdate: async (session) => {
-                sessionUpdates.push({ ...session });
-            },
-        });
-        const result = await ralph.run();
-        // Loop should succeed
-        expect(result.finalStatus).toBe('success');
-        expect(result.terminationReason).toBe('tests-passing');
-        // Verify at least 2 iterations happened (scaffold + test + fix + pass)
-        expect(result.iterationsCompleted).toBeGreaterThanOrEqual(2);
-        // Verify session was persisted
-        expect(sessionUpdates.length).toBeGreaterThan(0);
-        // Verify the fix was applied
-        const fixedContent = await readFile(join(tmpDir, 'src', 'index.ts'), 'utf-8');
-        expect(fixedContent).toContain('stop-1'); // LLM fix was applied
-        // Verify iteration history
-        const poc = result.session.poc;
-        expect(poc.iterations[0].outcome).toBe('scaffold');
-        const lastIter = poc.iterations[poc.iterations.length - 1];
-        expect(lastIter.outcome).toBe('tests-passing');
-    });
-    it('verifies failing tests are passed to LLM in iteration prompt (SC-002-003)', async () => {
-        const io = makeIo();
-        const scaffolder = makeFakeScaffolder(tmpDir);
-        let testCallCount = 0;
-        const testRunner = {
-            run: vi.fn().mockImplementation(async () => {
-                testCallCount++;
-                if (testCallCount === 1) {
-                    return {
-                        passed: 0,
-                        failed: 1,
-                        skipped: 0,
-                        total: 1,
-                        durationMs: 400,
-                        failures: [{ testName: 'unique-failure-name', message: 'specific-error-message' }],
-                        rawOutput: '',
-                    };
-                }
-                return {
-                    passed: 1,
-                    failed: 0,
-                    skipped: 0,
-                    total: 1,
-                    durationMs: 300,
-                    failures: [],
-                    rawOutput: '',
-                };
-            }),
-        };
-        // Capture the prompt sent to LLM
-        let capturedPrompt = '';
-        const client = {
-            createSession: vi.fn().mockResolvedValue({
-                send: vi.fn().mockImplementation((msg) => {
-                    capturedPrompt = msg.content;
-                    return {
-                        async *[Symbol.asyncIterator]() {
-                            yield {
-                                type: 'TextDelta',
-                                text: '```typescript file=src/index.ts\nexport function optimize() { return [1]; }\n```\n',
-                                timestamp: '',
-                            };
-                        },
-                    };
-                }),
-                getHistory: () => [],
-            }),
-        };
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session: fixtureSession,
-            outputDir: tmpDir,
-            maxIterations: 3,
-            testRunner,
-            scaffolder,
-        });
-        await ralph.run();
-        // Verify the LLM received the failure context
-        expect(capturedPrompt).toContain('unique-failure-name');
-        expect(capturedPrompt).toContain('specific-error-message');
-    });
-});
-// ── T074: TODO tracking writes and updates .sofia-metadata.json ────────────
-describe('TODO tracking integration (T074)', () => {
-    let tmpDir;
-    beforeEach(async () => {
-        tmpDir = await mkdtemp(join(tmpdir(), 'sofia-todo-'));
-    });
-    afterEach(async () => {
-        await rm(tmpDir, { recursive: true, force: true });
-    });
-    it('writes TODO counts to .sofia-metadata.json during scaffold and updates after iteration', async () => {
-        const { writeFile, mkdir } = await import('node:fs/promises');
-        // Create a scaffolder that writes files with TODO markers
-        const todoScaffolder = {
-            scaffold: vi.fn().mockImplementation(async () => {
-                await mkdir(join(tmpDir, 'src'), { recursive: true });
-                await mkdir(join(tmpDir, 'tests'), { recursive: true });
-                await writeFile(join(tmpDir, 'package.json'), JSON.stringify({
-                    name: 'todo-test-poc',
-                    scripts: { test: 'vitest run' },
-                    dependencies: {},
-                    devDependencies: {},
-                }), 'utf-8');
-                await writeFile(join(tmpDir, 'src', 'index.ts'), '// TODO: Implement the main logic\nexport function main() { return []; }\n// TODO: Add validation\n', 'utf-8');
-                await writeFile(join(tmpDir, '.sofia-metadata.json'), JSON.stringify({
-                    sessionId: fixtureSession.sessionId,
-                    scaffoldedAt: new Date().toISOString(),
-                }), 'utf-8');
-                return {
-                    createdFiles: ['package.json', 'src/index.ts', '.sofia-metadata.json'],
-                    skippedFiles: [],
-                    context: {
-                        projectName: 'todo-test-poc',
-                        ideaTitle: 'Test',
-                        ideaDescription: 'Test',
-                        techStack: { language: 'TypeScript', runtime: 'Node.js 20', testRunner: 'npm test' },
-                        planSummary: 'Test',
-                        sessionId: fixtureSession.sessionId,
-                        outputDir: tmpDir,
-                    },
-                };
-            }),
-            getTemplateFiles: () => ['package.json', 'src/index.ts'],
-        };
-        // Test runner that fails on first call (triggering TODO rescan), then passes
-        let runCount = 0;
-        const failThenPassRunner = {
-            run: vi.fn().mockImplementation(async () => {
-                runCount++;
-                if (runCount <= 1) {
-                    return {
-                        passed: 0,
-                        failed: 1,
-                        skipped: 0,
-                        total: 1,
-                        durationMs: 100,
-                        failures: [{ testName: 'test', message: 'fail' }],
-                        rawOutput: 'FAIL',
-                    };
-                }
-                return {
-                    passed: 1,
-                    failed: 0,
-                    skipped: 0,
-                    total: 1,
-                    durationMs: 100,
-                    failures: [],
-                    rawOutput: 'pass',
-                };
-            }),
-        };
-        const io = makeIo();
-        const session = { ...fixtureSession };
-        const client = {
-            createSession: vi.fn().mockResolvedValue({
-                send: vi.fn().mockReturnValue({
-                    async *[Symbol.asyncIterator]() {
-                        yield {
-                            type: 'TextDelta',
-                            text: '```typescript file=src/index.ts\nexport function main() { return [1, 2]; }\n```',
-                            timestamp: '',
-                        };
-                    },
-                }),
-                getHistory: () => [],
-            }),
-        };
-        const ralph = new RalphLoop({
-            client,
-            io,
-            session,
-            outputDir: tmpDir,
-            maxIterations: 3,
-            testRunner: failThenPassRunner,
-            scaffolder: todoScaffolder,
-        });
-        await ralph.run();
-        // Verify .sofia-metadata.json has todos section (written by rescan after failing iteration)
-        const metaRaw = await readFile(join(tmpDir, '.sofia-metadata.json'), 'utf-8');
-        const metadata = JSON.parse(metaRaw);
-        expect(metadata.todos).toBeDefined();
-        expect(typeof metadata.todos.totalInitial).toBe('number');
-        expect(typeof metadata.todos.remaining).toBe('number');
-        expect(Array.isArray(metadata.todos.markers)).toBe(true);
-        // After LLM fix removes TODOs from src/index.ts, remaining count should be ≤ initial scaffold count (2)
-        expect(metadata.todos.remaining).toBeLessThanOrEqual(2);
-    });
-});