npm - @hanzo/dev - Versions diffs - 1.2.0 → 2.0.0 - Mend

@hanzo/dev 1.2.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/.eslintrc.js +25 -0
package/dist/cli/dev.js +8202 -553
package/jest.config.js +30 -0
package/package.json +13 -1
package/src/cli/dev.ts +456 -106
package/src/lib/agent-loop.ts +552 -0
package/src/lib/code-act-agent.ts +378 -0
package/src/lib/config.ts +163 -0
package/src/lib/editor.ts +368 -0
package/src/lib/function-calling.ts +318 -0
package/src/lib/mcp-client.ts +259 -0
package/src/lib/peer-agent-network.ts +584 -0
package/src/lib/unified-workspace.ts +435 -0
package/tests/browser-integration.test.ts +242 -0
package/tests/code-act-agent.test.ts +305 -0
package/tests/editor.test.ts +223 -0
package/tests/mcp-client.test.ts +238 -0
package/tests/peer-agent-network.test.ts +340 -0
package/tests/setup.ts +25 -0
package/tests/swe-bench.test.ts +357 -0
package/tsconfig.json +13 -15

package/tests/code-act-agent.test.ts ADDED Viewed

@@ -0,0 +1,305 @@
+import { describe, test, expect, beforeEach, jest } from '@jest/globals';
+import { CodeActAgent, AgentState } from '../src/lib/code-act-agent';
+import { FunctionCallingSystem } from '../src/lib/function-calling';
+describe('CodeActAgent', () => {
+  let agent: CodeActAgent;
+  let mockFunctionCalling: jest.Mocked<FunctionCallingSystem>;
+  beforeEach(() => {
+    // Mock function calling system
+    mockFunctionCalling = {
+      registerTool: jest.fn(),
+      callFunctions: jest.fn(),
+      getAvailableTools: jest.fn().mockReturnValue([
+        { name: 'view_file', description: 'View file contents' },
+        { name: 'str_replace', description: 'Replace string in file' },
+        { name: 'run_command', description: 'Run shell command' }
+      ]),
+      getAllToolSchemas: jest.fn().mockReturnValue([])
+    } as any;
+    agent = new CodeActAgent('test-agent', mockFunctionCalling);
+  });
+  describe('state management', () => {
+    test('should initialize with correct default state', () => {
+      const state = agent.getState();
+      expect(state.currentTask).toBe('');
+      expect(state.plan).toEqual([]);
+      expect(state.completedSteps).toEqual([]);
+      expect(state.currentStep).toBe(0);
+      expect(state.errors).toEqual([]);
+      expect(state.observations).toEqual([]);
+    });
+    test('should update state correctly', () => {
+      const newState: Partial<AgentState> = {
+        currentTask: 'Fix bug in login',
+        plan: ['Locate login file', 'Fix validation', 'Test changes'],
+        currentStep: 1
+      };
+      agent.setState(newState);
+      const state = agent.getState();
+      expect(state.currentTask).toBe('Fix bug in login');
+      expect(state.plan).toHaveLength(3);
+      expect(state.currentStep).toBe(1);
+    });
+  });
+  describe('planning', () => {
+    test('should generate plan for task', async () => {
+      const task = 'Add user authentication to the API';
+      // Mock LLM response for planning
+      const mockPlan = [
+        'Analyze current API structure',
+        'Install authentication dependencies',
+        'Create auth middleware',
+        'Add login/logout endpoints',
+        'Update existing endpoints with auth checks',
+        'Write tests for authentication'
+      ];
+      // The agent should generate a plan based on the task
+      await agent.plan(task);
+      const state = agent.getState();
+      expect(state.currentTask).toBe(task);
+      expect(state.plan.length).toBeGreaterThan(0);
+    });
+    test('should handle planning errors gracefully', async () => {
+      const task = 'Invalid task that causes error';
+      // Even with errors, planning should not throw
+      await expect(agent.plan(task)).resolves.not.toThrow();
+      const state = agent.getState();
+      expect(state.currentTask).toBe(task);
+    });
+  });
+  describe('task execution', () => {
+    test('should execute single step', async () => {
+      // Set up agent with a plan
+      agent.setState({
+        currentTask: 'Fix typo in README',
+        plan: ['View README.md', 'Fix typo', 'Verify changes'],
+        currentStep: 0
+      });
+      // Mock function calling for view_file
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: true,
+        content: '# README\n\nThis is a typpo in the readme.'
+      }]);
+      const result = await agent.executeStep();
+      expect(result.completed).toBe(false);
+      expect(result.action).toBe('View README.md');
+      expect(mockFunctionCalling.callFunctions).toHaveBeenCalled();
+    });
+    test('should handle step execution errors', async () => {
+      agent.setState({
+        currentTask: 'Run failing command',
+        plan: ['Execute broken command'],
+        currentStep: 0
+      });
+      // Mock function calling to throw error
+      mockFunctionCalling.callFunctions.mockRejectedValueOnce(
+        new Error('Command not found')
+      );
+      const result = await agent.executeStep();
+      expect(result.completed).toBe(false);
+      expect(result.error).toBe('Command not found');
+      const state = agent.getState();
+      expect(state.errors).toHaveLength(1);
+      expect(state.errors[0]).toContain('Command not found');
+    });
+    test('should mark task as completed when all steps done', async () => {
+      agent.setState({
+        currentTask: 'Simple task',
+        plan: ['Step 1', 'Step 2'],
+        currentStep: 1,
+        completedSteps: ['Step 1']
+      });
+      // Mock successful execution
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: true
+      }]);
+      const result = await agent.executeStep();
+      expect(result.completed).toBe(true);
+      expect(result.action).toBe('Step 2');
+      const state = agent.getState();
+      expect(state.completedSteps).toHaveLength(2);
+    });
+  });
+  describe('parallel execution', () => {
+    test('should identify parallelizable steps', () => {
+      const plan = [
+        'Download file A',
+        'Download file B',
+        'Process file A',
+        'Process file B',
+        'Merge results'
+      ];
+      const parallel = agent.identifyParallelSteps(plan);
+      // Downloads can be parallel
+      expect(parallel[0]).toEqual([0, 1]);
+      // Processing depends on downloads
+      expect(parallel[1]).toEqual([2]);
+      expect(parallel[2]).toEqual([3]);
+      // Merge depends on processing
+      expect(parallel[3]).toEqual([4]);
+    });
+    test('should execute parallel steps concurrently', async () => {
+      agent.setState({
+        currentTask: 'Parallel downloads',
+        plan: ['Download file1.txt', 'Download file2.txt', 'Merge files'],
+        currentStep: 0
+      });
+      // Mock both downloads to succeed
+      mockFunctionCalling.callFunctions
+        .mockResolvedValueOnce([{ success: true, file: 'file1.txt' }])
+        .mockResolvedValueOnce([{ success: true, file: 'file2.txt' }]);
+      // Execute should handle parallel steps
+      const result1 = await agent.executeStep();
+      expect(result1.action).toContain('Download');
+      // The agent should recognize these can be parallel
+      const state = agent.getState();
+      expect(state.currentStep).toBeLessThanOrEqual(2);
+    });
+  });
+  describe('self-correction', () => {
+    test('should retry failed steps with corrections', async () => {
+      agent.setState({
+        currentTask: 'Fix syntax error',
+        plan: ['Edit file with error'],
+        currentStep: 0
+      });
+      // First attempt fails
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: false,
+        error: 'Syntax error in edit'
+      }]);
+      // Agent should detect error and retry
+      const result1 = await agent.executeStep();
+      expect(result1.error).toBeDefined();
+      // Second attempt with correction succeeds
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: true
+      }]);
+      const result2 = await agent.executeStep();
+      expect(result2.error).toBeUndefined();
+      expect(result2.retryCount).toBeGreaterThan(0);
+    });
+    test('should give up after max retries', async () => {
+      agent.setState({
+        currentTask: 'Impossible task',
+        plan: ['Do impossible thing'],
+        currentStep: 0
+      });
+      // All attempts fail
+      mockFunctionCalling.callFunctions.mockRejectedValue(
+        new Error('Cannot do impossible thing')
+      );
+      let lastResult;
+      for (let i = 0; i < 5; i++) {
+        lastResult = await agent.executeStep();
+      }
+      expect(lastResult!.error).toBeDefined();
+      expect(lastResult!.aborted).toBe(true);
+    });
+  });
+  describe('observation handling', () => {
+    test('should collect and store observations', async () => {
+      agent.setState({
+        currentTask: 'Analyze codebase',
+        plan: ['List files', 'Read main file'],
+        currentStep: 0
+      });
+      // Mock file listing
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: true,
+        output: 'file1.js\nfile2.js\nindex.js'
+      }]);
+      await agent.executeStep();
+      const state = agent.getState();
+      expect(state.observations).toHaveLength(1);
+      expect(state.observations[0]).toContain('file1.js');
+    });
+    test('should use observations for context', async () => {
+      // Pre-populate observations
+      agent.setState({
+        currentTask: 'Fix bug',
+        plan: ['Find bug location', 'Fix bug'],
+        currentStep: 1,
+        observations: ['Bug is in auth.js on line 42']
+      });
+      // The agent should use the observation context
+      mockFunctionCalling.callFunctions.mockResolvedValueOnce([{
+        success: true,
+        result: 'Fixed bug in auth.js'
+      }]);
+      const result = await agent.executeStep();
+      expect(result.completed).toBe(true);
+    });
+  });
+  describe('complete task execution', () => {
+    test('should execute entire task from plan to completion', async () => {
+      const task = 'Add logging to application';
+      // Mock successful execution of all steps
+      mockFunctionCalling.callFunctions
+        .mockResolvedValueOnce([{ success: true }]) // Install logger
+        .mockResolvedValueOnce([{ success: true }]) // Create logger config
+        .mockResolvedValueOnce([{ success: true }]) // Add logging statements
+        .mockResolvedValueOnce([{ success: true }]); // Test logging
+      await agent.plan(task);
+      const result = await agent.execute(task);
+      expect(result.success).toBe(true);
+      expect(result.completedSteps.length).toBeGreaterThan(0);
+      expect(result.errors).toHaveLength(0);
+    });
+  });
+});

package/tests/editor.test.ts ADDED Viewed

@@ -0,0 +1,223 @@
+import { describe, test, expect, beforeEach, afterEach } from '@jest/globals';
+import * as fs from 'fs';
+import * as path from 'path';
+import * as os from 'os';
+import { Editor, EditCommand } from '../src/lib/editor';
+describe('Editor', () => {
+  let editor: Editor;
+  let testDir: string;
+  let testFile: string;
+  beforeEach(() => {
+    // Create temporary test directory
+    testDir = fs.mkdtempSync(path.join(os.tmpdir(), 'hanzo-dev-test-'));
+    testFile = path.join(testDir, 'test.txt');
+    editor = new Editor(testDir);
+  });
+  afterEach(() => {
+    // Clean up test directory
+    fs.rmSync(testDir, { recursive: true, force: true });
+  });
+  describe('create command', () => {
+    test('should create a new file with content', async () => {
+      const command: EditCommand = {
+        command: 'create',
+        path: testFile,
+        content: 'Hello, World!'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(true);
+      expect(fs.existsSync(testFile)).toBe(true);
+      expect(fs.readFileSync(testFile, 'utf-8')).toBe('Hello, World!');
+    });
+    test('should fail when file already exists', async () => {
+      fs.writeFileSync(testFile, 'existing content');
+      const command: EditCommand = {
+        command: 'create',
+        path: testFile,
+        content: 'new content'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(false);
+      expect(result.error).toContain('already exists');
+    });
+  });
+  describe('view command', () => {
+    test('should view entire file when no line range specified', async () => {
+      const content = 'Line 1\nLine 2\nLine 3';
+      fs.writeFileSync(testFile, content);
+      const command: EditCommand = {
+        command: 'view',
+        path: testFile
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(true);
+      expect(result.content).toContain('Line 1');
+      expect(result.content).toContain('Line 2');
+      expect(result.content).toContain('Line 3');
+    });
+    test('should view specific line range', async () => {
+      const lines = Array.from({ length: 10 }, (_, i) => `Line ${i + 1}`);
+      fs.writeFileSync(testFile, lines.join('\n'));
+      const command: EditCommand = {
+        command: 'view',
+        path: testFile,
+        startLine: 3,
+        endLine: 5
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(true);
+      expect(result.content).toContain('Line 3');
+      expect(result.content).toContain('Line 4');
+      expect(result.content).toContain('Line 5');
+      expect(result.content).not.toContain('Line 1');
+      expect(result.content).not.toContain('Line 10');
+    });
+  });
+  describe('str_replace command', () => {
+    test('should replace string in file', async () => {
+      const content = 'Hello, World!\nThis is a test.\nHello again!';
+      fs.writeFileSync(testFile, content);
+      const command: EditCommand = {
+        command: 'str_replace',
+        path: testFile,
+        oldStr: 'Hello, World!',
+        newStr: 'Hi, Universe!'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(true);
+      const newContent = fs.readFileSync(testFile, 'utf-8');
+      expect(newContent).toContain('Hi, Universe!');
+      expect(newContent).not.toContain('Hello, World!');
+      expect(newContent).toContain('Hello again!');
+    });
+    test('should fail when old string not found', async () => {
+      fs.writeFileSync(testFile, 'Some content');
+      const command: EditCommand = {
+        command: 'str_replace',
+        path: testFile,
+        oldStr: 'Not found',
+        newStr: 'Replacement'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(false);
+      expect(result.error).toContain('not found');
+    });
+    test('should fail when old string appears multiple times', async () => {
+      const content = 'duplicate\nsome text\nduplicate';
+      fs.writeFileSync(testFile, content);
+      const command: EditCommand = {
+        command: 'str_replace',
+        path: testFile,
+        oldStr: 'duplicate',
+        newStr: 'unique'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(false);
+      expect(result.error).toContain('multiple');
+    });
+  });
+  describe('insert command', () => {
+    test('should insert text at specific line', async () => {
+      const content = 'Line 1\nLine 2\nLine 3';
+      fs.writeFileSync(testFile, content);
+      const command: EditCommand = {
+        command: 'insert',
+        path: testFile,
+        lineNumber: 2,
+        content: 'Inserted line'
+      };
+      const result = await editor.execute(command);
+      expect(result.success).toBe(true);
+      const newContent = fs.readFileSync(testFile, 'utf-8');
+      const lines = newContent.split('\n');
+      expect(lines[1]).toBe('Inserted line');
+      expect(lines[2]).toBe('Line 2');
+    });
+  });
+  describe('undo_edit command', () => {
+    test('should undo last edit', async () => {
+      const originalContent = 'Original content';
+      fs.writeFileSync(testFile, originalContent);
+      // Make an edit
+      await editor.execute({
+        command: 'str_replace',
+        path: testFile,
+        oldStr: 'Original',
+        newStr: 'Modified'
+      });
+      // Verify edit was made
+      expect(fs.readFileSync(testFile, 'utf-8')).toContain('Modified');
+      // Undo the edit
+      const result = await editor.execute({
+        command: 'undo_edit',
+        path: testFile
+      });
+      expect(result.success).toBe(true);
+      expect(fs.readFileSync(testFile, 'utf-8')).toBe(originalContent);
+    });
+  });
+  describe('chunk localization', () => {
+    test('should find relevant chunks for search query', async () => {
+      const codeContent = `
+function calculateTotal(items) {
+  let total = 0;
+  for (const item of items) {
+    total += item.price * item.quantity;
+  }
+  return total;
+}
+function applyDiscount(total, discountPercent) {
+  return total * (1 - discountPercent / 100);
+}
+function formatCurrency(amount) {
+  return new Intl.NumberFormat('en-US', {
+    style: 'currency',
+    currency: 'USD'
+  }).format(amount);
+}
+`;
+      fs.writeFileSync(testFile, codeContent);
+      const chunks = await editor.getRelevantChunks(testFile, 'calculate price total');
+      expect(chunks.length).toBeGreaterThan(0);
+      expect(chunks[0].content).toContain('calculateTotal');
+      expect(chunks[0].content).toContain('price');
+    });
+  });
+});