npm - vellum - Versions diffs - 0.2.13 → 0.2.14 - Mend

vellum 0.2.13 → 0.2.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (207) hide show

package/README.md +32 -0
package/bun.lock +2 -2
package/docs/skills.md +4 -4
package/package.json +2 -2
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +213 -3
package/src/__tests__/app-git-history.test.ts +176 -0
package/src/__tests__/app-git-service.test.ts +169 -0
package/src/__tests__/assistant-events-sse-hardening.test.ts +315 -0
package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +8 -8
package/src/__tests__/browser-skill-endstate.test.ts +6 -6
package/src/__tests__/call-bridge.test.ts +105 -13
package/src/__tests__/call-domain.test.ts +163 -0
package/src/__tests__/call-orchestrator.test.ts +113 -0
package/src/__tests__/call-routes-http.test.ts +246 -6
package/src/__tests__/channel-approval-routes.test.ts +438 -0
package/src/__tests__/channel-approval.test.ts +266 -0
package/src/__tests__/channel-approvals.test.ts +393 -0
package/src/__tests__/channel-delivery-store.test.ts +447 -0
package/src/__tests__/checker.test.ts +607 -1048
package/src/__tests__/cli.test.ts +1 -56
package/src/__tests__/config-schema.test.ts +137 -18
package/src/__tests__/conflict-intent-tokenization.test.ts +141 -0
package/src/__tests__/conflict-policy.test.ts +121 -0
package/src/__tests__/conflict-store.test.ts +2 -0
package/src/__tests__/contacts-tools.test.ts +3 -3
package/src/__tests__/contradiction-checker.test.ts +99 -1
package/src/__tests__/credential-security-invariants.test.ts +22 -6
package/src/__tests__/credential-vault-unit.test.ts +780 -0
package/src/__tests__/elevenlabs-client.test.ts +62 -0
package/src/__tests__/ephemeral-permissions.test.ts +73 -23
package/src/__tests__/filesystem-tools.test.ts +579 -0
package/src/__tests__/gateway-only-enforcement.test.ts +114 -4
package/src/__tests__/handlers-add-trust-rule-metadata.test.ts +202 -0
package/src/__tests__/handlers-cu-observation-blob.test.ts +2 -1
package/src/__tests__/handlers-ipc-blob-probe.test.ts +2 -1
package/src/__tests__/handlers-slack-config.test.ts +2 -1
package/src/__tests__/handlers-telegram-config.test.ts +855 -0
package/src/__tests__/handlers-twitter-config.test.ts +141 -1
package/src/__tests__/hooks-runner.test.ts +6 -2
package/src/__tests__/host-file-edit-tool.test.ts +124 -0
package/src/__tests__/host-file-read-tool.test.ts +62 -0
package/src/__tests__/host-file-write-tool.test.ts +59 -0
package/src/__tests__/host-shell-tool.test.ts +251 -0
package/src/__tests__/ingress-reconcile.test.ts +581 -0
package/src/__tests__/ipc-snapshot.test.ts +100 -41
package/src/__tests__/ipc-validate.test.ts +50 -0
package/src/__tests__/key-migration.test.ts +23 -0
package/src/__tests__/memory-regressions.test.ts +99 -0
package/src/__tests__/memory-retrieval.benchmark.test.ts +1 -1
package/src/__tests__/oauth-callback-registry.test.ts +11 -4
package/src/__tests__/playbook-execution.test.ts +502 -0
package/src/__tests__/playbook-tools.test.ts +4 -6
package/src/__tests__/public-ingress-urls.test.ts +34 -0
package/src/__tests__/qdrant-manager.test.ts +267 -0
package/src/__tests__/recurrence-engine-rruleset.test.ts +97 -0
package/src/__tests__/recurrence-engine.test.ts +9 -0
package/src/__tests__/recurrence-types.test.ts +8 -0
package/src/__tests__/registry.test.ts +1 -1
package/src/__tests__/runtime-runs.test.ts +1 -25
package/src/__tests__/schedule-store.test.ts +16 -14
package/src/__tests__/schedule-tools.test.ts +83 -0
package/src/__tests__/scheduler-recurrence.test.ts +111 -10
package/src/__tests__/secret-allowlist.test.ts +18 -17
package/src/__tests__/secret-ingress-handler.test.ts +11 -0
package/src/__tests__/secret-scanner.test.ts +43 -0
package/src/__tests__/session-conflict-gate.test.ts +442 -6
package/src/__tests__/session-init.benchmark.test.ts +3 -0
package/src/__tests__/session-process-bridge.test.ts +242 -0
package/src/__tests__/session-skill-tools.test.ts +1 -1
package/src/__tests__/shell-identity.test.ts +256 -0
package/src/__tests__/skill-projection.benchmark.test.ts +11 -1
package/src/__tests__/subagent-tools.test.ts +637 -54
package/src/__tests__/task-management-tools.test.ts +936 -0
package/src/__tests__/task-runner.test.ts +2 -2
package/src/__tests__/terminal-tools.test.ts +840 -0
package/src/__tests__/tool-executor-shell-integration.test.ts +301 -0
package/src/__tests__/tool-executor.test.ts +85 -151
package/src/__tests__/tool-permission-simulate-handler.test.ts +336 -0
package/src/__tests__/trust-store.test.ts +27 -453
package/src/__tests__/twilio-provider.test.ts +153 -3
package/src/__tests__/twilio-routes-elevenlabs.test.ts +375 -0
package/src/__tests__/twilio-routes-twiml.test.ts +4 -4
package/src/__tests__/twilio-routes.test.ts +17 -262
package/src/__tests__/twitter-auth-handler.test.ts +2 -1
package/src/__tests__/twitter-cli-error-shaping.test.ts +208 -0
package/src/__tests__/twitter-cli-routing.test.ts +252 -0
package/src/__tests__/twitter-oauth-client.test.ts +209 -0
package/src/__tests__/workspace-policy.test.ts +213 -0
package/src/calls/call-bridge.ts +92 -19
package/src/calls/call-domain.ts +157 -5
package/src/calls/call-orchestrator.ts +93 -7
package/src/calls/call-store.ts +6 -0
package/src/calls/elevenlabs-client.ts +8 -0
package/src/calls/elevenlabs-config.ts +7 -5
package/src/calls/twilio-provider.ts +91 -0
package/src/calls/twilio-routes.ts +32 -37
package/src/calls/types.ts +3 -1
package/src/calls/voice-quality.ts +29 -7
package/src/cli/twitter.ts +200 -21
package/src/cli.ts +1 -20
package/src/config/bundled-skills/contacts/tools/contact-merge.ts +52 -4
package/src/config/bundled-skills/contacts/tools/contact-search.ts +55 -4
package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +61 -4
package/src/config/bundled-skills/messaging/SKILL.md +17 -2
package/src/config/bundled-skills/messaging/tools/messaging-reply.ts +4 -1
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +5 -1
package/src/config/bundled-skills/messaging/tools/shared.ts +5 -0
package/src/config/bundled-skills/phone-calls/SKILL.md +142 -34
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +95 -6
package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +51 -6
package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +73 -6
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +110 -6
package/src/config/bundled-skills/public-ingress/SKILL.md +22 -5
package/src/config/bundled-skills/twitter/SKILL.md +103 -17
package/src/config/defaults.ts +10 -4
package/src/config/schema.ts +80 -21
package/src/config/types.ts +1 -0
package/src/config/vellum-skills/telegram-setup/SKILL.md +56 -61
package/src/daemon/assistant-attachments.ts +4 -2
package/src/daemon/handlers/apps.ts +69 -0
package/src/daemon/handlers/config.ts +543 -24
package/src/daemon/handlers/index.ts +1 -0
package/src/daemon/handlers/sessions.ts +22 -6
package/src/daemon/handlers/shared.ts +2 -1
package/src/daemon/handlers/skills.ts +5 -20
package/src/daemon/ipc-contract-inventory.json +28 -0
package/src/daemon/ipc-contract.ts +168 -10
package/src/daemon/ipc-validate.ts +17 -0
package/src/daemon/lifecycle.ts +2 -0
package/src/daemon/server.ts +78 -72
package/src/daemon/session-attachments.ts +1 -1
package/src/daemon/session-conflict-gate.ts +62 -6
package/src/daemon/session-notifiers.ts +1 -1
package/src/daemon/session-process.ts +62 -3
package/src/daemon/session-tool-setup.ts +1 -2
package/src/daemon/tls-certs.ts +189 -0
package/src/daemon/video-thumbnail.ts +5 -3
package/src/hooks/manager.ts +5 -9
package/src/memory/app-git-service.ts +295 -0
package/src/memory/app-store.ts +21 -0
package/src/memory/conflict-intent.ts +47 -4
package/src/memory/conflict-policy.ts +73 -0
package/src/memory/conflict-store.ts +9 -1
package/src/memory/contradiction-checker.ts +28 -0
package/src/memory/conversation-key-store.ts +15 -0
package/src/memory/db.ts +81 -0
package/src/memory/embedding-local.ts +3 -13
package/src/memory/external-conversation-store.ts +234 -0
package/src/memory/job-handlers/conflict.ts +22 -2
package/src/memory/jobs-worker.ts +67 -28
package/src/memory/runs-store.ts +54 -7
package/src/memory/schema.ts +20 -0
package/src/messaging/provider.ts +9 -0
package/src/messaging/providers/telegram-bot/adapter.ts +162 -0
package/src/messaging/providers/telegram-bot/client.ts +104 -0
package/src/messaging/providers/telegram-bot/types.ts +15 -0
package/src/messaging/registry.ts +1 -0
package/src/permissions/checker.ts +48 -44
package/src/permissions/prompter.ts +0 -4
package/src/permissions/shell-identity.ts +227 -0
package/src/permissions/trust-store.ts +76 -53
package/src/permissions/types.ts +0 -19
package/src/permissions/workspace-policy.ts +114 -0
package/src/providers/retry.ts +12 -37
package/src/runtime/assistant-event-hub.ts +41 -4
package/src/runtime/channel-approval-parser.ts +60 -0
package/src/runtime/channel-approval-types.ts +71 -0
package/src/runtime/channel-approvals.ts +145 -0
package/src/runtime/gateway-client.ts +16 -0
package/src/runtime/http-server.ts +29 -9
package/src/runtime/routes/call-routes.ts +52 -2
package/src/runtime/routes/channel-routes.ts +296 -16
package/src/runtime/routes/events-routes.ts +97 -28
package/src/runtime/routes/run-routes.ts +2 -7
package/src/runtime/run-orchestrator.ts +0 -3
package/src/schedule/recurrence-engine.ts +26 -2
package/src/schedule/recurrence-types.ts +1 -1
package/src/schedule/schedule-store.ts +12 -3
package/src/security/secret-scanner.ts +7 -0
package/src/tasks/ephemeral-permissions.ts +0 -2
package/src/tasks/task-scheduler.ts +2 -1
package/src/tools/calls/call-start.ts +8 -0
package/src/tools/execution-target.ts +21 -0
package/src/tools/execution-timeout.ts +49 -0
package/src/tools/executor.ts +6 -135
package/src/tools/network/web-search.ts +9 -32
package/src/tools/policy-context.ts +29 -0
package/src/tools/schedule/update.ts +8 -1
package/src/tools/terminal/parser.ts +16 -18
package/src/tools/types.ts +4 -11
package/src/twitter/oauth-client.ts +102 -0
package/src/twitter/router.ts +101 -0
package/src/util/debounce.ts +88 -0
package/src/util/network-info.ts +47 -0
package/src/util/platform.ts +29 -4
package/src/util/promise-guard.ts +37 -0
package/src/util/retry.ts +98 -0
package/src/util/truncate.ts +1 -1
package/src/workspace/git-service.ts +129 -112
package/src/tools/contacts/contact-merge.ts +0 -55
package/src/tools/contacts/contact-search.ts +0 -58
package/src/tools/contacts/contact-upsert.ts +0 -64
package/src/tools/playbooks/index.ts +0 -4
package/src/tools/playbooks/playbook-create.ts +0 -96
package/src/tools/playbooks/playbook-delete.ts +0 -52
package/src/tools/playbooks/playbook-list.ts +0 -74
package/src/tools/playbooks/playbook-update.ts +0 -111

package/src/__tests__/handlers-twitter-config.test.ts CHANGED Viewed

@@ -115,6 +115,7 @@ import type {
   TwitterIntegrationConfigRequest,
   ServerMessage,
 } from '../daemon/ipc-contract.js';
+import { DebouncerMap } from '../util/debounce.js';
 function createTestContext(): { ctx: HandlerContext; sent: ServerMessage[] } {
   const sent: ServerMessage[] = [];
@@ -126,7 +127,7 @@ function createTestContext(): { ctx: HandlerContext; sent: ServerMessage[] } {
     cuObservationParseSequence: new Map(),
     socketSandboxOverride: new Map(),
     sharedRequestTimestamps: [],
-    debounceTimers: new Map(),
+    debounceTimers: new DebouncerMap({ defaultDelayMs: 200 }),
     suppressConfigReload: false,
     setSuppressConfigReload: () => {},
     updateConfigFingerprint: () => {},
@@ -715,4 +716,143 @@ describe('Twitter integration config handler', () => {
     expect(responseStr).not.toContain('secret-client-secret-xyz789');
     expect(responseStr).not.toContain('secret-access-token-def456');
   });
+  // --- Strategy tests ---
+  test('get_strategy returns auto by default with strategyConfigured=false', () => {
+    const msg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'get_strategy',
+    };
+    const { ctx, sent } = createTestContext();
+    handleMessage(msg, {} as net.Socket, ctx);
+    expect(sent).toHaveLength(1);
+    const res = sent[0] as { type: string; success: boolean; strategy: string; strategyConfigured: boolean };
+    expect(res.type).toBe('twitter_integration_config_response');
+    expect(res.success).toBe(true);
+    expect(res.strategy).toBe('auto');
+    expect(res.strategyConfigured).toBe(false);
+  });
+  test('set_strategy persists and can be read back with strategyConfigured=true', () => {
+    // Set strategy to oauth
+    const setMsg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'set_strategy',
+      strategy: 'oauth',
+    };
+    const { ctx: ctx1, sent: sent1 } = createTestContext();
+    handleMessage(setMsg, {} as net.Socket, ctx1);
+    expect(sent1).toHaveLength(1);
+    const setRes = sent1[0] as { type: string; success: boolean; strategy: string; strategyConfigured: boolean };
+    expect(setRes.success).toBe(true);
+    expect(setRes.strategy).toBe('oauth');
+    expect(setRes.strategyConfigured).toBe(true);
+    // Read it back with get_strategy
+    const getMsg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'get_strategy',
+    };
+    const { ctx: ctx2, sent: sent2 } = createTestContext();
+    handleMessage(getMsg, {} as net.Socket, ctx2);
+    expect(sent2).toHaveLength(1);
+    const getRes = sent2[0] as { type: string; success: boolean; strategy: string; strategyConfigured: boolean };
+    expect(getRes.success).toBe(true);
+    expect(getRes.strategy).toBe('oauth');
+    expect(getRes.strategyConfigured).toBe(true);
+    // Verify persistence via saveRawConfig
+    expect(saveRawConfigCalls.length).toBeGreaterThan(0);
+    const lastSaved = saveRawConfigCalls[saveRawConfigCalls.length - 1]!;
+    expect(lastSaved.twitterOperationStrategy).toBe('oauth');
+  });
+  test('set_strategy with invalid value returns error', () => {
+    const msg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'set_strategy',
+      strategy: 'invalid_value',
+    };
+    const { ctx, sent } = createTestContext();
+    handleMessage(msg, {} as net.Socket, ctx);
+    expect(sent).toHaveLength(1);
+    const res = sent[0] as { type: string; success: boolean; error?: string };
+    expect(res.type).toBe('twitter_integration_config_response');
+    expect(res.success).toBe(false);
+    expect(res.error).toContain('Invalid strategy value');
+    expect(res.error).toContain('invalid_value');
+  });
+  test('set_strategy without value returns error', () => {
+    const msg = {
+      type: 'twitter_integration_config',
+      action: 'set_strategy',
+    } as unknown as TwitterIntegrationConfigRequest;
+    const { ctx, sent } = createTestContext();
+    handleMessage(msg, {} as net.Socket, ctx);
+    expect(sent).toHaveLength(1);
+    const res = sent[0] as { type: string; success: boolean; error?: string };
+    expect(res.success).toBe(false);
+    expect(res.error).toContain('Invalid strategy value');
+  });
+  test('get action includes strategy field with strategyConfigured=true when set', () => {
+    // Set a specific strategy first
+    rawConfigStore = { twitterOperationStrategy: 'browser' };
+    const msg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'get',
+    };
+    const { ctx, sent } = createTestContext();
+    handleMessage(msg, {} as net.Socket, ctx);
+    expect(sent).toHaveLength(1);
+    const res = sent[0] as { type: string; success: boolean; strategy: string; strategyConfigured: boolean; mode: string };
+    expect(res.type).toBe('twitter_integration_config_response');
+    expect(res.success).toBe(true);
+    expect(res.strategy).toBe('browser');
+    expect(res.strategyConfigured).toBe(true);
+  });
+  test('get action returns auto strategy by default with strategyConfigured=false', () => {
+    const msg: TwitterIntegrationConfigRequest = {
+      type: 'twitter_integration_config',
+      action: 'get',
+    };
+    const { ctx, sent } = createTestContext();
+    handleMessage(msg, {} as net.Socket, ctx);
+    expect(sent).toHaveLength(1);
+    const res = sent[0] as { type: string; success: boolean; strategy: string; strategyConfigured: boolean };
+    expect(res.strategy).toBe('auto');
+    expect(res.strategyConfigured).toBe(false);
+  });
+  test('set_strategy cycles through all valid values', () => {
+    for (const value of ['oauth', 'browser', 'auto'] as const) {
+      const msg: TwitterIntegrationConfigRequest = {
+        type: 'twitter_integration_config',
+        action: 'set_strategy',
+        strategy: value,
+      };
+      const { ctx, sent } = createTestContext();
+      handleMessage(msg, {} as net.Socket, ctx);
+      expect(sent).toHaveLength(1);
+      const res = sent[0] as { type: string; success: boolean; strategy: string };
+      expect(res.success).toBe(true);
+      expect(res.strategy).toBe(value);
+    }
+  });
 });

package/src/__tests__/hooks-runner.test.ts CHANGED Viewed

@@ -134,14 +134,18 @@ describe('Hook Runner', () => {
     expect(wsDir).toStartWith(rootDir);
   });
-  test('[experimental] times out after specified duration', async () => {
+  // Skip: child.kill() + 'close' event is unreliable on macOS when the hook
+  // script is a bash process tree — SIGTERM/SIGKILL may not trigger 'close',
+  // causing the test to hang. The timeout logic works in production but is
+  // not deterministically testable in unit tests.
+  test.skip('[experimental] times out after specified duration', async () => {
     const hook = createTestHook(hooksDir, 'slow-hook', '#!/bin/bash\nsleep 10');
     const eventData: HookEventData = { event: 'pre-tool-execute' };
     const result = await runHookScript(hook, eventData, { timeoutMs: 200 });
     expect(result.exitCode).toBeNull();
     expect(result.stderr).toContain('Hook timed out');
-  });
+  }, 10_000);
   test('handles non-existent script gracefully', async () => {
     const hook: DiscoveredHook = {

package/src/__tests__/host-file-edit-tool.test.ts CHANGED Viewed

@@ -101,4 +101,128 @@ describe('host_file_edit tool', () => {
     expect(result.isError).toBe(true);
     expect(result.content).toContain('appears multiple times');
   });
+  test('rejects missing path parameter', async () => {
+    const result = await hostFileEditTool.execute({
+      old_string: 'a',
+      new_string: 'b',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('path is required');
+  });
+  test('rejects non-string old_string', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    writeFileSync(filePath, 'content\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: 42,
+      new_string: 'b',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('old_string is required');
+  });
+  test('rejects non-string new_string', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    writeFileSync(filePath, 'content\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: 'content',
+      new_string: 42,
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('new_string is required');
+  });
+  test('rejects empty old_string', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    writeFileSync(filePath, 'content\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: '',
+      new_string: 'b',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('old_string must not be empty');
+  });
+  test('rejects identical old_string and new_string', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    writeFileSync(filePath, 'content\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: 'content',
+      new_string: 'content',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('old_string and new_string must be different');
+  });
+  test('returns error for nonexistent file', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'missing.txt');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: 'a',
+      new_string: 'b',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('File not found');
+  });
+  test('returns diff info after successful edit', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    writeFileSync(filePath, 'before\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      old_string: 'before',
+      new_string: 'after',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.diff).toBeDefined();
+    expect(result.diff!.filePath).toBe(filePath);
+    expect(result.diff!.oldContent).toBe('before\n');
+    expect(result.diff!.newContent).toBe('after\n');
+    expect(result.diff!.isNewFile).toBe(false);
+  });
+  test('whitespace-normalized match includes note in message', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-edit-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'sample.txt');
+    // File has tab indentation
+    writeFileSync(filePath, 'function foo() {\n\treturn 1;\n}\n');
+    const result = await hostFileEditTool.execute({
+      path: filePath,
+      // old_string uses spaces instead of tabs — should whitespace-normalize
+      old_string: 'function foo() {\n  return 1;\n}',
+      new_string: 'function bar() {\n  return 2;\n}',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    // Should contain either whitespace normalization or fuzzy match note
+    expect(
+      result.content.includes('whitespace') || result.content.includes('fuzzy') || result.content.includes('Successfully edited')
+    ).toBe(true);
+  });
 });

package/src/__tests__/host-file-read-tool.test.ts CHANGED Viewed

@@ -58,4 +58,66 @@ describe('host_file_read tool', () => {
     expect(result.isError).toBe(true);
     expect(result.content).toContain('is not a regular file');
   });
+  test('rejects missing path parameter', async () => {
+    const result = await hostFileReadTool.execute({}, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('path is required');
+  });
+  test('rejects non-string path', async () => {
+    const result = await hostFileReadTool.execute({ path: 42 }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('path is required and must be a string');
+  });
+  test('reads entire file when no offset or limit specified', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-read-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'full.txt');
+    writeFileSync(filePath, 'line1\nline2\nline3\n');
+    const result = await hostFileReadTool.execute({ path: filePath }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('1  line1');
+    expect(result.content).toContain('2  line2');
+    expect(result.content).toContain('3  line3');
+  });
+  test('handles empty file', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-read-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'empty.txt');
+    writeFileSync(filePath, '');
+    const result = await hostFileReadTool.execute({ path: filePath }, makeContext());
+    expect(result.isError).toBe(false);
+  });
+  test('offset starts from the correct line (1-indexed)', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-read-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'lines.txt');
+    writeFileSync(filePath, 'a\nb\nc\nd\ne\n');
+    const result = await hostFileReadTool.execute({ path: filePath, offset: 3, limit: 1 }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('3  c');
+    expect(result.content).not.toContain('2  b');
+    expect(result.content).not.toContain('4  d');
+  });
+  test('reads a file with symlinks resolved', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-read-test-'));
+    testDirs.push(dir);
+    const realFile = join(dir, 'real.txt');
+    const linkFile = join(dir, 'link.txt');
+    writeFileSync(realFile, 'symlink-content\n');
+    const { symlinkSync } = await import('node:fs');
+    symlinkSync(realFile, linkFile);
+    const result = await hostFileReadTool.execute({ path: linkFile }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('symlink-content');
+  });
 });

package/src/__tests__/host-file-write-tool.test.ts CHANGED Viewed

@@ -74,4 +74,63 @@ describe('host_file_write tool', () => {
       isNewFile: false,
     });
   });
+  test('rejects missing path parameter', async () => {
+    const result = await hostFileWriteTool.execute({ content: 'data' }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('path is required');
+  });
+  test('rejects non-string path', async () => {
+    const result = await hostFileWriteTool.execute({ path: 123, content: 'data' }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('path is required and must be a string');
+  });
+  test('success message contains the file path', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-write-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'msg-check.txt');
+    const result = await hostFileWriteTool.execute({ path: filePath, content: 'check' }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain(`Successfully wrote to ${filePath}`);
+  });
+  test('new file message includes line count', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-write-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'lines.txt');
+    const result = await hostFileWriteTool.execute({
+      path: filePath,
+      content: 'line1\nline2\nline3',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('new file');
+    expect(result.content).toContain('3 lines');
+  });
+  test('writes empty string content', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-write-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'empty.txt');
+    const result = await hostFileWriteTool.execute({ path: filePath, content: '' }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(existsSync(filePath)).toBe(true);
+    expect(readFileSync(filePath, 'utf-8')).toBe('');
+  });
+  test('creates nested parent directories', async () => {
+    const dir = mkdtempSync(join(tmpdir(), 'host-file-write-test-'));
+    testDirs.push(dir);
+    const filePath = join(dir, 'a', 'b', 'c', 'deep.txt');
+    const result = await hostFileWriteTool.execute({ path: filePath, content: 'deep' }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(existsSync(filePath)).toBe(true);
+    expect(readFileSync(filePath, 'utf-8')).toBe('deep');
+  });
 });

package/src/__tests__/host-shell-tool.test.ts CHANGED Viewed

@@ -309,3 +309,254 @@ describe('host_bash — regression: no proxied-mode additions', () => {
     expect((definition.input_schema as Record<string, unknown>).required).toEqual(['command', 'reason']);
   });
 });
+// ---------------------------------------------------------------------------
+// Input validation
+// ---------------------------------------------------------------------------
+describe('host_bash — input validation', () => {
+  test('rejects null bytes in command', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo \0evil',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('null bytes');
+  });
+  test('rejects null bytes in working_dir', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo test',
+      working_dir: '/tmp/\0evil',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('null bytes');
+  });
+  test('rejects empty command', async () => {
+    const result = await hostShellTool.execute({
+      command: '',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('command is required');
+  });
+  test('rejects non-string command', async () => {
+    const result = await hostShellTool.execute({
+      command: 42,
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('command is required and must be a string');
+  });
+  test('rejects non-string working_dir', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo test',
+      working_dir: 123,
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('working_dir must be a string');
+  });
+});
+// ---------------------------------------------------------------------------
+// Environment setup
+// ---------------------------------------------------------------------------
+describe('host_bash — environment setup', () => {
+  test('defaults working_dir to user home when not provided', async () => {
+    const { homedir } = await import('node:os');
+    const result = await hostShellTool.execute({
+      command: 'pwd',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content.trim()).toBe(realpathSync(homedir()));
+  });
+  test('PATH includes ~/.local/bin and ~/.bun/bin', async () => {
+    const { homedir } = await import('node:os');
+    const home = homedir();
+    const result = await hostShellTool.execute({
+      command: 'echo "$PATH"',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain(`${home}/.local/bin`);
+    expect(result.content).toContain(`${home}/.bun/bin`);
+  });
+  test('does not leak non-allowlisted env vars', async () => {
+    // Set a custom env var that is NOT in the SAFE_ENV_VARS allowlist
+    const varName = 'VELLUM_TEST_UNLISTED_VAR';
+    const originalVal = process.env[varName];
+    process.env[varName] = 'should-not-appear';
+    try {
+      const result = await hostShellTool.execute({
+        command: 'env',
+      }, makeContext());
+      expect(result.isError).toBe(false);
+      expect(result.content).not.toContain(varName);
+      expect(result.content).not.toContain('should-not-appear');
+    } finally {
+      if (originalVal === undefined) {
+        delete process.env[varName];
+      } else {
+        process.env[varName] = originalVal;
+      }
+    }
+  });
+  test('includes safe env vars like HOME and TERM', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo "HOME=$HOME"',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('HOME=');
+    expect(result.content.trim()).not.toBe('HOME=');
+  });
+});
+// ---------------------------------------------------------------------------
+// Timeout handling
+// ---------------------------------------------------------------------------
+describe('host_bash — timeout handling', () => {
+  test('respects custom timeout_seconds', async () => {
+    const result = await hostShellTool.execute({
+      command: 'sleep 5',
+      timeout_seconds: 1,
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('command_timeout');
+  });
+  test('clamps timeout to at least 1 second', async () => {
+    // A timeout_seconds of 0 should be clamped to 1
+    const result = await hostShellTool.execute({
+      command: 'echo fast',
+      timeout_seconds: 0,
+    }, makeContext());
+    // Should still complete — 1 second is enough for echo
+    expect(result.isError).toBe(false);
+    expect(result.content.trim()).toBe('fast');
+  });
+  test('clamps timeout to max configured value', async () => {
+    // Request a timeout larger than the configured max (600)
+    const result = await hostShellTool.execute({
+      command: 'echo capped',
+      timeout_seconds: 9999,
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content.trim()).toBe('capped');
+  });
+});
+// ---------------------------------------------------------------------------
+// Streaming output and abort signal
+// ---------------------------------------------------------------------------
+describe('host_bash — streaming and cancellation', () => {
+  test('calls onOutput callback with stdout chunks', async () => {
+    const chunks: string[] = [];
+    const ctx = {
+      ...makeContext(),
+      onOutput: (chunk: string) => chunks.push(chunk),
+    };
+    const result = await hostShellTool.execute({
+      command: 'echo streamed-output',
+    }, ctx);
+    expect(result.isError).toBe(false);
+    expect(chunks.join('')).toContain('streamed-output');
+  });
+  test('calls onOutput callback with stderr chunks', async () => {
+    const chunks: string[] = [];
+    const ctx = {
+      ...makeContext(),
+      onOutput: (chunk: string) => chunks.push(chunk),
+    };
+    await hostShellTool.execute({
+      command: 'echo stderr-data >&2',
+    }, ctx);
+    expect(chunks.join('')).toContain('stderr-data');
+  });
+  test('kills process when abort signal fires', async () => {
+    const ac = new AbortController();
+    // Start a long-running command then abort it quickly
+    const promise = hostShellTool.execute({
+      command: 'sleep 30',
+    }, { ...makeContext(), signal: ac.signal });
+    // Give the process a moment to start
+    await new Promise(r => setTimeout(r, 100));
+    ac.abort();
+    const result = await promise;
+    // The process was killed, so it should report an error (non-zero exit)
+    expect(result.isError).toBe(true);
+  });
+  test('immediately kills process if signal already aborted', async () => {
+    const ac = new AbortController();
+    ac.abort();
+    const result = await hostShellTool.execute({
+      command: 'sleep 30',
+    }, { ...makeContext(), signal: ac.signal });
+    expect(result.isError).toBe(true);
+  });
+});
+// ---------------------------------------------------------------------------
+// Error handling for spawn failures
+// ---------------------------------------------------------------------------
+describe('host_bash — spawn error handling', () => {
+  test('reports error when working_dir does not exist', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo test',
+      working_dir: '/nonexistent/path/that/does/not/exist',
+    }, makeContext());
+    expect(result.isError).toBe(true);
+    expect(result.content).toContain('Error spawning command');
+  });
+  test('captures both stdout and stderr in output', async () => {
+    const result = await hostShellTool.execute({
+      command: 'echo out && echo err >&2',
+    }, makeContext());
+    expect(result.content).toContain('out');
+    expect(result.content).toContain('err');
+  });
+  test('returns completed marker for successful empty output', async () => {
+    const result = await hostShellTool.execute({
+      command: 'true',
+    }, makeContext());
+    expect(result.isError).toBe(false);
+    expect(result.content).toContain('<command_completed />');
+  });
+});