@vellumai/assistant 0.3.2 → 0.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (109) hide show
  1. package/README.md +82 -21
  2. package/package.json +1 -1
  3. package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +16 -0
  4. package/src/__tests__/app-git-history.test.ts +22 -27
  5. package/src/__tests__/app-git-service.test.ts +44 -78
  6. package/src/__tests__/call-orchestrator.test.ts +321 -0
  7. package/src/__tests__/channel-approval-routes.test.ts +1267 -93
  8. package/src/__tests__/channel-approval.test.ts +2 -0
  9. package/src/__tests__/channel-approvals.test.ts +51 -2
  10. package/src/__tests__/channel-delivery-store.test.ts +130 -1
  11. package/src/__tests__/channel-guardian.test.ts +371 -1
  12. package/src/__tests__/config-schema.test.ts +1 -1
  13. package/src/__tests__/credential-security-invariants.test.ts +1 -0
  14. package/src/__tests__/daemon-lifecycle.test.ts +635 -0
  15. package/src/__tests__/daemon-server-session-init.test.ts +5 -0
  16. package/src/__tests__/gateway-only-enforcement.test.ts +106 -21
  17. package/src/__tests__/handlers-telegram-config.test.ts +82 -0
  18. package/src/__tests__/handlers-twilio-config.test.ts +738 -5
  19. package/src/__tests__/ingress-url-consistency.test.ts +64 -0
  20. package/src/__tests__/ipc-snapshot.test.ts +10 -0
  21. package/src/__tests__/run-orchestrator.test.ts +1 -1
  22. package/src/__tests__/secret-scanner.test.ts +223 -0
  23. package/src/__tests__/session-process-bridge.test.ts +2 -0
  24. package/src/__tests__/shell-parser-property.test.ts +357 -2
  25. package/src/__tests__/system-prompt.test.ts +25 -1
  26. package/src/__tests__/tool-executor-lifecycle-events.test.ts +34 -1
  27. package/src/__tests__/tool-permission-simulate-handler.test.ts +2 -2
  28. package/src/__tests__/user-reference.test.ts +68 -0
  29. package/src/calls/call-orchestrator.ts +63 -11
  30. package/src/calls/twilio-config.ts +10 -1
  31. package/src/calls/twilio-rest.ts +70 -0
  32. package/src/cli/map.ts +6 -0
  33. package/src/commands/__tests__/cc-command-registry.test.ts +67 -0
  34. package/src/commands/cc-command-registry.ts +14 -1
  35. package/src/config/bundled-skills/claude-code/TOOLS.json +10 -3
  36. package/src/config/bundled-skills/email-setup/SKILL.md +56 -0
  37. package/src/config/bundled-skills/messaging/SKILL.md +4 -0
  38. package/src/config/bundled-skills/subagent/SKILL.md +4 -0
  39. package/src/config/bundled-skills/subagent/TOOLS.json +4 -0
  40. package/src/config/defaults.ts +1 -1
  41. package/src/config/schema.ts +6 -3
  42. package/src/config/skills.ts +5 -32
  43. package/src/config/system-prompt.ts +16 -0
  44. package/src/config/user-reference.ts +29 -0
  45. package/src/config/vellum-skills/catalog.json +52 -0
  46. package/src/config/vellum-skills/telegram-setup/SKILL.md +6 -1
  47. package/src/config/vellum-skills/twilio-setup/SKILL.md +49 -4
  48. package/src/daemon/auth-manager.ts +103 -0
  49. package/src/daemon/computer-use-session.ts +8 -1
  50. package/src/daemon/config-watcher.ts +253 -0
  51. package/src/daemon/handlers/config.ts +193 -17
  52. package/src/daemon/handlers/sessions.ts +5 -3
  53. package/src/daemon/handlers/skills.ts +60 -17
  54. package/src/daemon/ipc-contract-inventory.json +4 -0
  55. package/src/daemon/ipc-contract.ts +16 -0
  56. package/src/daemon/ipc-handler.ts +87 -0
  57. package/src/daemon/lifecycle.ts +16 -4
  58. package/src/daemon/ride-shotgun-handler.ts +11 -1
  59. package/src/daemon/server.ts +105 -502
  60. package/src/daemon/session-agent-loop.ts +9 -14
  61. package/src/daemon/session-process.ts +20 -3
  62. package/src/daemon/session-runtime-assembly.ts +60 -44
  63. package/src/daemon/session-slash.ts +50 -2
  64. package/src/daemon/session-surfaces.ts +17 -1
  65. package/src/daemon/session.ts +8 -1
  66. package/src/inbound/public-ingress-urls.ts +20 -3
  67. package/src/index.ts +1 -23
  68. package/src/memory/app-git-service.ts +24 -0
  69. package/src/memory/app-store.ts +0 -21
  70. package/src/memory/channel-delivery-store.ts +74 -3
  71. package/src/memory/channel-guardian-store.ts +54 -26
  72. package/src/memory/conversation-key-store.ts +20 -0
  73. package/src/memory/conversation-store.ts +14 -2
  74. package/src/memory/db-connection.ts +28 -0
  75. package/src/memory/db-init.ts +1019 -0
  76. package/src/memory/db.ts +2 -1995
  77. package/src/memory/embedding-backend.ts +79 -11
  78. package/src/memory/indexer.ts +2 -0
  79. package/src/memory/job-utils.ts +64 -4
  80. package/src/memory/jobs-worker.ts +7 -1
  81. package/src/memory/recall-cache.ts +107 -0
  82. package/src/memory/retriever.ts +30 -1
  83. package/src/memory/schema-migration.ts +984 -0
  84. package/src/memory/schema.ts +6 -0
  85. package/src/memory/search/types.ts +2 -0
  86. package/src/permissions/prompter.ts +14 -3
  87. package/src/permissions/trust-store.ts +7 -0
  88. package/src/runtime/channel-approvals.ts +17 -3
  89. package/src/runtime/gateway-client.ts +2 -1
  90. package/src/runtime/http-server.ts +28 -9
  91. package/src/runtime/routes/channel-routes.ts +279 -100
  92. package/src/runtime/routes/run-routes.ts +7 -1
  93. package/src/runtime/run-orchestrator.ts +8 -1
  94. package/src/security/secret-scanner.ts +218 -0
  95. package/src/skills/clawhub.ts +6 -2
  96. package/src/skills/frontmatter.ts +63 -0
  97. package/src/skills/slash-commands.ts +23 -0
  98. package/src/skills/vellum-catalog-remote.ts +107 -0
  99. package/src/subagent/manager.ts +4 -1
  100. package/src/subagent/types.ts +2 -0
  101. package/src/tools/browser/auto-navigate.ts +132 -24
  102. package/src/tools/browser/browser-manager.ts +67 -61
  103. package/src/tools/claude-code/claude-code.ts +55 -3
  104. package/src/tools/executor.ts +10 -2
  105. package/src/tools/skills/vellum-catalog.ts +75 -127
  106. package/src/tools/subagent/spawn.ts +2 -0
  107. package/src/tools/terminal/parser.ts +21 -5
  108. package/src/util/platform.ts +8 -1
  109. package/src/util/retry.ts +4 -4
@@ -27,6 +27,14 @@ mock.module('../util/logger.js', () => ({
27
27
  }),
28
28
  }));
29
29
 
30
+ // ── User reference mock ──────────────────────────────────────────────
31
+
32
+ let mockUserReference = 'my human';
33
+
34
+ mock.module('../config/user-reference.js', () => ({
35
+ resolveUserReference: () => mockUserReference,
36
+ }));
37
+
30
38
  // ── Config mock ─────────────────────────────────────────────────────
31
39
 
32
40
  let mockCallModel: string | undefined = undefined;
@@ -197,6 +205,7 @@ describe('call-orchestrator', () => {
197
205
  beforeEach(() => {
198
206
  resetTables();
199
207
  mockCallModel = undefined;
208
+ mockUserReference = 'my human';
200
209
  // Reset the stream mock to default behaviour
201
210
  mockStreamFn.mockImplementation(() => createMockStream(['Hello', ' there']));
202
211
  });
@@ -414,6 +423,166 @@ describe('call-orchestrator', () => {
414
423
  orchestrator.destroy();
415
424
  });
416
425
 
426
+ test('LLM APIUserAbortError: treats as expected abort without technical-issue fallback', async () => {
427
+ mockStreamFn.mockImplementation(() => {
428
+ const emitter = new EventEmitter();
429
+ return {
430
+ on: (event: string, handler: (...args: unknown[]) => void) => {
431
+ emitter.on(event, handler);
432
+ return { on: () => ({ on: () => ({}) }) };
433
+ },
434
+ finalMessage: () => {
435
+ const err = new Error('user abort');
436
+ err.name = 'APIUserAbortError';
437
+ return Promise.reject(err);
438
+ },
439
+ };
440
+ });
441
+
442
+ const { relay, orchestrator } = setupOrchestrator();
443
+ await orchestrator.handleCallerUtterance('Hello');
444
+
445
+ const errorTokens = relay.sentTokens.filter((t) => t.token.includes('technical issue'));
446
+ expect(errorTokens.length).toBe(0);
447
+ expect(orchestrator.getState()).toBe('idle');
448
+
449
+ orchestrator.destroy();
450
+ });
451
+
452
+ test('stale superseded turn errors do not emit technical-issue fallback', async () => {
453
+ let callCount = 0;
454
+ mockStreamFn.mockImplementation(() => {
455
+ callCount++;
456
+ if (callCount === 1) {
457
+ const emitter = new EventEmitter();
458
+ return {
459
+ on: (event: string, handler: (...args: unknown[]) => void) => {
460
+ emitter.on(event, handler);
461
+ return { on: () => ({ on: () => ({}) }) };
462
+ },
463
+ finalMessage: () =>
464
+ new Promise((_, reject) => {
465
+ setTimeout(() => reject(new Error('stale stream failure')), 20);
466
+ }),
467
+ };
468
+ }
469
+ return createMockStream(['Second turn response.']);
470
+ });
471
+
472
+ const { relay, orchestrator } = setupOrchestrator();
473
+
474
+ const firstTurnPromise = orchestrator.handleCallerUtterance('First utterance');
475
+ // Allow the first turn to enter runLlm before the second utterance interrupts it.
476
+ await new Promise((r) => setTimeout(r, 5));
477
+ const secondTurnPromise = orchestrator.handleCallerUtterance('Second utterance');
478
+
479
+ await Promise.all([firstTurnPromise, secondTurnPromise]);
480
+
481
+ const allTokens = relay.sentTokens.map((t) => t.token).join('');
482
+ expect(allTokens).toContain('Second turn response.');
483
+ expect(allTokens).not.toContain('technical issue');
484
+
485
+ orchestrator.destroy();
486
+ });
487
+
488
+ test('rapid caller barge-in coalesces contiguous user turns for role alternation', async () => {
489
+ let callCount = 0;
490
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
491
+ callCount++;
492
+ if (callCount === 1) {
493
+ const emitter = new EventEmitter();
494
+ const options = args[1] as { signal?: AbortSignal } | undefined;
495
+ return {
496
+ on: (event: string, handler: (...evtArgs: unknown[]) => void) => {
497
+ emitter.on(event, handler);
498
+ return { on: () => ({ on: () => ({}) }) };
499
+ },
500
+ finalMessage: () =>
501
+ new Promise((_, reject) => {
502
+ options?.signal?.addEventListener('abort', () => {
503
+ const err = new Error('aborted');
504
+ err.name = 'AbortError';
505
+ reject(err);
506
+ }, { once: true });
507
+ }),
508
+ };
509
+ }
510
+
511
+ const firstArg = args[0] as { messages: Array<{ role: string; content: string }> };
512
+ const roles = firstArg.messages.map((m) => m.role);
513
+ for (let i = 1; i < roles.length; i++) {
514
+ expect(!(roles[i - 1] === 'user' && roles[i] === 'user')).toBe(true);
515
+ }
516
+ const userMessages = firstArg.messages.filter((m) => m.role === 'user');
517
+ const lastUser = userMessages[userMessages.length - 1];
518
+ expect(lastUser?.content).toContain('First caller utterance');
519
+ expect(lastUser?.content).toContain('Second caller utterance');
520
+ return createMockStream(['Merged turn handled.']);
521
+ });
522
+
523
+ const { relay, orchestrator } = setupOrchestrator();
524
+ const firstTurnPromise = orchestrator.handleCallerUtterance('First caller utterance');
525
+ await new Promise((r) => setTimeout(r, 5));
526
+ const secondTurnPromise = orchestrator.handleCallerUtterance('Second caller utterance');
527
+
528
+ await Promise.all([firstTurnPromise, secondTurnPromise]);
529
+
530
+ const allTokens = relay.sentTokens.map((t) => t.token).join('');
531
+ expect(allTokens).toContain('Merged turn handled.');
532
+
533
+ orchestrator.destroy();
534
+ });
535
+
536
+ test('interrupt then next caller prompt still preserves role alternation', async () => {
537
+ let callCount = 0;
538
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
539
+ callCount++;
540
+ if (callCount === 1) {
541
+ const emitter = new EventEmitter();
542
+ const options = args[1] as { signal?: AbortSignal } | undefined;
543
+ return {
544
+ on: (event: string, handler: (...evtArgs: unknown[]) => void) => {
545
+ emitter.on(event, handler);
546
+ return { on: () => ({ on: () => ({}) }) };
547
+ },
548
+ finalMessage: () =>
549
+ new Promise((_, reject) => {
550
+ options?.signal?.addEventListener('abort', () => {
551
+ const err = new Error('aborted');
552
+ err.name = 'AbortError';
553
+ reject(err);
554
+ }, { once: true });
555
+ }),
556
+ };
557
+ }
558
+
559
+ const firstArg = args[0] as { messages: Array<{ role: string; content: string }> };
560
+ const roles = firstArg.messages.map((m) => m.role);
561
+ for (let i = 1; i < roles.length; i++) {
562
+ expect(!(roles[i - 1] === 'user' && roles[i] === 'user')).toBe(true);
563
+ }
564
+ const userMessages = firstArg.messages.filter((m) => m.role === 'user');
565
+ const lastUser = userMessages[userMessages.length - 1];
566
+ expect(lastUser?.content).toContain('First caller utterance');
567
+ expect(lastUser?.content).toContain('Second caller utterance');
568
+ return createMockStream(['Post-interrupt response.']);
569
+ });
570
+
571
+ const { relay, orchestrator } = setupOrchestrator();
572
+ const firstTurnPromise = orchestrator.handleCallerUtterance('First caller utterance');
573
+ await new Promise((r) => setTimeout(r, 5));
574
+ orchestrator.handleInterrupt();
575
+ const secondTurnPromise = orchestrator.handleCallerUtterance('Second caller utterance');
576
+
577
+ await Promise.all([firstTurnPromise, secondTurnPromise]);
578
+
579
+ const allTokens = relay.sentTokens.map((t) => t.token).join('');
580
+ expect(allTokens).toContain('Post-interrupt response.');
581
+ expect(allTokens).not.toContain('technical issue');
582
+
583
+ orchestrator.destroy();
584
+ });
585
+
417
586
  test('handleUserAnswer: returns false when not in waiting_on_user state', async () => {
418
587
  const { orchestrator } = setupOrchestrator();
419
588
 
@@ -435,6 +604,87 @@ describe('call-orchestrator', () => {
435
604
  orchestrator.destroy();
436
605
  });
437
606
 
607
+ test('handleInterrupt: increments llmRunVersion to suppress stale turn side effects', async () => {
608
+ // Use a stream whose finalMessage resolves immediately but whose
609
+ // continuation (the code after `await stream.finalMessage()`) will
610
+ // run asynchronously. This simulates the race where the promise
611
+ // microtask is queued right as handleInterrupt fires.
612
+ mockStreamFn.mockImplementation(() => {
613
+ const emitter = new EventEmitter();
614
+ return {
615
+ on: (event: string, handler: (...args: unknown[]) => void) => {
616
+ emitter.on(event, handler);
617
+ return { on: () => ({ on: () => ({}) }) };
618
+ },
619
+ finalMessage: () => {
620
+ // Emit some tokens synchronously
621
+ emitter.emit('text', 'Stale response that should be suppressed.');
622
+ return Promise.resolve({
623
+ content: [{ type: 'text', text: 'Stale response that should be suppressed.' }],
624
+ });
625
+ },
626
+ };
627
+ });
628
+
629
+ const { relay, orchestrator } = setupOrchestrator();
630
+
631
+ // Start an LLM turn (don't await — we want to interrupt mid-flight)
632
+ const turnPromise = orchestrator.handleCallerUtterance('Hello');
633
+
634
+ // Interrupt immediately. Because finalMessage resolves as a microtask,
635
+ // its continuation hasn't run yet. handleInterrupt increments
636
+ // llmRunVersion so the continuation's isCurrentRun check will fail.
637
+ orchestrator.handleInterrupt();
638
+
639
+ // Let the stale turn's microtask continuation execute
640
+ await turnPromise;
641
+
642
+ // The orchestrator should remain idle — the stale turn must not
643
+ // have pushed state to waiting_on_user or any other post-turn state.
644
+ expect(orchestrator.getState()).toBe('idle');
645
+
646
+ // No technical-issue fallback should have been sent
647
+ const errorTokens = relay.sentTokens.filter((t) => t.token.includes('technical issue'));
648
+ expect(errorTokens.length).toBe(0);
649
+
650
+ // endSession should NOT have been called by the stale turn
651
+ expect(relay.endCalled).toBe(false);
652
+
653
+ orchestrator.destroy();
654
+ });
655
+
656
+ test('handleInterrupt: sends turn terminator when interrupting active speech', async () => {
657
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
658
+ const emitter = new EventEmitter();
659
+ const options = args[1] as { signal?: AbortSignal } | undefined;
660
+ return {
661
+ on: (event: string, handler: (...evtArgs: unknown[]) => void) => {
662
+ emitter.on(event, handler);
663
+ return { on: () => ({ on: () => ({}) }) };
664
+ },
665
+ finalMessage: () =>
666
+ new Promise((_, reject) => {
667
+ options?.signal?.addEventListener('abort', () => {
668
+ const err = new Error('aborted');
669
+ err.name = 'AbortError';
670
+ reject(err);
671
+ }, { once: true });
672
+ }),
673
+ };
674
+ });
675
+
676
+ const { relay, orchestrator } = setupOrchestrator();
677
+ const turnPromise = orchestrator.handleCallerUtterance('Start speaking');
678
+ await new Promise((r) => setTimeout(r, 5));
679
+ orchestrator.handleInterrupt();
680
+ await turnPromise;
681
+
682
+ const endTurnMarkers = relay.sentTokens.filter((t) => t.token === '' && t.last === true);
683
+ expect(endTurnMarkers.length).toBeGreaterThan(0);
684
+
685
+ orchestrator.destroy();
686
+ });
687
+
438
688
  // ── destroy ───────────────────────────────────────────────────────
439
689
 
440
690
  test('destroy: unregisters orchestrator', () => {
@@ -622,4 +872,75 @@ describe('call-orchestrator', () => {
622
872
 
623
873
  orchestrator.destroy();
624
874
  });
875
+
876
+ // ── System prompt: identity phrasing ────────────────────────────────
877
+
878
+ test('system prompt contains resolved user reference (default)', async () => {
879
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
880
+ const firstArg = args[0] as { system: string };
881
+ expect(firstArg.system).toContain('on behalf of my human');
882
+ return createMockStream(['Hello.']);
883
+ });
884
+
885
+ const { orchestrator } = setupOrchestrator();
886
+ await orchestrator.handleCallerUtterance('Hi');
887
+ orchestrator.destroy();
888
+ });
889
+
890
+ test('system prompt contains resolved user reference when set to a name', async () => {
891
+ mockUserReference = 'John';
892
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
893
+ const firstArg = args[0] as { system: string };
894
+ expect(firstArg.system).toContain('on behalf of John');
895
+ return createMockStream(['Hello John\'s contact.']);
896
+ });
897
+
898
+ const { orchestrator } = setupOrchestrator();
899
+ await orchestrator.handleCallerUtterance('Hi');
900
+ orchestrator.destroy();
901
+ });
902
+
903
+ test('system prompt does not hardcode "your user" in the opening line', async () => {
904
+ mockUserReference = 'Alice';
905
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
906
+ const firstArg = args[0] as { system: string };
907
+ expect(firstArg.system).not.toContain('on behalf of your user');
908
+ expect(firstArg.system).toContain('on behalf of Alice');
909
+ return createMockStream(['Hi there.']);
910
+ });
911
+
912
+ const { orchestrator } = setupOrchestrator();
913
+ await orchestrator.handleCallerUtterance('Hello');
914
+ orchestrator.destroy();
915
+ });
916
+
917
+ test('system prompt includes assistant identity bias rule', async () => {
918
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
919
+ const firstArg = args[0] as { system: string };
920
+ expect(firstArg.system).toContain('refer to yourself as an assistant');
921
+ expect(firstArg.system).toContain('Avoid the phrase "AI assistant" unless directly asked');
922
+ return createMockStream(['Sure thing.']);
923
+ });
924
+
925
+ const { orchestrator } = setupOrchestrator();
926
+ await orchestrator.handleCallerUtterance('Hi');
927
+ orchestrator.destroy();
928
+ });
929
+
930
+ test('assistant identity rule appears before disclosure rule in prompt', async () => {
931
+ mockStreamFn.mockImplementation((...args: unknown[]) => {
932
+ const firstArg = args[0] as { system: string };
933
+ const prompt = firstArg.system;
934
+ const identityIdx = prompt.indexOf('refer to yourself as an assistant');
935
+ const disclosureIdx = prompt.indexOf('Be concise');
936
+ expect(identityIdx).toBeGreaterThan(-1);
937
+ expect(disclosureIdx).toBeGreaterThan(-1);
938
+ expect(identityIdx).toBeLessThan(disclosureIdx);
939
+ return createMockStream(['OK.']);
940
+ });
941
+
942
+ const { orchestrator } = setupOrchestrator();
943
+ await orchestrator.handleCallerUtterance('Test');
944
+ orchestrator.destroy();
945
+ });
625
946
  });