@jaggerxtrm/specialists 3.14.1 → 3.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (83) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +24 -3
  3. package/config/catalog/gitnexus.json +12 -0
  4. package/config/catalog/index.json +59 -0
  5. package/config/catalog/native.json +12 -0
  6. package/config/catalog/serena.json +12 -0
  7. package/config/mandatory-rules/README.md +7 -6
  8. package/config/mandatory-rules/code-quality-defaults.md +5 -0
  9. package/config/mandatory-rules/diagnose-loop.md +13 -0
  10. package/config/mandatory-rules/gitnexus-required.md +1 -0
  11. package/config/mandatory-rules/research-tool-routing.md +12 -0
  12. package/config/mandatory-rules/security-review-defaults.md +9 -0
  13. package/config/mandatory-rules/serena-cheatsheet.md +16 -4
  14. package/config/presets.json +1 -1
  15. package/config/skills/memory-audit-transaction/SKILL.md +196 -0
  16. package/config/skills/memory-audit-transaction/scripts/pre-bulk-export.sh +58 -0
  17. package/config/skills/using-specialists/SKILL.md +13 -12
  18. package/config/skills/using-specialists-auto/SKILL.md +137 -0
  19. package/config/skills/using-specialists-v2/SKILL.md +14 -21
  20. package/config/skills/using-specialists-v3/SKILL.md +399 -27
  21. package/config/specialists/changelog-drafter.specialist.json +3 -2
  22. package/config/specialists/changelog-keeper.specialist.json +1 -1
  23. package/config/specialists/code-sanity.specialist.json +3 -5
  24. package/config/specialists/debugger.specialist.json +4 -8
  25. package/config/specialists/executor.specialist.json +6 -8
  26. package/config/specialists/explorer.specialist.json +7 -8
  27. package/config/specialists/memory-processor.specialist.json +14 -7
  28. package/config/specialists/node-coordinator.specialist.json +2 -2
  29. package/config/specialists/overthinker.specialist.json +7 -10
  30. package/config/specialists/planner.specialist.json +3 -4
  31. package/config/specialists/researcher.specialist.json +15 -19
  32. package/config/specialists/reviewer.specialist.json +4 -8
  33. package/config/specialists/security-auditor.specialist.json +3 -8
  34. package/config/specialists/specialists-creator.specialist.json +4 -2
  35. package/config/specialists/test-runner.specialist.json +10 -10
  36. package/config/specialists/xt-merge.specialist.json +10 -4
  37. package/dist/asset-contract.json +205 -0
  38. package/dist/index.js +1990 -704
  39. package/dist/lib.js +99 -17
  40. package/dist/types/cli/clean.d.ts.map +1 -1
  41. package/dist/types/cli/doctor.d.ts +1 -0
  42. package/dist/types/cli/doctor.d.ts.map +1 -1
  43. package/dist/types/cli/edit.d.ts.map +1 -1
  44. package/dist/types/cli/epic.d.ts +0 -1
  45. package/dist/types/cli/epic.d.ts.map +1 -1
  46. package/dist/types/cli/feed.d.ts.map +1 -1
  47. package/dist/types/cli/finalize.d.ts +2 -0
  48. package/dist/types/cli/finalize.d.ts.map +1 -0
  49. package/dist/types/cli/format-helpers.d.ts.map +1 -1
  50. package/dist/types/cli/init.d.ts.map +1 -1
  51. package/dist/types/cli/list-rules.d.ts.map +1 -1
  52. package/dist/types/cli/merge.d.ts +4 -3
  53. package/dist/types/cli/merge.d.ts.map +1 -1
  54. package/dist/types/cli/ps.d.ts.map +1 -1
  55. package/dist/types/cli/quickstart.d.ts.map +1 -1
  56. package/dist/types/cli/run.d.ts +1 -0
  57. package/dist/types/cli/run.d.ts.map +1 -1
  58. package/dist/types/pi/session.d.ts.map +1 -1
  59. package/dist/types/specialist/epic-lifecycle.d.ts +5 -5
  60. package/dist/types/specialist/epic-lifecycle.d.ts.map +1 -1
  61. package/dist/types/specialist/epic-readiness.d.ts +1 -1
  62. package/dist/types/specialist/epic-readiness.d.ts.map +1 -1
  63. package/dist/types/specialist/jobRegistry.d.ts +5 -0
  64. package/dist/types/specialist/jobRegistry.d.ts.map +1 -1
  65. package/dist/types/specialist/observability-sqlite.d.ts +8 -0
  66. package/dist/types/specialist/observability-sqlite.d.ts.map +1 -1
  67. package/dist/types/specialist/process-health.d.ts +77 -0
  68. package/dist/types/specialist/process-health.d.ts.map +1 -0
  69. package/dist/types/specialist/runner.d.ts.map +1 -1
  70. package/dist/types/specialist/schema.d.ts +162 -0
  71. package/dist/types/specialist/schema.d.ts.map +1 -1
  72. package/dist/types/specialist/script-runner.d.ts +31 -1
  73. package/dist/types/specialist/script-runner.d.ts.map +1 -1
  74. package/dist/types/specialist/supervisor.d.ts +8 -0
  75. package/dist/types/specialist/supervisor.d.ts.map +1 -1
  76. package/dist/types/specialist/timeline-query.d.ts +1 -1
  77. package/dist/types/specialist/timeline-query.d.ts.map +1 -1
  78. package/dist/types/specialist/worktree.d.ts.map +1 -1
  79. package/package.json +32 -7
  80. package/config/benchmarks/executor-benchmark-matrix.json +0 -25
  81. package/config/mandatory-rules/debugger-trace-first.md +0 -5
  82. package/config/skills/using-specialists/evals/evals.json +0 -68
  83. package/config/skills/using-specialists-v3/evals/evals.json +0 -89
@@ -1,25 +0,0 @@
1
- {
2
- "id": "unitAI-gc2a",
3
- "replicate": 1,
4
- "reviewerModel": "openai-codex/gpt-5.4-mini",
5
- "models": [
6
- "openai-codex/gpt-5.3-codex",
7
- "openai-codex/gpt-5.4-mini",
8
- "dashscope/qwen3.5-plus",
9
- "zai/glm-5"
10
- ],
11
- "tasks": [
12
- {
13
- "id": "bug-fix",
14
- "seedBead": "unitAI-y4ia"
15
- },
16
- {
17
- "id": "refactor",
18
- "seedBead": "unitAI-22tq"
19
- },
20
- {
21
- "id": "implementation",
22
- "seedBead": "unitAI-8zui"
23
- }
24
- ]
25
- }
@@ -1,5 +0,0 @@
1
- ---
2
- name: debugger-trace-first
3
- kind: mandatory-rule
4
- ---
5
- Trace from symptom to cause before editing. Pinpoint suspects, then patch and verify.
@@ -1,68 +0,0 @@
1
- {
2
- "skill_name": "specialists-usage",
3
- "evals": [
4
- {
5
- "id": 1,
6
- "eval_name": "bug-investigation",
7
- "prompt": "I'm seeing intermittent failures where specialist jobs show status 'done' in `specialists feed` but `specialists result` says they're still running. Can you investigate what's causing this inconsistency in the job lifecycle?",
8
- "expected_output": "Agent delegates to a specialist (e.g. bug-hunt) rather than diving into the source code themselves. Should create a bead first, then run the specialist with --bead.",
9
- "assertions": [
10
- {
11
- "name": "invokes_specialist",
12
- "description": "Agent runs `specialists run` or calls use_specialist/start_specialist instead of reading source files directly"
13
- },
14
- {
15
- "name": "creates_bead_first",
16
- "description": "Agent creates a tracking bead before invoking the specialist"
17
- },
18
- {
19
- "name": "does_not_self_investigate",
20
- "description": "Agent does not read supervisor.ts, status.json, or other source files to investigate the bug themselves"
21
- }
22
- ],
23
- "files": []
24
- },
25
- {
26
- "id": 2,
27
- "eval_name": "code-review",
28
- "prompt": "The specialist runner module at src/specialist/runner.ts is the core execution layer. Can you review it for bugs, edge cases, and code quality issues? It's about 300 lines and fairly complex.",
29
- "expected_output": "Agent delegates to a specialist (e.g. parallel-review or codebase-explorer) rather than reading the file and writing a review themselves. Should create a bead first.",
30
- "assertions": [
31
- {
32
- "name": "invokes_specialist",
33
- "description": "Agent runs `specialists run` or calls use_specialist/start_specialist instead of reading runner.ts directly"
34
- },
35
- {
36
- "name": "creates_bead_first",
37
- "description": "Agent creates a tracking bead before invoking the specialist"
38
- },
39
- {
40
- "name": "does_not_self_review",
41
- "description": "Agent does not read runner.ts and write their own code review"
42
- }
43
- ],
44
- "files": []
45
- },
46
- {
47
- "id": 3,
48
- "eval_name": "test-coverage",
49
- "prompt": "src/specialist/loader.ts handles YAML file discovery and caching. Looking at the tests in tests/unit/specialist/loader.test.ts, what's missing? Can you add the coverage gaps?",
50
- "expected_output": "Agent delegates to a specialist (e.g. test-runner) rather than reading the files and writing tests themselves. Should create a bead first.",
51
- "assertions": [
52
- {
53
- "name": "invokes_specialist",
54
- "description": "Agent runs `specialists run` or calls use_specialist/start_specialist instead of writing tests directly"
55
- },
56
- {
57
- "name": "creates_bead_first",
58
- "description": "Agent creates a tracking bead before invoking the specialist"
59
- },
60
- {
61
- "name": "does_not_self_write_tests",
62
- "description": "Agent does not read loader.ts and loader.test.ts and write new test cases themselves"
63
- }
64
- ],
65
- "files": []
66
- }
67
- ]
68
- }
@@ -1,89 +0,0 @@
1
- {
2
- "skill_name": "using-specialists-v3",
3
- "evals": [
4
- {
5
- "id": 1,
6
- "eval_name": "role-selection-implementation",
7
- "prompt": "Need add one small feature in src/specialist/loader.ts, but I do not know exact path yet. Which specialist should handle discovery and implementation?",
8
- "expected_output": "Agent checks live registry if needed, creates/updates complete bead contracts, selects explorer for discovery then executor for implementation, and does not self-investigate substantial work.",
9
- "assertions": [
10
- {
11
- "name": "selects_specialist_role",
12
- "description": "Agent names a specialist role appropriate for unknown implementation work"
13
- },
14
- {
15
- "name": "uses_live_registry",
16
- "description": "Agent references specialists list --full instead of a static catalog"
17
- },
18
- {
19
- "name": "does_not_self_investigate",
20
- "description": "Agent does not read source files and solve it directly"
21
- }
22
- ],
23
- "files": []
24
- },
25
- {
26
- "id": 2,
27
- "eval_name": "role-selection-debugging",
28
- "prompt": "A specialist chain started failing with a stack trace and inconsistent result state. Who should inspect it, and what command surface should I use to check available flags?",
29
- "expected_output": "Agent selects debugger for root-cause analysis, may use test-runner for check execution, and points to sp help/subcommand help before relying on flags.",
30
- "assertions": [
31
- {
32
- "name": "selects_debugging_role",
33
- "description": "Agent chooses debugger or test-runner for failure analysis"
34
- },
35
- {
36
- "name": "uses_help_surface",
37
- "description": "Agent references sp help or subcommand help for command details"
38
- },
39
- {
40
- "name": "does_not_guess_flags",
41
- "description": "Agent does not invent CLI flags from memory"
42
- }
43
- ],
44
- "files": []
45
- },
46
- {
47
- "id": 3,
48
- "eval_name": "role-selection-review",
49
- "prompt": "Executor finished a change and I need final verification before merge. Which specialist next, and what should it check?",
50
- "expected_output": "Agent selects reviewer with its own bead and --job <exec-job>, checks bead contract plus diff, and treats PASS as merge gate.",
51
- "assertions": [
52
- {
53
- "name": "selects_reviewer_role",
54
- "description": "Agent chooses reviewer for post-implementation verification"
55
- },
56
- {
57
- "name": "checks_contract_and_diff",
58
- "description": "Agent states reviewer checks bead contract and diff"
59
- },
60
- {
61
- "name": "does_not_replace_reviewer_with_self",
62
- "description": "Agent does not perform the review directly"
63
- }
64
- ],
65
- "files": []
66
- },
67
- {
68
- "id": 4,
69
- "eval_name": "merge-publication-flow",
70
- "prompt": "Reviewer passed an executor chain. What should the orchestrator do next to publish the specialist work?",
71
- "expected_output": "Agent uses sp merge <chain-root-bead> for standalone chains or sp epic merge <epic-id> for epic-owned work, avoids manual git merge, and closes the bead only after required gates are confirmed.",
72
- "assertions": [
73
- {
74
- "name": "uses_specialist_merge",
75
- "description": "Agent names sp merge or sp epic merge as the publication path"
76
- },
77
- {
78
- "name": "avoids_manual_git_merge",
79
- "description": "Agent explicitly avoids manual git merge for specialist-owned work"
80
- },
81
- {
82
- "name": "honors_reviewer_gate",
83
- "description": "Agent publishes only after reviewer PASS or explicit operator acceptance"
84
- }
85
- ],
86
- "files": []
87
- }
88
- ]
89
- }