opencode-swarm-plugin 0.44.0 → 0.44.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/swarm.serve.test.ts +6 -4
- package/bin/swarm.ts +16 -10
- package/dist/compaction-prompt-scoring.js +139 -0
- package/dist/eval-capture.js +12811 -0
- package/dist/hive.d.ts.map +1 -1
- package/dist/index.js +7644 -62599
- package/dist/plugin.js +23766 -78721
- package/dist/swarm-orchestrate.d.ts.map +1 -1
- package/dist/swarm-prompts.d.ts.map +1 -1
- package/dist/swarm-review.d.ts.map +1 -1
- package/package.json +17 -5
- package/.changeset/swarm-insights-data-layer.md +0 -63
- package/.hive/analysis/eval-failure-analysis-2025-12-25.md +0 -331
- package/.hive/analysis/session-data-quality-audit.md +0 -320
- package/.hive/eval-results.json +0 -483
- package/.hive/issues.jsonl +0 -138
- package/.hive/memories.jsonl +0 -729
- package/.opencode/eval-history.jsonl +0 -327
- package/.turbo/turbo-build.log +0 -9
- package/CHANGELOG.md +0 -2286
- package/SCORER-ANALYSIS.md +0 -598
- package/docs/analysis/subagent-coordination-patterns.md +0 -902
- package/docs/analysis-socratic-planner-pattern.md +0 -504
- package/docs/planning/ADR-001-monorepo-structure.md +0 -171
- package/docs/planning/ADR-002-package-extraction.md +0 -393
- package/docs/planning/ADR-003-performance-improvements.md +0 -451
- package/docs/planning/ADR-004-message-queue-features.md +0 -187
- package/docs/planning/ADR-005-devtools-observability.md +0 -202
- package/docs/planning/ADR-007-swarm-enhancements-worktree-review.md +0 -168
- package/docs/planning/ADR-008-worker-handoff-protocol.md +0 -293
- package/docs/planning/ADR-009-oh-my-opencode-patterns.md +0 -353
- package/docs/planning/ADR-010-cass-inhousing.md +0 -1215
- package/docs/planning/ROADMAP.md +0 -368
- package/docs/semantic-memory-cli-syntax.md +0 -123
- package/docs/swarm-mail-architecture.md +0 -1147
- package/docs/testing/context-recovery-test.md +0 -470
- package/evals/ARCHITECTURE.md +0 -1189
- package/evals/README.md +0 -768
- package/evals/compaction-prompt.eval.ts +0 -149
- package/evals/compaction-resumption.eval.ts +0 -289
- package/evals/coordinator-behavior.eval.ts +0 -307
- package/evals/coordinator-session.eval.ts +0 -154
- package/evals/evalite.config.ts.bak +0 -15
- package/evals/example.eval.ts +0 -31
- package/evals/fixtures/cass-baseline.ts +0 -217
- package/evals/fixtures/compaction-cases.ts +0 -350
- package/evals/fixtures/compaction-prompt-cases.ts +0 -311
- package/evals/fixtures/coordinator-sessions.ts +0 -328
- package/evals/fixtures/decomposition-cases.ts +0 -105
- package/evals/lib/compaction-loader.test.ts +0 -248
- package/evals/lib/compaction-loader.ts +0 -320
- package/evals/lib/data-loader.evalite-test.ts +0 -289
- package/evals/lib/data-loader.test.ts +0 -345
- package/evals/lib/data-loader.ts +0 -281
- package/evals/lib/llm.ts +0 -115
- package/evals/scorers/compaction-prompt-scorers.ts +0 -145
- package/evals/scorers/compaction-scorers.ts +0 -305
- package/evals/scorers/coordinator-discipline.evalite-test.ts +0 -539
- package/evals/scorers/coordinator-discipline.ts +0 -325
- package/evals/scorers/index.test.ts +0 -146
- package/evals/scorers/index.ts +0 -328
- package/evals/scorers/outcome-scorers.evalite-test.ts +0 -27
- package/evals/scorers/outcome-scorers.ts +0 -349
- package/evals/swarm-decomposition.eval.ts +0 -121
- package/examples/commands/swarm.md +0 -745
- package/examples/plugin-wrapper-template.ts +0 -2515
- package/examples/skills/hive-workflow/SKILL.md +0 -212
- package/examples/skills/skill-creator/SKILL.md +0 -223
- package/examples/skills/swarm-coordination/SKILL.md +0 -292
- package/global-skills/cli-builder/SKILL.md +0 -344
- package/global-skills/cli-builder/references/advanced-patterns.md +0 -244
- package/global-skills/learning-systems/SKILL.md +0 -644
- package/global-skills/skill-creator/LICENSE.txt +0 -202
- package/global-skills/skill-creator/SKILL.md +0 -352
- package/global-skills/skill-creator/references/output-patterns.md +0 -82
- package/global-skills/skill-creator/references/workflows.md +0 -28
- package/global-skills/swarm-coordination/SKILL.md +0 -995
- package/global-skills/swarm-coordination/references/coordinator-patterns.md +0 -235
- package/global-skills/swarm-coordination/references/strategies.md +0 -138
- package/global-skills/system-design/SKILL.md +0 -213
- package/global-skills/testing-patterns/SKILL.md +0 -430
- package/global-skills/testing-patterns/references/dependency-breaking-catalog.md +0 -586
- package/opencode-swarm-plugin-0.30.7.tgz +0 -0
- package/opencode-swarm-plugin-0.31.0.tgz +0 -0
- package/scripts/cleanup-test-memories.ts +0 -346
- package/scripts/init-skill.ts +0 -222
- package/scripts/migrate-unknown-sessions.ts +0 -349
- package/scripts/validate-skill.ts +0 -204
- package/src/agent-mail.ts +0 -1724
- package/src/anti-patterns.test.ts +0 -1167
- package/src/anti-patterns.ts +0 -448
- package/src/compaction-capture.integration.test.ts +0 -257
- package/src/compaction-hook.test.ts +0 -838
- package/src/compaction-hook.ts +0 -1204
- package/src/compaction-observability.integration.test.ts +0 -139
- package/src/compaction-observability.test.ts +0 -187
- package/src/compaction-observability.ts +0 -324
- package/src/compaction-prompt-scorers.test.ts +0 -475
- package/src/compaction-prompt-scoring.ts +0 -300
- package/src/contributor-tools.test.ts +0 -133
- package/src/contributor-tools.ts +0 -201
- package/src/dashboard.test.ts +0 -611
- package/src/dashboard.ts +0 -462
- package/src/error-enrichment.test.ts +0 -403
- package/src/error-enrichment.ts +0 -219
- package/src/eval-capture.test.ts +0 -1015
- package/src/eval-capture.ts +0 -929
- package/src/eval-gates.test.ts +0 -306
- package/src/eval-gates.ts +0 -218
- package/src/eval-history.test.ts +0 -508
- package/src/eval-history.ts +0 -214
- package/src/eval-learning.test.ts +0 -378
- package/src/eval-learning.ts +0 -360
- package/src/eval-runner.test.ts +0 -223
- package/src/eval-runner.ts +0 -402
- package/src/export-tools.test.ts +0 -476
- package/src/export-tools.ts +0 -257
- package/src/hive.integration.test.ts +0 -2241
- package/src/hive.ts +0 -1628
- package/src/index.ts +0 -940
- package/src/learning.integration.test.ts +0 -1815
- package/src/learning.ts +0 -1079
- package/src/logger.test.ts +0 -189
- package/src/logger.ts +0 -135
- package/src/mandate-promotion.test.ts +0 -473
- package/src/mandate-promotion.ts +0 -239
- package/src/mandate-storage.integration.test.ts +0 -601
- package/src/mandate-storage.test.ts +0 -578
- package/src/mandate-storage.ts +0 -794
- package/src/mandates.ts +0 -540
- package/src/memory-tools.test.ts +0 -195
- package/src/memory-tools.ts +0 -344
- package/src/memory.integration.test.ts +0 -334
- package/src/memory.test.ts +0 -158
- package/src/memory.ts +0 -527
- package/src/model-selection.test.ts +0 -188
- package/src/model-selection.ts +0 -68
- package/src/observability-tools.test.ts +0 -359
- package/src/observability-tools.ts +0 -871
- package/src/output-guardrails.test.ts +0 -438
- package/src/output-guardrails.ts +0 -381
- package/src/pattern-maturity.test.ts +0 -1160
- package/src/pattern-maturity.ts +0 -525
- package/src/planning-guardrails.test.ts +0 -491
- package/src/planning-guardrails.ts +0 -438
- package/src/plugin.ts +0 -23
- package/src/post-compaction-tracker.test.ts +0 -251
- package/src/post-compaction-tracker.ts +0 -237
- package/src/query-tools.test.ts +0 -636
- package/src/query-tools.ts +0 -324
- package/src/rate-limiter.integration.test.ts +0 -466
- package/src/rate-limiter.ts +0 -774
- package/src/replay-tools.test.ts +0 -496
- package/src/replay-tools.ts +0 -240
- package/src/repo-crawl.integration.test.ts +0 -441
- package/src/repo-crawl.ts +0 -610
- package/src/schemas/cell-events.test.ts +0 -347
- package/src/schemas/cell-events.ts +0 -807
- package/src/schemas/cell.ts +0 -257
- package/src/schemas/evaluation.ts +0 -166
- package/src/schemas/index.test.ts +0 -199
- package/src/schemas/index.ts +0 -286
- package/src/schemas/mandate.ts +0 -232
- package/src/schemas/swarm-context.ts +0 -115
- package/src/schemas/task.ts +0 -161
- package/src/schemas/worker-handoff.test.ts +0 -302
- package/src/schemas/worker-handoff.ts +0 -131
- package/src/sessions/agent-discovery.test.ts +0 -137
- package/src/sessions/agent-discovery.ts +0 -112
- package/src/sessions/index.ts +0 -15
- package/src/skills.integration.test.ts +0 -1192
- package/src/skills.test.ts +0 -643
- package/src/skills.ts +0 -1549
- package/src/storage.integration.test.ts +0 -341
- package/src/storage.ts +0 -884
- package/src/structured.integration.test.ts +0 -817
- package/src/structured.test.ts +0 -1046
- package/src/structured.ts +0 -762
- package/src/swarm-decompose.test.ts +0 -188
- package/src/swarm-decompose.ts +0 -1302
- package/src/swarm-deferred.integration.test.ts +0 -157
- package/src/swarm-deferred.test.ts +0 -38
- package/src/swarm-insights.test.ts +0 -214
- package/src/swarm-insights.ts +0 -459
- package/src/swarm-mail.integration.test.ts +0 -970
- package/src/swarm-mail.ts +0 -739
- package/src/swarm-orchestrate.integration.test.ts +0 -282
- package/src/swarm-orchestrate.test.ts +0 -548
- package/src/swarm-orchestrate.ts +0 -3084
- package/src/swarm-prompts.test.ts +0 -1270
- package/src/swarm-prompts.ts +0 -2077
- package/src/swarm-research.integration.test.ts +0 -701
- package/src/swarm-research.test.ts +0 -698
- package/src/swarm-research.ts +0 -472
- package/src/swarm-review.integration.test.ts +0 -285
- package/src/swarm-review.test.ts +0 -879
- package/src/swarm-review.ts +0 -709
- package/src/swarm-strategies.ts +0 -407
- package/src/swarm-worktree.test.ts +0 -501
- package/src/swarm-worktree.ts +0 -575
- package/src/swarm.integration.test.ts +0 -2377
- package/src/swarm.ts +0 -38
- package/src/tool-adapter.integration.test.ts +0 -1221
- package/src/tool-availability.ts +0 -461
- package/tsconfig.json +0 -28
|
@@ -1,300 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Compaction Prompt Quality Scoring - Pure Functions
|
|
3
|
-
*
|
|
4
|
-
* Evaluates the quality of continuation prompts generated after context compaction.
|
|
5
|
-
* **Problem**: Post-compaction coordinators often "wake up" confused, forget their role,
|
|
6
|
-
* and start editing files instead of checking worker status.
|
|
7
|
-
*
|
|
8
|
-
* **Solution**: Score prompts on 5 dimensions that predict coordinator success:
|
|
9
|
-
*
|
|
10
|
-
* 1. **Epic ID Specificity (0.20)**: Real IDs (`mjkw...`) not placeholders (`<epic-id>`, `bd-xxx`)
|
|
11
|
-
* - Placeholders = coordinator can't check actual swarm status
|
|
12
|
-
*
|
|
13
|
-
* 2. **Actionability (0.20)**: Tool calls with real values (e.g., `swarm_status(epic_id='mjkw81rkq4c')`)
|
|
14
|
-
* - Generic instructions like "check status" don't work
|
|
15
|
-
*
|
|
16
|
-
* 3. **Coordinator Identity (0.25)**: ASCII header + strong mandates (NEVER/ALWAYS)
|
|
17
|
-
* - Visual + semantic cues reinforce role post-compaction
|
|
18
|
-
*
|
|
19
|
-
* 4. **Forbidden Tools Listed (0.15)**: Explicitly lists Edit, Write, swarmmail_reserve, git commit
|
|
20
|
-
* - Naming forbidden tools reduces violations
|
|
21
|
-
*
|
|
22
|
-
* 5. **Post-Compaction Discipline (0.20)**: First suggested tool is swarm_status or inbox (not Edit)
|
|
23
|
-
* - First tool sets the pattern - "check status" vs "dive into code"
|
|
24
|
-
*
|
|
25
|
-
* **Pure functions**: These can be tested without evalite. The evalite wrappers are in
|
|
26
|
-
* `evals/scorers/compaction-prompt-scorers.ts`.
|
|
27
|
-
*
|
|
28
|
-
* **Data source**: Captured from `captureCompactionEvent()` with `compaction_type: "prompt_generated"`.
|
|
29
|
-
* The payload includes the FULL prompt content (not truncated) for scoring.
|
|
30
|
-
*
|
|
31
|
-
* **Integration**: `compaction-prompt.eval.ts` uses these scorers to track prompt quality over time.
|
|
32
|
-
* Progressive gates enforce quality: bootstrap → stabilization → production.
|
|
33
|
-
*
|
|
34
|
-
* @module compaction-prompt-scoring
|
|
35
|
-
*/
|
|
36
|
-
|
|
37
|
-
/**
|
|
38
|
-
* Compaction prompt structure (from LLM generation)
|
|
39
|
-
*/
|
|
40
|
-
export interface CompactionPrompt {
|
|
41
|
-
content: string;
|
|
42
|
-
}
|
|
43
|
-
|
|
44
|
-
/**
|
|
45
|
-
* Scorer result type
|
|
46
|
-
*/
|
|
47
|
-
export interface ScorerResult {
|
|
48
|
-
score: number;
|
|
49
|
-
message: string;
|
|
50
|
-
}
|
|
51
|
-
|
|
52
|
-
// ====== Shared Regex Patterns ======
|
|
53
|
-
|
|
54
|
-
/** Matches real epic/cell IDs (mjkw prefix + 7+ base36 chars) */
|
|
55
|
-
export const REAL_EPIC_ID = /mjkw[a-z0-9]{7,}/;
|
|
56
|
-
|
|
57
|
-
/** Matches common placeholder patterns */
|
|
58
|
-
export const PLACEHOLDERS = [
|
|
59
|
-
/<epic-id>/i,
|
|
60
|
-
/bd-xxx/,
|
|
61
|
-
/<path>/i,
|
|
62
|
-
/<project>/i,
|
|
63
|
-
];
|
|
64
|
-
|
|
65
|
-
/** Matches ASCII box-drawing characters (for headers) */
|
|
66
|
-
export const ASCII_BOX = /[┌┐└┘─│]{3,}/;
|
|
67
|
-
|
|
68
|
-
/** Matches strong mandate language */
|
|
69
|
-
export const STRONG_LANGUAGE = [/\bNEVER\b/, /\bALWAYS\b/, /\bNON-NEGOTIABLE\b/];
|
|
70
|
-
|
|
71
|
-
// ====== Pure Scoring Functions ======
|
|
72
|
-
|
|
73
|
-
/**
|
|
74
|
-
* Score epic ID specificity
|
|
75
|
-
*
|
|
76
|
-
* Validates that epic IDs are REAL, not placeholders.
|
|
77
|
-
* Placeholders like <epic-id>, bd-xxx, <path> indicate
|
|
78
|
-
* the prompt generator failed to inject actual values.
|
|
79
|
-
*
|
|
80
|
-
* @returns 1.0 if real IDs, 0.0 if placeholders found
|
|
81
|
-
*/
|
|
82
|
-
export function scoreEpicIdSpecificity(prompt: CompactionPrompt): ScorerResult {
|
|
83
|
-
// Check for placeholder patterns
|
|
84
|
-
for (const pattern of PLACEHOLDERS) {
|
|
85
|
-
if (pattern.test(prompt.content)) {
|
|
86
|
-
return {
|
|
87
|
-
score: 0.0,
|
|
88
|
-
message: `Found placeholder: ${pattern.source}`,
|
|
89
|
-
};
|
|
90
|
-
}
|
|
91
|
-
}
|
|
92
|
-
|
|
93
|
-
// Check for real epic ID pattern
|
|
94
|
-
if (REAL_EPIC_ID.test(prompt.content)) {
|
|
95
|
-
return {
|
|
96
|
-
score: 1.0,
|
|
97
|
-
message: "Contains real epic ID",
|
|
98
|
-
};
|
|
99
|
-
}
|
|
100
|
-
|
|
101
|
-
return {
|
|
102
|
-
score: 0.0,
|
|
103
|
-
message: "No epic ID found",
|
|
104
|
-
};
|
|
105
|
-
}
|
|
106
|
-
|
|
107
|
-
/**
|
|
108
|
-
* Score actionability of tool calls
|
|
109
|
-
*
|
|
110
|
-
* Validates that the prompt includes SPECIFIC actionable tool calls.
|
|
111
|
-
* Generic instructions like "check status" are useless.
|
|
112
|
-
* Good: swarm_status(epic_id='mjkw81rkq4c', project_key='/path')
|
|
113
|
-
* Bad: "Check the status of workers"
|
|
114
|
-
*
|
|
115
|
-
* @returns 1.0 if actionable tool calls with real values, 0.0 otherwise
|
|
116
|
-
*/
|
|
117
|
-
export function scoreActionability(prompt: CompactionPrompt): ScorerResult {
|
|
118
|
-
// Check for actionable tool patterns
|
|
119
|
-
const actionableTools = [
|
|
120
|
-
/swarm_status\([^)]*epic_id\s*=\s*['"]mjkw[a-z0-9]{7,}['"]/,
|
|
121
|
-
/swarmmail_inbox\(\)/,
|
|
122
|
-
];
|
|
123
|
-
|
|
124
|
-
for (const pattern of actionableTools) {
|
|
125
|
-
if (pattern.test(prompt.content)) {
|
|
126
|
-
return {
|
|
127
|
-
score: 1.0,
|
|
128
|
-
message: "Contains actionable tool call with real values",
|
|
129
|
-
};
|
|
130
|
-
}
|
|
131
|
-
}
|
|
132
|
-
|
|
133
|
-
// Check if tool is mentioned but with placeholders
|
|
134
|
-
if (
|
|
135
|
-
/swarm_status\([^)]*<epic-id>/.test(prompt.content) ||
|
|
136
|
-
/swarm_status\([^)]*<path>/.test(prompt.content)
|
|
137
|
-
) {
|
|
138
|
-
return {
|
|
139
|
-
score: 0.0,
|
|
140
|
-
message: "Tool call has placeholders",
|
|
141
|
-
};
|
|
142
|
-
}
|
|
143
|
-
|
|
144
|
-
return {
|
|
145
|
-
score: 0.0,
|
|
146
|
-
message: "No actionable tool calls found",
|
|
147
|
-
};
|
|
148
|
-
}
|
|
149
|
-
|
|
150
|
-
/**
|
|
151
|
-
* Score coordinator identity reinforcement
|
|
152
|
-
*
|
|
153
|
-
* Validates that the prompt has STRONG coordinator identity reinforcement.
|
|
154
|
-
* Post-compaction coordinators lose their identity without visual+semantic cues.
|
|
155
|
-
*
|
|
156
|
-
* Checks:
|
|
157
|
-
* 1. ASCII box header (visual anchor)
|
|
158
|
-
* 2. Strong language (NEVER/ALWAYS, not "should"/"consider")
|
|
159
|
-
*
|
|
160
|
-
* @returns 1.0 for ASCII header + strong mandates, 0.5 for header only, 0.0 otherwise
|
|
161
|
-
*/
|
|
162
|
-
export function scoreCoordinatorIdentity(
|
|
163
|
-
prompt: CompactionPrompt,
|
|
164
|
-
): ScorerResult {
|
|
165
|
-
// Check for ASCII box header (uses box-drawing characters)
|
|
166
|
-
const hasAsciiHeader =
|
|
167
|
-
ASCII_BOX.test(prompt.content) &&
|
|
168
|
-
/(YOU ARE THE COORDINATOR|COORDINATOR MODE)/i.test(prompt.content);
|
|
169
|
-
|
|
170
|
-
if (!hasAsciiHeader) {
|
|
171
|
-
return {
|
|
172
|
-
score: 0.0,
|
|
173
|
-
message: "No ASCII header found",
|
|
174
|
-
};
|
|
175
|
-
}
|
|
176
|
-
|
|
177
|
-
// Check for strong mandate language
|
|
178
|
-
const hasStrongLanguage = STRONG_LANGUAGE.some((pattern) =>
|
|
179
|
-
pattern.test(prompt.content),
|
|
180
|
-
);
|
|
181
|
-
|
|
182
|
-
if (!hasStrongLanguage) {
|
|
183
|
-
return {
|
|
184
|
-
score: 0.5,
|
|
185
|
-
message: "ASCII header present but weak language",
|
|
186
|
-
};
|
|
187
|
-
}
|
|
188
|
-
|
|
189
|
-
return {
|
|
190
|
-
score: 1.0,
|
|
191
|
-
message: "ASCII header + strong mandates present",
|
|
192
|
-
};
|
|
193
|
-
}
|
|
194
|
-
|
|
195
|
-
/**
|
|
196
|
-
* Score forbidden tools listing
|
|
197
|
-
*
|
|
198
|
-
* Validates that the prompt LISTS forbidden tools by name.
|
|
199
|
-
* Coordinators must know exactly which tools to avoid.
|
|
200
|
-
*
|
|
201
|
-
* Required forbidden tools:
|
|
202
|
-
* 1. Edit
|
|
203
|
-
* 2. Write
|
|
204
|
-
* 3. swarmmail_reserve (only workers reserve)
|
|
205
|
-
* 4. git commit (workers commit)
|
|
206
|
-
* 5. bash (for file modifications)
|
|
207
|
-
*
|
|
208
|
-
* @returns ratio of forbidden tools mentioned (0.0 to 1.0)
|
|
209
|
-
*/
|
|
210
|
-
export function scoreForbiddenToolsPresent(
|
|
211
|
-
prompt: CompactionPrompt,
|
|
212
|
-
): ScorerResult {
|
|
213
|
-
// Check for forbidden tool mentions
|
|
214
|
-
const forbiddenTools = [
|
|
215
|
-
/\bEdit\b/i,
|
|
216
|
-
/\bWrite\b/i,
|
|
217
|
-
/swarmmail_reserve/,
|
|
218
|
-
/git commit/,
|
|
219
|
-
/\bbash\b/i,
|
|
220
|
-
];
|
|
221
|
-
|
|
222
|
-
const foundTools = forbiddenTools.filter((pattern) =>
|
|
223
|
-
pattern.test(prompt.content),
|
|
224
|
-
);
|
|
225
|
-
|
|
226
|
-
const score = foundTools.length / forbiddenTools.length;
|
|
227
|
-
|
|
228
|
-
if (score === 1.0) {
|
|
229
|
-
return {
|
|
230
|
-
score: 1.0,
|
|
231
|
-
message: "All 5 forbidden tools listed",
|
|
232
|
-
};
|
|
233
|
-
}
|
|
234
|
-
|
|
235
|
-
if (score === 0) {
|
|
236
|
-
return {
|
|
237
|
-
score: 0.0,
|
|
238
|
-
message: "No forbidden tools listed (0/5)",
|
|
239
|
-
};
|
|
240
|
-
}
|
|
241
|
-
|
|
242
|
-
return {
|
|
243
|
-
score,
|
|
244
|
-
message: `${foundTools.length}/5 forbidden tools listed`,
|
|
245
|
-
};
|
|
246
|
-
}
|
|
247
|
-
|
|
248
|
-
/**
|
|
249
|
-
* Score post-compaction discipline (first tool correctness)
|
|
250
|
-
*
|
|
251
|
-
* Validates that the FIRST suggested tool is correct.
|
|
252
|
-
* Coordinators should check status FIRST, not edit files.
|
|
253
|
-
*
|
|
254
|
-
* Good first tools:
|
|
255
|
-
* - swarm_status
|
|
256
|
-
* - swarmmail_inbox
|
|
257
|
-
*
|
|
258
|
-
* Bad first tools:
|
|
259
|
-
* - Edit
|
|
260
|
-
* - Write
|
|
261
|
-
* - Read (should check status first)
|
|
262
|
-
*
|
|
263
|
-
* @returns 1.0 if first tool is swarm_status or inbox, 0.0 otherwise
|
|
264
|
-
*/
|
|
265
|
-
export function scorePostCompactionDiscipline(
|
|
266
|
-
prompt: CompactionPrompt,
|
|
267
|
-
): ScorerResult {
|
|
268
|
-
// Extract first tool call (look for function-like patterns)
|
|
269
|
-
const toolCallPattern =
|
|
270
|
-
/\b(swarm_status|swarmmail_inbox|Edit|Write|Read)\b/i;
|
|
271
|
-
const match = prompt.content.match(toolCallPattern);
|
|
272
|
-
|
|
273
|
-
if (!match) {
|
|
274
|
-
return {
|
|
275
|
-
score: 0.0,
|
|
276
|
-
message: "No tool calls found",
|
|
277
|
-
};
|
|
278
|
-
}
|
|
279
|
-
|
|
280
|
-
const firstTool = match[1].toLowerCase();
|
|
281
|
-
|
|
282
|
-
if (firstTool === "swarm_status") {
|
|
283
|
-
return {
|
|
284
|
-
score: 1.0,
|
|
285
|
-
message: "First tool is swarm_status (correct)",
|
|
286
|
-
};
|
|
287
|
-
}
|
|
288
|
-
|
|
289
|
-
if (firstTool === "swarmmail_inbox") {
|
|
290
|
-
return {
|
|
291
|
-
score: 1.0,
|
|
292
|
-
message: "First tool is inbox (correct)",
|
|
293
|
-
};
|
|
294
|
-
}
|
|
295
|
-
|
|
296
|
-
return {
|
|
297
|
-
score: 0.0,
|
|
298
|
-
message: `First tool is ${match[1]} (should be swarm_status or inbox)`,
|
|
299
|
-
};
|
|
300
|
-
}
|
|
@@ -1,133 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Contributor Tools Integration Tests
|
|
3
|
-
*
|
|
4
|
-
* Tests for contributor_lookup tool that fetches GitHub profiles
|
|
5
|
-
* and generates changeset credits.
|
|
6
|
-
*/
|
|
7
|
-
|
|
8
|
-
import { afterAll, describe, expect, test } from "bun:test";
|
|
9
|
-
import { closeAllSwarmMail } from "swarm-mail";
|
|
10
|
-
import { contributorTools, resetContributorCache } from "./contributor-tools";
|
|
11
|
-
import { resetMemoryCache } from "./memory-tools";
|
|
12
|
-
|
|
13
|
-
interface ToolContext {
|
|
14
|
-
sessionID: string;
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
describe("contributor tools integration", () => {
|
|
18
|
-
afterAll(async () => {
|
|
19
|
-
resetContributorCache();
|
|
20
|
-
resetMemoryCache();
|
|
21
|
-
await closeAllSwarmMail();
|
|
22
|
-
});
|
|
23
|
-
|
|
24
|
-
test("contributor_lookup tool is registered", () => {
|
|
25
|
-
expect(contributorTools).toHaveProperty("contributor_lookup");
|
|
26
|
-
expect(typeof contributorTools.contributor_lookup.execute).toBe("function");
|
|
27
|
-
});
|
|
28
|
-
|
|
29
|
-
describe("contributor_lookup", () => {
|
|
30
|
-
test("returns formatted credit with name + twitter", async () => {
|
|
31
|
-
const tool = contributorTools.contributor_lookup;
|
|
32
|
-
const result = await tool.execute(
|
|
33
|
-
{
|
|
34
|
-
login: "kentcdodds",
|
|
35
|
-
issue: 42,
|
|
36
|
-
},
|
|
37
|
-
{ sessionID: "test-session" } as ToolContext,
|
|
38
|
-
);
|
|
39
|
-
|
|
40
|
-
expect(typeof result).toBe("string");
|
|
41
|
-
const parsed = JSON.parse(result);
|
|
42
|
-
|
|
43
|
-
expect(parsed.login).toBe("kentcdodds");
|
|
44
|
-
expect(parsed.name).toBeDefined();
|
|
45
|
-
expect(parsed.twitter).toBeDefined();
|
|
46
|
-
expect(parsed.credit_line).toContain("Thanks to");
|
|
47
|
-
expect(parsed.credit_line).toContain("reporting #42");
|
|
48
|
-
expect(parsed.credit_line).toContain("@kentcdodds");
|
|
49
|
-
expect(parsed.credit_line).toContain("https://x.com/");
|
|
50
|
-
expect(parsed.memory_stored).toBe(true);
|
|
51
|
-
});
|
|
52
|
-
|
|
53
|
-
test("handles missing twitter gracefully", async () => {
|
|
54
|
-
const tool = contributorTools.contributor_lookup;
|
|
55
|
-
|
|
56
|
-
// Use a user that likely has name but no twitter
|
|
57
|
-
// (we'll test the format logic mainly)
|
|
58
|
-
const result = await tool.execute(
|
|
59
|
-
{
|
|
60
|
-
login: "torvalds", // Linus Torvalds - has name, might not have twitter
|
|
61
|
-
issue: 123,
|
|
62
|
-
},
|
|
63
|
-
{ sessionID: "test-session" } as ToolContext,
|
|
64
|
-
);
|
|
65
|
-
|
|
66
|
-
const parsed = JSON.parse(result);
|
|
67
|
-
|
|
68
|
-
expect(parsed.login).toBe("torvalds");
|
|
69
|
-
expect(parsed.name).toBeDefined();
|
|
70
|
-
expect(parsed.credit_line).toContain("Thanks to");
|
|
71
|
-
expect(parsed.credit_line).toContain("reporting #123");
|
|
72
|
-
// Should have GitHub mention if no Twitter
|
|
73
|
-
if (!parsed.twitter) {
|
|
74
|
-
expect(parsed.credit_line).toContain("on GitHub");
|
|
75
|
-
}
|
|
76
|
-
});
|
|
77
|
-
|
|
78
|
-
test("works without issue number", async () => {
|
|
79
|
-
const tool = contributorTools.contributor_lookup;
|
|
80
|
-
const result = await tool.execute(
|
|
81
|
-
{
|
|
82
|
-
login: "kentcdodds",
|
|
83
|
-
},
|
|
84
|
-
{ sessionID: "test-session" } as ToolContext,
|
|
85
|
-
);
|
|
86
|
-
|
|
87
|
-
const parsed = JSON.parse(result);
|
|
88
|
-
|
|
89
|
-
expect(parsed.login).toBe("kentcdodds");
|
|
90
|
-
expect(parsed.credit_line).toContain("Thanks to");
|
|
91
|
-
// Should NOT contain "reporting #"
|
|
92
|
-
expect(parsed.credit_line).not.toContain("reporting #");
|
|
93
|
-
});
|
|
94
|
-
|
|
95
|
-
test("stores contributor info in semantic-memory", async () => {
|
|
96
|
-
const tool = contributorTools.contributor_lookup;
|
|
97
|
-
const result = await tool.execute(
|
|
98
|
-
{
|
|
99
|
-
login: "gaearon", // Dan Abramov
|
|
100
|
-
issue: 99,
|
|
101
|
-
},
|
|
102
|
-
{ sessionID: "test-session" } as ToolContext,
|
|
103
|
-
);
|
|
104
|
-
|
|
105
|
-
const parsed = JSON.parse(result);
|
|
106
|
-
|
|
107
|
-
// Just verify memory_stored flag - embedding search may be async
|
|
108
|
-
expect(parsed.memory_stored).toBe(true);
|
|
109
|
-
});
|
|
110
|
-
|
|
111
|
-
test("returns all expected fields", async () => {
|
|
112
|
-
const tool = contributorTools.contributor_lookup;
|
|
113
|
-
const result = await tool.execute(
|
|
114
|
-
{
|
|
115
|
-
login: "kentcdodds",
|
|
116
|
-
},
|
|
117
|
-
{ sessionID: "test-session" } as ToolContext,
|
|
118
|
-
);
|
|
119
|
-
|
|
120
|
-
const parsed = JSON.parse(result);
|
|
121
|
-
|
|
122
|
-
// Required fields
|
|
123
|
-
expect(parsed).toHaveProperty("login");
|
|
124
|
-
expect(parsed).toHaveProperty("credit_line");
|
|
125
|
-
expect(parsed).toHaveProperty("memory_stored");
|
|
126
|
-
|
|
127
|
-
// Optional fields (may be null but should be present)
|
|
128
|
-
expect(parsed).toHaveProperty("name");
|
|
129
|
-
expect(parsed).toHaveProperty("twitter");
|
|
130
|
-
expect(parsed).toHaveProperty("bio");
|
|
131
|
-
});
|
|
132
|
-
});
|
|
133
|
-
});
|
package/src/contributor-tools.ts
DELETED
|
@@ -1,201 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Contributor Tools - GitHub profile extraction for changeset credits
|
|
3
|
-
*
|
|
4
|
-
* Provides contributor_lookup tool for fetching GitHub profiles and
|
|
5
|
-
* generating formatted changeset credit lines. Automatically stores
|
|
6
|
-
* contributor info in semantic-memory for future reference.
|
|
7
|
-
*
|
|
8
|
-
* Based on patterns from gh-issue-triage skill.
|
|
9
|
-
*/
|
|
10
|
-
|
|
11
|
-
import { tool } from "@opencode-ai/plugin";
|
|
12
|
-
import { z } from "zod";
|
|
13
|
-
import { getMemoryAdapter } from "./memory-tools";
|
|
14
|
-
|
|
15
|
-
// ============================================================================
|
|
16
|
-
// Types
|
|
17
|
-
// ============================================================================
|
|
18
|
-
|
|
19
|
-
const GitHubUserSchema = z.object({
|
|
20
|
-
login: z.string(),
|
|
21
|
-
name: z.string().nullable(),
|
|
22
|
-
twitter_username: z.string().nullable(),
|
|
23
|
-
blog: z.string().nullable(),
|
|
24
|
-
bio: z.string().nullable(),
|
|
25
|
-
avatar_url: z.string(),
|
|
26
|
-
html_url: z.string(),
|
|
27
|
-
public_repos: z.number().optional(),
|
|
28
|
-
followers: z.number().optional(),
|
|
29
|
-
});
|
|
30
|
-
|
|
31
|
-
type GitHubUser = z.infer<typeof GitHubUserSchema>;
|
|
32
|
-
|
|
33
|
-
interface ContributorResult {
|
|
34
|
-
login: string;
|
|
35
|
-
name: string | null;
|
|
36
|
-
twitter: string | null;
|
|
37
|
-
bio: string | null;
|
|
38
|
-
credit_line: string;
|
|
39
|
-
memory_stored: boolean;
|
|
40
|
-
}
|
|
41
|
-
|
|
42
|
-
interface ToolContext {
|
|
43
|
-
sessionID: string;
|
|
44
|
-
}
|
|
45
|
-
|
|
46
|
-
// ============================================================================
|
|
47
|
-
// Core Functions
|
|
48
|
-
// ============================================================================
|
|
49
|
-
|
|
50
|
-
/**
|
|
51
|
-
* Fetch GitHub user profile via gh CLI
|
|
52
|
-
*/
|
|
53
|
-
async function fetchGitHubUser(login: string): Promise<GitHubUser> {
|
|
54
|
-
const result = await Bun.$`gh api users/${login}`.json();
|
|
55
|
-
return GitHubUserSchema.parse(result);
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
/**
|
|
59
|
-
* Format changeset credit line based on available data
|
|
60
|
-
*
|
|
61
|
-
* Hierarchy:
|
|
62
|
-
* 1. Name + Twitter: "Thanks to {Name} ([@twitter](...)) for reporting #{issue}!"
|
|
63
|
-
* 2. Name only: "Thanks to {Name} (@{login} on GitHub) for reporting #{issue}!"
|
|
64
|
-
* 3. Twitter only: "Thanks to [@twitter](...) for reporting #{issue}!"
|
|
65
|
-
* 4. Fallback: "Thanks to @{login} for reporting #{issue}!"
|
|
66
|
-
*/
|
|
67
|
-
function formatCreditLine(user: GitHubUser, issueNumber?: number): string {
|
|
68
|
-
const issueText = issueNumber ? `reporting #${issueNumber}` : "the report";
|
|
69
|
-
|
|
70
|
-
// PREFERRED: Full name + Twitter (best for engagement)
|
|
71
|
-
if (user.name && user.twitter_username) {
|
|
72
|
-
return `Thanks to ${user.name} ([@${user.twitter_username}](https://x.com/${user.twitter_username})) for ${issueText}!`;
|
|
73
|
-
}
|
|
74
|
-
|
|
75
|
-
// Twitter only (no name available)
|
|
76
|
-
if (user.twitter_username) {
|
|
77
|
-
return `Thanks to [@${user.twitter_username}](https://x.com/${user.twitter_username}) for ${issueText}!`;
|
|
78
|
-
}
|
|
79
|
-
|
|
80
|
-
// Name only (no Twitter)
|
|
81
|
-
if (user.name) {
|
|
82
|
-
return `Thanks to ${user.name} (@${user.login} on GitHub) for ${issueText}!`;
|
|
83
|
-
}
|
|
84
|
-
|
|
85
|
-
// Fallback: GitHub username only
|
|
86
|
-
return `Thanks to @${user.login} for ${issueText}!`;
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
/**
|
|
90
|
-
* Store contributor info in semantic-memory
|
|
91
|
-
*/
|
|
92
|
-
async function storeContributorMemory(
|
|
93
|
-
user: GitHubUser,
|
|
94
|
-
issueNumber?: number,
|
|
95
|
-
): Promise<boolean> {
|
|
96
|
-
try {
|
|
97
|
-
const adapter = await getMemoryAdapter();
|
|
98
|
-
|
|
99
|
-
const twitterPart = user.twitter_username
|
|
100
|
-
? ` (@${user.twitter_username} on Twitter)`
|
|
101
|
-
: "";
|
|
102
|
-
const issuePart = issueNumber ? `. Filed issue #${issueNumber}` : "";
|
|
103
|
-
const bioPart = user.bio ? `. Bio: '${user.bio}'` : "";
|
|
104
|
-
|
|
105
|
-
const tags = [
|
|
106
|
-
"contributor",
|
|
107
|
-
user.login,
|
|
108
|
-
issueNumber ? `issue-${issueNumber}` : null,
|
|
109
|
-
]
|
|
110
|
-
.filter(Boolean)
|
|
111
|
-
.join(",");
|
|
112
|
-
|
|
113
|
-
const information = `Contributor @${user.login}: ${user.name || user.login}${twitterPart}${issuePart}${bioPart}`;
|
|
114
|
-
|
|
115
|
-
await adapter.store({
|
|
116
|
-
information,
|
|
117
|
-
tags,
|
|
118
|
-
});
|
|
119
|
-
|
|
120
|
-
return true;
|
|
121
|
-
} catch (error) {
|
|
122
|
-
console.error("Failed to store contributor memory:", error);
|
|
123
|
-
return false;
|
|
124
|
-
}
|
|
125
|
-
}
|
|
126
|
-
|
|
127
|
-
// ============================================================================
|
|
128
|
-
// Cache Management
|
|
129
|
-
// ============================================================================
|
|
130
|
-
|
|
131
|
-
/**
|
|
132
|
-
* Reset cache for testing
|
|
133
|
-
*/
|
|
134
|
-
export function resetContributorCache(): void {
|
|
135
|
-
// Currently no cache, but keeping this for consistency with other tools
|
|
136
|
-
}
|
|
137
|
-
|
|
138
|
-
// ============================================================================
|
|
139
|
-
// Plugin Tools
|
|
140
|
-
// ============================================================================
|
|
141
|
-
|
|
142
|
-
/**
|
|
143
|
-
* Look up GitHub contributor and generate changeset credit
|
|
144
|
-
*/
|
|
145
|
-
export const contributor_lookup = tool({
|
|
146
|
-
description:
|
|
147
|
-
"Fetch GitHub contributor profile and generate formatted changeset credit. Automatically stores contributor info in semantic-memory. Returns login, name, twitter, bio, and ready-to-paste credit_line.",
|
|
148
|
-
args: {
|
|
149
|
-
login: tool.schema.string().describe("GitHub username (required)"),
|
|
150
|
-
issue: tool.schema
|
|
151
|
-
.number()
|
|
152
|
-
.optional()
|
|
153
|
-
.describe("Issue number for context (optional)"),
|
|
154
|
-
},
|
|
155
|
-
async execute(
|
|
156
|
-
args: { login: string; issue?: number },
|
|
157
|
-
_ctx: ToolContext,
|
|
158
|
-
): Promise<string> {
|
|
159
|
-
try {
|
|
160
|
-
// Fetch GitHub profile
|
|
161
|
-
const user = await fetchGitHubUser(args.login);
|
|
162
|
-
|
|
163
|
-
// Format credit line
|
|
164
|
-
const creditLine = formatCreditLine(user, args.issue);
|
|
165
|
-
|
|
166
|
-
// Store in semantic-memory
|
|
167
|
-
const memoryStored = await storeContributorMemory(user, args.issue);
|
|
168
|
-
|
|
169
|
-
// Build result
|
|
170
|
-
const result: ContributorResult = {
|
|
171
|
-
login: user.login,
|
|
172
|
-
name: user.name,
|
|
173
|
-
twitter: user.twitter_username,
|
|
174
|
-
bio: user.bio,
|
|
175
|
-
credit_line: creditLine,
|
|
176
|
-
memory_stored: memoryStored,
|
|
177
|
-
};
|
|
178
|
-
|
|
179
|
-
return JSON.stringify(result, null, 2);
|
|
180
|
-
} catch (error) {
|
|
181
|
-
if (error instanceof Error) {
|
|
182
|
-
return JSON.stringify({
|
|
183
|
-
error: error.message,
|
|
184
|
-
login: args.login,
|
|
185
|
-
});
|
|
186
|
-
}
|
|
187
|
-
return JSON.stringify({
|
|
188
|
-
error: "Unknown error fetching contributor",
|
|
189
|
-
login: args.login,
|
|
190
|
-
});
|
|
191
|
-
}
|
|
192
|
-
},
|
|
193
|
-
});
|
|
194
|
-
|
|
195
|
-
// ============================================================================
|
|
196
|
-
// Exports
|
|
197
|
-
// ============================================================================
|
|
198
|
-
|
|
199
|
-
export const contributorTools = {
|
|
200
|
-
contributor_lookup,
|
|
201
|
-
} as const;
|