goalbuddy 0.3.5 → 0.3.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +46 -12
- package/RELEASE-0.3.5.md +4 -4
- package/RELEASE-0.3.7.md +127 -0
- package/goalbuddy/SKILL.md +53 -23
- package/goalbuddy/agents/README.md +1 -1
- package/goalbuddy/agents/goal_judge.toml +8 -4
- package/goalbuddy/agents/goal_worker.toml +8 -5
- package/goalbuddy/scripts/check-goal-state.mjs +129 -0
- package/goalbuddy/scripts/render-task-prompt.mjs +83 -5
- package/{plugins/goalbuddy/skills/goalbuddy/extend → goalbuddy/surfaces}/local-goal-board/README.md +7 -9
- package/{plugins/goalbuddy/skills/goalbuddy/extend → goalbuddy/surfaces}/local-goal-board/examples/sample-goal/state.yaml +5 -5
- package/{plugins/goalbuddy/skills/goalbuddy/extend → goalbuddy/surfaces}/local-goal-board/examples/subgoal-parent/state.yaml +3 -3
- package/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/state.yaml +3 -3
- package/goalbuddy/{extend → surfaces}/local-goal-board/scripts/lib/goal-board.mjs +250 -9
- package/goalbuddy/{extend → surfaces}/local-goal-board/scripts/local-goal-board.mjs +4 -4
- package/goalbuddy/{extend → surfaces}/local-goal-board/test/local-goal-board.test.mjs +67 -9
- package/goalbuddy/templates/agents.md +3 -2
- package/goalbuddy/templates/goal.md +27 -4
- package/goalbuddy/templates/state.yaml +13 -7
- package/internal/assets/goalbuddy-v0.3.7-release.png +0 -0
- package/internal/cli/goal-maker.mjs +112 -714
- package/package.json +4 -4
- package/plugins/goalbuddy/.claude-plugin/plugin.json +3 -4
- package/plugins/goalbuddy/.codex-plugin/plugin.json +5 -6
- package/plugins/goalbuddy/README.md +4 -3
- package/plugins/goalbuddy/agents/goal-judge.md +8 -4
- package/plugins/goalbuddy/agents/goal-worker.md +6 -4
- package/plugins/goalbuddy/skills/goalbuddy/SKILL.md +53 -23
- package/plugins/goalbuddy/skills/goalbuddy/agents/README.md +1 -1
- package/plugins/goalbuddy/skills/goalbuddy/agents/goal_judge.toml +8 -4
- package/plugins/goalbuddy/skills/goalbuddy/agents/goal_worker.toml +8 -5
- package/plugins/goalbuddy/skills/goalbuddy/scripts/check-goal-state.mjs +129 -0
- package/plugins/goalbuddy/skills/goalbuddy/scripts/render-task-prompt.mjs +83 -5
- package/{goalbuddy/extend → plugins/goalbuddy/skills/goalbuddy/surfaces}/local-goal-board/README.md +7 -9
- package/{goalbuddy/extend → plugins/goalbuddy/skills/goalbuddy/surfaces}/local-goal-board/examples/sample-goal/state.yaml +5 -5
- package/{goalbuddy/extend → plugins/goalbuddy/skills/goalbuddy/surfaces}/local-goal-board/examples/subgoal-parent/state.yaml +3 -3
- package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/state.yaml +3 -3
- package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/scripts/lib/goal-board.mjs +250 -9
- package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/scripts/local-goal-board.mjs +4 -4
- package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/test/local-goal-board.test.mjs +67 -9
- package/plugins/goalbuddy/skills/goalbuddy/templates/agents.md +3 -2
- package/plugins/goalbuddy/skills/goalbuddy/templates/goal.md +27 -4
- package/plugins/goalbuddy/skills/goalbuddy/templates/state.yaml +13 -7
- package/examples/extend-catalog-workflow/goal.md +0 -53
- package/examples/extend-catalog-workflow/notes/T001-extension-model-map.md +0 -47
- package/examples/extend-catalog-workflow/notes/T002-architecture-decision.md +0 -48
- package/examples/extend-catalog-workflow/notes/T003-implementation-summary.md +0 -43
- package/examples/extend-catalog-workflow/notes/T004-root-extend-folder.md +0 -24
- package/examples/extend-catalog-workflow/notes/T005-layout-cleanup.md +0 -46
- package/examples/extend-catalog-workflow/notes/T006-catalog-location.md +0 -50
- package/examples/extend-catalog-workflow/notes/T999-completion-audit.md +0 -36
- package/examples/extend-catalog-workflow/state.yaml +0 -327
- package/examples/github-pr-workflow-extension/pr-handoff.md +0 -46
- package/goalbuddy/extend/github-projects/README.md +0 -105
- package/goalbuddy/extend/github-projects/examples/goal-board-sync/state.yaml +0 -63
- package/goalbuddy/extend/github-projects/extension.yaml +0 -43
- package/goalbuddy/extend/github-projects/scripts/lib/github-projects.mjs +0 -728
- package/goalbuddy/extend/github-projects/scripts/lib/goal-state.mjs +0 -362
- package/goalbuddy/extend/github-projects/scripts/sync-github-project.mjs +0 -193
- package/goalbuddy/extend/github-projects/test/github-projects.test.mjs +0 -267
- package/goalbuddy/extend/local-goal-board/extension.yaml +0 -39
- package/internal/assets/extend-release.png +0 -0
- package/internal/assets/extend-release.svg +0 -83
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/README.md +0 -105
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/examples/goal-board-sync/state.yaml +0 -63
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/extension.yaml +0 -43
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/scripts/lib/github-projects.mjs +0 -728
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/scripts/lib/goal-state.mjs +0 -362
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/scripts/sync-github-project.mjs +0 -193
- package/plugins/goalbuddy/skills/goalbuddy/extend/github-projects/test/github-projects.test.mjs +0 -267
- package/plugins/goalbuddy/skills/goalbuddy/extend/local-goal-board/extension.yaml +0 -39
- /package/goalbuddy/{extend → surfaces}/local-goal-board/assets/goalbuddy-mark.png +0 -0
- /package/goalbuddy/{extend → surfaces}/local-goal-board/examples/sample-goal/notes/T001-scout.md +0 -0
- /package/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/goal.md +0 -0
- /package/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/notes/.gitkeep +0 -0
- /package/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/goal.md +0 -0
- /package/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/notes/.gitkeep +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/assets/goalbuddy-mark.png +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/sample-goal/notes/T001-scout.md +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/goal.md +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/notes/.gitkeep +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/goal.md +0 -0
- /package/plugins/goalbuddy/skills/goalbuddy/{extend → surfaces}/local-goal-board/examples/subgoal-parent/subgoals/T004-board-view/notes/.gitkeep +0 -0
package/package.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "goalbuddy",
|
|
3
|
-
"version": "0.3.
|
|
4
|
-
"description": "A /goal operating
|
|
3
|
+
"version": "0.3.7",
|
|
4
|
+
"description": "A /goal operating loop for Codex and Claude Code: goal oracles, local boards, receipts, and verification.",
|
|
5
5
|
"type": "module",
|
|
6
6
|
"bin": {
|
|
7
7
|
"goalbuddy": "internal/cli/goal-maker.mjs",
|
|
@@ -11,6 +11,7 @@
|
|
|
11
11
|
".agents/plugins/marketplace.json",
|
|
12
12
|
"README.md",
|
|
13
13
|
"RELEASE-0.3.5.md",
|
|
14
|
+
"RELEASE-0.3.7.md",
|
|
14
15
|
"CONTRIBUTING.md",
|
|
15
16
|
"examples",
|
|
16
17
|
"plugins/goalbuddy",
|
|
@@ -19,7 +20,7 @@
|
|
|
19
20
|
"goalbuddy/SKILL.md",
|
|
20
21
|
"goalbuddy/agents",
|
|
21
22
|
"goalbuddy/scripts",
|
|
22
|
-
"goalbuddy/
|
|
23
|
+
"goalbuddy/surfaces",
|
|
23
24
|
"goalbuddy/templates"
|
|
24
25
|
],
|
|
25
26
|
"scripts": {
|
|
@@ -51,7 +52,6 @@
|
|
|
51
52
|
"cli",
|
|
52
53
|
"workflow",
|
|
53
54
|
"agent",
|
|
54
|
-
"extensions",
|
|
55
55
|
"verification"
|
|
56
56
|
],
|
|
57
57
|
"author": "tolibear",
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "goalbuddy",
|
|
3
|
-
"version": "0.3.
|
|
4
|
-
"description": "Turn broad Claude Code work into
|
|
3
|
+
"version": "0.3.7",
|
|
4
|
+
"description": "Turn broad Codex and Claude Code work into pressured /goal runs with oracles, local boards, receipts, and verification.",
|
|
5
5
|
"author": {
|
|
6
6
|
"name": "tolibear",
|
|
7
7
|
"email": "support@tolibear.com",
|
|
@@ -18,7 +18,6 @@
|
|
|
18
18
|
"goal",
|
|
19
19
|
"task-board",
|
|
20
20
|
"receipts",
|
|
21
|
-
"workflow"
|
|
22
|
-
"extensions"
|
|
21
|
+
"workflow"
|
|
23
22
|
]
|
|
24
23
|
}
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "goalbuddy",
|
|
3
|
-
"version": "0.3.
|
|
4
|
-
"description": "Turn broad Codex and Claude Code work into
|
|
3
|
+
"version": "0.3.7",
|
|
4
|
+
"description": "Turn broad Codex and Claude Code work into pressured /goal runs with oracles, local boards, receipts, and verification.",
|
|
5
5
|
"author": {
|
|
6
6
|
"name": "tolibear",
|
|
7
7
|
"email": "support@tolibear.com",
|
|
@@ -18,14 +18,13 @@
|
|
|
18
18
|
"goal",
|
|
19
19
|
"task-board",
|
|
20
20
|
"receipts",
|
|
21
|
-
"workflow"
|
|
22
|
-
"extensions"
|
|
21
|
+
"workflow"
|
|
23
22
|
],
|
|
24
23
|
"skills": "./skills/",
|
|
25
24
|
"interface": {
|
|
26
25
|
"displayName": "GoalBuddy",
|
|
27
|
-
"shortDescription": "
|
|
28
|
-
"longDescription": "GoalBuddy packages a structured goal workflow for broad, long-running, or ambiguous engineering work in Codex or Claude Code. It creates durable goal charters, task boards, optional depth-1 subgoals,
|
|
26
|
+
"shortDescription": "Goal oracles, local boards, receipts, and proof loops for /goal",
|
|
27
|
+
"longDescription": "GoalBuddy packages a structured goal workflow for broad, long-running, or ambiguous engineering work in Codex or Claude Code. It creates durable goal charters, goal oracles, task boards, optional depth-1 subgoals, local board surfaces, parallel-agent-ready handoffs, receipts, verification gates, and compatibility guidance for teams moving from goal-maker.",
|
|
29
28
|
"developerName": "tolibear",
|
|
30
29
|
"category": "Coding",
|
|
31
30
|
"capabilities": [
|
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
# GoalBuddy Plugin (Codex + Claude Code)
|
|
2
2
|
|
|
3
|
-
GoalBuddy packages the canonical `goal-prep` skill as a plugin so teams can install the reusable workflow in **Codex** and **Claude Code**, while keeping the npm CLI for local setup, doctor checks, and
|
|
3
|
+
GoalBuddy packages the canonical `goal-prep` skill as a plugin so teams can install the reusable workflow in **Codex** and **Claude Code**, while keeping the npm CLI for local setup, doctor checks, and the built-in local board surface.
|
|
4
4
|
|
|
5
|
-
Version 0.3.
|
|
5
|
+
Version 0.3.7 is the Goalmaxxed release: goal oracles, largest safe useful slices, built-in local boards, receipt pressure, final-proof gates, and a smaller core without the extension catalog.
|
|
6
6
|
|
|
7
7
|
## What It Contains
|
|
8
8
|
|
|
@@ -56,8 +56,9 @@ goalbuddy --target claude # installs for Claude Code only
|
|
|
56
56
|
For local CLI testing before npm publish:
|
|
57
57
|
|
|
58
58
|
```bash
|
|
59
|
-
node internal/cli/goal-maker.mjs
|
|
59
|
+
node internal/cli/goal-maker.mjs
|
|
60
60
|
node internal/cli/goal-maker.mjs doctor
|
|
61
|
+
node internal/cli/goal-maker.mjs board docs/goals/<slug> --once --json
|
|
61
62
|
```
|
|
62
63
|
|
|
63
64
|
## Release Notes
|
|
@@ -13,11 +13,16 @@ Hard contract:
|
|
|
13
13
|
- Read only. Do not edit, stage, install, or implement.
|
|
14
14
|
- Read state receipts before raw files. Then read only the inputs named in the Judge task.
|
|
15
15
|
- Be skeptical of progress. Lots of files, docs, or tests are not completion.
|
|
16
|
-
- A safe Worker
|
|
16
|
+
- A safe Worker package must include objective, allowed_files, verify commands, and stop_if, and should cover the largest reversible local work package at that boundary.
|
|
17
|
+
- Choose the largest safe useful slice: bounded, explicit, verified, reversible, and outcome-moving. Safety does not mean tiny.
|
|
18
|
+
- Judge a whole useful slice, not one helper at a time.
|
|
19
|
+
- Detect micro-slice loops. Reject another tiny helper when the board has enough scaffolding for vertical progress.
|
|
20
|
+
- Select PM reorientation when recent receipts are safe-looking but outcome-light.
|
|
21
|
+
- Prefer milestone reviews over helper reviews.
|
|
17
22
|
- A safe child board must be depth 1, inside `subgoals/`, non-recursive, and linked from exactly one parent task.
|
|
18
23
|
- Parallel Worker work is safe only with provably disjoint `allowed_files`. Separate boards alone are not proof.
|
|
19
24
|
- Reject completion unless the full original outcome is mapped to receipts and current verification.
|
|
20
|
-
- Do not choose the active task or mutate state.
|
|
25
|
+
- Do not generate routine next tasks, choose the active task, or mutate state. The PM owns continuation after your review.
|
|
21
26
|
|
|
22
27
|
Return exactly one parseable JSON receipt object:
|
|
23
28
|
|
|
@@ -27,11 +32,10 @@ Return exactly one parseable JSON receipt object:
|
|
|
27
32
|
"result": "done | blocked",
|
|
28
33
|
"task_id": "<T###>",
|
|
29
34
|
"board_path": "<path to state.yaml>",
|
|
30
|
-
"decision": "
|
|
35
|
+
"decision": "approved | rejected | approve_subgoal | reject_subgoal | not_complete | complete",
|
|
31
36
|
"full_outcome_complete": false,
|
|
32
37
|
"rationale": "<=120 words>",
|
|
33
38
|
"evidence": [],
|
|
34
|
-
"next_allowed_task": null,
|
|
35
39
|
"subgoal_contract": null,
|
|
36
40
|
"parallel_safety": null,
|
|
37
41
|
"blocked_tasks": [],
|
|
@@ -1,12 +1,12 @@
|
|
|
1
1
|
---
|
|
2
2
|
name: goal-worker
|
|
3
|
-
description: GoalBuddy Worker. Bounded writer for
|
|
3
|
+
description: GoalBuddy Worker. Bounded writer for one coherent reversible Worker work package. Edits only allowed_files, runs verify, returns receipt.
|
|
4
4
|
tools: Read, Edit, Write, Grep, Glob, Bash
|
|
5
5
|
---
|
|
6
6
|
|
|
7
7
|
You are Worker for GoalBuddy.
|
|
8
8
|
|
|
9
|
-
Default effort:
|
|
9
|
+
Default effort: medium for implementation tasks. Use low only for tiny repair tasks or when the board explicitly sets `reasoning_hint` low.
|
|
10
10
|
|
|
11
11
|
Hard contract:
|
|
12
12
|
|
|
@@ -18,7 +18,10 @@ Hard contract:
|
|
|
18
18
|
- Do not create child sub-goals unless the task explicitly allows it.
|
|
19
19
|
- Run the verify commands exactly as listed after edits. You may make at most two fix attempts.
|
|
20
20
|
- Stop immediately if required evidence is missing, a file outside `allowed_files` is needed, source/product/tests conflict, or verification still fails after two attempts.
|
|
21
|
-
-
|
|
21
|
+
- Do not request a Judge just because the package is done. The PM decides whether this is a phase, risk, ambiguity, rejected-verification, or final-completion boundary.
|
|
22
|
+
- Keep the diff coherent, bounded, and reversible. Do not shrink the assigned work below the largest safe useful slice.
|
|
23
|
+
- Complete the whole assigned slice. Do not stop after the first helper if remaining work is inside `allowed_files` and verification is still feasible.
|
|
24
|
+
- If the task asks for a vertical slice, complete the vertical slice.
|
|
22
25
|
|
|
23
26
|
Parallel safety:
|
|
24
27
|
|
|
@@ -39,7 +42,6 @@ Return exactly one parseable JSON receipt object:
|
|
|
39
42
|
"commands": [],
|
|
40
43
|
"summary": "<=120 words>",
|
|
41
44
|
"remaining_blockers": [],
|
|
42
|
-
"needs_judge": false,
|
|
43
45
|
"verification_attempts": 1,
|
|
44
46
|
"stopped_because": null
|
|
45
47
|
}
|
|
@@ -12,9 +12,17 @@ GoalBuddy is for autonomous, long-running Codex or Claude Code work where the PM
|
|
|
12
12
|
The loop is:
|
|
13
13
|
|
|
14
14
|
```text
|
|
15
|
-
raw user intent -> intake compiler ->
|
|
15
|
+
raw user intent -> intake compiler -> goal oracle -> local work surface -> one active task -> receipt -> proof loop -> repeat
|
|
16
16
|
```
|
|
17
17
|
|
|
18
|
+
GoalBuddy's core invariant is:
|
|
19
|
+
|
|
20
|
+
```text
|
|
21
|
+
Intent -> Oracle -> Surface -> Loop -> Proof
|
|
22
|
+
```
|
|
23
|
+
|
|
24
|
+
No oracle, no serious goal. A goal oracle is the observable signal that tells the PM whether the original owner outcome is actually true yet. It may be a test suite, browser walkthrough, demo transcript, generated artifact, benchmark, source-backed answer, release check, or final human decision. Weak proof creates weak goals, so record the oracle before shaping tasks and keep testing against it until final completion.
|
|
25
|
+
|
|
18
26
|
## Invocation Boundary
|
|
19
27
|
|
|
20
28
|
There are two different modes:
|
|
@@ -31,7 +39,7 @@ Allowed `$goal-prep` actions:
|
|
|
31
39
|
- run the bundled GoalBuddy update checker and mention a newer version if one is available;
|
|
32
40
|
- ask diagnostic intake questions and wait when required;
|
|
33
41
|
- create or repair only `docs/goals/<slug>/goal.md`, `docs/goals/<slug>/state.yaml`, `docs/goals/<slug>/notes/`, and the generated `.goalbuddy-board/` visual board artifact;
|
|
34
|
-
- create and open the
|
|
42
|
+
- create and open the built-in local GoalBuddy board surface for the goal unless the user opts out;
|
|
35
43
|
- optionally run the GoalBuddy board checker against that `state.yaml`;
|
|
36
44
|
- verify GoalBuddy agent availability, if this can be done without touching implementation work, and record `installed`, `bundled_not_installed`, `missing`, or `unknown` truthfully;
|
|
37
45
|
- print exactly `/goal Follow docs/goals/<slug>/goal.md.`;
|
|
@@ -69,25 +77,25 @@ Extract:
|
|
|
69
77
|
- authority: `requested | approved | inferred | needs_approval | blocked`;
|
|
70
78
|
- proof type: `test | demo | artifact | metric | review | source_backed_answer | decision`;
|
|
71
79
|
- completion proof: the observable signal for full outcome completion;
|
|
80
|
+
- goal oracle: the live check, walkthrough, artifact, metric, or decision that will keep pressure on the goal and prevent early completion;
|
|
72
81
|
- likely misfire: how `/goal` could succeed at the wrong thing;
|
|
73
82
|
- blind spots: important risks, choices, or success dimensions the user may not have named yet;
|
|
74
83
|
- existing plan facts: user-provided steps, files, constraints, or sequencing that must be preserved but still validated.
|
|
75
84
|
|
|
76
|
-
|
|
85
|
+
Use the local GoalBuddy board as the default work surface for broad GoalBuddy runs. Ask only when the user has not already implied they want the default local surface, the goal is unusually quick/private, or board setup would materially distract from the requested prep:
|
|
77
86
|
|
|
78
87
|
```text
|
|
79
|
-
Do you want
|
|
88
|
+
Do you want the local GoalBuddy board for this goal?
|
|
80
89
|
```
|
|
81
90
|
|
|
82
91
|
Recommended options:
|
|
83
92
|
|
|
84
93
|
1. Local live board (Recommended) - starts immediately, requires no credentials, and lets the user watch tasks populate inside Codex or Claude Code.
|
|
85
|
-
2.
|
|
86
|
-
3. No visual board - best for quick or private goals where the file board is enough.
|
|
94
|
+
2. No visual board - best for quick or private goals where the file board is enough.
|
|
87
95
|
|
|
88
|
-
If the user chooses the local live board, create the goal directory, `notes/`, and an initial minimal `state.yaml` as soon as the slug is known, then run `npx goalbuddy board docs/goals/<slug>` and open the printed local URL in the AI coding agent's in-app browser (the Codex in-app Browser, the Claude Code preview, or the user's regular browser). The default local hub is `http://goalbuddy.localhost:41737/`, and board URLs normally look like `http://goalbuddy.localhost:41737/<slug>/`. In short: start the local board before filling the task list so the board pops up right away and cards populate live as `state.yaml` changes. Include the printed board URL in the final prep response as
|
|
96
|
+
If the user chooses the local live board, create the goal directory, `notes/`, and an initial minimal `state.yaml` as soon as the slug is known, then run `npx goalbuddy board docs/goals/<slug>` and open the printed local URL in the AI coding agent's in-app browser (the Codex in-app Browser, the Claude Code preview, or the user's regular browser). The default local hub is `http://goalbuddy.localhost:41737/`, and board URLs normally look like `http://goalbuddy.localhost:41737/<slug>/`. In short: start the local board before filling the task list so the board pops up right away and cards populate live as `state.yaml` changes. Include the printed board URL in the final prep response as an actual clickable Markdown link, for example `[Open GoalBuddy board](http://goalbuddy.localhost:41737/<slug>/)`. Do not put the board URL only in a code block, quote, HTML comment, or prose that the UI cannot click.
|
|
89
97
|
|
|
90
|
-
If the user
|
|
98
|
+
If the user wants an external board, GitHub sync, Slack digest, Linear handoff, or any other custom integration, do not install a GoalBuddy catalog item. Treat it as normal implementation work: create a concrete task that designs and verifies that integration inside the target repo or asks the operator for the required credentials and scope.
|
|
91
99
|
|
|
92
100
|
Ask before board creation when the request is vague, strategic, improvement-oriented, or open-ended and the user has not explicitly said to use defaults. Ask one guided question at a time with 2-3 options and a recommended default, then wait. Continue the diagnostic intake until the user's answers are sufficient to choose the board shape. Do not create or repair `docs/goals/<slug>/` until the diagnostic intake is complete or the user explicitly accepts defaults.
|
|
93
101
|
|
|
@@ -134,7 +142,7 @@ Stop after each question. Do not create files, repair an existing board, run che
|
|
|
134
142
|
|
|
135
143
|
Minimum diagnostic ladder for vague, strategic, or improvement-oriented goals:
|
|
136
144
|
|
|
137
|
-
1.
|
|
145
|
+
1. Goal surface: use the local live board by default, or ask "Do you want the local GoalBuddy board for this goal?" when board handling is unresolved.
|
|
138
146
|
2. Intent target: what kind of improvement or outcome matters most?
|
|
139
147
|
3. Success proof: what evidence would convince the user this worked?
|
|
140
148
|
4. Scope and non-goals: what should remain untouched or explicitly out of scope?
|
|
@@ -173,7 +181,7 @@ Do:
|
|
|
173
181
|
- classify the goal as `specific`, `open_ended`, `existing_plan`, `recovery`, or `audit`;
|
|
174
182
|
- create or repair `docs/goals/<slug>/`;
|
|
175
183
|
- create `goal.md`, `state.yaml`, and `notes/`;
|
|
176
|
-
-
|
|
184
|
+
- start the local board immediately and open it in the AI coding agent's in-app browser (Codex in-app Browser, Claude Code preview, or the user's regular browser) before filling the task list, unless the user opts out;
|
|
177
185
|
- seed a role-tagged task board that matches the input shape;
|
|
178
186
|
- make the first active task safe;
|
|
179
187
|
- verify Scout, Worker, and Judge agent availability or record an explicit truthful state;
|
|
@@ -203,22 +211,38 @@ Planning, Scout findings, Judge decisions, and a queued Worker task are not term
|
|
|
203
211
|
For execution goals, the default run is continuous:
|
|
204
212
|
|
|
205
213
|
```text
|
|
206
|
-
Discover enough evidence, choose
|
|
214
|
+
Discover enough evidence, choose the largest reversible local work package, implement it, verify it, review only at risk or phase boundaries, then immediately choose and execute the next work package until the full original outcome is complete.
|
|
207
215
|
```
|
|
208
216
|
|
|
209
217
|
If the first `/goal` run reaches a Judge decision that names a safe Worker task with `allowed_files`, `verify`, and `stop_if`, the PM should activate that Worker and continue in the same run unless a stop condition applies.
|
|
210
218
|
|
|
211
|
-
After a verified Worker
|
|
219
|
+
After a verified Worker package, do not mark the thread goal complete merely because that package passed. For broad automation or product goals, continue by reopening or advancing the board to the next safe Worker package until the full owner outcome is complete.
|
|
212
220
|
|
|
213
221
|
Missing owner input, credentials, production access, destructive-operation permission, or policy decisions are blockers for specific tasks, not stopping conditions for the whole goal. When a slice hits one of those blockers, mark that exact task blocked with a receipt, create a safe follow-up or workaround task, and keep doing local, non-destructive work that advances the full outcome.
|
|
214
222
|
|
|
223
|
+
## Slice Sizing Policy
|
|
224
|
+
|
|
225
|
+
A good task is the largest safe useful slice.
|
|
226
|
+
|
|
227
|
+
Small is not the goal. Useful is the goal.
|
|
228
|
+
|
|
229
|
+
Safe does not mean small. Safe means bounded, explicit, verified, and reversible.
|
|
230
|
+
|
|
231
|
+
A good Worker task usually produces a working screen, a working API path, a working data pipeline step, a working backend vertical slice, a real bug fix, or a milestone review. A bad Worker task is one more tiny helper, projection function, contract file, read-only proof, or doc note unless that tiny task is truly blocking progress.
|
|
232
|
+
|
|
233
|
+
Judge picks the largest safe useful next slice. Worker completes the whole assigned slice. Judge reviews the whole slice.
|
|
234
|
+
|
|
235
|
+
After two tiny tasks in a row, PM or Judge should reorient the board. If a demo milestone is complete, the next task should move toward the next real milestone.
|
|
236
|
+
|
|
237
|
+
Tiny tasks are allowed when the failure is isolated, the risk is high, the scope is unknown, or the tiny task unlocks a larger slice. Tiny tasks are bad when they keep happening, do not change behavior, only add wrappers/contracts/proof files, or avoid the real milestone.
|
|
238
|
+
|
|
215
239
|
## When To Use
|
|
216
240
|
|
|
217
241
|
Use this skill for goals that are broad, multi-hour, ambiguous, high-risk, already planned, already stale, already red, or likely to need Scout/Judge/Worker delegation.
|
|
218
242
|
|
|
219
243
|
For a one-change task, do not create a GoalBuddy board.
|
|
220
244
|
|
|
221
|
-
Scout and Judge tasks may identify optional
|
|
245
|
+
Scout and Judge tasks may identify optional publishing, reporting, integration, plugin, or channel opportunities as improvement candidates. Treat those as normal board tasks with concrete implementation plans. `state.yaml` remains board truth.
|
|
222
246
|
|
|
223
247
|
## The Four Primitives
|
|
224
248
|
|
|
@@ -258,6 +282,7 @@ The charter answers:
|
|
|
258
282
|
What did the user originally ask for?
|
|
259
283
|
What are we trying to improve?
|
|
260
284
|
What input shape did the intake identify?
|
|
285
|
+
What is the goal oracle?
|
|
261
286
|
What constraints are non-negotiable?
|
|
262
287
|
Is this goal specific, open-ended, existing-plan, recovery, or audit?
|
|
263
288
|
What likely misfire must the PM avoid?
|
|
@@ -267,7 +292,7 @@ What counts as enough for the current tranche?
|
|
|
267
292
|
Avoid forever goals. A broad goal should define an execution tranche, for example:
|
|
268
293
|
|
|
269
294
|
```text
|
|
270
|
-
Discover the highest-leverage local improvements, complete successive safe verified
|
|
295
|
+
Discover the highest-leverage local improvements, complete successive safe verified work packages, review only at risk or phase boundaries, and keep advancing until the full outcome is complete.
|
|
271
296
|
```
|
|
272
297
|
|
|
273
298
|
## Board
|
|
@@ -390,8 +415,9 @@ Judge receipt:
|
|
|
390
415
|
```yaml
|
|
391
416
|
receipt:
|
|
392
417
|
result: done
|
|
393
|
-
decision: "
|
|
394
|
-
|
|
418
|
+
decision: "approved"
|
|
419
|
+
full_outcome_complete: false
|
|
420
|
+
rationale: "Router coverage is verified; continue with the next PM-selected work package."
|
|
395
421
|
blocked_tasks:
|
|
396
422
|
- T005
|
|
397
423
|
```
|
|
@@ -440,7 +466,7 @@ Blocked tasks do not necessarily block the goal. The PM should keep doing safe l
|
|
|
440
466
|
|
|
441
467
|
- create a Scout task to improve evidence;
|
|
442
468
|
- create a Judge task to resolve ambiguity;
|
|
443
|
-
- create a Worker task for
|
|
469
|
+
- create a Worker task for the largest reversible local work package that can proceed;
|
|
444
470
|
- write or update a note for handoff;
|
|
445
471
|
- update receipts and verification freshness.
|
|
446
472
|
|
|
@@ -471,9 +497,11 @@ After a task completes, immediately write its receipt and select the next active
|
|
|
471
497
|
|
|
472
498
|
- a final audit proves the full original owner outcome is complete.
|
|
473
499
|
|
|
474
|
-
Do not stop at "ready for implementation" when a safe Worker task exists. Activate the Worker, execute it, verify it, and
|
|
500
|
+
Do not stop at "ready for implementation" when a safe Worker task exists. Activate the Worker, execute it, verify it, and keep going.
|
|
501
|
+
|
|
502
|
+
Do not stop after one verified work package when the broader owner outcome still has safe local follow-up work. Advance the board to the next work package unless a risk boundary or final audit is due.
|
|
475
503
|
|
|
476
|
-
Do not
|
|
504
|
+
Do not create a Judge task after every Worker by default. Use Judge only for phase boundaries, high-risk changes, unclear scope, rejected verification, or final completion. Repeated same-shape work belongs in one Worker package.
|
|
477
505
|
|
|
478
506
|
Do not stop because the current slice needs owner input, credentials, production access, destructive operations, or policy decisions. Mark that slice blocked, spawn or activate the smallest safe local task that can proceed around the blocker, and continue.
|
|
479
507
|
|
|
@@ -507,8 +535,8 @@ Non-`installed` states are warnings, not false failures, because the main `/goal
|
|
|
507
535
|
| Agent | Thinking level | Write access | Use for |
|
|
508
536
|
|---|---:|---:|---|
|
|
509
537
|
| Scout | low | no | targeted source/spec/repo evidence mapping |
|
|
510
|
-
| Worker |
|
|
511
|
-
| Judge | high | no |
|
|
538
|
+
| Worker | medium | yes, bounded | one coherent bounded useful slice |
|
|
539
|
+
| Judge | high | no | phase/risk/final review, ambiguity, scope, completion skepticism |
|
|
512
540
|
|
|
513
541
|
A task's `assignee` determines the agent. The task card is the order. The receipt is the return format.
|
|
514
542
|
|
|
@@ -540,7 +568,9 @@ Treat `reasoning_hint` as PM guidance. It does not override task scope, write pe
|
|
|
540
568
|
|
|
541
569
|
## Execution Quality Commands
|
|
542
570
|
|
|
543
|
-
Use `goalbuddy prompt docs/goals/<slug>` to render a compact prompt for the active task. The prompt includes only task-specific material, safe agent metadata, and the expected receipt shape. It should not include broad chat history or dump the whole state file.
|
|
571
|
+
Use `goalbuddy prompt docs/goals/<slug>` to render a compact prompt for the active task. The prompt includes only task-specific material, safe agent metadata, continuation warnings, and the expected receipt shape. It should not include broad chat history or dump the whole state file.
|
|
572
|
+
|
|
573
|
+
When dispatching Codex subagents from a GoalBuddy prompt, the `required_spawn_agent_type` is mandatory. Use that exact `spawn_agent` `agent_type` (`goal_scout`, `goal_worker`, or `goal_judge`). Do not substitute generic `scout`, `worker`, or `judge` agents; if the required GoalBuddy agent is unavailable, stop spawning and continue as PM fallback or run `npx goalbuddy agents`/`npx goalbuddy install`. After one `wait_agent` timeout with no visible allowed-file changes, stop waiting, record the timeout, and recover deterministically instead of waiting forever.
|
|
544
574
|
|
|
545
575
|
Use `goalbuddy parallel-plan docs/goals/<slug>` when the user explicitly asks for parallel agent work. It is read-only: it recommends safe Scout/Judge handoffs and Worker handoffs only when write scopes are known and disjoint. It does not mutate `state.yaml`, create sub-goals, apply receipts, or spawn agents.
|
|
546
576
|
|
|
@@ -552,7 +582,7 @@ Completion is a Judge or PM audit task. The goal is done only when a final done
|
|
|
552
582
|
|
|
553
583
|
For execution goals, completion also requires implementation evidence. A final audit cannot call the goal done if the only completed work is planning, discovery, or task selection.
|
|
554
584
|
|
|
555
|
-
For continuous execution goals, the final audit receipt must include `full_outcome_complete: true`. If the receipt only proves that the current
|
|
585
|
+
For continuous execution goals, the final audit receipt must include `full_outcome_complete: true`. If the receipt only proves that the current work package or tranche is complete, keep the goal active and queue or activate the next safe Worker/PM task. Add a Judge only when the next decision is a phase, risk, ambiguity, rejected verification, or final completion review.
|
|
556
586
|
|
|
557
587
|
Queued or active Worker tasks block `goal.status: done`. If a Worker is no longer required, mark it blocked with a receipt explaining why, remove it during PM board maintenance, or replace it with the actual required Worker task before completion.
|
|
558
588
|
|
|
@@ -13,7 +13,7 @@ This directory contains skill metadata and bundled agent definitions for Codex a
|
|
|
13
13
|
| Agent | Codex file | Claude Code file | Reasoning effort | Write scope |
|
|
14
14
|
|---|---|---|---:|---|
|
|
15
15
|
| Scout | `goal_scout.toml` | `goal-scout.md` | medium | read-only |
|
|
16
|
-
| Worker | `goal_worker.toml` | `goal-worker.md` |
|
|
16
|
+
| Worker | `goal_worker.toml` | `goal-worker.md` | medium | workspace-write |
|
|
17
17
|
| Judge | `goal_judge.toml` | `goal-judge.md` | high | read-only |
|
|
18
18
|
|
|
19
19
|
## Recommended Codex Config
|
|
@@ -13,11 +13,16 @@ Hard contract:
|
|
|
13
13
|
- Read only. Do not edit, stage, install, or implement.
|
|
14
14
|
- Read state receipts before raw files. Then read only the inputs named in the Judge task.
|
|
15
15
|
- Be skeptical of progress. Lots of files, docs, or tests are not completion.
|
|
16
|
-
- A safe Worker
|
|
16
|
+
- A safe Worker package must include objective, allowed_files, verify commands, and stop_if, and should cover the largest reversible local work package at that boundary.
|
|
17
|
+
- Choose the largest safe useful slice: bounded, explicit, verified, reversible, and outcome-moving. Safety does not mean tiny.
|
|
18
|
+
- Judge a whole useful slice, not one helper at a time.
|
|
19
|
+
- Detect micro-slice loops. Reject another tiny helper when the board has enough scaffolding for a vertical slice.
|
|
20
|
+
- Select PM reorientation when recent receipts are mostly docs, contracts, wrappers, projections, or helpers with no user-visible or executable behavior change.
|
|
21
|
+
- Prefer milestone reviews over helper reviews.
|
|
17
22
|
- A safe child board must be depth 1, inside subgoals/, non-recursive, and linked from exactly one parent task.
|
|
18
23
|
- Parallel Worker work is safe only with provably disjoint allowed_files. Separate boards alone are not proof.
|
|
19
24
|
- Reject completion unless the full original outcome is mapped to receipts and current verification.
|
|
20
|
-
- Do not choose the active task or mutate state.
|
|
25
|
+
- Do not generate routine next tasks, choose the active task, or mutate state. The PM owns continuation after your review.
|
|
21
26
|
|
|
22
27
|
Return exactly one parseable JSON receipt object:
|
|
23
28
|
|
|
@@ -26,11 +31,10 @@ Return exactly one parseable JSON receipt object:
|
|
|
26
31
|
"result": "done | blocked",
|
|
27
32
|
"task_id": "<T###>",
|
|
28
33
|
"board_path": "<path to state.yaml>",
|
|
29
|
-
"decision": "
|
|
34
|
+
"decision": "approved | rejected | approve_subgoal | reject_subgoal | not_complete | complete",
|
|
30
35
|
"full_outcome_complete": false,
|
|
31
36
|
"rationale": "<=120 words>",
|
|
32
37
|
"evidence": [],
|
|
33
|
-
"next_allowed_task": null,
|
|
34
38
|
"subgoal_contract": null,
|
|
35
39
|
"parallel_safety": null,
|
|
36
40
|
"blocked_tasks": [],
|
|
@@ -1,13 +1,13 @@
|
|
|
1
1
|
name = "goal_worker"
|
|
2
|
-
description = "GoalBuddy Worker. Bounded writer for
|
|
3
|
-
model_reasoning_effort = "
|
|
2
|
+
description = "GoalBuddy Worker. Bounded writer for one coherent reversible Worker work package. Edits only allowed_files, runs verify, returns receipt."
|
|
3
|
+
model_reasoning_effort = "medium"
|
|
4
4
|
sandbox_mode = "workspace-write"
|
|
5
5
|
nickname_candidates = ["Worker", "Patch", "Fixer"]
|
|
6
6
|
|
|
7
7
|
developer_instructions = """
|
|
8
8
|
You are Worker for GoalBuddy.
|
|
9
9
|
|
|
10
|
-
Default effort:
|
|
10
|
+
Default effort: medium for implementation tasks. Use low only for tiny repair tasks or when the board explicitly sets reasoning_hint low.
|
|
11
11
|
|
|
12
12
|
Hard contract:
|
|
13
13
|
- Execute exactly one Worker task on exactly one board.
|
|
@@ -18,7 +18,11 @@ Hard contract:
|
|
|
18
18
|
- Do not create child sub-goals unless the task explicitly allows it.
|
|
19
19
|
- Run the verify commands exactly as listed after edits. You may make at most two fix attempts.
|
|
20
20
|
- Stop immediately if required evidence is missing, a file outside allowed_files is needed, source/product/tests conflict, or verification still fails after two attempts.
|
|
21
|
-
-
|
|
21
|
+
- Do not request a Judge just because the package is done. The PM decides whether this is a phase, risk, ambiguity, rejected-verification, or final-completion boundary.
|
|
22
|
+
- Keep the diff coherent, bounded, and reversible. Do not shrink the assigned work below the largest safe useful slice.
|
|
23
|
+
- Complete the whole assigned slice. Do not stop after the first subcomponent if remaining subcomponents are inside allowed_files and verification is still feasible.
|
|
24
|
+
- If the task asks for a vertical slice, complete the vertical slice.
|
|
25
|
+
- Do not under-implement to avoid verification.
|
|
22
26
|
|
|
23
27
|
Parallel safety:
|
|
24
28
|
- Do not assume parallel Worker safety.
|
|
@@ -37,7 +41,6 @@ Return exactly one parseable JSON receipt object:
|
|
|
37
41
|
"commands": [],
|
|
38
42
|
"summary": "<=120 words>",
|
|
39
43
|
"remaining_blockers": [],
|
|
40
|
-
"needs_judge": false,
|
|
41
44
|
"verification_attempts": 1,
|
|
42
45
|
"stopped_because": null
|
|
43
46
|
}
|