agent-method 1.5.12
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +343 -0
- package/bin/wwa.js +115 -0
- package/docs/internal/cli-commands.yaml +259 -0
- package/docs/internal/doc-tokens.yaml +1103 -0
- package/docs/internal/feature-registry.yaml +1643 -0
- package/lib/boundaries.js +247 -0
- package/lib/cli/add.js +170 -0
- package/lib/cli/casestudy.js +1000 -0
- package/lib/cli/check.js +323 -0
- package/lib/cli/close.js +838 -0
- package/lib/cli/completion.js +735 -0
- package/lib/cli/deps.js +234 -0
- package/lib/cli/digest.js +73 -0
- package/lib/cli/doc-review.js +486 -0
- package/lib/cli/docs.js +315 -0
- package/lib/cli/helpers.js +198 -0
- package/lib/cli/implement.js +169 -0
- package/lib/cli/init.js +280 -0
- package/lib/cli/pipeline.js +206 -0
- package/lib/cli/plan.js +140 -0
- package/lib/cli/record.js +98 -0
- package/lib/cli/refine.js +202 -0
- package/lib/cli/report-helpers.js +113 -0
- package/lib/cli/review.js +76 -0
- package/lib/cli/routable.js +109 -0
- package/lib/cli/route.js +101 -0
- package/lib/cli/scan.js +133 -0
- package/lib/cli/serve.js +23 -0
- package/lib/cli/status.js +65 -0
- package/lib/cli/update-docs.js +574 -0
- package/lib/cli/upgrade.js +222 -0
- package/lib/cli/watch.js +32 -0
- package/lib/dependencies.js +196 -0
- package/lib/init.js +692 -0
- package/lib/mcp-server.js +612 -0
- package/lib/pipeline.js +907 -0
- package/lib/registry.js +132 -0
- package/lib/watcher.js +165 -0
- package/package.json +54 -0
- package/templates/README.md +363 -0
- package/templates/entry-points/.cursorrules +90 -0
- package/templates/entry-points/AGENT.md +90 -0
- package/templates/entry-points/CLAUDE.md +88 -0
- package/templates/extensions/MANIFEST.md +110 -0
- package/templates/extensions/analytical-system.md +96 -0
- package/templates/extensions/code-project.md +77 -0
- package/templates/extensions/data-exploration.md +117 -0
- package/templates/full/.context/BASE.md +101 -0
- package/templates/full/.context/COMPOSITION.md +47 -0
- package/templates/full/.context/INDEX.yaml +56 -0
- package/templates/full/.context/METHODOLOGY.md +246 -0
- package/templates/full/.context/PROTOCOL.yaml +169 -0
- package/templates/full/.context/REGISTRY.md +75 -0
- package/templates/full/.cursorrules +90 -0
- package/templates/full/AGENT.md +90 -0
- package/templates/full/CLAUDE.md +90 -0
- package/templates/full/Management/DIGEST.md +23 -0
- package/templates/full/Management/STATUS.md +46 -0
- package/templates/full/PLAN.md +67 -0
- package/templates/full/PROJECT-PROFILE.md +61 -0
- package/templates/full/PROJECT.md +80 -0
- package/templates/full/REQUIREMENTS.md +30 -0
- package/templates/full/ROADMAP.md +39 -0
- package/templates/full/Reviews/INDEX.md +41 -0
- package/templates/full/Reviews/backlog.md +52 -0
- package/templates/full/Reviews/plan.md +43 -0
- package/templates/full/Reviews/project.md +41 -0
- package/templates/full/Reviews/requirements.md +42 -0
- package/templates/full/Reviews/roadmap.md +41 -0
- package/templates/full/Reviews/state.md +56 -0
- package/templates/full/SESSION-LOG.md +102 -0
- package/templates/full/STATE.md +42 -0
- package/templates/full/SUMMARY.md +27 -0
- package/templates/full/agentWorkflows/INDEX.md +42 -0
- package/templates/full/agentWorkflows/observations.md +65 -0
- package/templates/full/agentWorkflows/patterns.md +68 -0
- package/templates/full/agentWorkflows/sessions.md +92 -0
- package/templates/full/intro/README.md +39 -0
- package/templates/full/registry/feature-registry.yaml +25 -0
- package/templates/full/registry/features/catalog.yaml +743 -0
- package/templates/full/registry/features/protocol.yaml +121 -0
- package/templates/full/registry/features/routing.yaml +358 -0
- package/templates/full/registry/features/workflows.yaml +404 -0
- package/templates/full/todos/backlog.md +19 -0
- package/templates/starter/.context/BASE.md +66 -0
- package/templates/starter/.context/INDEX.yaml +51 -0
- package/templates/starter/.context/METHODOLOGY.md +228 -0
- package/templates/starter/.context/PROTOCOL.yaml +165 -0
- package/templates/starter/.cursorrules +90 -0
- package/templates/starter/AGENT.md +90 -0
- package/templates/starter/CLAUDE.md +90 -0
- package/templates/starter/Management/DIGEST.md +23 -0
- package/templates/starter/Management/STATUS.md +46 -0
- package/templates/starter/PLAN.md +67 -0
- package/templates/starter/PROJECT-PROFILE.md +44 -0
- package/templates/starter/PROJECT.md +80 -0
- package/templates/starter/ROADMAP.md +39 -0
- package/templates/starter/Reviews/INDEX.md +75 -0
- package/templates/starter/SESSION-LOG.md +102 -0
- package/templates/starter/STATE.md +42 -0
- package/templates/starter/SUMMARY.md +27 -0
- package/templates/starter/agentWorkflows/INDEX.md +61 -0
- package/templates/starter/intro/README.md +37 -0
- package/templates/starter/registry/feature-registry.yaml +25 -0
- package/templates/starter/registry/features/catalog.yaml +743 -0
- package/templates/starter/registry/features/protocol.yaml +121 -0
- package/templates/starter/registry/features/routing.yaml +358 -0
- package/templates/starter/registry/features/workflows.yaml +404 -0
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
# Roadmap Review
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: Synthesize from ROADMAP.md. This is the high-level view of phase progress,
|
|
4
|
+
milestones, and project trajectory. Update after phase completions or milestone changes.
|
|
5
|
+
|
|
6
|
+
Source: ROADMAP.md
|
|
7
|
+
Parent: Reviews/INDEX.md (update "At a glance" row when this changes) -->
|
|
8
|
+
|
|
9
|
+
## Phase progress
|
|
10
|
+
|
|
11
|
+
| Phase | Name | Status | Completion | Gate |
|
|
12
|
+
|-------|------|--------|------------|------|
|
|
13
|
+
<!-- Populate from ROADMAP.md. Show all phases with current status. -->
|
|
14
|
+
|
|
15
|
+
## Milestone timeline
|
|
16
|
+
|
|
17
|
+
<!-- AGENT: Track when phases were completed or are expected to complete. -->
|
|
18
|
+
|
|
19
|
+
| Milestone | Target | Actual | Delta |
|
|
20
|
+
|-----------|--------|--------|-------|
|
|
21
|
+
<!-- {phase/milestone name} | {expected date} | {actual date} | {on time / early / late} -->
|
|
22
|
+
|
|
23
|
+
## Velocity analysis
|
|
24
|
+
|
|
25
|
+
<!-- AGENT: Observe patterns in phase completion speed. -->
|
|
26
|
+
|
|
27
|
+
- **Average phase duration**: {estimate based on completed phases}
|
|
28
|
+
- **Trend**: {accelerating / steady / slowing}
|
|
29
|
+
- **Bottleneck phases**: {any phases that took significantly longer}
|
|
30
|
+
|
|
31
|
+
## Upcoming work
|
|
32
|
+
|
|
33
|
+
<!-- AGENT: What's next on the roadmap? Any dependencies or risks? -->
|
|
34
|
+
|
|
35
|
+
### Next phase
|
|
36
|
+
|
|
37
|
+
{Brief description of what's coming and what it depends on.}
|
|
38
|
+
|
|
39
|
+
### Risks to timeline
|
|
40
|
+
|
|
41
|
+
<!-- Known risks that could delay upcoming phases. -->
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
# State Review
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: Synthesize from STATE.md. Analyze decision patterns, blocker trends,
|
|
4
|
+
and open question resolution. This is the analytical view of project state —
|
|
5
|
+
STATE.md is the raw data, this file is the analysis.
|
|
6
|
+
Update after significant state changes (new blockers, major decisions).
|
|
7
|
+
|
|
8
|
+
Source: STATE.md
|
|
9
|
+
Parent: Reviews/INDEX.md (update "At a glance" row when this changes) -->
|
|
10
|
+
|
|
11
|
+
## Decision analysis
|
|
12
|
+
|
|
13
|
+
### Summary
|
|
14
|
+
|
|
15
|
+
- **Total decisions**: {count}
|
|
16
|
+
- **Decisions this phase**: {count}
|
|
17
|
+
- **Most common decision type**: {technical / architectural / process / scope}
|
|
18
|
+
|
|
19
|
+
### Recent decisions (last 10)
|
|
20
|
+
|
|
21
|
+
| Date | Decision | Category |
|
|
22
|
+
|------|----------|----------|
|
|
23
|
+
<!-- Last 10 from STATE.md decisions table -->
|
|
24
|
+
|
|
25
|
+
### Decision frequency
|
|
26
|
+
|
|
27
|
+
<!-- AGENT: How often are decisions being made? Any patterns in timing? -->
|
|
28
|
+
|
|
29
|
+
## Blocker analysis
|
|
30
|
+
|
|
31
|
+
### Active blockers
|
|
32
|
+
|
|
33
|
+
| Blocker | Since | Duration | Severity | Resolution path |
|
|
34
|
+
|---------|-------|----------|----------|----------------|
|
|
35
|
+
<!-- Active blockers from STATE.md with aging analysis -->
|
|
36
|
+
|
|
37
|
+
### Resolved blockers
|
|
38
|
+
|
|
39
|
+
- **Total resolved**: {count}
|
|
40
|
+
- **Average resolution time**: {estimate}
|
|
41
|
+
- **Most common blocker type**: {external dependency / technical / decision needed}
|
|
42
|
+
|
|
43
|
+
## Open question analysis
|
|
44
|
+
|
|
45
|
+
### Active questions
|
|
46
|
+
|
|
47
|
+
| Question | Since | Duration | Priority |
|
|
48
|
+
|----------|-------|----------|----------|
|
|
49
|
+
<!-- Active open questions with aging -->
|
|
50
|
+
|
|
51
|
+
### Resolution rate
|
|
52
|
+
|
|
53
|
+
- **Total questions raised**: {count}
|
|
54
|
+
- **Resolved**: {count} ({%})
|
|
55
|
+
- **Still open**: {count}
|
|
56
|
+
- **Average resolution time**: {estimate}
|
|
@@ -0,0 +1,102 @@
|
|
|
1
|
+
# Session Log
|
|
2
|
+
|
|
3
|
+
Append-only session observation log for case study data collection. Each session adds a metrics entry at close. High-effort tasks log immediately at task completion. This file is read-only during extraction (never during normal work).
|
|
4
|
+
|
|
5
|
+
<!-- AGENT INSTRUCTION: At the end of every session — or immediately after any high-effort task —
|
|
6
|
+
append a new entry below using the format in "Entry format".
|
|
7
|
+
Do NOT read this file during normal work — only append to it.
|
|
8
|
+
Do NOT modify or delete previous entries.
|
|
9
|
+
When this file exceeds 300 lines, archive older entries to session-log/batch-{N}.md -->
|
|
10
|
+
|
|
11
|
+
## Project context
|
|
12
|
+
|
|
13
|
+
| Field | Value |
|
|
14
|
+
|-------|-------|
|
|
15
|
+
| Project name | {project name} |
|
|
16
|
+
| Project type | {code / data / analytical / mixed / general} |
|
|
17
|
+
| Integration profile | {lite / standard / full} |
|
|
18
|
+
| Extension(s) | {code-project / data-exploration / analytical-system / none} |
|
|
19
|
+
| Observation started | {date} |
|
|
20
|
+
|
|
21
|
+
## Effort classification
|
|
22
|
+
|
|
23
|
+
| Effort | Description | When to log |
|
|
24
|
+
|--------|-------------|-------------|
|
|
25
|
+
| **low** | Quick answer, single file or no changes, <5 min | At session close |
|
|
26
|
+
| **medium** | Multi-step work, several file changes, 5-30 min | At session close |
|
|
27
|
+
| **high** | Complex multi-file changes, architecture decisions, extensive debugging, 30+ min | Immediately at task completion |
|
|
28
|
+
|
|
29
|
+
## Assessment scales
|
|
30
|
+
|
|
31
|
+
**Ambiguity** (agent-assessed — how clear was the user's request?):
|
|
32
|
+
- **low**: Clear, specific request with sufficient context
|
|
33
|
+
- **medium**: Request understood but required interpretation or assumptions
|
|
34
|
+
- **high**: Vague or ambiguous, required significant clarification
|
|
35
|
+
|
|
36
|
+
**Context level** (agent-assessed — how much project context was loaded?):
|
|
37
|
+
- **very low**: No project files loaded, answered from general knowledge
|
|
38
|
+
- **low**: Entry point only
|
|
39
|
+
- **medium**: Entry point + STATE.md + 1-2 project files
|
|
40
|
+
- **high**: Entry point + STATE.md + specialist context + multiple project files
|
|
41
|
+
- **very high**: Extensive project context, multiple specialists, cross-file analysis
|
|
42
|
+
|
|
43
|
+
**User response** (agent-observed — how did the user respond to the result?):
|
|
44
|
+
- **accepted**: User proceeded to next step without changes
|
|
45
|
+
- **edited**: User manually modified the agent's output
|
|
46
|
+
- **revised**: User asked agent to redo or revise the result
|
|
47
|
+
- **rejected**: User said no or declined the result entirely
|
|
48
|
+
- **redirected**: User changed approach or gave new instructions
|
|
49
|
+
|
|
50
|
+
**Refinement magnitude** (for medium/high effort only — how much changed from first attempt to final?):
|
|
51
|
+
- **none**: Accepted as-is, 0% changed
|
|
52
|
+
- **minor**: Small fixes — typos, naming, formatting (<10% changed)
|
|
53
|
+
- **moderate**: Logic or structural changes, added/removed sections (10–50% changed)
|
|
54
|
+
- **major**: Significant rework of approach or content (50–80% changed)
|
|
55
|
+
- **rework**: Mostly rewritten, original approach abandoned (>80% changed)
|
|
56
|
+
|
|
57
|
+
**Delta categories** (what kinds of changes were needed — select all that apply):
|
|
58
|
+
- **accuracy**: Factual errors or incorrect implementation
|
|
59
|
+
- **completeness**: Missing parts, incomplete coverage
|
|
60
|
+
- **approach**: Wrong method or strategy
|
|
61
|
+
- **scope**: Over-scoped or under-scoped
|
|
62
|
+
- **style**: Formatting, naming, conventions
|
|
63
|
+
|
|
64
|
+
## Observation checklist
|
|
65
|
+
|
|
66
|
+
At session close (or high-effort task completion), reflect on these before writing the entry:
|
|
67
|
+
1. Which workflow did this session follow?
|
|
68
|
+
2. Which query types were encountered?
|
|
69
|
+
3. Which features visibly activated? (context loading, cascade, decision recording, scoping)
|
|
70
|
+
4. Were any cascades expected but missed?
|
|
71
|
+
5. Were any decisions deferred instead of recorded immediately?
|
|
72
|
+
6. Was there friction with any methodology rule?
|
|
73
|
+
7. Any degradation signals? (HAI-05: cascade misses, instruction loss, shallow context)
|
|
74
|
+
8. How much effort did this task require? (low / medium / high)
|
|
75
|
+
9. How ambiguous was the user's request? (low / medium / high)
|
|
76
|
+
10. How much project context was loaded? (very low / low / medium / high / very high)
|
|
77
|
+
11. LLM token usage (input + output), tool call count, and wall time?
|
|
78
|
+
12. How did the user respond to the result? (accepted / edited / revised / rejected / redirected)
|
|
79
|
+
13. For medium/high effort: how many revision cycles before acceptance?
|
|
80
|
+
14. What magnitude of change between first attempt and final result? (none / minor / moderate / major / rework)
|
|
81
|
+
15. What categories of refinement were needed? (accuracy / completeness / approach / scope / style)
|
|
82
|
+
|
|
83
|
+
## Entry format
|
|
84
|
+
|
|
85
|
+
<!-- Append new entries below. Format: -->
|
|
86
|
+
<!--
|
|
87
|
+
### S{N} — {YYYY-MM-DD} — {brief title}
|
|
88
|
+
Model: {model} | Profile: {profile} | Workflow: {WF-XX}
|
|
89
|
+
Effort: {low / medium / high} | Ambiguity: {low / medium / high} | Context: {very low / low / medium / high / very high}
|
|
90
|
+
LLM tokens: ~{N}k ({N} input + {N} output) | Tool calls: {N} | Wall time: ~{N} min
|
|
91
|
+
Queries: {query types encountered}
|
|
92
|
+
Features: {feature IDs activated}
|
|
93
|
+
Cascades: {triggered}/{expected} | Decisions: {count}
|
|
94
|
+
Response: {accepted / edited / revised / rejected / redirected}
|
|
95
|
+
Revisions: {0 | count of revision cycles} | Magnitude: {none / minor / moderate / major / rework}
|
|
96
|
+
Delta: {n/a | categories: accuracy, completeness, approach, scope, style} | Survival: ~{N}%
|
|
97
|
+
Delta notes: {n/a | brief description of what changed between first attempt and final}
|
|
98
|
+
Friction: {none | brief description}
|
|
99
|
+
Finding: {none | observation with methodology implication}
|
|
100
|
+
-->
|
|
101
|
+
|
|
102
|
+
## Session entries
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
# State
|
|
2
|
+
|
|
3
|
+
## Current position
|
|
4
|
+
|
|
5
|
+
- **Phase**: {Phase name or number}
|
|
6
|
+
- **Status**: {What's happening now}
|
|
7
|
+
- **Next**: {What comes after the current work}
|
|
8
|
+
- **Active context**: `.context/BASE.md`
|
|
9
|
+
|
|
10
|
+
<!-- INSTRUCTION: Update this section every session. The next session reads this
|
|
11
|
+
to know where to pick up. Be specific about what's in progress and what's next. -->
|
|
12
|
+
|
|
13
|
+
## Decisions
|
|
14
|
+
|
|
15
|
+
| Date | Decision | Rationale |
|
|
16
|
+
|------|----------|-----------|
|
|
17
|
+
<!-- INSTRUCTION: Add decisions HERE, in the SAME response as the work that
|
|
18
|
+
produced them. Never defer to end of session. If the session is interrupted,
|
|
19
|
+
the decision survives. Format: date, what was decided, why. -->
|
|
20
|
+
|
|
21
|
+
## Blockers
|
|
22
|
+
|
|
23
|
+
<!-- INSTRUCTION: List anything preventing progress. Remove when resolved. -->
|
|
24
|
+
|
|
25
|
+
None currently.
|
|
26
|
+
|
|
27
|
+
## Open questions
|
|
28
|
+
|
|
29
|
+
<!-- INSTRUCTION: When the agent encounters uncertainty, it writes a numbered
|
|
30
|
+
question here. When resolved, don't delete — add the resolution inline.
|
|
31
|
+
This preserves reasoning history. -->
|
|
32
|
+
|
|
33
|
+
1. {Open question — describe what's uncertain and why it matters}
|
|
34
|
+
|
|
35
|
+
## Variant log
|
|
36
|
+
|
|
37
|
+
<!-- INSTRUCTION: Optional. Track experiment variants if your project involves
|
|
38
|
+
A/B testing, prompt variants, or configuration comparison. Delete if unused. -->
|
|
39
|
+
|
|
40
|
+
| Run | Scenario | Variant | Avg Score | Notes |
|
|
41
|
+
|-----|----------|---------|-----------|-------|
|
|
42
|
+
| -- | -- | -- | -- | No runs executed yet |
|
|
@@ -0,0 +1,27 @@
|
|
|
1
|
+
# Summary
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: This file is the session audit trail — a chronological record of work done.
|
|
4
|
+
The management digest has moved to Management/DIGEST.md.
|
|
5
|
+
Append an entry after each session or significant task using the format below.
|
|
6
|
+
Never edit previous entries. -->
|
|
7
|
+
|
|
8
|
+
## Session audit trail
|
|
9
|
+
|
|
10
|
+
<!-- INSTRUCTION: Use this format for each entry:
|
|
11
|
+
|
|
12
|
+
### {Date} — {Brief title}
|
|
13
|
+
|
|
14
|
+
**Plan**: {What was planned for this session}
|
|
15
|
+
**Outcome**: {What was actually accomplished}
|
|
16
|
+
|
|
17
|
+
**Files created**:
|
|
18
|
+
- {path/to/new-file.md}
|
|
19
|
+
|
|
20
|
+
**Files updated**:
|
|
21
|
+
- {path/to/updated-file.md} — {what changed}
|
|
22
|
+
|
|
23
|
+
**Key decisions**:
|
|
24
|
+
- {Decision and rationale — should match what's in STATE.md}
|
|
25
|
+
|
|
26
|
+
**Next**: {What should happen in the following session — this is the bridge}
|
|
27
|
+
-->
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
# Agent Workflows
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: This file is the overview of agent workflow performance.
|
|
4
|
+
It links to detailed analysis files for deep dives.
|
|
5
|
+
Update the summary table after high-effort sessions.
|
|
6
|
+
|
|
7
|
+
Source: SESSION-LOG.md entries, agent self-observation during sessions.
|
|
8
|
+
Detail lives in the linked analysis files — keep this file lean. -->
|
|
9
|
+
|
|
10
|
+
## Workflow summary
|
|
11
|
+
|
|
12
|
+
| Workflow | Times used | Last used | Typical effort | Analysis |
|
|
13
|
+
|----------|-----------|-----------|---------------|----------|
|
|
14
|
+
<!-- Populate from SESSION-LOG.md workflow field -->
|
|
15
|
+
| {WF-XX} | {N} | {date} | {low/medium/high} | [sessions.md](sessions.md) |
|
|
16
|
+
|
|
17
|
+
## Quick stats
|
|
18
|
+
|
|
19
|
+
<!-- AGENT: Populate from SESSION-LOG.md. Update after each high-effort session. -->
|
|
20
|
+
|
|
21
|
+
- **Total sessions**: {count}
|
|
22
|
+
- **Acceptance rate**: {%} (accepted on first attempt)
|
|
23
|
+
- **Average effort**: {low/medium/high}
|
|
24
|
+
- **Most common workflow**: {WF-XX}
|
|
25
|
+
- **Cascade compliance**: {triggered/expected} ({%})
|
|
26
|
+
|
|
27
|
+
## Analysis files
|
|
28
|
+
|
|
29
|
+
| File | What it covers | Last updated |
|
|
30
|
+
|------|---------------|-------------|
|
|
31
|
+
| [sessions.md](sessions.md) | Session-by-session analysis, effort distribution, query patterns | {date} |
|
|
32
|
+
| [patterns.md](patterns.md) | Extracted behavioral patterns, what works vs. friction | {date} |
|
|
33
|
+
| [observations.md](observations.md) | Case study observations, methodology findings | {date} |
|
|
34
|
+
|
|
35
|
+
## Recent findings
|
|
36
|
+
|
|
37
|
+
<!-- AGENT: Keep the 5 most recent significant findings here.
|
|
38
|
+
Full findings history in observations.md. -->
|
|
39
|
+
|
|
40
|
+
| Date | Finding | Severity | Action taken |
|
|
41
|
+
|------|---------|----------|-------------|
|
|
42
|
+
<!-- Last 5 significant findings -->
|
|
@@ -0,0 +1,65 @@
|
|
|
1
|
+
# Case Study Observations
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: Record methodology observations — findings from running the methodology
|
|
4
|
+
on this project that have implications for methodology improvement. These feed
|
|
5
|
+
into refinement reports (see case-studies/refinement-report-template.md).
|
|
6
|
+
Update whenever a significant finding emerges during a session.
|
|
7
|
+
|
|
8
|
+
Source: SESSION-LOG.md (finding field), agent self-observation
|
|
9
|
+
Parent: agentWorkflows/INDEX.md (update recent findings when this changes) -->
|
|
10
|
+
|
|
11
|
+
## Observation log
|
|
12
|
+
|
|
13
|
+
<!-- AGENT: Append new observations. Never edit or delete previous entries. -->
|
|
14
|
+
|
|
15
|
+
| # | Date | Observation | Category | Severity | Action |
|
|
16
|
+
|---|------|-------------|----------|----------|--------|
|
|
17
|
+
<!-- {N} | {date} | {what was observed} | {see categories below} | {critical/major/minor/enhancement} | {what was done or proposed} -->
|
|
18
|
+
|
|
19
|
+
## Categories
|
|
20
|
+
|
|
21
|
+
Observations are classified into these categories (matching the refinement report template):
|
|
22
|
+
|
|
23
|
+
| Category | Code | Description |
|
|
24
|
+
|----------|------|-------------|
|
|
25
|
+
| Context quality | CQ | How well .context/ files serve the project |
|
|
26
|
+
| Decision preservation | DP | Whether decisions are captured accurately and timely |
|
|
27
|
+
| Scope discipline | SD | Whether scoping rules are followed correctly |
|
|
28
|
+
| Cascade coverage | CC | Whether cascade rules trigger correctly and completely |
|
|
29
|
+
| Audit completeness | AC | Whether session records are complete and useful |
|
|
30
|
+
| Bootstrap speed | BS | How quickly new projects get productive |
|
|
31
|
+
| Lifecycle fit | LF | Whether lifecycle stage affects methodology effectiveness |
|
|
32
|
+
| Model adequacy | MA | Whether the model tier matches task complexity |
|
|
33
|
+
|
|
34
|
+
## Severity guide
|
|
35
|
+
|
|
36
|
+
| Severity | Definition | Response |
|
|
37
|
+
|----------|-----------|----------|
|
|
38
|
+
| **Critical** | Methodology fails to function correctly | Immediate fix needed |
|
|
39
|
+
| **Major** | Methodology works but produces poor results | Fix before next case study |
|
|
40
|
+
| **Minor** | Methodology works but could be smoother | Fix when convenient |
|
|
41
|
+
| **Enhancement** | Opportunity to improve, not a problem | Add to backlog |
|
|
42
|
+
|
|
43
|
+
## Summary by category
|
|
44
|
+
|
|
45
|
+
<!-- AGENT: Aggregate observations by category. Update as observations accumulate. -->
|
|
46
|
+
|
|
47
|
+
| Category | Critical | Major | Minor | Enhancement | Total |
|
|
48
|
+
|----------|----------|-------|-------|-------------|-------|
|
|
49
|
+
| Context quality | {N} | {N} | {N} | {N} | {N} |
|
|
50
|
+
| Decision preservation | {N} | {N} | {N} | {N} | {N} |
|
|
51
|
+
| Scope discipline | {N} | {N} | {N} | {N} | {N} |
|
|
52
|
+
| Cascade coverage | {N} | {N} | {N} | {N} | {N} |
|
|
53
|
+
| Audit completeness | {N} | {N} | {N} | {N} | {N} |
|
|
54
|
+
| Bootstrap speed | {N} | {N} | {N} | {N} | {N} |
|
|
55
|
+
| Lifecycle fit | {N} | {N} | {N} | {N} | {N} |
|
|
56
|
+
| Model adequacy | {N} | {N} | {N} | {N} | {N} |
|
|
57
|
+
|
|
58
|
+
## Refinement candidates
|
|
59
|
+
|
|
60
|
+
<!-- AGENT: Observations promoted to refinement report candidates. These are findings
|
|
61
|
+
significant enough to warrant methodology changes. -->
|
|
62
|
+
|
|
63
|
+
| Observation # | Category | Proposed change | Status |
|
|
64
|
+
|--------------|----------|----------------|--------|
|
|
65
|
+
<!-- {N} | {code} | {what should change in the methodology} | {proposed / accepted / implemented / rejected} -->
|
|
@@ -0,0 +1,68 @@
|
|
|
1
|
+
# Behavioral Patterns
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: Extract recurring patterns from SESSION-LOG.md and session experience.
|
|
4
|
+
Focus on what works, what doesn't, and what could be improved.
|
|
5
|
+
Update when new patterns emerge or existing patterns are confirmed/disproven.
|
|
6
|
+
|
|
7
|
+
Source: SESSION-LOG.md (friction and finding fields), agent self-observation
|
|
8
|
+
Parent: agentWorkflows/INDEX.md (update recent findings when this changes) -->
|
|
9
|
+
|
|
10
|
+
## Effective patterns
|
|
11
|
+
|
|
12
|
+
<!-- AGENT: Patterns that consistently lead to good outcomes (accepted results,
|
|
13
|
+
efficient execution, accurate context loading). -->
|
|
14
|
+
|
|
15
|
+
### Context loading
|
|
16
|
+
|
|
17
|
+
<!-- What context loading strategies work best for this project? -->
|
|
18
|
+
|
|
19
|
+
### Cascade compliance
|
|
20
|
+
|
|
21
|
+
<!-- How well are cascade rules followed? Any patterns in misses? -->
|
|
22
|
+
|
|
23
|
+
- **Cascade compliance rate**: {triggered/expected} ({%})
|
|
24
|
+
- **Common cascade misses**: {which cascade rules get missed most?}
|
|
25
|
+
|
|
26
|
+
### Decision recording
|
|
27
|
+
|
|
28
|
+
<!-- Is decision recording happening in the same response? Any delays? -->
|
|
29
|
+
|
|
30
|
+
### Query routing
|
|
31
|
+
|
|
32
|
+
<!-- Are queries routing to the correct workflow? Any misclassifications? -->
|
|
33
|
+
|
|
34
|
+
## Friction points
|
|
35
|
+
|
|
36
|
+
<!-- AGENT: Patterns that consistently cause problems — methodology rules that
|
|
37
|
+
are hard to follow, scoping that doesn't fit, cascades that are unclear. -->
|
|
38
|
+
|
|
39
|
+
### Recurring friction
|
|
40
|
+
|
|
41
|
+
| Pattern | Frequency | Impact | Potential fix |
|
|
42
|
+
|---------|-----------|--------|--------------|
|
|
43
|
+
<!-- {description} | {how often} | {low/medium/high} | {what might help} -->
|
|
44
|
+
|
|
45
|
+
### Methodology gaps
|
|
46
|
+
|
|
47
|
+
<!-- Are there query types or situations not covered by current scoping rules? -->
|
|
48
|
+
|
|
49
|
+
### Scale issues
|
|
50
|
+
|
|
51
|
+
<!-- Are any files consistently approaching the 300-line threshold? -->
|
|
52
|
+
|
|
53
|
+
## Anti-patterns
|
|
54
|
+
|
|
55
|
+
<!-- AGENT: Things that should be avoided — approaches that lead to rejections,
|
|
56
|
+
context loading that wastes tokens, cascades that produce low-value updates. -->
|
|
57
|
+
|
|
58
|
+
| Anti-pattern | Observed | Consequence | Prevention |
|
|
59
|
+
|-------------|----------|-------------|------------|
|
|
60
|
+
<!-- {description} | {when it happened} | {what went wrong} | {how to avoid} -->
|
|
61
|
+
|
|
62
|
+
## Improvement suggestions
|
|
63
|
+
|
|
64
|
+
<!-- AGENT: Based on patterns observed, what methodology changes would help? -->
|
|
65
|
+
|
|
66
|
+
| Suggestion | Evidence | Priority | Status |
|
|
67
|
+
|-----------|----------|----------|--------|
|
|
68
|
+
<!-- {what to change} | {based on what pattern} | {low/medium/high} | {proposed / implemented / rejected} -->
|
|
@@ -0,0 +1,92 @@
|
|
|
1
|
+
# Session Analysis
|
|
2
|
+
|
|
3
|
+
<!-- AGENT: Synthesize from SESSION-LOG.md. Aggregate session metrics into
|
|
4
|
+
actionable patterns. This transforms raw session data into analysis.
|
|
5
|
+
Update after every 5 sessions or after any high-effort session.
|
|
6
|
+
|
|
7
|
+
Source: SESSION-LOG.md
|
|
8
|
+
Parent: agentWorkflows/INDEX.md (update quick stats when this changes) -->
|
|
9
|
+
|
|
10
|
+
## Effort distribution
|
|
11
|
+
|
|
12
|
+
| Effort level | Count | Percentage | Avg time |
|
|
13
|
+
|-------------|-------|------------|----------|
|
|
14
|
+
| Low | {N} | {%} | ~{N} min |
|
|
15
|
+
| Medium | {N} | {%} | ~{N} min |
|
|
16
|
+
| High | {N} | {%} | ~{N} min |
|
|
17
|
+
|
|
18
|
+
## Query type frequency
|
|
19
|
+
|
|
20
|
+
<!-- AGENT: Which query types appear most often in SESSION-LOG.md? -->
|
|
21
|
+
|
|
22
|
+
| Query type | Count | Typical effort | Typical outcome |
|
|
23
|
+
|-----------|-------|---------------|----------------|
|
|
24
|
+
<!-- Populate from SESSION-LOG.md queries field -->
|
|
25
|
+
|
|
26
|
+
## Workflow usage
|
|
27
|
+
|
|
28
|
+
| Workflow | Count | Success rate | Avg effort |
|
|
29
|
+
|----------|-------|-------------|------------|
|
|
30
|
+
<!-- Populate from SESSION-LOG.md workflow field -->
|
|
31
|
+
|
|
32
|
+
## Acceptance analysis
|
|
33
|
+
|
|
34
|
+
### Overall
|
|
35
|
+
|
|
36
|
+
| Response | Count | Percentage |
|
|
37
|
+
|----------|-------|------------|
|
|
38
|
+
| Accepted | {N} | {%} |
|
|
39
|
+
| Edited | {N} | {%} |
|
|
40
|
+
| Revised | {N} | {%} |
|
|
41
|
+
| Rejected | {N} | {%} |
|
|
42
|
+
| Redirected | {N} | {%} |
|
|
43
|
+
|
|
44
|
+
### By effort level
|
|
45
|
+
|
|
46
|
+
<!-- AGENT: Break down acceptance rates by effort level. Do high-effort tasks
|
|
47
|
+
get revised more often? -->
|
|
48
|
+
|
|
49
|
+
| Effort | Accepted | Edited | Revised | Rejected |
|
|
50
|
+
|--------|----------|--------|---------|----------|
|
|
51
|
+
| Low | {%} | {%} | {%} | {%} |
|
|
52
|
+
| Medium | {%} | {%} | {%} | {%} |
|
|
53
|
+
| High | {%} | {%} | {%} | {%} |
|
|
54
|
+
|
|
55
|
+
## Refinement patterns
|
|
56
|
+
|
|
57
|
+
<!-- AGENT: For medium/high effort tasks, what refinement patterns emerge? -->
|
|
58
|
+
|
|
59
|
+
### Magnitude distribution
|
|
60
|
+
|
|
61
|
+
| Magnitude | Count | Percentage |
|
|
62
|
+
|-----------|-------|------------|
|
|
63
|
+
| None | {N} | {%} |
|
|
64
|
+
| Minor | {N} | {%} |
|
|
65
|
+
| Moderate | {N} | {%} |
|
|
66
|
+
| Major | {N} | {%} |
|
|
67
|
+
| Rework | {N} | {%} |
|
|
68
|
+
|
|
69
|
+
### Delta categories
|
|
70
|
+
|
|
71
|
+
<!-- Which types of changes are most common? -->
|
|
72
|
+
|
|
73
|
+
| Category | Count | Notes |
|
|
74
|
+
|----------|-------|-------|
|
|
75
|
+
| Accuracy | {N} | {pattern notes} |
|
|
76
|
+
| Completeness | {N} | {pattern notes} |
|
|
77
|
+
| Approach | {N} | {pattern notes} |
|
|
78
|
+
| Scope | {N} | {pattern notes} |
|
|
79
|
+
| Style | {N} | {pattern notes} |
|
|
80
|
+
|
|
81
|
+
## Context level patterns
|
|
82
|
+
|
|
83
|
+
<!-- AGENT: How much context is typically loaded? Does more context correlate with
|
|
84
|
+
better acceptance rates? -->
|
|
85
|
+
|
|
86
|
+
| Context level | Count | Acceptance rate |
|
|
87
|
+
|--------------|-------|----------------|
|
|
88
|
+
| Very low | {N} | {%} |
|
|
89
|
+
| Low | {N} | {%} |
|
|
90
|
+
| Medium | {N} | {%} |
|
|
91
|
+
| High | {N} | {%} |
|
|
92
|
+
| Very high | {N} | {%} |
|
|
@@ -0,0 +1,39 @@
|
|
|
1
|
+
# Methodology Overview
|
|
2
|
+
|
|
3
|
+
This project uses the **wwa** (Working With Agents) methodology for AI-agent-assisted development. The methodology gives your AI agent persistent memory, structured workflows, and scoped context loading across sessions.
|
|
4
|
+
|
|
5
|
+
## How it works
|
|
6
|
+
|
|
7
|
+
Your agent reads an entry point file (CLAUDE.md, .cursorrules, or AGENT.md) at the start of every session. That file tells the agent:
|
|
8
|
+
|
|
9
|
+
- **What to read** — scoping rules match your question to the right files
|
|
10
|
+
- **What to update** — cascade rules keep dependent files in sync
|
|
11
|
+
- **How to work** — workflows guide the agent through structured steps
|
|
12
|
+
|
|
13
|
+
Key files the agent manages:
|
|
14
|
+
|
|
15
|
+
| File | Purpose |
|
|
16
|
+
|------|---------|
|
|
17
|
+
| STATE.md | Decisions, blockers, current position (cross-session memory) |
|
|
18
|
+
| PLAN.md | Current task with verification criteria |
|
|
19
|
+
| ROADMAP.md | Phase breakdown with gate criteria |
|
|
20
|
+
| REQUIREMENTS.md | Scoped features with phase traceability |
|
|
21
|
+
| .context/BASE.md | Core project context — architecture, codebase map |
|
|
22
|
+
| .context/REGISTRY.md | Navigation map for split file trees |
|
|
23
|
+
| .context/DOCS-MAP.md | Maps your project components to their documentation |
|
|
24
|
+
|
|
25
|
+
## Your project's docs/
|
|
26
|
+
|
|
27
|
+
The `docs/` folder is reserved for **your project's documentation** — API references, architecture guides, setup instructions, etc. It is not created at setup time. Instead, the agent proposes new docs/ files as your project grows, based on scaffolding rules in `.context/DOCS-MAP.md`.
|
|
28
|
+
|
|
29
|
+
## Full documentation
|
|
30
|
+
|
|
31
|
+
For the complete methodology guide, templates reference, and architecture docs:
|
|
32
|
+
|
|
33
|
+
**https://github.com/anthropics/agent-method**
|
|
34
|
+
|
|
35
|
+
Key pages:
|
|
36
|
+
- [Quick Start](https://github.com/anthropics/agent-method/blob/main/docs/guides/quick-start.md)
|
|
37
|
+
- [For Developers](https://github.com/anthropics/agent-method/blob/main/docs/guides/for-developers.md)
|
|
38
|
+
- [File Roles](https://github.com/anthropics/agent-method/blob/main/docs/architecture/file-roles.md)
|
|
39
|
+
- [CLI Tools](https://github.com/anthropics/agent-method/blob/main/docs/guides/for-developers/cli-tools.md)
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
# Feature Registry — Index
|
|
2
|
+
# Split into registry/features/. Tools reassemble on load.
|
|
3
|
+
# CLI: wwa route, wwa check, wwa scan, wwa init
|
|
4
|
+
#
|
|
5
|
+
# Four layers:
|
|
6
|
+
# 1. Feature catalog — WHAT each capability is
|
|
7
|
+
# 2. Guided workflows — HOW features compose into task patterns
|
|
8
|
+
# 3. Agent protocol — WHY the agent does what it does
|
|
9
|
+
# 4. Routing rules — HOW queries map to features automatically
|
|
10
|
+
|
|
11
|
+
version: v1.6
|
|
12
|
+
|
|
13
|
+
layers:
|
|
14
|
+
- id: catalog
|
|
15
|
+
file: features/catalog.yaml
|
|
16
|
+
description: "Domains + features — WHAT each capability is"
|
|
17
|
+
- id: workflows
|
|
18
|
+
file: features/workflows.yaml
|
|
19
|
+
description: "Guided workflows — HOW features compose into task patterns"
|
|
20
|
+
- id: protocol
|
|
21
|
+
file: features/protocol.yaml
|
|
22
|
+
description: "Agent behavioral protocol — WHY the agent does what it does"
|
|
23
|
+
- id: routing
|
|
24
|
+
file: features/routing.yaml
|
|
25
|
+
description: "Routing rules — HOW queries map to features automatically"
|