npm - agentweaver - Versions diffs - 0.1.17 → 0.1.18 - Mend

agentweaver 0.1.17 → 0.1.18

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/README.md +104 -23
package/dist/artifacts.js +41 -0
package/dist/index.js +252 -27
package/dist/interactive/controller.js +249 -13
package/dist/interactive/ink/index.js +2 -2
package/dist/interactive/state.js +1 -0
package/dist/interactive/web/index.js +179 -0
package/dist/interactive/web/protocol.js +154 -0
package/dist/interactive/web/server.js +575 -0
package/dist/interactive/web/static/app.js +709 -0
package/dist/interactive/web/static/index.html +77 -0
package/dist/interactive/web/static/styles.css +2 -0
package/dist/interactive/web/static/styles.input.css +469 -0
package/dist/pipeline/flow-catalog.js +4 -0
package/dist/pipeline/flow-specs/auto-common-guided.json +313 -0
package/dist/pipeline/flow-specs/auto-common.json +3 -1
package/dist/pipeline/flow-specs/design-review/design-review-loop.json +2 -0
package/dist/pipeline/flow-specs/design-review.json +2 -0
package/dist/pipeline/flow-specs/implement.json +3 -1
package/dist/pipeline/flow-specs/plan.json +4 -0
package/dist/pipeline/flow-specs/playbook-init.json +199 -0
package/dist/pipeline/flow-specs/review/review-fix.json +3 -1
package/dist/pipeline/flow-specs/review/review-loop.json +4 -0
package/dist/pipeline/flow-specs/review/review.json +2 -0
package/dist/pipeline/node-registry.js +45 -0
package/dist/pipeline/nodes/flow-run-node.js +13 -1
package/dist/pipeline/nodes/playbook-ensure-node.js +115 -0
package/dist/pipeline/nodes/playbook-inventory-node.js +51 -0
package/dist/pipeline/nodes/playbook-questions-form-node.js +166 -0
package/dist/pipeline/nodes/playbook-write-node.js +243 -0
package/dist/pipeline/nodes/project-guidance-node.js +69 -0
package/dist/pipeline/prompt-registry.js +4 -1
package/dist/pipeline/prompt-runtime.js +6 -2
package/dist/pipeline/spec-types.js +19 -0
package/dist/pipeline/value-resolver.js +39 -1
package/dist/playbook/practice-candidates.js +12 -0
package/dist/playbook/repo-inventory.js +208 -0
package/dist/prompts.js +31 -0
package/dist/runtime/playbook.js +485 -0
package/dist/runtime/project-guidance.js +339 -0
package/dist/structured-artifact-schema-registry.js +8 -0
package/dist/structured-artifact-schemas.json +235 -0
package/dist/structured-artifacts.js +7 -1
package/docs/declarative-workflows.md +565 -0
package/docs/features.md +77 -0
package/docs/playbook.md +327 -0
package/package.json +8 -3

package/README.md CHANGED Viewed

@@ -1,34 +1,44 @@
 # AgentWeaver
-`AgentWeaver` is a TypeScript/Node.js CLI for harness engineering around coding agents.
+`AgentWeaver` is a TypeScript/Node.js CLI for engineering durable workflows around coding agents.
-It is built around declarative workflow specs. A flow describes phases and steps in JSON, runtime nodes implement behavior in TypeScript, and artifacts on disk make runs resumable, inspectable, and operationally manageable from the TUI.
+It is built for teams that want agent work to behave less like one-off prompting and more like an inspectable engineering system: explicit workflows, durable artifacts, repeatable review gates, resumable execution, and repository-local guidance that evolves with the codebase.
 Typical usage looks like:
 `plan -> implement -> run-go-linter-loop -> run-go-tests-loop -> review -> review-fix`
-The important part is not that exact chain. The point is that AgentWeaver lets you design, operate, and evolve durable agent harnesses instead of accumulating one-off prompts and shell glue.
+Planning-heavy work can use:
-For planning-heavy work, a typical path can now include `plan -> design-review -> implement`, where `design-review` critiques planning artifacts before coding starts.
+`plan -> design-review -> implement -> review-loop`
-## What It Does
+The important part is not the exact chain. The point is that AgentWeaver lets you model, operate, and evolve the harness around the agent.
-- Fetches Jira issue context by issue key or browse URL
-- Fetches GitLab merge request diff and review data into reusable artifacts
-- Runs Codex-, OpenCode-, and process-backed stages through a common pipeline runtime
-- Persists artifacts and compact flow execution state under the current project scope
-- Supports both operator-driven work in a TUI and end-to-end automation flows
-- Resumes interrupted declarative flows when required artifacts and launch profile still match
+## Key Features
-## Harness Engineering Focus
+See [docs/features.md](docs/features.md) for the expanded feature overview.
+- **Declarative agent workflows**: flows are JSON specs with phases, steps, prompt bindings, params, expectations, and post-step actions. Workflow design stays declarative while runtime behavior lives in typed nodes and executors.
+- **Repository-local project playbook**: stable project conventions live under `.agentweaver/playbook/` as versioned rules, examples, and templates. Guided flows select relevant guidance before planning, implementation, review, and repair so repeated agent runs inherit the same project knowledge.
+- **Artifact-first execution**: each stage produces structured JSON and human-readable markdown artifacts on disk. Artifacts are the contract between stages, which makes runs inspectable, reviewable, and restartable.
+- **Planning and design-review gates**: planning flows produce design, implementation plan, and QA plan artifacts. `design-review` critiques those artifacts before coding starts, and `auto-common` can iterate through `plan-revise` before implementation.
+- **Review and repair loops**: review flows produce structured findings with severities. Repair flows can select blockers and critical findings, apply targeted fixes, and run follow-up checks.
+- **Resumable automation**: long-running flows persist compact execution state, support resume/continue/restart semantics, and can restart from selected phases when the artifacts and launch profile are compatible.
+- **Multiple execution backends**: Codex, OpenCode, shell/process checks, Jira, GitLab, Git commit, and Telegram notification integrations run through a common executor model.
+- **Interactive TUI and direct CLI**: the same workflow model works in an operator-driven terminal UI, direct CLI commands, and non-interactive automation.
+- **Custom flows**: built-in flows can be extended with global or project-local flow specs without changing AgentWeaver source code.
+- **Plugin SDK**: local plugins can add public-SDK-compatible nodes and executors, with manifest validation, version checks, and documented entrypoint rules.
+- **Operational diagnostics**: `doctor` checks system readiness, executor configuration, flow specs, node versions, and runtime environment shape before workflows fail mid-run.
+## Why Harness Engineering
 AgentWeaver is not positioned as a thin wrapper around one agent call. It is meant for harness engineering:
-- workflows are modeled explicitly as phases, steps, prompts, params, expectations, and artifacts
-- execution logic is isolated into reusable nodes and executors instead of being embedded in ad-hoc scripts
-- artifacts on disk are the contract between stages, which makes runs reviewable and restartable
-- the same workflow model can be used in direct CLI mode, interactive TUI mode, and resumable automation flows
+- The workflow is explicit instead of hidden in a long prompt.
+- The intermediate decisions are persisted instead of disappearing in chat history.
+- The agent receives project guidance from the repository instead of relying on memory or copy-pasted instructions.
+- Review, repair, checks, and restart behavior are first-class parts of the workflow.
+- The same model works in local CLI use, interactive operation, and automation.
 In practice, this means you can treat an agent workflow like an engineered system: versioned, inspectable, repeatable, and debuggable.
@@ -40,14 +50,15 @@ In practice, this means you can treat an agent workflow like an engineered syste
 - `scope`: isolated workspace key for artifacts and flow state; usually based on Jira task, otherwise derived from git context
 - `artifact`: file produced or consumed by flows, used as the stable contract between stages
 - `flow state`: compact persisted execution metadata used for resume/restart in long-running flows such as `auto-golang`
+- `project playbook`: local `.agentweaver/playbook/` directory with `manifest.yaml`, practices, examples, and templates; the format is described in [docs/playbook.md](docs/playbook.md)
-## Семантика Запуска
+## Launch Semantics
-- `resume` возобновляет только реально прерванный запуск и использует сохранённое состояние исполнения без пересборки уже выполненных шагов
-- `continue` предназначен для завершённых итерационных циклов и запускает следующую итерацию от последних валидных артефактов без удаления исторических артефактов
-- `restart` считается новым запуском: текущая активная попытка архивируется в `.agentweaver/scopes/<scope>/.artifacts/restart-archives/attempt-XXXX`, после чего создаётся новая активная попытка
-- Для неоднозначных запусков оператор должен явно выбрать действие: в интерактивном режиме через подтверждение, в неинтерактивном режиме через `--resume`, `--continue` или `--restart`
-- Контракт распространяется на `auto-common`, `auto-simple`, `auto-golang`, `instant-task`, `review-loop`, `run-go-linter-loop` и `run-go-tests-loop`
+- `resume` only resumes a genuinely interrupted run and uses the saved execution state without rebuilding already completed steps
+- `continue` is intended for completed iterative cycles and starts the next iteration from the latest valid artifacts without deleting historical artifacts
+- `restart` is treated as a new run: the current active attempt is archived under `.agentweaver/scopes/<scope>/.artifacts/restart-archives/attempt-XXXX`, then a new active attempt is created
+- For ambiguous launches, the operator must choose the action explicitly: by confirmation in interactive mode, or with `--resume`, `--continue`, or `--restart` in non-interactive mode
+- This contract applies to `auto-common`, `auto-simple`, `auto-golang`, `instant-task`, `review-loop`, `run-go-linter-loop`, and `run-go-tests-loop`
 ## Declarative Workflow Model
@@ -62,6 +73,8 @@ The center of the system is the declarative flow spec:
 This keeps workflow design in JSON while keeping implementation details in typed runtime code.
+The full flow-spec reference now lives in [docs/declarative-workflows.md](docs/declarative-workflows.md).
 ## Repository Layout
 - `src/index.ts` — CLI entrypoint, interactive mode bootstrap, and top-level orchestration
@@ -109,6 +122,30 @@ There are also built-in nested/helper flows that are loaded declaratively but ar
 - `opencode` CLI if you use OpenCode-backed stages
 - access to Jira and/or GitLab when the selected flow needs them
+## Web UI
+The `agentweaver web [--no-open] [--host <host>|--listen-all] [<jira-browse-url|jira-issue-key>]` command starts interactive mode through the Web UI. By default, the server binds to `127.0.0.1`, asks the operating system for a random port, and prints the final address as `AgentWeaver Web UI: http://127.0.0.1:<port>/`.
+To open the Web UI from another machine on a trusted network, configure Web UI credentials first:
+```bash
+export AGENTWEAVER_WEB_USERNAME=operator
+export AGENTWEAVER_WEB_PASSWORD='choose-a-strong-password'
+agentweaver web --listen-all --no-open
+```
+External binding requires both `AGENTWEAVER_WEB_USERNAME` and `AGENTWEAVER_WEB_PASSWORD`. This applies to `agentweaver web --listen-all`, `agentweaver web --host 0.0.0.0`, `agentweaver web --host ::`, explicit non-loopback IP addresses such as `192.168.1.10` or `2001:db8::1`, and any hostname other than `localhost`. In this mode, the server listens on the requested interface; connect to the IP address or hostname of the machine running AgentWeaver and the assigned port.
+The default localhost bindings, including `127.0.0.1`, `::1`, and `localhost`, remain no-auth by default. If Web UI credentials are configured, the same Basic auth check also protects localhost Web UI requests.
+Web UI authentication uses HTTP Basic auth. Over plain HTTP, use it only on trusted networks because credentials are not encrypted in transit. For untrusted networks, put AgentWeaver behind TLS termination or an equivalent reverse proxy.
+By default, AgentWeaver tries to open the browser after the server starts successfully and the URL is printed. For CI, tests, and manual smoke checks, use `agentweaver web --no-open` or the `AGENTWEAVER_WEB_NO_OPEN=1` environment variable; the `--no-open` flag is supported only after the `web` command.
+The Web UI serves the operator console from the same local process, including `/`, `/static/app.js`, and `/static/styles.css`. Live browser interaction uses WebSocket on `/__agentweaver/ws`. Bounded checks can use `GET /__agentweaver/health`, and shutdown is available through `POST /__agentweaver/exit` or `SIGINT`/`SIGTERM`.
+Web UI state is process-local: it exists only while the AgentWeaver process is running and is not shared with other AgentWeaver processes. The Web UI is intended to match the interactive operator workflow for flow selection, launch confirmation, routing and user-input forms, progress and logs, and interrupt handling.
 ## Installation
 Local development:
@@ -295,7 +332,7 @@ Notes:
 - `--verbose` streams child process stdout/stderr in direct CLI mode
 - `--prompt <text>` appends extra instructions to the prompt
 - `--scope <name>` is supported by scope-flexible flows such as `implement`, `review`, `review-fix`, `review-loop`, `run-go-tests-loop`, `run-go-linter-loop`, `gitlab-review`, and `gitlab-diff-review`
-- `--md-lang <en|ru>` currently applies to `plan`
+- `--md-lang <en|ru>` applies only to generated workflow markdown artifacts, not repository source files or committed documentation
 - `--force` only affects interactive mode: it skips loading cached summary-pane content on startup so Jira-backed flows that regenerate summary artifacts can repopulate it during the run
 - Jira-backed flows ask for Jira input interactively when it is omitted
 - `task-describe` can also work from manual task description input without Jira
@@ -336,6 +373,7 @@ Artifacts and flow state are stored under the current project scope. In practice
 - Jira-backed runs usually use the Jira issue key as scope
 - non-Jira runs can fall back to a git-derived scope
 - `--scope <name>` lets you override the default for supported commands
+- interactive and web sessions automatically switch the branch-derived scope after the git branch changes, unless the session was started with an explicit Jira argument or `--scope`
 The runtime uses artifacts as the contract between stages, including markdown outputs and structured JSON files validated against schemas.
@@ -427,7 +465,50 @@ Recommended smoke checks:
 node dist/index.js --help
 node dist/index.js auto-golang --help-phases
 node dist/index.js auto-common --help-phases
+node dist/index.js auto-common-guided --help-phases
 node dist/index.js plan --dry DEMO-1234
 node dist/index.js implement --dry DEMO-1234
 node dist/index.js review --dry DEMO-1234
 ```
+## Guided Project Guidance
+The project playbook is AgentWeaver's way to turn project-specific conventions into durable agent context. Instead of repeating the same instructions in every prompt, a repository can keep stable rules, examples, and templates under `.agentweaver/playbook/`. Guided flows validate that material, select the parts relevant to the current task and phase, and pass compact guidance into the model before planning, implementation, review, and repair.
+Typical playbook content includes:
+- engineering rules such as required test locations, documentation language, or runtime validation boundaries
+- examples that should be opened only when relevant, instead of pasted into every prompt
+- templates for recurring artifact shapes or implementation notes
+- repository context that should remain visible across tasks without overriding task-specific inputs
+The guided flow is `auto-common-guided`. It first runs the same Jira fetch and task normalization steps as `auto-common`, then validates `.agentweaver/playbook/manifest.yaml` and generates compact project guidance before the `plan`, `design-review`, `implement`, `review`, and `repair/review-fix` phases. JSON artifacts remain English and machine-readable; workflow markdown artifacts are generated in the workflow-selected language. The markdown language setting does not apply to repository source files, committed documentation, or playbook rules.
+The guidance is intentionally phase-aware. A rule can apply only to `plan`, `implement`, `review`, or another supported phase; it can also target languages, frameworks, glob patterns, and keywords. AgentWeaver writes both a structured `project-guidance/v1` JSON artifact and a derivative markdown file, then passes their paths into the phase prompt as supplemental project-local context.
+Initialize or refresh the playbook with:
+```bash
+agentweaver playbook-init
+agentweaver playbook-init --accept-playbook-draft
+```
+Use the guided flow with:
+```bash
+agentweaver auto-common-guided --help-phases
+agentweaver auto-common-guided --accept-playbook-draft DEMO-1234
+```
+The workflow does not read old `playbook.json` or `playbook.md` files as fallbacks. In non-interactive runs, a missing manifest stops the workflow before planning and reports the required action: run `agentweaver playbook-init --accept-playbook-draft` first, or rerun `agentweaver auto-common-guided --accept-playbook-draft <jira>`. The `--accept-playbook-draft` flag explicitly accepts the generated playbook without interactive review and allows AgentWeaver to write the manifest-based layout. An invalid manifest stops the guided phase before the LLM prompt.
+To inspect whether playbook guidance participated in a run, check the generated artifacts:
+```bash
+find .agentweaver/scopes -name 'project-guidance-*'
+rg -n "Project Guidance|practice\\." .agentweaver/scopes
+```
+Keep `.agentweaver/playbook/` in Git even when other AgentWeaver runtime state is ignored. The playbook format and maintenance workflow are documented in [docs/playbook.md](docs/playbook.md).
+Current limitations: skills integration is not available yet; the playbook generator must rely on repository evidence and clarification answers; guided prompts receive compact context and open full examples only when they are directly relevant to the current phase.

package/dist/artifacts.js CHANGED Viewed

@@ -163,6 +163,20 @@ export function taskContextFile(taskKey, iteration) {
 export function taskContextJsonFile(taskKey, iteration) {
     return versionedJsonArtifactFile(taskKey, "task-context", iteration);
 }
+export function projectGuidanceArtifactStem(phase) {
+    switch (phase) {
+        case "repair/review-fix":
+            return "project-guidance-repair-review-fix";
+        default:
+            return `project-guidance-${phase}`;
+    }
+}
+export function projectGuidanceFile(taskKey, phase, iteration) {
+    return versionedMarkdownArtifactFile(taskKey, projectGuidanceArtifactStem(phase), iteration);
+}
+export function projectGuidanceJsonFile(taskKey, phase, iteration) {
+    return versionedJsonArtifactFile(taskKey, projectGuidanceArtifactStem(phase), iteration);
+}
 export function taskDescribeInputJsonFile(taskKey) {
     return taskArtifactsFile(taskKey, `task-describe-input-${taskKey}.json`);
 }
@@ -175,6 +189,33 @@ export function gitStatusJsonFile(taskKey) {
 export function gitDiffFile(taskKey) {
     return taskWorkspaceFile(taskKey, `git-diff-${taskKey}.txt`);
 }
+export function repoInventoryFile(taskKey) {
+    return taskWorkspaceFile(taskKey, `repo-inventory-${taskKey}.md`);
+}
+export function repoInventoryJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `repo-inventory-${taskKey}.json`);
+}
+export function practiceCandidatesFile(taskKey) {
+    return taskWorkspaceFile(taskKey, `practice-candidates-${taskKey}.md`);
+}
+export function practiceCandidatesJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `practice-candidates-${taskKey}.json`);
+}
+export function playbookQuestionsJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `playbook-questions-${taskKey}.json`);
+}
+export function playbookAnswersJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `playbook-answers-${taskKey}.json`);
+}
+export function playbookDraftFile(taskKey) {
+    return taskWorkspaceFile(taskKey, `playbook-draft-${taskKey}.md`);
+}
+export function playbookDraftJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `playbook-draft-${taskKey}.json`);
+}
+export function playbookWriteResultJsonFile(taskKey) {
+    return taskArtifactsFile(taskKey, `playbook-write-result-${taskKey}.json`);
+}
 export function gitCommitMessageJsonFile(taskKey) {
     return taskArtifactsFile(taskKey, `git-commit-message-${taskKey}.json`);
 }