agestra 4.14.5 → 4.15.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. package/.claude-plugin/marketplace.json +1 -1
  2. package/.claude-plugin/plugin.json +1 -13
  3. package/.gemini/commands/agestra/research.toml +5 -6
  4. package/.gemini/commands/agestra/review.toml +2 -2
  5. package/AGENTS.md +22 -11
  6. package/GEMINI.md +13 -9
  7. package/README.ja.md +10 -13
  8. package/README.ko.md +10 -13
  9. package/README.md +10 -13
  10. package/README.zh.md +10 -13
  11. package/agents/agestra-debate.md +33 -28
  12. package/agents/agestra-research.md +24 -11
  13. package/agents/agestra-team-lead.md +137 -134
  14. package/commands/research.md +115 -154
  15. package/commands/review.md +27 -22
  16. package/commands/setup.md +33 -17
  17. package/dist/bundle.js +207 -435
  18. package/hooks/user-prompt-submit.js +9 -20
  19. package/package.json +5 -2
  20. package/scripts/host-assets/categories.mjs +6 -16
  21. package/scripts/host-assets/codex-assets.mjs +183 -6
  22. package/scripts/host-assets/gemini-assets.mjs +110 -7
  23. package/scripts/host-assets/manifest.mjs +10 -0
  24. package/skills/cancel.md +7 -18
  25. package/skills/design.md +16 -13
  26. package/skills/idea.md +19 -16
  27. package/skills/leader.md +84 -76
  28. package/skills/plan.md +119 -0
  29. package/skills/provider-guide.md +122 -103
  30. package/skills/qa.md +85 -48
  31. package/skills/references/lenses/README.md +9 -7
  32. package/skills/references/lenses/e2e.md +16 -15
  33. package/skills/references/lenses/research-domains/planning.md +31 -0
  34. package/skills/references/lenses/research.md +2 -2
  35. package/skills/research.md +96 -172
  36. package/skills/review.md +29 -24
  37. package/skills/security.md +13 -9
  38. package/skills/setup.md +31 -17
  39. package/.gemini/commands/agestra/design.toml +0 -16
  40. package/.gemini/commands/agestra/idea.toml +0 -16
  41. package/.gemini/commands/agestra/implement.toml +0 -16
  42. package/.gemini/commands/agestra/qa.toml +0 -16
  43. package/.gemini/commands/agestra/security.toml +0 -16
  44. package/agents/agestra-implementer.md +0 -126
  45. package/commands/design.md +0 -153
  46. package/commands/idea.md +0 -146
  47. package/commands/implement.md +0 -151
  48. package/commands/qa.md +0 -143
  49. package/commands/security.md +0 -119
  50. package/skills/e2e.md +0 -72
  51. package/skills/references/lenses/research-domains/implement.md +0 -33
  52. package/skills/worker-manage.md +0 -79
@@ -12,7 +12,7 @@
12
12
  "name": "agestra",
13
13
  "source": "./",
14
14
  "description": "Multi-host MCP orchestration across Claude, Ollama, Gemini, and Codex for review, QA, and cross-validation",
15
- "version": "4.14.5",
15
+ "version": "4.15.1",
16
16
  "author": {
17
17
  "name": "mua-vtuber"
18
18
  },
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "agestra",
3
- "version": "4.14.5",
3
+ "version": "4.15.1",
4
4
  "description": "Claude Code plugin — multi-host MCP orchestration across Claude, Ollama, Gemini, and Codex for review, QA, and cross-validation",
5
5
  "mcpServers": {
6
6
  "agestra": {
@@ -9,17 +9,5 @@
9
9
  "${CLAUDE_PLUGIN_ROOT}/dist/bundle.js"
10
10
  ]
11
11
  }
12
- },
13
- "hooks": {
14
- "UserPromptSubmit": [
15
- {
16
- "hooks": [
17
- {
18
- "type": "command",
19
- "command": "node ${CLAUDE_PLUGIN_ROOT}/hooks/user-prompt-submit.js"
20
- }
21
- ]
22
- }
23
- ]
24
12
  }
25
13
  }
@@ -1,16 +1,15 @@
1
1
  # Generated by Agestra. Managed file.
2
- description = "Run research using a selected investigation topology"
2
+ description = "Run host-owned Agestra research with an idea, QA, or security viewpoint"
3
3
  prompt = """
4
4
  You are executing the `/agestra research` Gemini command.
5
5
 
6
- - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows that continue into domain consensus, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
6
+ - Start with `setup_status`; provider availability is not a gate for research.
7
+ - Ask for the research viewpoint when missing: Idea exploration, QA evidence set, or Security evidence set.
8
+ - Use host-owned `agestra-research` assignments. Do not ask for a research topology or provider investigation mode.
9
+ - Host research contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
10
  호스트가 조사한다.
10
11
  호스트가 정리한다.
11
- 시스템이 토론한다.
12
12
  호스트가 문서화한다.
13
- - External AI research and debate run in separate fresh sessions, even when the same provider participates in both phases.
14
13
 
15
14
  @{commands/research.md}
16
15
  """
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra review` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
package/AGENTS.md CHANGED
@@ -16,38 +16,49 @@ Use `host_assets_status` to inspect generated Codex host assets, and only call `
16
16
  ## How to Work Here
17
17
 
18
18
  - Default to direct Codex work using the workspace `AGENTS.md` contract, oh-my-codex workflows, and Superpowers-style skills when they apply.
19
- - Use Agestra primarily for explicit multi-AI or provider orchestration requests, such as when the user names Agestra, Codex/Gemini/Ollama providers, "multi-AI", "multiple AI", "provider", `agent_debate_*`, `cli_worker_*`, or asks to gather/compare several AI opinions.
19
+ - Use Agestra primarily for explicit multi-AI or provider-backed review, QA, security, design, idea, and evidence/consensus work, such as when the user names Agestra, Codex/Gemini/Ollama providers, "multi-AI", "multiple AI", "provider", or asks to gather/compare several AI opinions.
20
20
  - Plain review/QA/check requests without `/agestra` or explicit multi-AI/provider wording stay with the current host; they are not Agestra natural-language auto-triggers.
21
21
  - Agestra natural-language routing requires explicit multi-AI/provider wording such as "multiple AIs", "all AIs", "other AI", "multi-AI", "Codex and Gemini", "provider comparison", or "프로바이더 비교". Explicit `/agestra ...` commands remain supported.
22
22
  - Native helper agents are created by the active host layer. In Codex, use the generated custom agents installed from these assets; external MCP/CLI/chat providers participate through Agestra tools and never create or manage Codex native agents.
23
23
  - Keep Agestra setup/status/provider checks as installation and health checks, not as workflow-routing triggers.
24
24
  - Run `setup_status`, `environment_check`, and `provider_list` when the task concerns Agestra installation, MCP registration, host assets, provider availability, or before entering an Agestra workflow. If `setup_status` reports `Setup required: yes`, complete interactive setup first and then resume the original task.
25
25
  - Do not treat ordinary review, QA, security, design, idea, implementation, cleanup, build-fix, or planning requests as Agestra workflows just because setup/status/provider checks exist.
26
+ - Agestra does not implement product code or author persistent E2E test files. Code and test authoring should happen in the current host first, then Agestra can review, QA, security-check, design-check, or discuss the result.
26
27
  - When an Agestra workflow is active, treat `commands/*.md` as the source of truth for that workflow.
27
28
  - Prefer Agestra MCP tools over ad-hoc multi-provider prompting only when the task is actually in Agestra/multi-provider mode.
28
29
  - If any legacy workflow text mentions old single-host Agestra execution, treat it as obsolete. Direct current-host work should happen outside Agestra workflows.
29
30
 
30
31
  ## Workflow Mapping
31
32
 
33
+ - Public slash commands are limited to setup, research, and review.
34
+ - Setup and research requests follow `commands/setup.md` and `commands/research.md`.
32
35
  - When Agestra is active, review requests follow `commands/review.md`
33
- - When Agestra is active, QA / verification requests follow `commands/qa.md`
34
- - When Agestra is active, security audit requests follow `commands/security.md`
36
+ - Internal QA, security, design, idea, and planning viewpoints remain available through workflow profiles and skill/lens resources; they are not shipped as public slash commands.
35
37
  - Review, QA, and security workflows write durable reports under `docs/reports/review/`, `docs/reports/qa/`, and `docs/reports/security/` unless the user asks for chat-only output.
36
- - Persistent E2E test creation/maintenance is internal: QA produces `E2E_TEST_WORK_REQUEST`, the leader asks the user, and approved work goes to `agestra-implementer` with `mode: e2e-test-authoring`.
37
- - When Agestra is active, design and architecture requests follow `commands/design.md`
38
- - When Agestra is active, idea discovery requests follow `commands/idea.md`
39
- - When Agestra is active, implementation requests follow `commands/implement.md`
40
38
 
41
39
  ## Core MCP Tools
42
40
 
43
41
  - `setup_status`, `environment_check`, and `provider_list`: inspect installation, host, and provider state for Agestra health checks and active Agestra workflows
44
- - `agent_consensus_start` (with `agent_debate_approve`/`_continue`/`_reject`) and `agent_debate_review`: run approval-gated consensus flows from prepared `initial_aggregation`
45
- - `cli_worker_spawn`, `agent_changes_review`, `agent_changes_accept`, `agent_changes_reject`: use for explicit autonomous Codex/Gemini worker tasks
42
+ - `agent_research_start`: research-only preprocessing with workflow profile, prompt pack, questionSet, evidencePolicy, research lenses, and investigator assignments; writes `research_submissions.json`, `research_transcript.json`, and `aggregation.json`; does not start debate
43
+ - `agent_consensus_start` (with `agent_debate_approve`/`_continue`/`_reject`): debate-only approval-gated consensus flows from prepared `aggregation`, supplied `questionSet`, and `evidencePolicy`; `workflow` is a report/artifact label only, not a debate routing branch
46
44
  - `host_assets_status`, `host_assets_install`, `host_assets_uninstall`: inspect and explicitly manage generated Codex host-native assets such as custom agents and skills
47
- - `qa_run`: run workspace build/test verification before reporting implementation completion
45
+ - `qa_run`: run workspace build/test verification for QA evidence
48
46
 
49
47
  ## Project Assets
50
48
 
51
- - `agents/`: canonical role prompts (`agestra-team-lead`, `agestra-research`, `agestra-debate`, `agestra-implementer`)
49
+ - `agents/`: canonical role prompts (`agestra-team-lead`, `agestra-research`, `agestra-debate`)
52
50
  - `skills/`: reusable workflow references
53
51
  - `GEMINI.md` and `.gemini/commands/`: Gemini-specific host assets; keep behavior aligned with them when updating shared workflows
52
+
53
+ ## graphify
54
+
55
+ This project has a knowledge graph at graphify-out/ with god nodes, community structure, and cross-file relationships.
56
+
57
+ When the user types `/graphify`, invoke the `skill` tool with `skill: "graphify"` before doing anything else.
58
+
59
+ Rules:
60
+ - For codebase questions, first run `graphify query "<question>"` when graphify-out/graph.json exists. Use `graphify path "<A>" "<B>"` for relationships and `graphify explain "<concept>"` for focused concepts. These return a scoped subgraph, usually much smaller than GRAPH_REPORT.md or raw grep output.
61
+ - Dirty graphify-out/ files are expected after hooks or incremental updates; dirty graph files are not a reason to skip graphify. Only skip graphify if the task is about stale or incorrect graph output, or the user explicitly says not to use it.
62
+ - If graphify-out/wiki/index.md exists, use it for broad navigation instead of raw source browsing.
63
+ - Read graphify-out/GRAPH_REPORT.md only for broad architecture review or when query/path/explain do not surface enough context.
64
+ - After modifying code, run `graphify update .` to keep the graph current (AST-only, no API cost).
package/GEMINI.md CHANGED
@@ -20,9 +20,11 @@ After setup, Gemini project commands are available:
20
20
  - `/agestra:security`
21
21
  - `/agestra:design`
22
22
  - `/agestra:idea`
23
- - `/agestra:implement`
24
23
 
25
24
  Each command delegates to the shared workflow specs in `commands/*.md`.
25
+ Agestra does not implement product code or author persistent E2E test files. Use
26
+ Gemini CLI or the current host for code/test changes first, then run Agestra
27
+ QA/review/security on the result.
26
28
 
27
29
  ## Usage Rules
28
30
 
@@ -31,9 +33,10 @@ Each command delegates to the shared workflow specs in `commands/*.md`.
31
33
  - Start orchestration requests with `setup_status`, then `environment_check` and `provider_list`.
32
34
  - Prefer Agestra MCP tools instead of rebuilding workflows in free-form prompts.
33
35
  - Treat `commands/*.md` and `agents/*.md` as the canonical workflow and role assets.
34
- - Keep native agent creation host-owned. Providers reached through MCP, CLI workers, or chat are participants only.
35
- - For investigation-including workflows, route through `agent_research_consensus_start`.
36
- - Use this host research consensus contract verbatim:
36
+ - Keep native agent creation host-owned. Providers reached through MCP or chat are participants only.
37
+ - For investigation-including workflows, route through `agent_research_start`,
38
+ then start debate separately with `agent_consensus_start`.
39
+ - Use this host research/debate phase contract verbatim:
37
40
  호스트가 조사한다.
38
41
  호스트가 정리한다.
39
42
  시스템이 토론한다.
@@ -43,11 +46,12 @@ Each command delegates to the shared workflow specs in `commands/*.md`.
43
46
 
44
47
  ## Core MCP Tools
45
48
 
46
- - `agent_research_consensus_start`: host-led research, consolidation, system debate, engine aggregation docs, and host-authored final decision docs for investigation-including workflows
47
- - `agent_consensus_start`, `agent_debate_approve`/`_continue`/`_reject`, `agent_debate_review`: direct consensus sessions from prepared `initial_aggregation` and approval-gated debate artifacts
48
- - `cli_worker_spawn`, `agent_changes_review`, `agent_changes_accept`, `agent_changes_reject`: autonomous worker lifecycle
49
+ - `agent_research_start`: research-only host-led preprocessing with workflow
50
+ profile, prompt pack, `questionSet`, `evidencePolicy`, research lenses, and
51
+ investigator assignments; writes `research_submissions.json`,
52
+ `research_transcript.json`, and `aggregation.json`; does not start debate
53
+ - debate-only `agent_consensus_start`, `agent_debate_approve`/`_continue`/`_reject`: sessions from prepared `aggregation`, supplied `questionSet`, `evidencePolicy`, and approval-gated debate artifacts
49
54
  - `workspace_*`: document-backed review and aggregation flows
50
- - `qa_run`: workspace build/test verification before implementation completion
55
+ - `qa_run`: workspace build/test verification for QA evidence
51
56
 
52
57
  Review, QA, and security workflows write durable reports under `docs/reports/review/`, `docs/reports/qa/`, and `docs/reports/security/` unless the user asks for chat-only output.
53
- Persistent E2E test creation/maintenance is internal: QA produces `E2E_TEST_WORK_REQUEST`, the leader asks the user, and approved work goes to `agestra-implementer` with `mode: e2e-test-authoring`. There is no standalone Gemini `/agestra:e2e` command yet.
package/README.ja.md CHANGED
@@ -7,7 +7,7 @@ Claude Code、Codex CLI、Gemini CLI、ローカルモデルで使えるマル
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra は、1 つの作業に複数の AI を使って比較し、整理するためのツールです。コードレビュー、QA、セキュリティ確認、設計相談、アイデア探索、provider-backed 実装向けに作られています。
10
+ Agestra は、1 つの問題を複数の AI 視点で検討し、整理するためのツールです。コードレビュー、QA、セキュリティ確認、設計相談、アイデア探索、根拠にもとづく合意形成向けに作られています。
11
11
 
12
12
  ## クイックスタート
13
13
 
@@ -21,32 +21,29 @@ Agestra は、1 つの作業に複数の AI を使って比較し、整理する
21
21
 
22
22
  インストール後、プロジェクトを開いて Agestra ワークフローを呼び出します。
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra research ...` または `/agestra review ...`
25
+ - Gemini CLI: `/agestra:research ...` または `/agestra:review ...`
26
26
  - Codex CLI: `Use Agestra with Gemini and Codex to review this branch.` のように、Agestra や複数 AI を明示して依頼
27
27
 
28
28
  初回は使う provider を聞かれることがあります。provider が 1 つだけでもセットアップやホスト所有の作業はできますが、複数 AI 比較は 2 つ以上あるとより有効です。
29
29
 
30
30
  ## 何に使うか
31
31
 
32
- - `review`: コード品質、回帰リスク、UX、整理ポイントを複数 AI の視点で比較
33
- - `qa`: 設計書や計画を基準に実装を検証し、PASS/FAIL の根拠を集める
34
- - `security`: セキュリティ観点に絞って確認する
35
- - `design`: 実装前に構造やトレードオフを整理する
36
- - `idea`: 改善案、代替案、類似ツールを探る
37
- - `implement`: 複数 provider で実装を進め、最後の検証までつなぐ
32
+ - `research`: アイデア、QA、セキュリティの質問に必要な根拠を現在のホストだけで調査し整理します。この流れでは外部 provider は調査しません。
33
+ - `review`: 既存のコード、ドキュメント、diff、または準備済みのリサーチ結果をもとに討論し、意見を比較します。レビューは新しい調査を始めません。
34
+ - レビュー観点には、コード品質、回帰リスク、UX、整理、設計適合性、性能、信頼性、テスト、安全性のにおい、リリース準備状況を含められます。
38
35
 
39
36
  ## 実行すると何が起こるか
40
37
 
41
38
  1. Agestra が設定と利用可能な provider を確認します。
42
39
  2. 依頼を対象とスコープが明確なワークフローに整理します。
43
- 3. 調査が必要なら、ホストが先に証拠を集めて整理します。
44
- 4. 選ばれた provider は残っている論点だけをレビューまたは討論します。
40
+ 3. `research` では、現在のホストが根拠を調査し、整理し、文書化します。provider fan-out はありません。
41
+ 4. `review` では、選ばれた provider がスコープ内のコード、ドキュメント、diff、または準備済みのリサーチ結果について討論します。別途調査はしません。
45
42
  5. 結論、意見の違い、根拠を 1 つの結果として返します。
46
43
 
47
- 普通のレビューや QA の依頼が自動で Agestra になるわけではありません。`/agestra ...` を使うか、複数 AI や provider-backed 作業を明示したときに Agestra が動きます。
44
+ 普通のレビューや QA の依頼が自動で Agestra になるわけではありません。`/agestra ...` を使うか、複数 AI や provider-backed のリサーチ/レビュー作業を明示したときに Agestra が動きます。
48
45
 
49
- 実装と QA では、最後の確認は引き続きホストが担当します。ビルド、テスト、実行証拠、ブラウザフロー、最終的なファイル反映はホスト側で確認します。
46
+ コード変更は、まず現在のホストで直接行うのが基本です。Agestra はその後で結果をレビューし、計画との一致を確認し、複数 provider の意見と根拠を記録するところで最も力を発揮します。
50
47
 
51
48
  ## このリポジトリで使う
52
49
 
package/README.ko.md CHANGED
@@ -7,7 +7,7 @@ Claude Code, Codex CLI, Gemini CLI, 로컬 모델을 함께 쓰기 위한 멀티
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra는 하나의 작업에 여러 AI 붙여서 비교하고 정리해 주는 도구입니다. 코드 리뷰, QA, 보안 점검, 설계 논의, 아이디어 탐색, provider-backed 구현에 맞춰 설계되어 있습니다.
10
+ Agestra는 하나의 문제를 여러 AI 시각으로 검토하고 정리해 주는 도구입니다. 코드 리뷰, QA, 보안 점검, 설계 논의, 아이디어 탐색, 근거 기반 합의에 맞춰 설계되어 있습니다.
11
11
 
12
12
  ## 빠른 시작
13
13
 
@@ -21,32 +21,29 @@ Agestra는 하나의 작업에 여러 AI를 붙여서 비교하고 정리해 주
21
21
 
22
22
  설치 후 프로젝트를 열고 Agestra 워크플로우를 요청하면 됩니다.
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra research ...` 또는 `/agestra review ...`
25
+ - Gemini CLI: `/agestra:research ...` 또는 `/agestra:review ...`
26
26
  - Codex CLI: `Agestra로 Gemini와 Codex를 같이 써서 이 브랜치 리뷰해줘`처럼 Agestra나 여러 AI를 명시해서 요청
27
27
 
28
28
  첫 실행에서는 사용할 provider를 물어볼 수 있습니다. provider가 하나만 있어도 설정과 호스트 소유 작업은 가능하지만, 멀티 AI 비교는 둘 이상일 때 가장 잘 살아납니다.
29
29
 
30
30
  ## 무엇에 쓰나
31
31
 
32
- - `review`: 코드 품질, 회귀 위험, UX, 정리 포인트를 여러 AI 의견으로 비교
33
- - `qa`: 설계 문서나 계획 기준으로 구현을 검증하고 PASS/FAIL 근거 수집
34
- - `security`: 보안 관점만 따로 집중해서 검토
35
- - `design`: 구현 전에 구조와 트레이드오프 논의
36
- - `idea`: 개선 아이디어, 대안, 유사 도구 탐색
37
- - `implement`: 여러 provider를 써서 구현을 진행하고 마지막 검증까지 이어감
32
+ - `research`: 아이디어, QA, 보안 질문에 필요한 근거를 현재 호스트만 조사하고 정리합니다. 외부 provider는 이 흐름에서 조사하지 않습니다.
33
+ - `review`: 이미 있는 코드, 문서, diff, 또는 준비된 리서치 결과를 두고 토론하고 의견을 비교합니다. 리뷰는 새 조사를 시작하지 않습니다.
34
+ - 리뷰 관점은 코드 품질, 회귀 위험, UX, 정리, 설계 적합성, 성능, 안정성, 테스트, 기본 안전 냄새, 배포 준비도를 다룰 수 있습니다.
38
35
 
39
36
  ## 실행하면 어떻게 되나
40
37
 
41
38
  1. Agestra가 설정과 사용 가능한 provider를 확인합니다.
42
39
  2. 요청을 대상과 범위가 분명한 워크플로우로 정리합니다.
43
- 3. 조사가 필요하면 호스트가 먼저 근거를 모으고 정리합니다.
44
- 4. 선택된 provider들이 남은 쟁점만 검토하거나 토론합니다.
40
+ 3. `research`에서는 현재 호스트가 근거를 조사하고 정리하고 문서화합니다. provider fan-out은 없습니다.
41
+ 4. `review`에서는 선택된 provider들이 범위 안의 코드, 문서, diff, 또는 준비된 리서치 결과를 놓고 토론합니다. 별도 조사는 하지 않습니다.
45
42
  5. 결론, 이견, 근거를 하나의 결과로 돌려줍니다.
46
43
 
47
- 평범한 리뷰나 QA 요청이 자동으로 Agestra가 되는 것은 아닙니다. `/agestra ...`를 쓰거나, 여러 AI나 provider-backed 작업을 명시했을 때 Agestra 워크플로우가 시작됩니다.
44
+ 평범한 리뷰나 QA 요청이 자동으로 Agestra가 되는 것은 아닙니다. `/agestra ...`를 쓰거나, 여러 AI나 provider-backed 리서치/리뷰 작업을 명시했을 때 Agestra 워크플로우가 시작됩니다.
48
45
 
49
- 구현과 QA에서는 마지막 확인을 계속 호스트가 맡습니다. 빌드, 테스트, 실행 근거, 브라우저 흐름, 최종 파일 반영은 호스트가 확인합니다.
46
+ 코드 변경은 먼저 현재 호스트에서 직접 진행하는 편이 좋습니다. Agestra는 다음 결과를 리뷰하고, 계획과 맞는지 검증하고, 여러 provider 의견과 근거를 기록할 때 가장 강합니다.
50
47
 
51
48
  ## 이 저장소에서 쓰기
52
49
 
package/README.md CHANGED
@@ -7,7 +7,7 @@ Multi-host MCP orchestration for Claude Code, Codex CLI, Gemini CLI, and local m
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra helps you use more than one AI for the same task. It is built for review, QA, design discussion, idea exploration, and provider-backed implementation.
10
+ Agestra helps you use more than one AI to examine the same problem. It is built for review, QA, security checks, design discussion, idea exploration, and evidence-backed consensus.
11
11
 
12
12
  ## Quick Start
13
13
 
@@ -21,32 +21,29 @@ Install Agestra in the host you already use.
21
21
 
22
22
  Then open your project and ask for an Agestra workflow.
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra research ...` or `/agestra review ...`
25
+ - Gemini CLI: `/agestra:research ...` or `/agestra:review ...`
26
26
  - Codex CLI: ask explicitly for Agestra or multiple providers, for example `Use Agestra with Gemini and Codex to review this branch.`
27
27
 
28
28
  The first workflow may ask which providers you want to use. Agestra works best with two or more providers, but setup and host-owned flows still work with one.
29
29
 
30
30
  ## What To Use It For
31
31
 
32
- - `review`: compare multiple AI opinions about code quality, regressions, UX, and cleanup
33
- - `qa`: verify implementation against a design or plan and collect PASS/FAIL evidence
34
- - `security`: run a dedicated security-focused review
35
- - `design`: discuss architecture and tradeoffs before coding
36
- - `idea`: explore improvements, alternatives, and similar tools
37
- - `implement`: coordinate provider-backed implementation, then verify the result
32
+ - `research`: host-only evidence gathering for idea, QA, or security questions. External providers do not investigate in this flow.
33
+ - `review`: debate and compare opinions about existing code, docs, diffs, or prepared research. Review does not start a fresh investigation.
34
+ - Review lenses can cover code quality, regressions, UX, cleanup, design fit, performance, reliability, tests, safety smells, and production readiness.
38
35
 
39
36
  ## How It Runs
40
37
 
41
38
  1. Agestra checks setup and available providers.
42
39
  2. It turns your request into a clear workflow with a target and scope.
43
- 3. When research is needed, the host gathers and organizes the evidence first.
44
- 4. Selected providers review or debate only the unresolved points.
40
+ 3. In `research`, the current host gathers, organizes, and documents evidence. There is no provider fan-out.
41
+ 4. In `review`, selected providers discuss the code, documents, diffs, or prepared research already in scope. They do not perform separate research.
45
42
  5. Agestra returns one result with conclusions, disagreements, and evidence.
46
43
 
47
- Plain review or QA requests do not automatically become Agestra workflows. Agestra starts when you use `/agestra ...` or explicitly ask for multi-AI or provider-backed help.
44
+ Plain review or QA requests do not automatically become Agestra workflows. Agestra starts when you use `/agestra ...` or explicitly ask for multi-AI or provider-backed research/review work.
48
45
 
49
- For implementation and QA, the host still owns the final checks such as build, test, runtime evidence, browser flows, and accepted file changes.
46
+ For code changes, use your current host directly first. Agestra is strongest after that: reviewing the result, checking it against a plan, comparing provider opinions, and recording the evidence.
50
47
 
51
48
  ## Using This Repository
52
49
 
package/README.zh.md CHANGED
@@ -7,7 +7,7 @@
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合代码审查、QA、安全检查、设计讨论、想法探索,以及 provider-backed 实现。
10
+ Agestra 用来让多个 AI 从不同角度审视同一个问题,并把结果整理成证据清晰的结论。它适合代码审查、QA、安全检查、设计讨论、想法探索和基于证据的共识。
11
11
 
12
12
  ## 快速开始
13
13
 
@@ -21,32 +21,29 @@ Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合
21
21
 
22
22
  安装后,打开项目并发起 Agestra 工作流。
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra research ...` `/agestra review ...`
25
+ - Gemini CLI: `/agestra:research ...` `/agestra:review ...`
26
26
  - Codex CLI: 像 `Use Agestra with Gemini and Codex to review this branch.` 这样明确提到 Agestra 或多个 AI
27
27
 
28
28
  第一次运行时,它可能会询问你要启用哪些 provider。只有一个 provider 也能完成设置和宿主自有流程,但 Multi-AI 比较在两个以上 provider 时效果最好。
29
29
 
30
30
  ## 用它做什么
31
31
 
32
- - `review`: 比较多个 AI 对代码质量、回归风险、UX 和整理点的看法
33
- - `qa`: 按设计文档或计划验证实现,并收集 PASS/FAIL 证据
34
- - `security`: 专门做安全视角的检查
35
- - `design`: 在写代码前讨论结构和取舍
36
- - `idea`: 探索改进方向、备选方案和相似工具
37
- - `implement`: 用多个 provider 推进实现,并把最后验证也串起来
32
+ - `research`: 由当前宿主单独收集并整理 idea、QA 或安全问题所需的证据。外部 provider 不参与这个调查流程。
33
+ - `review`: 围绕已有代码、文档、diff 或已准备好的 research 结果进行讨论并比较意见。review 不会启动新的调查。
34
+ - review 视角可以覆盖代码质量、回归风险、UX、整理点、设计契合度、性能、可靠性、测试、安全异味和上线准备度。
38
35
 
39
36
  ## 运行时会发生什么
40
37
 
41
38
  1. Agestra 检查设置和可用 provider。
42
39
  2. 它把请求整理成目标和范围明确的工作流。
43
- 3. 如果需要调查,宿主先收集并整理证据。
44
- 4. 被选中的 provider 只讨论或审查剩下的未解决问题。
40
+ 3. 在 `research` 中,当前宿主负责调查、整理并文档化证据。没有 provider fan-out。
41
+ 4. `review` 中,被选中的 provider 讨论范围内的代码、文档、diff 或已准备好的 research 结果。它们不会另行调查。
45
42
  5. Agestra 返回一份包含结论、分歧和证据的结果。
46
43
 
47
- 普通的 review 或 QA 请求不会自动变成 Agestra 工作流。只有当你使用 `/agestra ...`,或者明确要求多 AI / provider-backed 帮助时,Agestra 才会启动。
44
+ 普通的 review 或 QA 请求不会自动变成 Agestra 工作流。只有当你使用 `/agestra ...`,或者明确要求多 AI / provider-backed 的 research/review 工作时,Agestra 才会启动。
48
45
 
49
- 在实现和 QA 里,最后的确认仍然由宿主负责。构建、测试、运行证据、浏览器流程,以及最终落盘的改动都由宿主确认。
46
+ 代码修改应优先由当前宿主直接完成。Agestra 最适合在修改之后审查结果、按计划验证、比较多个 provider 的意见,并记录证据。
50
47
 
51
48
  ## 在这个仓库里使用
52
49
 
@@ -2,9 +2,10 @@
2
2
  name: agestra-debate
3
3
  description: |
4
4
  Host-native debate participant for Agestra consensus rounds. Reads the assigned
5
- domain/lens context, answers a pending host turn, and returns the required
6
- consensus JSON. It is not the moderator, not the team lead, not a reviewer/QA/
7
- security specialist identity, and does not choose participants or run rounds.
5
+ workflow profile/lens context, answers a pending host turn by the supplied
6
+ question set, and returns the required [ITEM] markup. It is not the
7
+ moderator, not the team lead, not a reviewer/QA/security specialist identity,
8
+ and does not choose participants or run rounds.
8
9
 
9
10
  Use this agent only when the team lead or consensus engine has an explicit
10
11
  host-native participant turn for `agestra-debate`.
@@ -17,10 +18,10 @@ tools: Read, Glob, Grep, Bash
17
18
  <Role>
18
19
  You are the host-native debate participant for Agestra. You receive one pending
19
20
  consensus turn, inspect only the supplied packet/files/lens references, and
20
- return the required JSON answer for that turn.
21
+ return the required [ITEM] answer for that turn.
21
22
 
22
23
  You are not the consensus engine, moderator, team lead, reviewer, QA judge,
23
- security auditor, or implementation worker.
24
+ security auditor, or code-change executor.
24
25
 
25
26
  Use only inside an active Agestra workflow. Plain review/QA/check requests
26
27
  without `/agestra` or explicit multi-AI/provider wording stay with the current
@@ -36,7 +37,8 @@ Required information:
36
37
  - round number to echo in `round`
37
38
  - assigned item ids
38
39
  - allowed files or evidence references
39
- - assigned domain/lens context, if any
40
+ - assigned workflow profile and lens context, if any
41
+ - supplied `questionSet` with required question IDs, verdict fields, and allowed verdicts
40
42
  - output contract
41
43
 
42
44
  If the request is only a generic review, QA, or debate request and does not
@@ -50,37 +52,40 @@ When a lens reference is provided, read only the needed file under
50
52
  `skills/references/lenses/`.
51
53
 
52
54
  Do not load every lens by default. The lens narrows the question; it does not
53
- override the pending turn packet or JSON contract.
55
+ override the pending turn packet or [ITEM] contract.
54
56
  </Lens_Policy>
55
57
 
56
58
  <Output_Contract>
57
- Return JSON only. Do not include prose, Markdown, XML tags, or explanations
58
- outside the JSON object.
59
+ Return [ITEM] blocks only. Do not include prose, Markdown, JSON, XML tags, or
60
+ explanations outside the item blocks.
59
61
 
60
62
  Consensus turn shape:
61
63
 
62
- ```json
63
- {
64
- "provider": "<pending participant id>",
65
- "round": 1,
66
- "items": [
67
- {
68
- "id": "<assigned item id>",
69
- "stance": "agree",
70
- "comment": "short evidence-based comment when needed"
71
- }
72
- ]
73
- }
64
+ ```text
65
+ [ITEM]
66
+ id: <assigned item id>
67
+ stance: agree
68
+ responds_to: <assigned item id>
69
+ evidence: file:line, artifact path, or item evidence ref
70
+ stanceEvidenceType: empirical
71
+ question: <questionId> | <verdictField> | <allowed verdict> | short evidence-based rationale
72
+ finalStatus: <allowed final status from questionSet>
73
+ adjustedRemedy: optional remedy adjustment when allowed by the packet
74
+ text:
75
+ Concise participant response text.
76
+ [/ITEM]
74
77
  ```
75
78
 
76
79
  Rules:
77
- - `provider` must exactly match the pending participant id.
78
- - `round` must exactly match the pending round.
80
+ - The mailbox turn id, participant id, and round are supplied by the packet and
81
+ submission tool call; do not invent different values.
79
82
  - Answer every assigned item exactly once.
80
- - `stance` must be one of `agree`, `disagree`, `opinion`, or `revise`.
81
- - `disagree`, `opinion`, and `revise` require a non-empty `comment`.
82
- - `revise` requires a `proposedItem` in the shape requested by the engine.
83
- - Do not create new top-level fields unless the engine contract explicitly allows them.
83
+ - Answer every required question in the supplied `questionSet`.
84
+ - Use only verdict values allowed by the supplied `questionSet`.
85
+ - Include stance evidence type and evidence refs for each question answer.
86
+ - Treat `workflow` as artifact context only; do not infer hidden QA, review,
87
+ security, design, idea, or planning rules.
88
+ - Do not return debate JSON.
84
89
  </Output_Contract>
85
90
 
86
91
  <Boundaries>
@@ -89,5 +94,5 @@ Rules:
89
94
  - Do not write reports or final synthesis documents.
90
95
  - Do not edit source files.
91
96
  - Do not convert this task into a general review, QA, security audit, or design pass.
92
- - If evidence is missing, use `opinion` or `disagree` with a clear comment instead of inventing facts.
97
+ - If evidence is missing, answer the supplied question set with `unclear` or the closest allowed verdict and explain the evidence gap instead of inventing facts.
93
98
  </Boundaries>
@@ -16,7 +16,7 @@ You are a focused research assignee. You investigate the exact research
16
16
  assignment you receive and return structured evidence for aggregation.
17
17
 
18
18
  You are not the team lead, final synthesizer, consensus engine, reviewer, QA
19
- judge, security auditor, or implementation worker.
19
+ judge, security auditor, or code-change executor.
20
20
 
21
21
  Use only inside an active Agestra workflow. Plain review/QA/check requests
22
22
  without `/agestra` or explicit multi-AI/provider wording stay with the current
@@ -27,9 +27,12 @@ host.
27
27
  Proceed only when the request includes a bounded research assignment.
28
28
 
29
29
  Expected assignment fields:
30
- - `domain`: idea, design, review, qa, security, implement, or research
30
+ - `workflow` and `profileId`: idea, design, review, qa, security, planning, or
31
+ research workflow profile selected by team-lead
32
+ - `promptPack`: self-contained workflow prompt, research skill guidance,
33
+ question set, finding contract, and evidence policy
31
34
  - `question`: the narrow question this run answers
32
- - `lens`: the lens bundle to apply
35
+ - `lens`: the single lens to apply
33
36
  - `scope`: files, docs, URLs, or boundaries to inspect
34
37
  - `deliverable`: expected result shape
35
38
  - `rationale`: why this run exists, when provided
@@ -40,8 +43,8 @@ concrete research assignment instead of expanding the scope yourself.
40
43
 
41
44
  <Lens_Policy>
42
45
  Start from `skills/references/lenses/research.md` when lens rules are needed.
43
- If the assignment has a concrete domain, read only the matching domain pack under
44
- `skills/references/lenses/research-domains/`.
46
+ If the assignment has a concrete workflow profile, read only the matching lens
47
+ reference under `skills/references/lenses/research-domains/`.
45
48
 
46
49
  One research run should keep a narrow lens bundle. If the assignment includes too
47
50
  many unrelated lenses, report that it should be split into multiple research
@@ -58,15 +61,17 @@ runs.
58
61
  </Research_Method>
59
62
 
60
63
  <Output_Contract>
61
- Return JSON only. The result feeds team-lead/research aggregation, which may
62
- later create `initial_aggregation` for the consensus engine.
64
+ Return JSON only. The result feeds team-lead/research aggregation. Do not start
65
+ debate or create the final report.
63
66
 
64
67
  Recommended shape:
65
68
 
66
69
  ```json
67
70
  {
68
71
  "researcher": "agestra-research",
69
- "domain": "idea",
72
+ "workflow": "idea",
73
+ "profileId": "idea.value-and-next-step.v1",
74
+ "promptPackId": "idea.value-and-next-step.v1",
70
75
  "question": "The assigned question",
71
76
  "lens": "User Pain + Evidence",
72
77
  "findings": [
@@ -75,18 +80,26 @@ Recommended shape:
75
80
  "kind": "finding",
76
81
  "title": "Short evidence-backed title",
77
82
  "claim": "What the evidence suggests",
83
+ "whyItMatters": "Why a participant should care about this finding",
84
+ "evidenceType": "empirical",
78
85
  "evidence": ["file:line, command, artifact path, or URL"],
86
+ "proposedRemedy": "Action or next step when the workflow requires one",
87
+ "remedyRisk": "Risk introduced by the proposed remedy, or null",
88
+ "debateEligibility": "eligible",
79
89
  "confidence": "high",
80
90
  "limits": "What was not checked"
81
91
  }
82
92
  ],
93
+ "rawTranscript": "The concise raw response or notes from this run",
83
94
  "openQuestions": [],
84
- "suggestedConsensusItems": []
95
+ "suggestedAggregationItems": []
85
96
  }
86
97
  ```
87
98
 
88
- Use `suggestedConsensusItems` only for claims that may need multi-AI consensus.
89
- Do not call the consensus engine yourself.
99
+ Use one prompt pack and one lens per run. Every finding must classify evidence as
100
+ `empirical`, `inferential`, or `mixed`; include `proposedRemedy`, `remedyRisk`,
101
+ and `debateEligibility` when the profile contract asks for them. Do not call the
102
+ consensus engine yourself.
90
103
  </Output_Contract>
91
104
 
92
105
  <Boundaries>