agestra 4.14.5 → 4.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. package/.claude-plugin/marketplace.json +1 -1
  2. package/.claude-plugin/plugin.json +1 -1
  3. package/.gemini/commands/agestra/design.toml +2 -2
  4. package/.gemini/commands/agestra/idea.toml +2 -2
  5. package/.gemini/commands/agestra/qa.toml +2 -2
  6. package/.gemini/commands/agestra/research.toml +2 -2
  7. package/.gemini/commands/agestra/review.toml +2 -2
  8. package/.gemini/commands/agestra/security.toml +2 -2
  9. package/AGENTS.md +6 -7
  10. package/GEMINI.md +13 -9
  11. package/README.ja.md +5 -6
  12. package/README.ko.md +5 -6
  13. package/README.md +5 -6
  14. package/README.zh.md +5 -6
  15. package/agents/agestra-debate.md +23 -11
  16. package/agents/agestra-research.md +24 -11
  17. package/agents/agestra-team-lead.md +163 -100
  18. package/commands/design.md +16 -11
  19. package/commands/idea.md +20 -15
  20. package/commands/qa.md +79 -60
  21. package/commands/research.md +185 -34
  22. package/commands/review.md +13 -9
  23. package/commands/security.md +10 -7
  24. package/dist/bundle.js +348 -524
  25. package/hooks/user-prompt-submit.js +9 -20
  26. package/package.json +5 -2
  27. package/scripts/host-assets/categories.mjs +2 -16
  28. package/skills/cancel.md +7 -18
  29. package/skills/design.md +16 -13
  30. package/skills/idea.md +19 -16
  31. package/skills/leader.md +74 -65
  32. package/skills/plan.md +119 -0
  33. package/skills/provider-guide.md +54 -74
  34. package/skills/qa.md +85 -48
  35. package/skills/references/lenses/README.md +3 -3
  36. package/skills/references/lenses/e2e.md +16 -15
  37. package/skills/references/lenses/research-domains/planning.md +31 -0
  38. package/skills/references/lenses/research.md +2 -2
  39. package/skills/research.md +188 -42
  40. package/skills/review.md +12 -9
  41. package/skills/security.md +13 -9
  42. package/skills/setup.md +8 -5
  43. package/.gemini/commands/agestra/implement.toml +0 -16
  44. package/agents/agestra-implementer.md +0 -126
  45. package/commands/implement.md +0 -151
  46. package/skills/e2e.md +0 -72
  47. package/skills/references/lenses/research-domains/implement.md +0 -33
  48. package/skills/worker-manage.md +0 -79
@@ -12,7 +12,7 @@
12
12
  "name": "agestra",
13
13
  "source": "./",
14
14
  "description": "Multi-host MCP orchestration across Claude, Ollama, Gemini, and Codex for review, QA, and cross-validation",
15
- "version": "4.14.5",
15
+ "version": "4.15.0",
16
16
  "author": {
17
17
  "name": "mua-vtuber"
18
18
  },
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "agestra",
3
- "version": "4.14.5",
3
+ "version": "4.15.0",
4
4
  "description": "Claude Code plugin — multi-host MCP orchestration across Claude, Ollama, Gemini, and Codex for review, QA, and cross-validation",
5
5
  "mcpServers": {
6
6
  "agestra": {
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra design` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra idea` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra qa` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra research` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows that continue into domain consensus, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows that continue into workflow consensus, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra review` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
@@ -4,8 +4,8 @@ prompt = """
4
4
  You are executing the `/agestra security` Gemini command.
5
5
 
6
6
  - Start with `setup_status`, then `environment_check` and `provider_list`.
7
- - For investigation-including workflows, route through `agent_research_consensus_start`.
8
- - Host research consensus contract:
7
+ - For investigation-including workflows, route through `agent_research_start`, then start debate separately with `agent_consensus_start`.
8
+ - Host research/debate contract uses workflow profiles, `aggregation`, `questionSet`, and `evidencePolicy`:
9
9
  호스트가 조사한다.
10
10
  호스트가 정리한다.
11
11
  시스템이 토론한다.
package/AGENTS.md CHANGED
@@ -16,13 +16,14 @@ Use `host_assets_status` to inspect generated Codex host assets, and only call `
16
16
  ## How to Work Here
17
17
 
18
18
  - Default to direct Codex work using the workspace `AGENTS.md` contract, oh-my-codex workflows, and Superpowers-style skills when they apply.
19
- - Use Agestra primarily for explicit multi-AI or provider orchestration requests, such as when the user names Agestra, Codex/Gemini/Ollama providers, "multi-AI", "multiple AI", "provider", `agent_debate_*`, `cli_worker_*`, or asks to gather/compare several AI opinions.
19
+ - Use Agestra primarily for explicit multi-AI or provider-backed review, QA, security, design, idea, and evidence/consensus work, such as when the user names Agestra, Codex/Gemini/Ollama providers, "multi-AI", "multiple AI", "provider", or asks to gather/compare several AI opinions.
20
20
  - Plain review/QA/check requests without `/agestra` or explicit multi-AI/provider wording stay with the current host; they are not Agestra natural-language auto-triggers.
21
21
  - Agestra natural-language routing requires explicit multi-AI/provider wording such as "multiple AIs", "all AIs", "other AI", "multi-AI", "Codex and Gemini", "provider comparison", or "프로바이더 비교". Explicit `/agestra ...` commands remain supported.
22
22
  - Native helper agents are created by the active host layer. In Codex, use the generated custom agents installed from these assets; external MCP/CLI/chat providers participate through Agestra tools and never create or manage Codex native agents.
23
23
  - Keep Agestra setup/status/provider checks as installation and health checks, not as workflow-routing triggers.
24
24
  - Run `setup_status`, `environment_check`, and `provider_list` when the task concerns Agestra installation, MCP registration, host assets, provider availability, or before entering an Agestra workflow. If `setup_status` reports `Setup required: yes`, complete interactive setup first and then resume the original task.
25
25
  - Do not treat ordinary review, QA, security, design, idea, implementation, cleanup, build-fix, or planning requests as Agestra workflows just because setup/status/provider checks exist.
26
+ - Agestra does not implement product code or author persistent E2E test files. Code and test authoring should happen in the current host first, then Agestra can review, QA, security-check, design-check, or discuss the result.
26
27
  - When an Agestra workflow is active, treat `commands/*.md` as the source of truth for that workflow.
27
28
  - Prefer Agestra MCP tools over ad-hoc multi-provider prompting only when the task is actually in Agestra/multi-provider mode.
28
29
  - If any legacy workflow text mentions old single-host Agestra execution, treat it as obsolete. Direct current-host work should happen outside Agestra workflows.
@@ -33,21 +34,19 @@ Use `host_assets_status` to inspect generated Codex host assets, and only call `
33
34
  - When Agestra is active, QA / verification requests follow `commands/qa.md`
34
35
  - When Agestra is active, security audit requests follow `commands/security.md`
35
36
  - Review, QA, and security workflows write durable reports under `docs/reports/review/`, `docs/reports/qa/`, and `docs/reports/security/` unless the user asks for chat-only output.
36
- - Persistent E2E test creation/maintenance is internal: QA produces `E2E_TEST_WORK_REQUEST`, the leader asks the user, and approved work goes to `agestra-implementer` with `mode: e2e-test-authoring`.
37
37
  - When Agestra is active, design and architecture requests follow `commands/design.md`
38
38
  - When Agestra is active, idea discovery requests follow `commands/idea.md`
39
- - When Agestra is active, implementation requests follow `commands/implement.md`
40
39
 
41
40
  ## Core MCP Tools
42
41
 
43
42
  - `setup_status`, `environment_check`, and `provider_list`: inspect installation, host, and provider state for Agestra health checks and active Agestra workflows
44
- - `agent_consensus_start` (with `agent_debate_approve`/`_continue`/`_reject`) and `agent_debate_review`: run approval-gated consensus flows from prepared `initial_aggregation`
45
- - `cli_worker_spawn`, `agent_changes_review`, `agent_changes_accept`, `agent_changes_reject`: use for explicit autonomous Codex/Gemini worker tasks
43
+ - `agent_research_start`: research-only preprocessing with workflow profile, prompt pack, questionSet, evidencePolicy, research lenses, and investigator assignments; writes `research_submissions.json`, `research_transcript.json`, and `aggregation.json`; does not start debate
44
+ - `agent_consensus_start` (with `agent_debate_approve`/`_continue`/`_reject`) and `agent_debate_review`: debate-only approval-gated consensus flows from prepared `aggregation`, supplied `questionSet`, and `evidencePolicy`; `workflow` is a report/artifact label only, not a debate routing branch
46
45
  - `host_assets_status`, `host_assets_install`, `host_assets_uninstall`: inspect and explicitly manage generated Codex host-native assets such as custom agents and skills
47
- - `qa_run`: run workspace build/test verification before reporting implementation completion
46
+ - `qa_run`: run workspace build/test verification for QA evidence
48
47
 
49
48
  ## Project Assets
50
49
 
51
- - `agents/`: canonical role prompts (`agestra-team-lead`, `agestra-research`, `agestra-debate`, `agestra-implementer`)
50
+ - `agents/`: canonical role prompts (`agestra-team-lead`, `agestra-research`, `agestra-debate`)
52
51
  - `skills/`: reusable workflow references
53
52
  - `GEMINI.md` and `.gemini/commands/`: Gemini-specific host assets; keep behavior aligned with them when updating shared workflows
package/GEMINI.md CHANGED
@@ -20,9 +20,11 @@ After setup, Gemini project commands are available:
20
20
  - `/agestra:security`
21
21
  - `/agestra:design`
22
22
  - `/agestra:idea`
23
- - `/agestra:implement`
24
23
 
25
24
  Each command delegates to the shared workflow specs in `commands/*.md`.
25
+ Agestra does not implement product code or author persistent E2E test files. Use
26
+ Gemini CLI or the current host for code/test changes first, then run Agestra
27
+ QA/review/security on the result.
26
28
 
27
29
  ## Usage Rules
28
30
 
@@ -31,9 +33,10 @@ Each command delegates to the shared workflow specs in `commands/*.md`.
31
33
  - Start orchestration requests with `setup_status`, then `environment_check` and `provider_list`.
32
34
  - Prefer Agestra MCP tools instead of rebuilding workflows in free-form prompts.
33
35
  - Treat `commands/*.md` and `agents/*.md` as the canonical workflow and role assets.
34
- - Keep native agent creation host-owned. Providers reached through MCP, CLI workers, or chat are participants only.
35
- - For investigation-including workflows, route through `agent_research_consensus_start`.
36
- - Use this host research consensus contract verbatim:
36
+ - Keep native agent creation host-owned. Providers reached through MCP or chat are participants only.
37
+ - For investigation-including workflows, route through `agent_research_start`,
38
+ then start debate separately with `agent_consensus_start`.
39
+ - Use this host research/debate phase contract verbatim:
37
40
  호스트가 조사한다.
38
41
  호스트가 정리한다.
39
42
  시스템이 토론한다.
@@ -43,11 +46,12 @@ Each command delegates to the shared workflow specs in `commands/*.md`.
43
46
 
44
47
  ## Core MCP Tools
45
48
 
46
- - `agent_research_consensus_start`: host-led research, consolidation, system debate, engine aggregation docs, and host-authored final decision docs for investigation-including workflows
47
- - `agent_consensus_start`, `agent_debate_approve`/`_continue`/`_reject`, `agent_debate_review`: direct consensus sessions from prepared `initial_aggregation` and approval-gated debate artifacts
48
- - `cli_worker_spawn`, `agent_changes_review`, `agent_changes_accept`, `agent_changes_reject`: autonomous worker lifecycle
49
+ - `agent_research_start`: research-only host-led preprocessing with workflow
50
+ profile, prompt pack, `questionSet`, `evidencePolicy`, research lenses, and
51
+ investigator assignments; writes `research_submissions.json`,
52
+ `research_transcript.json`, and `aggregation.json`; does not start debate
53
+ - debate-only `agent_consensus_start`, `agent_debate_approve`/`_continue`/`_reject`, `agent_debate_review`: sessions from prepared `aggregation`, supplied `questionSet`, `evidencePolicy`, and approval-gated debate artifacts
49
54
  - `workspace_*`: document-backed review and aggregation flows
50
- - `qa_run`: workspace build/test verification before implementation completion
55
+ - `qa_run`: workspace build/test verification for QA evidence
51
56
 
52
57
  Review, QA, and security workflows write durable reports under `docs/reports/review/`, `docs/reports/qa/`, and `docs/reports/security/` unless the user asks for chat-only output.
53
- Persistent E2E test creation/maintenance is internal: QA produces `E2E_TEST_WORK_REQUEST`, the leader asks the user, and approved work goes to `agestra-implementer` with `mode: e2e-test-authoring`. There is no standalone Gemini `/agestra:e2e` command yet.
package/README.ja.md CHANGED
@@ -7,7 +7,7 @@ Claude Code、Codex CLI、Gemini CLI、ローカルモデルで使えるマル
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra は、1 つの作業に複数の AI を使って比較し、整理するためのツールです。コードレビュー、QA、セキュリティ確認、設計相談、アイデア探索、provider-backed 実装向けに作られています。
10
+ Agestra は、1 つの問題を複数の AI 視点で検討し、整理するためのツールです。コードレビュー、QA、セキュリティ確認、設計相談、アイデア探索、根拠にもとづく合意形成向けに作られています。
11
11
 
12
12
  ## クイックスタート
13
13
 
@@ -21,8 +21,8 @@ Agestra は、1 つの作業に複数の AI を使って比較し、整理する
21
21
 
22
22
  インストール後、プロジェクトを開いて Agestra ワークフローを呼び出します。
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`
25
+ - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`
26
26
  - Codex CLI: `Use Agestra with Gemini and Codex to review this branch.` のように、Agestra や複数 AI を明示して依頼
27
27
 
28
28
  初回は使う provider を聞かれることがあります。provider が 1 つだけでもセットアップやホスト所有の作業はできますが、複数 AI 比較は 2 つ以上あるとより有効です。
@@ -34,7 +34,6 @@ Agestra は、1 つの作業に複数の AI を使って比較し、整理する
34
34
  - `security`: セキュリティ観点に絞って確認する
35
35
  - `design`: 実装前に構造やトレードオフを整理する
36
36
  - `idea`: 改善案、代替案、類似ツールを探る
37
- - `implement`: 複数 provider で実装を進め、最後の検証までつなぐ
38
37
 
39
38
  ## 実行すると何が起こるか
40
39
 
@@ -44,9 +43,9 @@ Agestra は、1 つの作業に複数の AI を使って比較し、整理する
44
43
  4. 選ばれた provider は残っている論点だけをレビューまたは討論します。
45
44
  5. 結論、意見の違い、根拠を 1 つの結果として返します。
46
45
 
47
- 普通のレビューや QA の依頼が自動で Agestra になるわけではありません。`/agestra ...` を使うか、複数 AI や provider-backed 作業を明示したときに Agestra が動きます。
46
+ 普通のレビューや QA の依頼が自動で Agestra になるわけではありません。`/agestra ...` を使うか、複数 AI や provider-backed のレビュー、QA、セキュリティ、設計、アイデア作業を明示したときに Agestra が動きます。
48
47
 
49
- 実装と QA では、最後の確認は引き続きホストが担当します。ビルド、テスト、実行証拠、ブラウザフロー、最終的なファイル反映はホスト側で確認します。
48
+ コード変更は、まず現在のホストで直接行うのが基本です。Agestra はその後で結果をレビューし、計画との一致を確認し、複数 provider の意見と根拠を記録するところで最も力を発揮します。
50
49
 
51
50
  ## このリポジトリで使う
52
51
 
package/README.ko.md CHANGED
@@ -7,7 +7,7 @@ Claude Code, Codex CLI, Gemini CLI, 로컬 모델을 함께 쓰기 위한 멀티
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra는 하나의 작업에 여러 AI 붙여서 비교하고 정리해 주는 도구입니다. 코드 리뷰, QA, 보안 점검, 설계 논의, 아이디어 탐색, provider-backed 구현에 맞춰 설계되어 있습니다.
10
+ Agestra는 하나의 문제를 여러 AI 시각으로 검토하고 정리해 주는 도구입니다. 코드 리뷰, QA, 보안 점검, 설계 논의, 아이디어 탐색, 근거 기반 합의에 맞춰 설계되어 있습니다.
11
11
 
12
12
  ## 빠른 시작
13
13
 
@@ -21,8 +21,8 @@ Agestra는 하나의 작업에 여러 AI를 붙여서 비교하고 정리해 주
21
21
 
22
22
  설치 후 프로젝트를 열고 Agestra 워크플로우를 요청하면 됩니다.
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`
25
+ - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`
26
26
  - Codex CLI: `Agestra로 Gemini와 Codex를 같이 써서 이 브랜치 리뷰해줘`처럼 Agestra나 여러 AI를 명시해서 요청
27
27
 
28
28
  첫 실행에서는 사용할 provider를 물어볼 수 있습니다. provider가 하나만 있어도 설정과 호스트 소유 작업은 가능하지만, 멀티 AI 비교는 둘 이상일 때 가장 잘 살아납니다.
@@ -34,7 +34,6 @@ Agestra는 하나의 작업에 여러 AI를 붙여서 비교하고 정리해 주
34
34
  - `security`: 보안 관점만 따로 집중해서 검토
35
35
  - `design`: 구현 전에 구조와 트레이드오프 논의
36
36
  - `idea`: 개선 아이디어, 대안, 유사 도구 탐색
37
- - `implement`: 여러 provider를 써서 구현을 진행하고 마지막 검증까지 이어감
38
37
 
39
38
  ## 실행하면 어떻게 되나
40
39
 
@@ -44,9 +43,9 @@ Agestra는 하나의 작업에 여러 AI를 붙여서 비교하고 정리해 주
44
43
  4. 선택된 provider들이 남은 쟁점만 검토하거나 토론합니다.
45
44
  5. 결론, 이견, 근거를 하나의 결과로 돌려줍니다.
46
45
 
47
- 평범한 리뷰나 QA 요청이 자동으로 Agestra가 되는 것은 아닙니다. `/agestra ...`를 쓰거나, 여러 AI나 provider-backed 작업을 명시했을 때 Agestra 워크플로우가 시작됩니다.
46
+ 평범한 리뷰나 QA 요청이 자동으로 Agestra가 되는 것은 아닙니다. `/agestra ...`를 쓰거나, 여러 AI나 provider-backed 리뷰/QA/보안/설계/아이디어 작업을 명시했을 때 Agestra 워크플로우가 시작됩니다.
48
47
 
49
- 구현과 QA에서는 마지막 확인을 계속 호스트가 맡습니다. 빌드, 테스트, 실행 근거, 브라우저 흐름, 최종 파일 반영은 호스트가 확인합니다.
48
+ 코드 변경은 먼저 현재 호스트에서 직접 진행하는 편이 좋습니다. Agestra는 다음 결과를 리뷰하고, 계획과 맞는지 검증하고, 여러 provider 의견과 근거를 기록할 때 가장 강합니다.
50
49
 
51
50
  ## 이 저장소에서 쓰기
52
51
 
package/README.md CHANGED
@@ -7,7 +7,7 @@ Multi-host MCP orchestration for Claude Code, Codex CLI, Gemini CLI, and local m
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra helps you use more than one AI for the same task. It is built for review, QA, design discussion, idea exploration, and provider-backed implementation.
10
+ Agestra helps you use more than one AI to examine the same problem. It is built for review, QA, security checks, design discussion, idea exploration, and evidence-backed consensus.
11
11
 
12
12
  ## Quick Start
13
13
 
@@ -21,8 +21,8 @@ Install Agestra in the host you already use.
21
21
 
22
22
  Then open your project and ask for an Agestra workflow.
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`
25
+ - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`
26
26
  - Codex CLI: ask explicitly for Agestra or multiple providers, for example `Use Agestra with Gemini and Codex to review this branch.`
27
27
 
28
28
  The first workflow may ask which providers you want to use. Agestra works best with two or more providers, but setup and host-owned flows still work with one.
@@ -34,7 +34,6 @@ The first workflow may ask which providers you want to use. Agestra works best w
34
34
  - `security`: run a dedicated security-focused review
35
35
  - `design`: discuss architecture and tradeoffs before coding
36
36
  - `idea`: explore improvements, alternatives, and similar tools
37
- - `implement`: coordinate provider-backed implementation, then verify the result
38
37
 
39
38
  ## How It Runs
40
39
 
@@ -44,9 +43,9 @@ The first workflow may ask which providers you want to use. Agestra works best w
44
43
  4. Selected providers review or debate only the unresolved points.
45
44
  5. Agestra returns one result with conclusions, disagreements, and evidence.
46
45
 
47
- Plain review or QA requests do not automatically become Agestra workflows. Agestra starts when you use `/agestra ...` or explicitly ask for multi-AI or provider-backed help.
46
+ Plain review or QA requests do not automatically become Agestra workflows. Agestra starts when you use `/agestra ...` or explicitly ask for multi-AI or provider-backed review, QA, security, design, or idea work.
48
47
 
49
- For implementation and QA, the host still owns the final checks such as build, test, runtime evidence, browser flows, and accepted file changes.
48
+ For code changes, use your current host directly first. Agestra is strongest after that: reviewing the result, checking it against a plan, comparing provider opinions, and recording the evidence.
50
49
 
51
50
  ## Using This Repository
52
51
 
package/README.zh.md CHANGED
@@ -7,7 +7,7 @@
7
7
 
8
8
  [English](README.md) | [한국어](README.ko.md) | [日本語](README.ja.md) | [中文](README.zh.md)
9
9
 
10
- Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合代码审查、QA、安全检查、设计讨论、想法探索,以及 provider-backed 实现。
10
+ Agestra 用来让多个 AI 从不同角度审视同一个问题,并把结果整理成证据清晰的结论。它适合代码审查、QA、安全检查、设计讨论、想法探索和基于证据的共识。
11
11
 
12
12
  ## 快速开始
13
13
 
@@ -21,8 +21,8 @@ Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合
21
21
 
22
22
  安装后,打开项目并发起 Agestra 工作流。
23
23
 
24
- - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`, `/agestra implement`
25
- - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`, `/agestra:implement`
24
+ - Claude Code: `/agestra review`, `/agestra qa`, `/agestra security`, `/agestra design`, `/agestra idea`
25
+ - Gemini CLI: `/agestra:review`, `/agestra:qa`, `/agestra:security`, `/agestra:design`, `/agestra:idea`
26
26
  - Codex CLI: 像 `Use Agestra with Gemini and Codex to review this branch.` 这样明确提到 Agestra 或多个 AI
27
27
 
28
28
  第一次运行时,它可能会询问你要启用哪些 provider。只有一个 provider 也能完成设置和宿主自有流程,但 Multi-AI 比较在两个以上 provider 时效果最好。
@@ -34,7 +34,6 @@ Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合
34
34
  - `security`: 专门做安全视角的检查
35
35
  - `design`: 在写代码前讨论结构和取舍
36
36
  - `idea`: 探索改进方向、备选方案和相似工具
37
- - `implement`: 用多个 provider 推进实现,并把最后验证也串起来
38
37
 
39
38
  ## 运行时会发生什么
40
39
 
@@ -44,9 +43,9 @@ Agestra 用来把多个 AI 放到同一个任务里比较和整理。它适合
44
43
  4. 被选中的 provider 只讨论或审查剩下的未解决问题。
45
44
  5. Agestra 返回一份包含结论、分歧和证据的结果。
46
45
 
47
- 普通的 review 或 QA 请求不会自动变成 Agestra 工作流。只有当你使用 `/agestra ...`,或者明确要求多 AI / provider-backed 帮助时,Agestra 才会启动。
46
+ 普通的 review 或 QA 请求不会自动变成 Agestra 工作流。只有当你使用 `/agestra ...`,或者明确要求多 AI / provider-backed 的 review、QA、安全、设计或 idea 工作时,Agestra 才会启动。
48
47
 
49
- 在实现和 QA 里,最后的确认仍然由宿主负责。构建、测试、运行证据、浏览器流程,以及最终落盘的改动都由宿主确认。
48
+ 代码修改应优先由当前宿主直接完成。Agestra 最适合在修改之后审查结果、按计划验证、比较多个 provider 的意见,并记录证据。
50
49
 
51
50
  ## 在这个仓库里使用
52
51
 
@@ -2,9 +2,10 @@
2
2
  name: agestra-debate
3
3
  description: |
4
4
  Host-native debate participant for Agestra consensus rounds. Reads the assigned
5
- domain/lens context, answers a pending host turn, and returns the required
6
- consensus JSON. It is not the moderator, not the team lead, not a reviewer/QA/
7
- security specialist identity, and does not choose participants or run rounds.
5
+ workflow profile/lens context, answers a pending host turn by the supplied
6
+ question set, and returns the required consensus JSON. It is not the
7
+ moderator, not the team lead, not a reviewer/QA/security specialist identity,
8
+ and does not choose participants or run rounds.
8
9
 
9
10
  Use this agent only when the team lead or consensus engine has an explicit
10
11
  host-native participant turn for `agestra-debate`.
@@ -20,7 +21,7 @@ consensus turn, inspect only the supplied packet/files/lens references, and
20
21
  return the required JSON answer for that turn.
21
22
 
22
23
  You are not the consensus engine, moderator, team lead, reviewer, QA judge,
23
- security auditor, or implementation worker.
24
+ security auditor, or code-change executor.
24
25
 
25
26
  Use only inside an active Agestra workflow. Plain review/QA/check requests
26
27
  without `/agestra` or explicit multi-AI/provider wording stay with the current
@@ -36,7 +37,8 @@ Required information:
36
37
  - round number to echo in `round`
37
38
  - assigned item ids
38
39
  - allowed files or evidence references
39
- - assigned domain/lens context, if any
40
+ - assigned workflow profile and lens context, if any
41
+ - supplied `questionSet` with required question IDs, verdict fields, and allowed verdicts
40
42
  - output contract
41
43
 
42
44
  If the request is only a generic review, QA, or debate request and does not
@@ -66,8 +68,16 @@ Consensus turn shape:
66
68
  "items": [
67
69
  {
68
70
  "id": "<assigned item id>",
69
- "stance": "agree",
70
- "comment": "short evidence-based comment when needed"
71
+ "questionResults": {
72
+ "<verdictField from questionSet>": {
73
+ "verdict": "<allowed verdict from questionSet>",
74
+ "reason": "short evidence-based reason",
75
+ "stanceEvidenceType": "empirical",
76
+ "evidenceRefs": ["file:line, artifact path, or item evidence ref"]
77
+ }
78
+ },
79
+ "finalStatus": "<allowed final status from questionSet>",
80
+ "adjustedRemedy": "optional remedy adjustment when allowed by the packet"
71
81
  }
72
82
  ]
73
83
  }
@@ -77,9 +87,11 @@ Rules:
77
87
  - `provider` must exactly match the pending participant id.
78
88
  - `round` must exactly match the pending round.
79
89
  - Answer every assigned item exactly once.
80
- - `stance` must be one of `agree`, `disagree`, `opinion`, or `revise`.
81
- - `disagree`, `opinion`, and `revise` require a non-empty `comment`.
82
- - `revise` requires a `proposedItem` in the shape requested by the engine.
90
+ - Answer every required question in the supplied `questionSet`.
91
+ - Use only verdict values allowed by the supplied `questionSet`.
92
+ - Include stance evidence type and evidence refs for each question answer.
93
+ - Treat `workflow` as artifact context only; do not infer hidden QA, review,
94
+ security, design, idea, or planning rules.
83
95
  - Do not create new top-level fields unless the engine contract explicitly allows them.
84
96
  </Output_Contract>
85
97
 
@@ -89,5 +101,5 @@ Rules:
89
101
  - Do not write reports or final synthesis documents.
90
102
  - Do not edit source files.
91
103
  - Do not convert this task into a general review, QA, security audit, or design pass.
92
- - If evidence is missing, use `opinion` or `disagree` with a clear comment instead of inventing facts.
104
+ - If evidence is missing, answer the supplied question set with `unclear` or the closest allowed verdict and explain the evidence gap instead of inventing facts.
93
105
  </Boundaries>
@@ -16,7 +16,7 @@ You are a focused research assignee. You investigate the exact research
16
16
  assignment you receive and return structured evidence for aggregation.
17
17
 
18
18
  You are not the team lead, final synthesizer, consensus engine, reviewer, QA
19
- judge, security auditor, or implementation worker.
19
+ judge, security auditor, or code-change executor.
20
20
 
21
21
  Use only inside an active Agestra workflow. Plain review/QA/check requests
22
22
  without `/agestra` or explicit multi-AI/provider wording stay with the current
@@ -27,9 +27,12 @@ host.
27
27
  Proceed only when the request includes a bounded research assignment.
28
28
 
29
29
  Expected assignment fields:
30
- - `domain`: idea, design, review, qa, security, implement, or research
30
+ - `workflow` and `profileId`: idea, design, review, qa, security, planning, or
31
+ research workflow profile selected by team-lead
32
+ - `promptPack`: self-contained workflow prompt, research skill guidance,
33
+ question set, finding contract, and evidence policy
31
34
  - `question`: the narrow question this run answers
32
- - `lens`: the lens bundle to apply
35
+ - `lens`: the single lens to apply
33
36
  - `scope`: files, docs, URLs, or boundaries to inspect
34
37
  - `deliverable`: expected result shape
35
38
  - `rationale`: why this run exists, when provided
@@ -40,8 +43,8 @@ concrete research assignment instead of expanding the scope yourself.
40
43
 
41
44
  <Lens_Policy>
42
45
  Start from `skills/references/lenses/research.md` when lens rules are needed.
43
- If the assignment has a concrete domain, read only the matching domain pack under
44
- `skills/references/lenses/research-domains/`.
46
+ If the assignment has a concrete workflow profile, read only the matching lens
47
+ reference under `skills/references/lenses/research-domains/`.
45
48
 
46
49
  One research run should keep a narrow lens bundle. If the assignment includes too
47
50
  many unrelated lenses, report that it should be split into multiple research
@@ -58,15 +61,17 @@ runs.
58
61
  </Research_Method>
59
62
 
60
63
  <Output_Contract>
61
- Return JSON only. The result feeds team-lead/research aggregation, which may
62
- later create `initial_aggregation` for the consensus engine.
64
+ Return JSON only. The result feeds team-lead/research aggregation. Do not start
65
+ debate or create the final report.
63
66
 
64
67
  Recommended shape:
65
68
 
66
69
  ```json
67
70
  {
68
71
  "researcher": "agestra-research",
69
- "domain": "idea",
72
+ "workflow": "idea",
73
+ "profileId": "idea.value-and-next-step.v1",
74
+ "promptPackId": "idea.value-and-next-step.v1",
70
75
  "question": "The assigned question",
71
76
  "lens": "User Pain + Evidence",
72
77
  "findings": [
@@ -75,18 +80,26 @@ Recommended shape:
75
80
  "kind": "finding",
76
81
  "title": "Short evidence-backed title",
77
82
  "claim": "What the evidence suggests",
83
+ "whyItMatters": "Why a participant should care about this finding",
84
+ "evidenceType": "empirical",
78
85
  "evidence": ["file:line, command, artifact path, or URL"],
86
+ "proposedRemedy": "Action or next step when the workflow requires one",
87
+ "remedyRisk": "Risk introduced by the proposed remedy, or null",
88
+ "debateEligibility": "eligible",
79
89
  "confidence": "high",
80
90
  "limits": "What was not checked"
81
91
  }
82
92
  ],
93
+ "rawTranscript": "The concise raw response or notes from this run",
83
94
  "openQuestions": [],
84
- "suggestedConsensusItems": []
95
+ "suggestedAggregationItems": []
85
96
  }
86
97
  ```
87
98
 
88
- Use `suggestedConsensusItems` only for claims that may need multi-AI consensus.
89
- Do not call the consensus engine yourself.
99
+ Use one prompt pack and one lens per run. Every finding must classify evidence as
100
+ `empirical`, `inferential`, or `mixed`; include `proposedRemedy`, `remedyRisk`,
101
+ and `debateEligibility` when the profile contract asks for them. Do not call the
102
+ consensus engine yourself.
90
103
  </Output_Contract>
91
104
 
92
105
  <Boundaries>