@ngxtm/devkit 3.19.0 → 3.20.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/merged-commands/application-performance-performance-optimization.md +13 -13
- package/merged-commands/ask/fast.md +14 -57
- package/merged-commands/ask/hard.md +22 -79
- package/merged-commands/auto.md +6 -33
- package/merged-commands/backend-development-feature-development.md +12 -12
- package/merged-commands/bootstrap/auto/fast.md +15 -15
- package/merged-commands/bootstrap/auto/parallel.md +12 -12
- package/merged-commands/bootstrap/auto.md +14 -14
- package/merged-commands/bootstrap.md +15 -15
- package/merged-commands/brainstorm/fast.md +19 -72
- package/merged-commands/brainstorm/hard.md +23 -84
- package/merged-commands/c4-architecture-c4-architecture.md +5 -5
- package/merged-commands/code/auto.md +16 -16
- package/merged-commands/code/fast.md +19 -72
- package/merged-commands/code/hard.md +38 -122
- package/merged-commands/code/no-test.md +12 -12
- package/merged-commands/code/parallel.md +9 -9
- package/merged-commands/code.md +14 -14
- package/merged-commands/comprehensive-review-full-review.md +8 -8
- package/merged-commands/context-degradation.md +2 -2
- package/merged-commands/context-engineering.md +4 -4
- package/merged-commands/context-optimization.md +3 -3
- package/merged-commands/cook/auto/fast.md +3 -3
- package/merged-commands/cook/auto/parallel.md +9 -9
- package/merged-commands/cook/auto.md +1 -1
- package/merged-commands/cook/fast.md +38 -47
- package/merged-commands/cook/hard.md +46 -41
- package/merged-commands/cook.md +13 -13
- package/merged-commands/daily-news-report.md +15 -15
- package/merged-commands/data-engineering-data-driven-feature.md +16 -16
- package/merged-commands/debug/fast.md +13 -29
- package/merged-commands/debug/hard.md +47 -49
- package/merged-commands/debug.md +1 -1
- package/merged-commands/debugging-toolkit-smart-debug.md +1 -1
- package/merged-commands/deploy/check.md +22 -71
- package/merged-commands/deploy/preview.md +18 -62
- package/merged-commands/deploy/production.md +22 -71
- package/merged-commands/deploy/rollback.md +22 -71
- package/merged-commands/deploy.md +0 -11
- package/merged-commands/design/3d.md +3 -3
- package/merged-commands/design/describe.md +1 -1
- package/merged-commands/design/fast.md +2 -2
- package/merged-commands/design/good.md +3 -3
- package/merged-commands/design/hard.md +15 -85
- package/merged-commands/design/screenshot.md +1 -1
- package/merged-commands/design/video.md +1 -1
- package/merged-commands/design.md +0 -11
- package/merged-commands/doc-coauthoring.md +5 -5
- package/merged-commands/docker-expert.md +1 -1
- package/merged-commands/docs/audit.md +26 -77
- package/merged-commands/docs/business.md +26 -77
- package/merged-commands/docs/core.md +24 -68
- package/merged-commands/docs/init.md +8 -8
- package/merged-commands/docs/update.md +13 -13
- package/merged-commands/docs.md +0 -12
- package/merged-commands/error-debugging-multi-agent-review.md +1 -1
- package/merged-commands/error-diagnostics-smart-debug.md +1 -1
- package/merged-commands/finishing-a-development-branch.md +1 -1
- package/merged-commands/fix/ci.md +2 -2
- package/merged-commands/fix/fast.md +2 -2
- package/merged-commands/fix/hard.md +6 -6
- package/merged-commands/fix/logs.md +5 -5
- package/merged-commands/fix/parallel.md +9 -9
- package/merged-commands/fix/test.md +6 -6
- package/merged-commands/fix/ui.md +8 -8
- package/merged-commands/fixing.md +3 -3
- package/merged-commands/framework-migration-legacy-modernize.md +13 -13
- package/merged-commands/full-stack-orchestration-full-stack-feature.md +12 -12
- package/merged-commands/git/cm.md +1 -1
- package/merged-commands/git/cp.md +1 -1
- package/merged-commands/git/merge.md +1 -1
- package/merged-commands/git/pr.md +1 -1
- package/merged-commands/git-pr-workflows-git-workflow.md +10 -10
- package/merged-commands/google-adk-python.md +1 -1
- package/merged-commands/hr-pro.md +1 -1
- package/merged-commands/incident-response-incident-response.md +13 -13
- package/merged-commands/integrate/polar.md +3 -3
- package/merged-commands/integrate/sepay.md +3 -3
- package/merged-commands/journal.md +1 -1
- package/merged-commands/linear-claude-skill.md +2 -2
- package/merged-commands/loki-mode.md +14 -14
- package/merged-commands/machine-learning-ops-ml-pipeline.md +7 -7
- package/merged-commands/mcp-management.md +8 -8
- package/merged-commands/multi-agent-patterns.md +14 -14
- package/merged-commands/multi-platform-apps-multi-platform.md +10 -10
- package/merged-commands/nestjs-expert.md +1 -1
- package/merged-commands/performance-testing-review-multi-agent-review.md +1 -1
- package/merged-commands/plan/archive.md +1 -1
- package/merged-commands/plan/ci.md +1 -1
- package/merged-commands/plan/fast.md +2 -2
- package/merged-commands/plan/hard.md +4 -4
- package/merged-commands/plan/parallel.md +5 -5
- package/merged-commands/plan/two.md +6 -6
- package/merged-commands/requesting-code-review.md +6 -6
- package/merged-commands/review/codebase/parallel.md +5 -5
- package/merged-commands/review/codebase.md +5 -5
- package/merged-commands/review/fast.md +13 -29
- package/merged-commands/review/hard.md +48 -49
- package/merged-commands/review.md +0 -11
- package/merged-commands/security-scanning-security-hardening.md +13 -13
- package/merged-commands/skill/add.md +6 -6
- package/merged-commands/skill/create.md +6 -6
- package/merged-commands/skill/fix-logs.md +6 -6
- package/merged-commands/skill/optimize/auto.md +1 -1
- package/merged-commands/skill/optimize.md +1 -1
- package/merged-commands/skill/plan.md +1 -1
- package/merged-commands/skill/update.md +6 -6
- package/merged-commands/subagent-driven-development.md +53 -53
- package/merged-commands/tdd-workflows-tdd-cycle.md +12 -12
- package/merged-commands/tdd-workflows-tdd-red.md +1 -1
- package/merged-commands/tdd-workflows-tdd-refactor.md +1 -1
- package/merged-commands/test/fast.md +22 -33
- package/merged-commands/test/hard.md +59 -56
- package/merged-commands/test/ui.md +1 -1
- package/merged-commands/test.md +1 -1
- package/merged-commands/typescript-expert.md +1 -1
- package/merged-commands/use-mcp.md +5 -5
- package/merged-commands/writing-plans.md +3 -3
- package/merged-commands/writing-skills.md +8 -8
- package/package.json +1 -1
- package/rules-index.json +1 -1
- package/skills/application-performance-performance-optimization/SKILL.md +13 -13
- package/skills/azure-ai-agents-python/references/tools.md +1 -1
- package/skills/backend-development-feature-development/SKILL.md +12 -12
- package/skills/best-practices/references/anti-patterns.md +2 -2
- package/skills/best-practices/references/best-practices-guide.md +14 -14
- package/skills/c4-architecture-c4-architecture/SKILL.md +5 -5
- package/skills/comprehensive-review-full-review/SKILL.md +8 -8
- package/skills/context-degradation/SKILL.md +2 -2
- package/skills/context-engineering/SKILL.md +4 -4
- package/skills/context-engineering/references/context-degradation.md +1 -1
- package/skills/context-engineering/references/context-optimization.md +1 -1
- package/skills/context-engineering/references/multi-agent-patterns.md +1 -1
- package/skills/context-engineering/references/runtime-awareness.md +1 -1
- package/skills/context-optimization/SKILL.md +3 -3
- package/skills/daily-news-report/SKILL.md +15 -15
- package/skills/data-engineering-data-driven-feature/SKILL.md +16 -16
- package/skills/debugging-toolkit-smart-debug/SKILL.md +1 -1
- package/skills/doc-coauthoring/SKILL.md +5 -5
- package/skills/docker-expert/SKILL.md +1 -1
- package/skills/error-debugging-multi-agent-review/SKILL.md +1 -1
- package/skills/error-diagnostics-smart-debug/SKILL.md +1 -1
- package/skills/finishing-a-development-branch/SKILL.md +1 -1
- package/skills/fixing/SKILL.md +3 -3
- package/skills/fixing/references/parallel-exploration.md +4 -4
- package/skills/fixing/references/skill-activation-matrix.md +3 -3
- package/skills/fixing/references/workflow-deep.md +11 -11
- package/skills/fixing/references/workflow-quick.md +4 -4
- package/skills/fixing/references/workflow-standard.md +12 -12
- package/skills/framework-migration-legacy-modernize/SKILL.md +13 -13
- package/skills/full-stack-orchestration-full-stack-feature/SKILL.md +12 -12
- package/skills/git-pr-workflows-git-workflow/SKILL.md +10 -10
- package/skills/google-adk-python/SKILL.md +1 -1
- package/skills/hr-pro/SKILL.md +1 -1
- package/skills/incident-response-incident-response/SKILL.md +13 -13
- package/skills/incident-response-smart-fix/resources/implementation-playbook.md +17 -17
- package/skills/linear-claude-skill/SKILL.md +2 -2
- package/skills/loki-mode/ACKNOWLEDGEMENTS.md +4 -4
- package/skills/loki-mode/CHANGELOG.md +9 -9
- package/skills/loki-mode/CONTEXT-EXPORT.md +1 -1
- package/skills/loki-mode/README.md +2 -2
- package/skills/loki-mode/SKILL.md +14 -14
- package/skills/loki-mode/autonomy/run.sh +1 -1
- package/skills/loki-mode/integrations/vibe-kanban.md +1 -1
- package/skills/loki-mode/references/core-workflow.md +4 -4
- package/skills/loki-mode/references/production-patterns.md +6 -6
- package/skills/loki-mode/references/quality-control.md +2 -2
- package/skills/loki-mode/references/sdlc-phases.md +3 -3
- package/skills/machine-learning-ops-ml-pipeline/SKILL.md +7 -7
- package/skills/mcp-builder/reference/evaluation.md +3 -3
- package/skills/mcp-management/README.md +6 -6
- package/skills/mcp-management/SKILL.md +8 -8
- package/skills/mcp-management/references/gemini-cli-integration.md +1 -1
- package/skills/multi-agent-patterns/SKILL.md +14 -14
- package/skills/multi-platform-apps-multi-platform/SKILL.md +10 -10
- package/skills/nestjs-expert/SKILL.md +1 -1
- package/skills/performance-testing-review-multi-agent-review/SKILL.md +1 -1
- package/skills/planning-with-files/reference.md +2 -2
- package/skills/requesting-code-review/SKILL.md +6 -6
- package/skills/security-scanning-security-hardening/SKILL.md +13 -13
- package/skills/subagent-driven-development/SKILL.md +53 -53
- package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +1 -1
- package/skills/subagent-driven-development/implementer-prompt.md +3 -3
- package/skills/subagent-driven-development/spec-reviewer-prompt.md +1 -1
- package/skills/tdd-workflows-tdd-cycle/SKILL.md +12 -12
- package/skills/tdd-workflows-tdd-green/resources/implementation-playbook.md +1 -1
- package/skills/tdd-workflows-tdd-red/SKILL.md +1 -1
- package/skills/tdd-workflows-tdd-refactor/SKILL.md +1 -1
- package/skills/typescript-expert/SKILL.md +1 -1
- package/skills/writing-plans/SKILL.md +3 -3
- package/skills/writing-skills/SKILL.md +8 -8
- package/skills/writing-skills/examples/CLAUDE_MD_TESTING.md +1 -1
- package/skills/writing-skills/references/cso/README.md +3 -3
- package/skills/writing-skills/testing-skills-with-subagents.md +1 -1
|
@@ -158,7 +158,7 @@ Battle-tested patterns from practitioners:
|
|
|
158
158
|
- **Confidence-Based Routing**: Auto-approve high confidence, escalate low
|
|
159
159
|
- **Deterministic Outer Loops**: Rule-based validation, not LLM-judged
|
|
160
160
|
- **Context Curation**: Manual selection beats automatic RAG
|
|
161
|
-
- **
|
|
161
|
+
- **Task Agents for Context Isolation**: Prevent token waste
|
|
162
162
|
- **Event-Driven Orchestration**: Async, decoupled coordination
|
|
163
163
|
- **Policy-First Enforcement**: Runtime governance
|
|
164
164
|
|
|
@@ -172,7 +172,7 @@ Battle-tested patterns from practitioners:
|
|
|
172
172
|
- Confidence-Based Routing thresholds
|
|
173
173
|
- Deterministic Outer Loops workflow
|
|
174
174
|
- Context Engineering principles
|
|
175
|
-
-
|
|
175
|
+
- Task Agents for Context Isolation
|
|
176
176
|
|
|
177
177
|
### Key Practitioner Insights
|
|
178
178
|
|
|
@@ -347,7 +347,7 @@ Comprehensive guide covering:
|
|
|
347
347
|
- **Haiku**: Unit tests, monitoring, and simple tasks
|
|
348
348
|
|
|
349
349
|
### Changed
|
|
350
|
-
- SKILL.md: Added Single-Responsibility Principle to
|
|
350
|
+
- SKILL.md: Added Single-Responsibility Principle to Task agent guidance
|
|
351
351
|
- SKILL.md: Clarified model selection (Opus=planning, Sonnet=dev, Haiku=tests)
|
|
352
352
|
- SKILL.md: Dynamic Agent Selection table now shows Planning/Development/Testing columns
|
|
353
353
|
- tool-orchestration.md: Added correlation_id, tool_reliability_rate to schema
|
|
@@ -939,7 +939,7 @@ The previous "37 agents" messaging was misleading because:
|
|
|
939
939
|
- **Sonnet 4.5** is now clearly marked as **DEFAULT** for all standard implementation work
|
|
940
940
|
- **Haiku 4.5** changed to **OPTIMIZATION ONLY** for simple/parallelizable tasks
|
|
941
941
|
- **Opus 4.5** changed to **COMPLEX ONLY** for architecture & security
|
|
942
|
-
- Previous documentation incorrectly suggested Haiku as default for most
|
|
942
|
+
- Previous documentation incorrectly suggested Haiku as default for most Task agents
|
|
943
943
|
- Aligns with best practices: Sonnet for quality, Haiku for speed optimization only
|
|
944
944
|
|
|
945
945
|
- **run.sh Implementation Gap** - RARV cycle now implemented in runner script (run.sh:870-871, 908-916):
|
|
@@ -1150,7 +1150,7 @@ For existing `.loki/` projects:
|
|
|
1150
1150
|
|
|
1151
1151
|
### Fixed
|
|
1152
1152
|
- Removed duplicate CONTINUITY.md template from bootstrap script (was lines 2436-2470)
|
|
1153
|
-
- Removed duplicate Task Completion Report from
|
|
1153
|
+
- Removed duplicate Task Completion Report from Task agent dispatch section (was lines 1731-1764)
|
|
1154
1154
|
- Consolidated severity matrices (removed duplicates, kept one authoritative version)
|
|
1155
1155
|
|
|
1156
1156
|
## [2.14.0] - 2026-01-02
|
|
@@ -1353,8 +1353,8 @@ Loki Mode now combines the best practices from GitHub's ecosystem:
|
|
|
1353
1353
|
- Secret scanning to prevent credential leaks
|
|
1354
1354
|
- 5 quality gate categories with blocking rules
|
|
1355
1355
|
|
|
1356
|
-
**Principle 2: Structured Prompting for
|
|
1357
|
-
- All
|
|
1356
|
+
**Principle 2: Structured Prompting for Task Agents**
|
|
1357
|
+
- All Task agent dispatches must include: GOAL, CONSTRAINTS, CONTEXT, OUTPUT FORMAT
|
|
1358
1358
|
- Goals explain "what success looks like" (not just actions)
|
|
1359
1359
|
- Constraints define boundaries (dependencies, compatibility, performance)
|
|
1360
1360
|
- Context includes CONTINUITY.md, ledgers, learnings, architecture decisions
|
|
@@ -1390,10 +1390,10 @@ Loki Mode now combines the best practices from GitHub's ecosystem:
|
|
|
1390
1390
|
|
|
1391
1391
|
### Changed
|
|
1392
1392
|
- CODE_REVIEW phase now requires static analysis before AI reviewers
|
|
1393
|
-
-
|
|
1393
|
+
- Task agent dispatch template updated with GOAL/CONSTRAINTS/CONTEXT/OUTPUT
|
|
1394
1394
|
- Task completion requires decision documentation (not just code output)
|
|
1395
1395
|
- Quality gates now include static analysis tools (CodeQL, linters, security scanners)
|
|
1396
|
-
- Context-Aware
|
|
1396
|
+
- Context-Aware Task Agent Dispatch section rewritten for structured prompting
|
|
1397
1397
|
|
|
1398
1398
|
### Philosophy
|
|
1399
1399
|
"Speed and control aren't trade-offs. They reinforce each other." - GitHub
|
|
@@ -13,7 +13,7 @@
|
|
|
13
13
|
### Key Features
|
|
14
14
|
- 37 specialized agent types across 6 swarms (Engineering, Operations, Business, Data, Product, Growth)
|
|
15
15
|
- Dynamic agent scaling based on project complexity
|
|
16
|
-
- Task tool for
|
|
16
|
+
- Task tool for Task agent dispatch with fresh context
|
|
17
17
|
- Distributed task queue (pending, in-progress, completed, failed, dead-letter)
|
|
18
18
|
- Circuit breakers for per-agent failure handling
|
|
19
19
|
- Timeout/stuck agent detection with heartbeat monitoring
|
|
@@ -522,12 +522,12 @@ Loki Mode incorporates research and patterns from leading AI labs and practition
|
|
|
522
522
|
### Practitioner Insights
|
|
523
523
|
|
|
524
524
|
- **Boris Cherny** (Claude Code creator) - Self-verification loop, extended thinking
|
|
525
|
-
- **Simon Willison** -
|
|
525
|
+
- **Simon Willison** - Task agents for context isolation, skills system
|
|
526
526
|
- **Hacker News Community** - [Production patterns](https://news.ycombinator.com/item?id=44623207) from real deployments
|
|
527
527
|
|
|
528
528
|
### Inspirations
|
|
529
529
|
|
|
530
|
-
- [LerianStudio/ring](https://github.com/LerianStudio/ring) -
|
|
530
|
+
- [LerianStudio/ring](https://github.com/LerianStudio/ring) - Task-agent-driven-development pattern
|
|
531
531
|
- [Awesome Agentic Patterns](https://github.com/nibzard/awesome-agentic-patterns) - 105+ production patterns
|
|
532
532
|
|
|
533
533
|
**[Full Acknowledgements](ACKNOWLEDGEMENTS.md)** - Complete list of 50+ research papers, articles, and resources
|
|
@@ -137,7 +137,7 @@ If bugs are found in these files, document them in `.loki/CONTINUITY.md` under "
|
|
|
137
137
|
| - Identify highest priority unblocked task |
|
|
138
138
|
+-------------------------------------------------------------------+
|
|
139
139
|
| ACT: Execute the task |
|
|
140
|
-
| - Dispatch
|
|
140
|
+
| - Dispatch Task agent via Task tool OR execute directly |
|
|
141
141
|
| - Write code, run tests, fix issues |
|
|
142
142
|
| - Commit changes atomically (git checkpoint) |
|
|
143
143
|
+-------------------------------------------------------------------+
|
|
@@ -175,7 +175,7 @@ If bugs are found in these files, document them in `.loki/CONTINUITY.md` under "
|
|
|
175
175
|
### Task Tool Model Parameter
|
|
176
176
|
```python
|
|
177
177
|
# Opus for planning/architecture ONLY
|
|
178
|
-
Task(subagent_type="
|
|
178
|
+
Task(subagent_type="general-purpose", model="opus", description="Design system architecture", prompt="...")
|
|
179
179
|
|
|
180
180
|
# Sonnet for development and functional testing
|
|
181
181
|
Task(subagent_type="general-purpose", description="Implement API endpoint", prompt="...")
|
|
@@ -286,7 +286,7 @@ Task(description="Refactor database layer for performance", prompt="...") #
|
|
|
286
286
|
- **Direct Routing:** Minimal context - just the task and relevant file(s)
|
|
287
287
|
- **Supervisor Mode:** Full context - CONTINUITY.md, architectural decisions, dependencies
|
|
288
288
|
|
|
289
|
-
> "Keep in mind, complex task histories might confuse simpler
|
|
289
|
+
> "Keep in mind, complex task histories might confuse simpler Task agents." - AWS Best Practices
|
|
290
290
|
|
|
291
291
|
### E2E Testing with Playwright MCP (Anthropic Harness Pattern)
|
|
292
292
|
|
|
@@ -325,7 +325,7 @@ mcp_servers = {
|
|
|
325
325
|
| Metric | What to Track | Store In |
|
|
326
326
|
|--------|---------------|----------|
|
|
327
327
|
| Wall time | Seconds from start to completion | `.loki/metrics/efficiency/` |
|
|
328
|
-
| Agent count | Number of
|
|
328
|
+
| Agent count | Number of Task agents spawned | `.loki/metrics/efficiency/` |
|
|
329
329
|
| Retry count | Attempts before success | `.loki/metrics/efficiency/` |
|
|
330
330
|
| Model usage | Haiku/Sonnet/Opus call distribution | `.loki/metrics/efficiency/` |
|
|
331
331
|
|
|
@@ -351,12 +351,12 @@ See `references/tool-orchestration.md` for full implementation details.
|
|
|
351
351
|
|
|
352
352
|
---
|
|
353
353
|
|
|
354
|
-
## Structured Prompting for
|
|
354
|
+
## Structured Prompting for Task Agents
|
|
355
355
|
|
|
356
356
|
**Single-Responsibility Principle:** Each agent should have ONE clear goal and narrow scope.
|
|
357
357
|
([UiPath Best Practices](https://www.uipath.com/blog/ai/agent-builder-best-practices))
|
|
358
358
|
|
|
359
|
-
**Every
|
|
359
|
+
**Every Task agent dispatch MUST include:**
|
|
360
360
|
|
|
361
361
|
```markdown
|
|
362
362
|
## GOAL (What success looks like)
|
|
@@ -446,7 +446,7 @@ See `references/agent-types.md` for complete definitions and capabilities.
|
|
|
446
446
|
- **NEVER** skip code review between tasks
|
|
447
447
|
- **NEVER** proceed with unfixed Critical/High/Medium issues
|
|
448
448
|
- **NEVER** dispatch reviewers sequentially (always parallel - 3x faster)
|
|
449
|
-
- **NEVER** dispatch multiple implementation
|
|
449
|
+
- **NEVER** dispatch multiple implementation Task agents in parallel (conflicts)
|
|
450
450
|
- **NEVER** implement without reading task requirements first
|
|
451
451
|
|
|
452
452
|
### Review Anti-Patterns
|
|
@@ -466,7 +466,7 @@ See `references/agent-types.md` for complete definitions and capabilities.
|
|
|
466
466
|
- **ALWAYS** wait for all reviewers before aggregating
|
|
467
467
|
- **ALWAYS** fix Critical/High/Medium immediately
|
|
468
468
|
- **ALWAYS** re-run ALL 3 reviewers after fixes
|
|
469
|
-
- **ALWAYS** checkpoint state before spawning
|
|
469
|
+
- **ALWAYS** checkpoint state before spawning Task agents
|
|
470
470
|
|
|
471
471
|
---
|
|
472
472
|
|
|
@@ -618,14 +618,14 @@ context_budget:
|
|
|
618
618
|
reserve: "90% for model reasoning"
|
|
619
619
|
```
|
|
620
620
|
|
|
621
|
-
###
|
|
621
|
+
### Task Agents for Context Isolation
|
|
622
622
|
|
|
623
|
-
**Use
|
|
623
|
+
**Use Task agents to prevent token waste on noisy subtasks:**
|
|
624
624
|
|
|
625
625
|
```
|
|
626
|
-
Main agent (focused) -->
|
|
627
|
-
-->
|
|
628
|
-
-->
|
|
626
|
+
Main agent (focused) --> Task agent (file search)
|
|
627
|
+
--> Task agent (test running)
|
|
628
|
+
--> Task agent (linting)
|
|
629
629
|
```
|
|
630
630
|
|
|
631
631
|
See `references/production-patterns.md` for full practitioner patterns.
|
|
@@ -690,7 +690,7 @@ Loki Mode with PRD at path/to/prd # Start with PRD
|
|
|
690
690
|
|-------|-------|
|
|
691
691
|
| Trigger | "Loki Mode" or "Loki Mode with PRD at [path]" |
|
|
692
692
|
| Skip When | Need human approval, want to review plan first, single small task |
|
|
693
|
-
| Related Skills |
|
|
693
|
+
| Related Skills | task-agent-driven-development, executing-plans |
|
|
694
694
|
|
|
695
695
|
---
|
|
696
696
|
|
|
@@ -1473,7 +1473,7 @@ build_prompt() {
|
|
|
1473
1473
|
local analysis_instruction="CODEBASE_ANALYSIS_MODE: No PRD. FIRST: Analyze codebase - scan structure, read package.json/requirements.txt, examine README. THEN: Generate PRD at .loki/generated-prd.md. FINALLY: Execute SDLC phases."
|
|
1474
1474
|
|
|
1475
1475
|
# Context Memory Instructions
|
|
1476
|
-
local memory_instruction="CONTEXT MEMORY: Save state to .loki/memory/ledgers/LEDGER-orchestrator.md before complex operations. Create handoffs at .loki/memory/handoffs/ when passing work to
|
|
1476
|
+
local memory_instruction="CONTEXT MEMORY: Save state to .loki/memory/ledgers/LEDGER-orchestrator.md before complex operations. Create handoffs at .loki/memory/handoffs/ when passing work to Task agents. Extract learnings to .loki/memory/learnings/ after completing tasks. Check .loki/rules/ for established patterns. If context feels heavy, create .loki/signals/CONTEXT_CLEAR_REQUESTED and the wrapper will reset context with your ledger preserved."
|
|
1477
1477
|
|
|
1478
1478
|
# Load existing context if resuming
|
|
1479
1479
|
local context_injection=""
|
|
@@ -10,7 +10,7 @@ Loki Mode can optionally integrate with [Vibe Kanban](https://github.com/BloopAI
|
|
|
10
10
|
| Progress monitoring | Log files | Real-time dashboard |
|
|
11
11
|
| Manual intervention | Edit queue files | Drag-and-drop tasks |
|
|
12
12
|
| Code review | Automated 3-reviewer | + Visual diff review |
|
|
13
|
-
| Parallel agents | Background
|
|
13
|
+
| Parallel agents | Background Task agents | Isolated git worktrees |
|
|
14
14
|
|
|
15
15
|
## Setup
|
|
16
16
|
|
|
@@ -34,7 +34,7 @@ Every iteration follows this cycle:
|
|
|
34
34
|
| - Determine exact steps to complete it |
|
|
35
35
|
+-------------------------------------------------------------------+
|
|
36
36
|
| ACT: Execute the task |
|
|
37
|
-
| - Dispatch
|
|
37
|
+
| - Dispatch Task agent via Task tool OR execute directly |
|
|
38
38
|
| - Write code, run tests, fix issues |
|
|
39
39
|
| - Commit changes atomically (git checkpoint) |
|
|
40
40
|
| - Update queue files (.loki/queue/*.json) |
|
|
@@ -266,10 +266,10 @@ move_tasks_to_pending after_task=$last_good_task_id
|
|
|
266
266
|
|
|
267
267
|
---
|
|
268
268
|
|
|
269
|
-
## If
|
|
269
|
+
## If Task Agent Fails
|
|
270
270
|
|
|
271
271
|
1. Do NOT try to fix manually (context pollution)
|
|
272
|
-
2. Dispatch fix
|
|
273
|
-
3. If fix
|
|
272
|
+
2. Dispatch fix Task agent with specific error context
|
|
273
|
+
3. If fix Task agent fails 3x, move to dead letter queue
|
|
274
274
|
4. Open circuit breaker for that agent type
|
|
275
275
|
5. Alert orchestrator for human review
|
|
@@ -283,20 +283,20 @@ skills_architecture:
|
|
|
283
283
|
- Skills can be updated independently
|
|
284
284
|
```
|
|
285
285
|
|
|
286
|
-
###
|
|
286
|
+
### Task Agents for Context Isolation
|
|
287
287
|
|
|
288
288
|
**Key Insight:** Prevent massive token waste by isolating context-noisy subtasks.
|
|
289
289
|
|
|
290
290
|
```python
|
|
291
291
|
async def context_isolated_search(query, codebase_path):
|
|
292
292
|
"""
|
|
293
|
-
Use
|
|
293
|
+
Use Task agent for grep/search to prevent context pollution.
|
|
294
294
|
Based on Simon Willison's patterns.
|
|
295
295
|
"""
|
|
296
296
|
# Main agent stays focused
|
|
297
|
-
#
|
|
297
|
+
# Task agent handles noisy file searching
|
|
298
298
|
|
|
299
|
-
search_agent =
|
|
299
|
+
search_agent = spawn_task_agent(
|
|
300
300
|
role="codebase-searcher",
|
|
301
301
|
context_limit="10k tokens",
|
|
302
302
|
permissions=["read-only"]
|
|
@@ -538,11 +538,11 @@ cost_patterns:
|
|
|
538
538
|
max_tier: "$200/month often needs 2-3 subscriptions"
|
|
539
539
|
|
|
540
540
|
token_economics:
|
|
541
|
-
|
|
541
|
+
task_agents_multiply_cost: "Each duplicates context"
|
|
542
542
|
example: "5-task parallel job = 50,000+ tokens per subtask"
|
|
543
543
|
|
|
544
544
|
optimization:
|
|
545
|
-
context_isolation: "Use
|
|
545
|
+
context_isolation: "Use Task agents for noisy tasks"
|
|
546
546
|
information_abstraction: "Summarize, don't dump"
|
|
547
547
|
fresh_conversations: "Reset after major tasks"
|
|
548
548
|
skill_on_demand: "Load only when needed"
|
|
@@ -273,9 +273,9 @@ Task(subagent_type="general-purpose", model="opus",
|
|
|
273
273
|
|
|
274
274
|
---
|
|
275
275
|
|
|
276
|
-
## Structured Prompting for
|
|
276
|
+
## Structured Prompting for Task Agents
|
|
277
277
|
|
|
278
|
-
**Every
|
|
278
|
+
**Every Task agent dispatch MUST include:**
|
|
279
279
|
|
|
280
280
|
```markdown
|
|
281
281
|
## GOAL (What success looks like)
|
|
@@ -197,15 +197,15 @@ jobs:
|
|
|
197
197
|
### Workflow Per Task:
|
|
198
198
|
|
|
199
199
|
```
|
|
200
|
-
1. Dispatch implementation
|
|
201
|
-
2.
|
|
200
|
+
1. Dispatch implementation Task agent (Task tool, model: sonnet)
|
|
201
|
+
2. Task agent implements with TDD, commits, reports back
|
|
202
202
|
3. Dispatch 3 reviewers IN PARALLEL (single message, 3 Task calls):
|
|
203
203
|
- code-reviewer (opus)
|
|
204
204
|
- business-logic-reviewer (opus)
|
|
205
205
|
- security-reviewer (opus)
|
|
206
206
|
4. Aggregate findings by severity
|
|
207
207
|
5. IF Critical/High/Medium found:
|
|
208
|
-
- Dispatch fix
|
|
208
|
+
- Dispatch fix Task agent
|
|
209
209
|
- Re-run ALL 3 reviewers
|
|
210
210
|
- Loop until all PASS
|
|
211
211
|
6. Add TODO comments for Low issues
|
|
@@ -46,7 +46,7 @@ The multi-agent approach ensures each aspect is handled by domain experts:
|
|
|
46
46
|
## Phase 1: Data & Requirements Analysis
|
|
47
47
|
|
|
48
48
|
<Task>
|
|
49
|
-
subagent_type:
|
|
49
|
+
subagent_type: general-purpose
|
|
50
50
|
prompt: |
|
|
51
51
|
Analyze and design data pipeline for ML system with requirements: $ARGUMENTS
|
|
52
52
|
|
|
@@ -73,7 +73,7 @@ prompt: |
|
|
|
73
73
|
</Task>
|
|
74
74
|
|
|
75
75
|
<Task>
|
|
76
|
-
subagent_type:
|
|
76
|
+
subagent_type: general-purpose
|
|
77
77
|
prompt: |
|
|
78
78
|
Design feature engineering and model requirements for: $ARGUMENTS
|
|
79
79
|
Using data architecture from: {phase1.data-engineer.output}
|
|
@@ -103,7 +103,7 @@ prompt: |
|
|
|
103
103
|
## Phase 2: Model Development & Training
|
|
104
104
|
|
|
105
105
|
<Task>
|
|
106
|
-
subagent_type:
|
|
106
|
+
subagent_type: general-purpose
|
|
107
107
|
prompt: |
|
|
108
108
|
Implement training pipeline based on requirements: {phase1.data-scientist.output}
|
|
109
109
|
Using data pipeline: {phase1.data-engineer.output}
|
|
@@ -131,7 +131,7 @@ prompt: |
|
|
|
131
131
|
</Task>
|
|
132
132
|
|
|
133
133
|
<Task>
|
|
134
|
-
subagent_type:
|
|
134
|
+
subagent_type: general-purpose
|
|
135
135
|
prompt: |
|
|
136
136
|
Optimize and productionize ML code from: {phase2.ml-engineer.output}
|
|
137
137
|
|
|
@@ -160,7 +160,7 @@ prompt: |
|
|
|
160
160
|
## Phase 3: Production Deployment & Serving
|
|
161
161
|
|
|
162
162
|
<Task>
|
|
163
|
-
subagent_type:
|
|
163
|
+
subagent_type: general-purpose
|
|
164
164
|
prompt: |
|
|
165
165
|
Design production deployment for models from: {phase2.ml-engineer.output}
|
|
166
166
|
With optimized code from: {phase2.python-pro.output}
|
|
@@ -194,7 +194,7 @@ prompt: |
|
|
|
194
194
|
</Task>
|
|
195
195
|
|
|
196
196
|
<Task>
|
|
197
|
-
subagent_type:
|
|
197
|
+
subagent_type: general-purpose
|
|
198
198
|
prompt: |
|
|
199
199
|
Design Kubernetes infrastructure for ML workloads from: {phase3.mlops-engineer.output}
|
|
200
200
|
|
|
@@ -223,7 +223,7 @@ prompt: |
|
|
|
223
223
|
## Phase 4: Monitoring & Continuous Improvement
|
|
224
224
|
|
|
225
225
|
<Task>
|
|
226
|
-
subagent_type:
|
|
226
|
+
subagent_type: general-purpose
|
|
227
227
|
prompt: |
|
|
228
228
|
Implement comprehensive monitoring for ML system deployed in: {phase3.mlops-engineer.output}
|
|
229
229
|
Using Kubernetes infrastructure: {phase3.kubernetes-architect.output}
|
|
@@ -179,7 +179,7 @@ Read the documentation of the target API to understand:
|
|
|
179
179
|
- Available endpoints and functionality
|
|
180
180
|
- If ambiguity exists, fetch additional information from the web
|
|
181
181
|
- Parallelize this step AS MUCH AS POSSIBLE
|
|
182
|
-
- Ensure each
|
|
182
|
+
- Ensure each Task agent is ONLY examining documentation from the file system or on the web
|
|
183
183
|
|
|
184
184
|
### Step 2: Tool Inspection
|
|
185
185
|
|
|
@@ -204,8 +204,8 @@ After understanding the API and tools, USE the MCP server tools:
|
|
|
204
204
|
- Goal: identify specific content (e.g., users, channels, messages, projects, tasks) for creating realistic questions
|
|
205
205
|
- Should NOT call any tools that modify state
|
|
206
206
|
- Will NOT read the code of the MCP server implementation itself
|
|
207
|
-
- Parallelize this step with individual
|
|
208
|
-
- Ensure each
|
|
207
|
+
- Parallelize this step with individual Task agents pursuing independent explorations
|
|
208
|
+
- Ensure each Task agent is only performing READ-ONLY, NON-DESTRUCTIVE, and IDEMPOTENT operations
|
|
209
209
|
- BE CAREFUL: SOME TOOLS may return LOTS OF DATA which would cause you to run out of CONTEXT
|
|
210
210
|
- Make INCREMENTAL, SMALL, AND TARGETED tool calls for exploration
|
|
211
211
|
- In all tool call requests, use the `limit` parameter to limit results (<10)
|
|
@@ -4,7 +4,7 @@ Intelligent management and execution of Model Context Protocol (MCP) servers.
|
|
|
4
4
|
|
|
5
5
|
## Overview
|
|
6
6
|
|
|
7
|
-
This skill enables Claude to discover, analyze, and execute MCP server capabilities without polluting the main context window. Perfect for context-efficient MCP integration using
|
|
7
|
+
This skill enables Claude to discover, analyze, and execute MCP server capabilities without polluting the main context window. Perfect for context-efficient MCP integration using Task agent-based architecture.
|
|
8
8
|
|
|
9
9
|
## Features
|
|
10
10
|
|
|
@@ -12,7 +12,7 @@ This skill enables Claude to discover, analyze, and execute MCP server capabilit
|
|
|
12
12
|
- **Intelligent Tool Discovery**: Analyze which tools are relevant for specific tasks
|
|
13
13
|
- **Progressive Disclosure**: Load only necessary tool definitions
|
|
14
14
|
- **Execution Engine**: Call MCP tools with proper parameter handling
|
|
15
|
-
- **Context Efficiency**: Delegate MCP operations to `mcp-manager`
|
|
15
|
+
- **Context Efficiency**: Delegate MCP operations to `mcp-manager` Task agent
|
|
16
16
|
|
|
17
17
|
## Quick Start
|
|
18
18
|
|
|
@@ -71,13 +71,13 @@ The LLM reads `assets/tools.json` and intelligently selects tools. No separate a
|
|
|
71
71
|
npx ts-node scripts/cli.ts call-tool memory add '{"key":"name","value":"Alice"}'
|
|
72
72
|
```
|
|
73
73
|
|
|
74
|
-
### Pattern 4: Use with
|
|
74
|
+
### Pattern 4: Use with Task agent
|
|
75
75
|
|
|
76
76
|
In main Claude conversation:
|
|
77
77
|
|
|
78
78
|
```
|
|
79
79
|
User: "I need to search the web and save results"
|
|
80
|
-
Main Agent: [Spawns mcp-manager
|
|
80
|
+
Main Agent: [Spawns mcp-manager Task agent]
|
|
81
81
|
mcp-manager: Discovers brave-search + memory tools, reports back
|
|
82
82
|
Main Agent: Uses recommended tools for implementation
|
|
83
83
|
```
|
|
@@ -87,7 +87,7 @@ Main Agent: Uses recommended tools for implementation
|
|
|
87
87
|
```
|
|
88
88
|
Main Agent (Claude)
|
|
89
89
|
↓ (delegates MCP tasks)
|
|
90
|
-
mcp-manager
|
|
90
|
+
mcp-manager Task agent
|
|
91
91
|
↓ (uses skill)
|
|
92
92
|
mcp-management Skill
|
|
93
93
|
↓ (connects via)
|
|
@@ -96,7 +96,7 @@ MCP Servers (memory, filesystem, etc.)
|
|
|
96
96
|
|
|
97
97
|
**Benefits**:
|
|
98
98
|
- Main agent context stays clean
|
|
99
|
-
- MCP discovery happens in isolated
|
|
99
|
+
- MCP discovery happens in isolated Task agent context
|
|
100
100
|
- Only relevant tool definitions loaded when needed
|
|
101
101
|
- Reduced token usage
|
|
102
102
|
|
|
@@ -15,7 +15,7 @@ MCP is an open protocol enabling AI agents to connect to external tools and data
|
|
|
15
15
|
- Progressive disclosure of MCP capabilities (load only what's needed)
|
|
16
16
|
- Intelligent tool/prompt/resource selection based on task requirements
|
|
17
17
|
- Multi-server management from single config file
|
|
18
|
-
- Context-efficient:
|
|
18
|
+
- Context-efficient: Task agents handle MCP discovery and execution
|
|
19
19
|
- Persistent tool catalog: automatically saves discovered tools to JSON for fast reference
|
|
20
20
|
|
|
21
21
|
## When to Use This Skill
|
|
@@ -25,7 +25,7 @@ Use this skill when:
|
|
|
25
25
|
2. **Task-Based Tool Selection**: Analyzing which MCP tools are relevant for a specific task
|
|
26
26
|
3. **Executing MCP Tools**: Calling MCP tools programmatically with proper parameter handling
|
|
27
27
|
4. **MCP Integration**: Building or debugging MCP client implementations
|
|
28
|
-
5. **Context Management**: Avoiding context pollution by delegating MCP operations to
|
|
28
|
+
5. **Context Management**: Avoiding context pollution by delegating MCP operations to Task agents
|
|
29
29
|
|
|
30
30
|
## Core Capabilities
|
|
31
31
|
|
|
@@ -80,7 +80,7 @@ echo "Take a screenshot of https://example.com" | gemini -y -m gemini-2.5-flash
|
|
|
80
80
|
npx tsx scripts/cli.ts call-tool memory create_entities '{"entities":[...]}'
|
|
81
81
|
```
|
|
82
82
|
|
|
83
|
-
**Fallback: mcp-manager
|
|
83
|
+
**Fallback: mcp-manager Task agent**
|
|
84
84
|
|
|
85
85
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete examples.
|
|
86
86
|
|
|
@@ -106,14 +106,14 @@ echo "Take a screenshot of https://example.com. Return JSON only per GEMINI.md i
|
|
|
106
106
|
- Automatic tool discovery
|
|
107
107
|
- Structured JSON responses (parseable by Claude)
|
|
108
108
|
- GEMINI.md auto-loaded for consistent formatting
|
|
109
|
-
- Faster than
|
|
109
|
+
- Faster than Task agent orchestration
|
|
110
110
|
- No natural language ambiguity
|
|
111
111
|
|
|
112
112
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete guide.
|
|
113
113
|
|
|
114
|
-
### Pattern 2:
|
|
114
|
+
### Pattern 2: Task Agent-Based Execution (Fallback)
|
|
115
115
|
|
|
116
|
-
Use `mcp-manager` agent when Gemini CLI unavailable.
|
|
116
|
+
Use `mcp-manager` agent when Gemini CLI unavailable. Task agent discovers tools, selects relevant ones, executes tasks, reports back.
|
|
117
117
|
|
|
118
118
|
**Benefit**: Main context stays clean, only relevant tool definitions loaded when needed.
|
|
119
119
|
|
|
@@ -166,7 +166,7 @@ npx tsx cli.ts list-tools # Saves to assets/tools.json
|
|
|
166
166
|
npx tsx cli.ts call-tool memory create_entities '{"entities":[...]}'
|
|
167
167
|
```
|
|
168
168
|
|
|
169
|
-
**Method 3: mcp-manager
|
|
169
|
+
**Method 3: mcp-manager Task agent**
|
|
170
170
|
|
|
171
171
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete guide.
|
|
172
172
|
|
|
@@ -193,7 +193,7 @@ See [references/mcp-protocol.md](references/mcp-protocol.md) for:
|
|
|
193
193
|
- Use when: Need specific tool/server control
|
|
194
194
|
- Execute: `npx tsx scripts/cli.ts call-tool <server> <tool> <args>`
|
|
195
195
|
|
|
196
|
-
3. **mcp-manager
|
|
196
|
+
3. **mcp-manager Task agent** (Fallback): Context-efficient delegation
|
|
197
197
|
- Use when: Gemini unavailable or failed
|
|
198
198
|
- Keeps main context clean
|
|
199
199
|
|
|
@@ -206,7 +206,7 @@ Shows detailed MCP communication logs.
|
|
|
206
206
|
| Direct Scripts | ⭐⭐ | ⭐⭐⭐ | ⭐⭐⭐ | Specific tools |
|
|
207
207
|
| mcp-manager | ⭐ | ⭐⭐ | ⭐⭐⭐ | Fallback |
|
|
208
208
|
|
|
209
|
-
**Recommendation**: Use Gemini CLI as primary method, fallback to scripts/
|
|
209
|
+
**Recommendation**: Use Gemini CLI as primary method, fallback to scripts/Task agent when unavailable.
|
|
210
210
|
|
|
211
211
|
## Resources
|
|
212
212
|
|
|
@@ -12,7 +12,7 @@ Master orchestrator, peer-to-peer, and hierarchical multi-agent architectures
|
|
|
12
12
|
Use this skill when working with master orchestrator, peer-to-peer, and hierarchical multi-agent architectures.
|
|
13
13
|
# Multi-Agent Architecture Patterns
|
|
14
14
|
|
|
15
|
-
Multi-agent architectures distribute work across multiple language model instances, each with its own context window. When designed well, this distribution enables capabilities beyond single-agent limits. When designed poorly, it introduces coordination overhead that negates benefits. The critical insight is that
|
|
15
|
+
Multi-agent architectures distribute work across multiple language model instances, each with its own context window. When designed well, this distribution enables capabilities beyond single-agent limits. When designed poorly, it introduces coordination overhead that negates benefits. The critical insight is that Task agents exist primarily to isolate context, not to anthropomorphize role division.
|
|
16
16
|
|
|
17
17
|
## When to Activate
|
|
18
18
|
|
|
@@ -26,7 +26,7 @@ Activate this skill when:
|
|
|
26
26
|
|
|
27
27
|
## Core Concepts
|
|
28
28
|
|
|
29
|
-
Multi-agent systems address single-agent context limitations through distribution. Three dominant patterns exist: supervisor/orchestrator for centralized control, peer-to-peer/swarm for flexible handoffs, and hierarchical for layered abstraction. The critical design principle is context isolation—
|
|
29
|
+
Multi-agent systems address single-agent context limitations through distribution. Three dominant patterns exist: supervisor/orchestrator for centralized control, peer-to-peer/swarm for flexible handoffs, and hierarchical for layered abstraction. The critical design principle is context isolation—Task agents exist primarily to partition context rather than to simulate organizational roles.
|
|
30
30
|
|
|
31
31
|
Effective multi-agent systems require explicit coordination protocols, consensus mechanisms that avoid sycophancy, and careful attention to failure modes including bottlenecks, divergence, and error propagation.
|
|
32
32
|
|
|
@@ -75,20 +75,20 @@ When to use: Complex tasks with clear decomposition, tasks requiring coordinatio
|
|
|
75
75
|
|
|
76
76
|
Advantages: Strict control over workflow, easier to implement human-in-the-loop interventions, ensures adherence to predefined plans.
|
|
77
77
|
|
|
78
|
-
Disadvantages: Supervisor context becomes bottleneck, supervisor failures cascade to all workers, "telephone game" problem where supervisors paraphrase
|
|
78
|
+
Disadvantages: Supervisor context becomes bottleneck, supervisor failures cascade to all workers, "telephone game" problem where supervisors paraphrase Task agent responses incorrectly.
|
|
79
79
|
|
|
80
80
|
**The Telephone Game Problem and Solution**
|
|
81
|
-
LangGraph benchmarks found supervisor architectures initially performed 50% worse than optimized versions due to the "telephone game" problem where supervisors paraphrase
|
|
81
|
+
LangGraph benchmarks found supervisor architectures initially performed 50% worse than optimized versions due to the "telephone game" problem where supervisors paraphrase Task agent responses incorrectly, losing fidelity.
|
|
82
82
|
|
|
83
|
-
The fix: implement a `forward_message` tool allowing
|
|
83
|
+
The fix: implement a `forward_message` tool allowing Task agents to pass responses directly to users:
|
|
84
84
|
|
|
85
85
|
```python
|
|
86
86
|
def forward_message(message: str, to_user: bool = True):
|
|
87
87
|
"""
|
|
88
|
-
Forward
|
|
89
|
-
|
|
88
|
+
Forward Task agent response directly to user without supervisor synthesis.
|
|
89
|
+
|
|
90
90
|
Use when:
|
|
91
|
-
-
|
|
91
|
+
- Task agent response is final and complete
|
|
92
92
|
- Supervisor synthesis would lose important details
|
|
93
93
|
- Response format must be preserved exactly
|
|
94
94
|
"""
|
|
@@ -97,9 +97,9 @@ def forward_message(message: str, to_user: bool = True):
|
|
|
97
97
|
return {"type": "supervisor_input", "content": message}
|
|
98
98
|
```
|
|
99
99
|
|
|
100
|
-
With this pattern, swarm architectures slightly outperform supervisors because
|
|
100
|
+
With this pattern, swarm architectures slightly outperform supervisors because Task agents respond directly to users, eliminating translation errors.
|
|
101
101
|
|
|
102
|
-
Implementation note: Implement direct pass-through mechanisms allowing
|
|
102
|
+
Implementation note: Implement direct pass-through mechanisms allowing Task agents to pass responses directly to users rather than through supervisor synthesis when appropriate.
|
|
103
103
|
|
|
104
104
|
**Pattern 2: Peer-to-Peer/Swarm**
|
|
105
105
|
The peer-to-peer pattern removes central control, allowing agents to communicate directly based on predefined protocols. Any agent can transfer control to any other through explicit handoff mechanisms.
|
|
@@ -137,17 +137,17 @@ Disadvantages: Coordination overhead between layers, potential for misalignment
|
|
|
137
137
|
|
|
138
138
|
### Context Isolation as Design Principle
|
|
139
139
|
|
|
140
|
-
The primary purpose of multi-agent architectures is context isolation. Each
|
|
140
|
+
The primary purpose of multi-agent architectures is context isolation. Each Task agent operates in a clean context window focused on its subtask without carrying accumulated context from other subtasks.
|
|
141
141
|
|
|
142
142
|
**Isolation Mechanisms**
|
|
143
|
-
Full context delegation: For complex tasks where the
|
|
143
|
+
Full context delegation: For complex tasks where the Task agent needs complete understanding, the planner shares its entire context. The Task agent has its own tools and instructions but receives full context for its decisions.
|
|
144
144
|
|
|
145
|
-
Instruction passing: For simple, well-defined subtasks, the planner creates instructions via function call. The
|
|
145
|
+
Instruction passing: For simple, well-defined subtasks, the planner creates instructions via function call. The Task agent receives only the instructions needed for its specific task.
|
|
146
146
|
|
|
147
147
|
File system memory: For complex tasks requiring shared state, agents read and write to persistent storage. The file system serves as the coordination mechanism, avoiding context bloat from shared state passing.
|
|
148
148
|
|
|
149
149
|
**Isolation Trade-offs**
|
|
150
|
-
Full context delegation provides maximum capability but defeats the purpose of
|
|
150
|
+
Full context delegation provides maximum capability but defeats the purpose of Task agents. Instruction passing maintains isolation but limits Task agent flexibility. File system memory enables shared state without context passing but introduces latency and consistency challenges.
|
|
151
151
|
|
|
152
152
|
The right choice depends on task complexity, coordination needs, and acceptable latency.
|
|
153
153
|
|