@ngxtm/devkit 3.18.0 → 3.20.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/merged-commands/application-performance-performance-optimization.md +13 -13
- package/merged-commands/ask/fast.md +14 -57
- package/merged-commands/ask/hard.md +22 -79
- package/merged-commands/auto.md +6 -33
- package/merged-commands/backend-development-feature-development.md +12 -12
- package/merged-commands/bootstrap/auto/fast.md +15 -15
- package/merged-commands/bootstrap/auto/parallel.md +12 -12
- package/merged-commands/bootstrap/auto.md +14 -14
- package/merged-commands/bootstrap.md +15 -15
- package/merged-commands/brainstorm/fast.md +19 -72
- package/merged-commands/brainstorm/hard.md +23 -84
- package/merged-commands/c4-architecture-c4-architecture.md +5 -5
- package/merged-commands/code/auto.md +16 -16
- package/merged-commands/code/fast.md +19 -72
- package/merged-commands/code/hard.md +38 -122
- package/merged-commands/code/no-test.md +12 -12
- package/merged-commands/code/parallel.md +9 -9
- package/merged-commands/code.md +14 -14
- package/merged-commands/comprehensive-review-full-review.md +8 -8
- package/merged-commands/context-degradation.md +2 -2
- package/merged-commands/context-engineering.md +4 -4
- package/merged-commands/context-optimization.md +3 -3
- package/merged-commands/cook/auto/fast.md +3 -3
- package/merged-commands/cook/auto/parallel.md +9 -9
- package/merged-commands/cook/auto.md +1 -1
- package/merged-commands/cook/fast.md +38 -47
- package/merged-commands/cook/hard.md +46 -41
- package/merged-commands/cook.md +13 -13
- package/merged-commands/daily-news-report.md +15 -15
- package/merged-commands/data-engineering-data-driven-feature.md +16 -16
- package/merged-commands/debug/fast.md +13 -29
- package/merged-commands/debug/hard.md +47 -49
- package/merged-commands/debug.md +1 -1
- package/merged-commands/debugging-toolkit-smart-debug.md +1 -1
- package/merged-commands/deploy/check.md +22 -71
- package/merged-commands/deploy/preview.md +18 -62
- package/merged-commands/deploy/production.md +22 -71
- package/merged-commands/deploy/rollback.md +22 -71
- package/merged-commands/deploy.md +0 -11
- package/merged-commands/design/3d.md +3 -3
- package/merged-commands/design/describe.md +1 -1
- package/merged-commands/design/fast.md +2 -2
- package/merged-commands/design/good.md +3 -3
- package/merged-commands/design/hard.md +15 -85
- package/merged-commands/design/screenshot.md +1 -1
- package/merged-commands/design/video.md +1 -1
- package/merged-commands/design.md +0 -11
- package/merged-commands/doc-coauthoring.md +5 -5
- package/merged-commands/docker-expert.md +1 -1
- package/merged-commands/docs/audit.md +26 -77
- package/merged-commands/docs/business.md +26 -77
- package/merged-commands/docs/core.md +24 -68
- package/merged-commands/docs/init.md +8 -8
- package/merged-commands/docs/update.md +13 -13
- package/merged-commands/docs.md +0 -12
- package/merged-commands/error-debugging-multi-agent-review.md +1 -1
- package/merged-commands/error-diagnostics-smart-debug.md +1 -1
- package/merged-commands/finishing-a-development-branch.md +1 -1
- package/merged-commands/fix/ci.md +2 -2
- package/merged-commands/fix/fast.md +2 -2
- package/merged-commands/fix/hard.md +6 -6
- package/merged-commands/fix/logs.md +5 -5
- package/merged-commands/fix/parallel.md +9 -9
- package/merged-commands/fix/test.md +6 -6
- package/merged-commands/fix/ui.md +8 -8
- package/merged-commands/fixing.md +3 -3
- package/merged-commands/framework-migration-legacy-modernize.md +13 -13
- package/merged-commands/full-stack-orchestration-full-stack-feature.md +12 -12
- package/merged-commands/git/cm.md +1 -1
- package/merged-commands/git/cp.md +1 -1
- package/merged-commands/git/merge.md +1 -1
- package/merged-commands/git/pr.md +1 -1
- package/merged-commands/git-pr-workflows-git-workflow.md +10 -10
- package/merged-commands/google-adk-python.md +1 -1
- package/merged-commands/hr-pro.md +1 -1
- package/merged-commands/incident-response-incident-response.md +13 -13
- package/merged-commands/integrate/polar.md +3 -3
- package/merged-commands/integrate/sepay.md +3 -3
- package/merged-commands/journal.md +1 -1
- package/merged-commands/learn.md +51 -4
- package/merged-commands/linear-claude-skill.md +2 -2
- package/merged-commands/loki-mode.md +14 -14
- package/merged-commands/machine-learning-ops-ml-pipeline.md +7 -7
- package/merged-commands/mcp-management.md +8 -8
- package/merged-commands/multi-agent-patterns.md +14 -14
- package/merged-commands/multi-platform-apps-multi-platform.md +10 -10
- package/merged-commands/nestjs-expert.md +1 -1
- package/merged-commands/performance-testing-review-multi-agent-review.md +1 -1
- package/merged-commands/plan/archive.md +1 -1
- package/merged-commands/plan/ci.md +1 -1
- package/merged-commands/plan/fast.md +2 -2
- package/merged-commands/plan/hard.md +4 -4
- package/merged-commands/plan/parallel.md +5 -5
- package/merged-commands/plan/two.md +6 -6
- package/merged-commands/requesting-code-review.md +6 -6
- package/merged-commands/review/codebase/parallel.md +5 -5
- package/merged-commands/review/codebase.md +5 -5
- package/merged-commands/review/fast.md +13 -29
- package/merged-commands/review/hard.md +48 -49
- package/merged-commands/review.md +0 -11
- package/merged-commands/security-scanning-security-hardening.md +13 -13
- package/merged-commands/skill/add.md +6 -6
- package/merged-commands/skill/create.md +6 -6
- package/merged-commands/skill/fix-logs.md +6 -6
- package/merged-commands/skill/optimize/auto.md +1 -1
- package/merged-commands/skill/optimize.md +1 -1
- package/merged-commands/skill/plan.md +1 -1
- package/merged-commands/skill/update.md +6 -6
- package/merged-commands/subagent-driven-development.md +53 -53
- package/merged-commands/tdd-workflows-tdd-cycle.md +12 -12
- package/merged-commands/tdd-workflows-tdd-red.md +1 -1
- package/merged-commands/tdd-workflows-tdd-refactor.md +1 -1
- package/merged-commands/test/fast.md +22 -33
- package/merged-commands/test/hard.md +59 -56
- package/merged-commands/test/ui.md +1 -1
- package/merged-commands/test.md +1 -1
- package/merged-commands/typescript-expert.md +1 -1
- package/merged-commands/use-mcp.md +5 -5
- package/merged-commands/writing-plans.md +3 -3
- package/merged-commands/writing-skills.md +8 -8
- package/package.json +1 -1
- package/rules-index.json +1 -1
- package/skills/application-performance-performance-optimization/SKILL.md +13 -13
- package/skills/azure-ai-agents-python/references/tools.md +1 -1
- package/skills/backend-development-feature-development/SKILL.md +12 -12
- package/skills/best-practices/references/anti-patterns.md +2 -2
- package/skills/best-practices/references/best-practices-guide.md +14 -14
- package/skills/c4-architecture-c4-architecture/SKILL.md +5 -5
- package/skills/comprehensive-review-full-review/SKILL.md +8 -8
- package/skills/context-degradation/SKILL.md +2 -2
- package/skills/context-engineering/SKILL.md +4 -4
- package/skills/context-engineering/references/context-degradation.md +1 -1
- package/skills/context-engineering/references/context-optimization.md +1 -1
- package/skills/context-engineering/references/multi-agent-patterns.md +1 -1
- package/skills/context-engineering/references/runtime-awareness.md +1 -1
- package/skills/context-optimization/SKILL.md +3 -3
- package/skills/daily-news-report/SKILL.md +15 -15
- package/skills/data-engineering-data-driven-feature/SKILL.md +16 -16
- package/skills/debugging-toolkit-smart-debug/SKILL.md +1 -1
- package/skills/doc-coauthoring/SKILL.md +5 -5
- package/skills/docker-expert/SKILL.md +1 -1
- package/skills/error-debugging-multi-agent-review/SKILL.md +1 -1
- package/skills/error-diagnostics-smart-debug/SKILL.md +1 -1
- package/skills/finishing-a-development-branch/SKILL.md +1 -1
- package/skills/fixing/SKILL.md +3 -3
- package/skills/fixing/references/parallel-exploration.md +4 -4
- package/skills/fixing/references/skill-activation-matrix.md +3 -3
- package/skills/fixing/references/workflow-deep.md +11 -11
- package/skills/fixing/references/workflow-quick.md +4 -4
- package/skills/fixing/references/workflow-standard.md +12 -12
- package/skills/framework-migration-legacy-modernize/SKILL.md +13 -13
- package/skills/full-stack-orchestration-full-stack-feature/SKILL.md +12 -12
- package/skills/git-pr-workflows-git-workflow/SKILL.md +10 -10
- package/skills/google-adk-python/SKILL.md +1 -1
- package/skills/hr-pro/SKILL.md +1 -1
- package/skills/incident-response-incident-response/SKILL.md +13 -13
- package/skills/incident-response-smart-fix/resources/implementation-playbook.md +17 -17
- package/skills/learn/SKILL.md +51 -4
- package/skills/linear-claude-skill/SKILL.md +2 -2
- package/skills/loki-mode/ACKNOWLEDGEMENTS.md +4 -4
- package/skills/loki-mode/CHANGELOG.md +9 -9
- package/skills/loki-mode/CONTEXT-EXPORT.md +1 -1
- package/skills/loki-mode/README.md +2 -2
- package/skills/loki-mode/SKILL.md +14 -14
- package/skills/loki-mode/autonomy/run.sh +1 -1
- package/skills/loki-mode/integrations/vibe-kanban.md +1 -1
- package/skills/loki-mode/references/core-workflow.md +4 -4
- package/skills/loki-mode/references/production-patterns.md +6 -6
- package/skills/loki-mode/references/quality-control.md +2 -2
- package/skills/loki-mode/references/sdlc-phases.md +3 -3
- package/skills/machine-learning-ops-ml-pipeline/SKILL.md +7 -7
- package/skills/mcp-builder/reference/evaluation.md +3 -3
- package/skills/mcp-management/README.md +6 -6
- package/skills/mcp-management/SKILL.md +8 -8
- package/skills/mcp-management/references/gemini-cli-integration.md +1 -1
- package/skills/multi-agent-patterns/SKILL.md +14 -14
- package/skills/multi-platform-apps-multi-platform/SKILL.md +10 -10
- package/skills/nestjs-expert/SKILL.md +1 -1
- package/skills/performance-testing-review-multi-agent-review/SKILL.md +1 -1
- package/skills/planning-with-files/reference.md +2 -2
- package/skills/requesting-code-review/SKILL.md +6 -6
- package/skills/security-scanning-security-hardening/SKILL.md +13 -13
- package/skills/subagent-driven-development/SKILL.md +53 -53
- package/skills/subagent-driven-development/code-quality-reviewer-prompt.md +1 -1
- package/skills/subagent-driven-development/implementer-prompt.md +3 -3
- package/skills/subagent-driven-development/spec-reviewer-prompt.md +1 -1
- package/skills/tdd-workflows-tdd-cycle/SKILL.md +12 -12
- package/skills/tdd-workflows-tdd-green/resources/implementation-playbook.md +1 -1
- package/skills/tdd-workflows-tdd-red/SKILL.md +1 -1
- package/skills/tdd-workflows-tdd-refactor/SKILL.md +1 -1
- package/skills/typescript-expert/SKILL.md +1 -1
- package/skills/writing-plans/SKILL.md +3 -3
- package/skills/writing-skills/SKILL.md +8 -8
- package/skills/writing-skills/examples/CLAUDE_MD_TESTING.md +1 -1
- package/skills/writing-skills/references/cso/README.md +3 -3
- package/skills/writing-skills/testing-skills-with-subagents.md +1 -1
|
@@ -45,19 +45,19 @@ Orchestrate multi-agent incident response with modern SRE practices for rapid re
|
|
|
45
45
|
## Phase 1: Detection & Triage
|
|
46
46
|
|
|
47
47
|
### 1. Incident Detection and Classification
|
|
48
|
-
- Use Task tool with subagent_type="
|
|
48
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
49
49
|
- Prompt: "URGENT: Detect and classify incident: $ARGUMENTS. Analyze alerts from PagerDuty/Opsgenie/monitoring. Determine: 1) Incident severity (P0-P3), 2) Affected services and dependencies, 3) User impact and business risk, 4) Initial incident command structure needed. Check error budgets and SLO violations."
|
|
50
50
|
- Output: Severity classification, impact assessment, incident command assignments, SLO status
|
|
51
51
|
- Context: Initial alerts, monitoring dashboards, recent changes
|
|
52
52
|
|
|
53
53
|
### 2. Observability Analysis
|
|
54
|
-
- Use Task tool with subagent_type="
|
|
54
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
55
55
|
- Prompt: "Perform rapid observability sweep for incident: $ARGUMENTS. Query: 1) Distributed tracing (OpenTelemetry/Jaeger), 2) Metrics correlation (Prometheus/Grafana/DataDog), 3) Log aggregation (ELK/Splunk), 4) APM data, 5) Real User Monitoring. Identify anomalies, error patterns, and service degradation points."
|
|
56
56
|
- Output: Observability findings, anomaly detection, service health matrix, trace analysis
|
|
57
57
|
- Context: Severity level from step 1, affected services
|
|
58
58
|
|
|
59
59
|
### 3. Initial Mitigation
|
|
60
|
-
- Use Task tool with subagent_type="
|
|
60
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
61
61
|
- Prompt: "Implement immediate mitigation for P$SEVERITY incident: $ARGUMENTS. Actions: 1) Traffic throttling/rerouting if needed, 2) Feature flag disabling for affected features, 3) Circuit breaker activation, 4) Rollback assessment for recent deployments, 5) Scale resources if capacity-related. Prioritize user experience restoration."
|
|
62
62
|
- Output: Mitigation actions taken, temporary fixes applied, rollback decisions
|
|
63
63
|
- Context: Observability findings, severity classification
|
|
@@ -65,19 +65,19 @@ Orchestrate multi-agent incident response with modern SRE practices for rapid re
|
|
|
65
65
|
## Phase 2: Investigation & Root Cause Analysis
|
|
66
66
|
|
|
67
67
|
### 4. Deep System Debugging
|
|
68
|
-
- Use Task tool with subagent_type="
|
|
68
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
69
69
|
- Prompt: "Conduct deep debugging for incident: $ARGUMENTS using observability data. Investigate: 1) Stack traces and error logs, 2) Database query performance and locks, 3) Network latency and timeouts, 4) Memory leaks and CPU spikes, 5) Dependency failures and cascading errors. Apply Five Whys analysis."
|
|
70
70
|
- Output: Root cause identification, contributing factors, dependency impact map
|
|
71
71
|
- Context: Observability analysis, mitigation status
|
|
72
72
|
|
|
73
73
|
### 5. Security Assessment
|
|
74
|
-
- Use Task tool with subagent_type="
|
|
74
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
75
75
|
- Prompt: "Assess security implications of incident: $ARGUMENTS. Check: 1) DDoS attack indicators, 2) Authentication/authorization failures, 3) Data exposure risks, 4) Certificate issues, 5) Suspicious access patterns. Review WAF logs, security groups, and audit trails."
|
|
76
76
|
- Output: Security assessment, breach analysis, vulnerability identification
|
|
77
77
|
- Context: Root cause findings, system logs
|
|
78
78
|
|
|
79
79
|
### 6. Performance Engineering Analysis
|
|
80
|
-
- Use Task tool with subagent_type="
|
|
80
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
81
81
|
- Prompt: "Analyze performance aspects of incident: $ARGUMENTS. Examine: 1) Resource utilization patterns, 2) Query optimization opportunities, 3) Caching effectiveness, 4) Load balancer health, 5) CDN performance, 6) Autoscaling triggers. Identify bottlenecks and capacity issues."
|
|
82
82
|
- Output: Performance bottlenecks, resource recommendations, optimization opportunities
|
|
83
83
|
- Context: Debug findings, current mitigation state
|
|
@@ -85,13 +85,13 @@ Orchestrate multi-agent incident response with modern SRE practices for rapid re
|
|
|
85
85
|
## Phase 3: Resolution & Recovery
|
|
86
86
|
|
|
87
87
|
### 7. Fix Implementation
|
|
88
|
-
- Use Task tool with subagent_type="
|
|
88
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
89
89
|
- Prompt: "Design and implement production fix for incident: $ARGUMENTS based on root cause. Requirements: 1) Minimal viable fix for rapid deployment, 2) Risk assessment and rollback capability, 3) Staged rollout plan with monitoring, 4) Validation criteria and health checks. Consider both immediate fix and long-term solution."
|
|
90
90
|
- Output: Fix implementation, deployment strategy, validation plan, rollback procedures
|
|
91
91
|
- Context: Root cause analysis, performance findings, security assessment
|
|
92
92
|
|
|
93
93
|
### 8. Deployment and Validation
|
|
94
|
-
- Use Task tool with subagent_type="
|
|
94
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
95
95
|
- Prompt: "Execute emergency deployment for incident fix: $ARGUMENTS. Process: 1) Blue-green or canary deployment, 2) Progressive rollout with monitoring, 3) Health check validation at each stage, 4) Rollback triggers configured, 5) Real-time monitoring during deployment. Coordinate with incident command."
|
|
96
96
|
- Output: Deployment status, validation results, monitoring dashboard, rollback readiness
|
|
97
97
|
- Context: Fix implementation, current system state
|
|
@@ -99,13 +99,13 @@ Orchestrate multi-agent incident response with modern SRE practices for rapid re
|
|
|
99
99
|
## Phase 4: Communication & Coordination
|
|
100
100
|
|
|
101
101
|
### 9. Stakeholder Communication
|
|
102
|
-
- Use Task tool with subagent_type="
|
|
102
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
103
103
|
- Prompt: "Manage incident communication for: $ARGUMENTS. Create: 1) Status page updates (public-facing), 2) Internal engineering updates (technical details), 3) Executive summary (business impact/ETA), 4) Customer support briefing (talking points), 5) Timeline documentation with key decisions. Update every 15-30 minutes based on severity."
|
|
104
104
|
- Output: Communication artifacts, status updates, stakeholder briefings, timeline log
|
|
105
105
|
- Context: All previous phases, current resolution status
|
|
106
106
|
|
|
107
107
|
### 10. Customer Impact Assessment
|
|
108
|
-
- Use Task tool with subagent_type="
|
|
108
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
109
109
|
- Prompt: "Assess and document customer impact for incident: $ARGUMENTS. Analyze: 1) Affected user segments and geography, 2) Failed transactions or data loss, 3) SLA violations and contractual implications, 4) Customer support ticket volume, 5) Revenue impact estimation. Prepare proactive customer outreach list."
|
|
110
110
|
- Output: Customer impact report, SLA analysis, outreach recommendations
|
|
111
111
|
- Context: Resolution progress, communication status
|
|
@@ -113,19 +113,19 @@ Orchestrate multi-agent incident response with modern SRE practices for rapid re
|
|
|
113
113
|
## Phase 5: Postmortem & Prevention
|
|
114
114
|
|
|
115
115
|
### 11. Blameless Postmortem
|
|
116
|
-
- Use Task tool with subagent_type="
|
|
116
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
117
117
|
- Prompt: "Conduct blameless postmortem for incident: $ARGUMENTS. Document: 1) Complete incident timeline with decisions, 2) Root cause and contributing factors (systems focus), 3) What went well in response, 4) What could improve, 5) Action items with owners and deadlines, 6) Lessons learned for team education. Follow SRE postmortem best practices."
|
|
118
118
|
- Output: Postmortem document, action items list, process improvements, training needs
|
|
119
119
|
- Context: Complete incident history, all agent outputs
|
|
120
120
|
|
|
121
121
|
### 12. Monitoring and Alert Enhancement
|
|
122
|
-
- Use Task tool with subagent_type="
|
|
122
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
123
123
|
- Prompt: "Enhance monitoring to prevent recurrence of: $ARGUMENTS. Implement: 1) New alerts for early detection, 2) SLI/SLO adjustments if needed, 3) Dashboard improvements for visibility, 4) Runbook automation opportunities, 5) Chaos engineering scenarios for testing. Ensure alerts are actionable and reduce noise."
|
|
124
124
|
- Output: New monitoring configuration, alert rules, dashboard updates, runbook automation
|
|
125
125
|
- Context: Postmortem findings, root cause analysis
|
|
126
126
|
|
|
127
127
|
### 13. System Hardening
|
|
128
|
-
- Use Task tool with subagent_type="
|
|
128
|
+
- Use Task tool with subagent_type="general-purpose"
|
|
129
129
|
- Prompt: "Design system improvements to prevent incident: $ARGUMENTS. Propose: 1) Architecture changes for resilience (circuit breakers, bulkheads), 2) Graceful degradation strategies, 3) Capacity planning adjustments, 4) Technical debt prioritization, 5) Dependency reduction opportunities. Create implementation roadmap."
|
|
130
130
|
- Output: Architecture improvements, resilience patterns, technical debt items, roadmap
|
|
131
131
|
- Context: Postmortem action items, performance analysis
|
|
@@ -5,7 +5,7 @@ argument-hint: [tasks]
|
|
|
5
5
|
|
|
6
6
|
Think harder.
|
|
7
7
|
Activate `payment-integration` skill.
|
|
8
|
-
Plan & start implementing payment integration with [Polar.sh](https://polar.sh/docs/llms-full.txt) follow the Orchestration Protocol, Core Responsibilities,
|
|
8
|
+
Plan & start implementing payment integration with [Polar.sh](https://polar.sh/docs/llms-full.txt) follow the Orchestration Protocol, Core Responsibilities, and Development Rules:
|
|
9
9
|
<tasks>$ARGUMENTS</tasks>
|
|
10
10
|
|
|
11
11
|
---
|
|
@@ -23,6 +23,6 @@ Plan & start implementing payment integration with [Polar.sh](https://polar.sh/d
|
|
|
23
23
|
|
|
24
24
|
## Workflow:
|
|
25
25
|
|
|
26
|
-
- **Scout**: Use
|
|
27
|
-
- **Plan**: Trigger slash command `/plan:fast <detailed-instruction-prompt>` to create an implementation plan based on the reports from
|
|
26
|
+
- **Scout**: Use Task agent for scouting to find related resources, documents, and code snippets in the current codebase: Task(subagent_type="general-purpose", prompt="You are a scout. Find related resources...", description="Scout codebase")
|
|
27
|
+
- **Plan**: Trigger slash command `/plan:fast <detailed-instruction-prompt>` to create an implementation plan based on the reports from Task agent.
|
|
28
28
|
- **Implementation**: Trigger slash command `/code <plan>` to implement the plan.
|
|
@@ -5,7 +5,7 @@ argument-hint: [tasks]
|
|
|
5
5
|
|
|
6
6
|
Think harder.
|
|
7
7
|
Activate `payment-integration` skill.
|
|
8
|
-
Plan & start implementing payment integration with [https://developer.sepay.vn/vi](https://developer.sepay.vn/vi) follow the Orchestration Protocol, Core Responsibilities,
|
|
8
|
+
Plan & start implementing payment integration with [https://developer.sepay.vn/vi](https://developer.sepay.vn/vi) follow the Orchestration Protocol, Core Responsibilities, and Development Rules:
|
|
9
9
|
<tasks>$ARGUMENTS</tasks>
|
|
10
10
|
|
|
11
11
|
---
|
|
@@ -23,6 +23,6 @@ Plan & start implementing payment integration with [https://developer.sepay.vn/v
|
|
|
23
23
|
|
|
24
24
|
## Workflow:
|
|
25
25
|
|
|
26
|
-
- **Scout**: Use
|
|
27
|
-
- **Plan**: Trigger slash command `/plan:fast <detailed-instruction-prompt>` to create an implementation plan based on the reports from
|
|
26
|
+
- **Scout**: Use Task agent for scouting to find related resources, documents, and code snippets in the current codebase: Task(subagent_type="general-purpose", prompt="You are a scout. Find related resources...", description="Scout codebase")
|
|
27
|
+
- **Plan**: Trigger slash command `/plan:fast <detailed-instruction-prompt>` to create an implementation plan based on the reports from Task agent.
|
|
28
28
|
- **Implementation**: Trigger slash command `/code <plan>` to implement the plan.
|
|
@@ -2,6 +2,6 @@
|
|
|
2
2
|
description: ⚡ Write some journal entries.
|
|
3
3
|
---
|
|
4
4
|
|
|
5
|
-
Use
|
|
5
|
+
Use a Task agent for journal writing to explore the memories and recent code changes, and write some journal entries: Task(subagent_type="general-purpose", prompt="You are a journal-writer. Explore memories and recent code changes, write journal entries...", description="Write journal entries")
|
|
6
6
|
Journal entries should be concise and focused on the most important events, key changes, impacts, and decisions.
|
|
7
7
|
Keep journal entries in the `./docs/journals/` directory.
|
package/merged-commands/learn.md
CHANGED
|
@@ -1,16 +1,21 @@
|
|
|
1
1
|
---
|
|
2
2
|
name: learn
|
|
3
3
|
description: Guided project building — you code, AI mentors. Build your own product step-by-step with best practices and deep understanding.
|
|
4
|
-
argument-hint: [topic]
|
|
4
|
+
argument-hint: [topic] [--plan <path>]
|
|
5
5
|
---
|
|
6
6
|
|
|
7
|
-
# Learn Mode v3.
|
|
7
|
+
# Learn Mode v3.2
|
|
8
8
|
|
|
9
9
|
> Build your product. Design the architecture. Write every line. Understand every decision.
|
|
10
10
|
|
|
11
11
|
## Activation
|
|
12
12
|
|
|
13
13
|
`/learn "topic"` — e.g., `/learn "JWT auth in Express"`, `/learn "build real-time chat"`
|
|
14
|
+
`/learn --plan <path>` — Learn by following an existing plan (topic auto-extracted from plan title)
|
|
15
|
+
`/learn "topic" --plan <path>` — Learn with custom topic + existing plan
|
|
16
|
+
|
|
17
|
+
e.g., `/learn --plan plans/skill-sync-rewrite/plan.md`
|
|
18
|
+
e.g., `/learn "upstream sync" --plan plans/skill-sync-rewrite/plan.md`
|
|
14
19
|
|
|
15
20
|
---
|
|
16
21
|
|
|
@@ -18,7 +23,17 @@ argument-hint: [topic]
|
|
|
18
23
|
|
|
19
24
|
1. **Resume check**: Look in `learn/` for existing file matching topic. If found, read its YAML frontmatter and offer to resume from last checkpoint via `AskUserQuestion`.
|
|
20
25
|
|
|
21
|
-
2. **
|
|
26
|
+
2. **Plan import check**: If arguments contain `--plan <path>`:
|
|
27
|
+
a. Read the plan file at `<path>`. Validate it exists and has content.
|
|
28
|
+
b. **Topic resolution**: If no topic provided in arguments, extract from plan's YAML frontmatter `title` field.
|
|
29
|
+
c. Detect plan structure:
|
|
30
|
+
- **Single-file plan**: no `phase-XX` files referenced → tasks = plan's task list
|
|
31
|
+
- **Multi-phase plan**: has `## Phases` table with phase-XX links → each phase = potential learn module
|
|
32
|
+
d. If multi-phase: ask user via `AskUserQuestion` which phase(s) to learn.
|
|
33
|
+
e. Read selected phase file(s) for detailed tasks.
|
|
34
|
+
f. Store parsed steps for REVIEW phase.
|
|
35
|
+
|
|
36
|
+
3. **Language detection** (skip if `--plan` already implies language from plan context): Scan project for config files to identify primary language.
|
|
22
37
|
|
|
23
38
|
| Language | Config Files | Verify: Syntax | Verify: Run/Test |
|
|
24
39
|
|----------|-------------|----------------|------------------|
|
|
@@ -70,6 +85,8 @@ step: 0
|
|
|
70
85
|
total_steps: 0
|
|
71
86
|
difficulty: {deep|standard|quick}
|
|
72
87
|
teaching: {guided|scaffolded|demonstrated}
|
|
88
|
+
plan_source: "{path or none}"
|
|
89
|
+
plan_type: {single|multi-phase|none}
|
|
73
90
|
started: {ISO timestamp}
|
|
74
91
|
updated: {ISO timestamp}
|
|
75
92
|
---
|
|
@@ -93,9 +110,32 @@ Update frontmatter: `phase: LEARN`
|
|
|
93
110
|
|
|
94
111
|
---
|
|
95
112
|
|
|
113
|
+
## Phase 3-ALT: REVIEW (only when --plan provided, replaces Phase 3 + 4)
|
|
114
|
+
|
|
115
|
+
> Understand the plan before building. Light touch — not redesign.
|
|
116
|
+
|
|
117
|
+
1. **Summarize**: Present plan overview to user:
|
|
118
|
+
> "This plan proposes: {overview}. It has {N} steps targeting {files}."
|
|
119
|
+
> Key decisions: {list key decisions from plan}
|
|
120
|
+
|
|
121
|
+
2. **Socratic check** (skip in Quick difficulty): Ask 1-2 questions via `AskUserQuestion`:
|
|
122
|
+
> "Before we start — why do you think {first step} comes before {later step}?"
|
|
123
|
+
> OR "What problem does {key decision} solve?"
|
|
124
|
+
Build on user's answer. Correct misconceptions if any.
|
|
125
|
+
|
|
126
|
+
3. **Adapt**: Ask via `AskUserQuestion`:
|
|
127
|
+
> "Want to reorder, skip, or add any steps? Or proceed as-is?"
|
|
128
|
+
Adjust step list based on user feedback.
|
|
129
|
+
|
|
130
|
+
4. **Write to tutorial file**: Record plan source, overview, and adapted steps.
|
|
131
|
+
|
|
132
|
+
Update frontmatter: `phase: REVIEW`, `total_steps: {N}`
|
|
133
|
+
|
|
134
|
+
---
|
|
135
|
+
|
|
96
136
|
## Phase 3: DESIGN (Socratic architecture thinking)
|
|
97
137
|
|
|
98
|
-
>
|
|
138
|
+
> **Skip this phase entirely if `--plan` was provided.** Go to Phase 3-ALT: REVIEW instead.
|
|
99
139
|
|
|
100
140
|
1. **Frame the problem**: AI presents the high-level problem to solve:
|
|
101
141
|
> "We need to build {topic}. Before I suggest anything — how would YOU approach this? What components or pieces do you think we need?"
|
|
@@ -134,6 +174,8 @@ Update frontmatter: `phase: DESIGN`
|
|
|
134
174
|
|
|
135
175
|
## Phase 4: PLAN (concrete implementation steps)
|
|
136
176
|
|
|
177
|
+
> **Skip this phase entirely if `--plan` was provided.** Steps come from REVIEW phase instead.
|
|
178
|
+
|
|
137
179
|
1. **Break down the chosen design** into 3-7 concrete, verifiable steps. Each step should:
|
|
138
180
|
- Have a clear goal (what's done when this step is complete)
|
|
139
181
|
- Build on previous steps (incremental, testable progress)
|
|
@@ -155,6 +197,10 @@ Update frontmatter: `phase: PLAN`, `total_steps: {N}`
|
|
|
155
197
|
|
|
156
198
|
## Phase 5: BUILD (core phase)
|
|
157
199
|
|
|
200
|
+
> If `--plan` was provided, steps come from REVIEW phase (imported plan).
|
|
201
|
+
> If no `--plan`, steps come from Phase 4 (PLAN) as usual.
|
|
202
|
+
> Everything else in BUILD works identically for both paths.
|
|
203
|
+
|
|
158
204
|
1. **For each step from the PLAN phase, follow the teaching mode**:
|
|
159
205
|
|
|
160
206
|
### Guided Mode (user codes everything)
|
|
@@ -267,6 +313,7 @@ Display: `Tutorial saved: learn/{filename}.md`
|
|
|
267
313
|
|
|
268
314
|
## Version History
|
|
269
315
|
|
|
316
|
+
- **3.2.0** - Added --plan flag: import existing plan files, REVIEW phase replaces DESIGN+PLAN for plan-driven learning. Flow with plan: INIT → LEARN → REVIEW → BUILD → WRAP-UP
|
|
270
317
|
- **3.1.0** - Added DESIGN phase (Socratic architecture) and PLAN phase (concrete steps). Full flow: INIT → LEARN → DESIGN → PLAN → BUILD → WRAP-UP
|
|
271
318
|
- **3.0.0** - Teaching modes (guided/scaffolded/demonstrated), best-practice review, explain-back checkpoints, user-codes-first philosophy
|
|
272
319
|
- **2.0.0** - Rewrite: adaptive difficulty via codingLevel, 4 phases, WebSearch, Socratic method, resume support, tiered verify, 17 languages, codebase-aware
|
|
@@ -387,13 +387,13 @@ For detailed helper script usage, see **troubleshooting.md**.
|
|
|
387
387
|
|
|
388
388
|
### Parallel Agent Execution
|
|
389
389
|
|
|
390
|
-
For bulk operations or background execution, use the `Linear-specialist`
|
|
390
|
+
For bulk operations or background execution, use the `Linear-specialist` Task agent:
|
|
391
391
|
|
|
392
392
|
```javascript
|
|
393
393
|
Task({
|
|
394
394
|
description: "Update Linear issues",
|
|
395
395
|
prompt: "Mark ENG-101, ENG-102, ENG-103 as Done",
|
|
396
|
-
subagent_type: "
|
|
396
|
+
subagent_type: "general-purpose"
|
|
397
397
|
})
|
|
398
398
|
```
|
|
399
399
|
|
|
@@ -137,7 +137,7 @@ If bugs are found in these files, document them in `.loki/CONTINUITY.md` under "
|
|
|
137
137
|
| - Identify highest priority unblocked task |
|
|
138
138
|
+-------------------------------------------------------------------+
|
|
139
139
|
| ACT: Execute the task |
|
|
140
|
-
| - Dispatch
|
|
140
|
+
| - Dispatch Task agent via Task tool OR execute directly |
|
|
141
141
|
| - Write code, run tests, fix issues |
|
|
142
142
|
| - Commit changes atomically (git checkpoint) |
|
|
143
143
|
+-------------------------------------------------------------------+
|
|
@@ -175,7 +175,7 @@ If bugs are found in these files, document them in `.loki/CONTINUITY.md` under "
|
|
|
175
175
|
### Task Tool Model Parameter
|
|
176
176
|
```python
|
|
177
177
|
# Opus for planning/architecture ONLY
|
|
178
|
-
Task(subagent_type="
|
|
178
|
+
Task(subagent_type="general-purpose", model="opus", description="Design system architecture", prompt="...")
|
|
179
179
|
|
|
180
180
|
# Sonnet for development and functional testing
|
|
181
181
|
Task(subagent_type="general-purpose", description="Implement API endpoint", prompt="...")
|
|
@@ -286,7 +286,7 @@ Task(description="Refactor database layer for performance", prompt="...") #
|
|
|
286
286
|
- **Direct Routing:** Minimal context - just the task and relevant file(s)
|
|
287
287
|
- **Supervisor Mode:** Full context - CONTINUITY.md, architectural decisions, dependencies
|
|
288
288
|
|
|
289
|
-
> "Keep in mind, complex task histories might confuse simpler
|
|
289
|
+
> "Keep in mind, complex task histories might confuse simpler Task agents." - AWS Best Practices
|
|
290
290
|
|
|
291
291
|
### E2E Testing with Playwright MCP (Anthropic Harness Pattern)
|
|
292
292
|
|
|
@@ -325,7 +325,7 @@ mcp_servers = {
|
|
|
325
325
|
| Metric | What to Track | Store In |
|
|
326
326
|
|--------|---------------|----------|
|
|
327
327
|
| Wall time | Seconds from start to completion | `.loki/metrics/efficiency/` |
|
|
328
|
-
| Agent count | Number of
|
|
328
|
+
| Agent count | Number of Task agents spawned | `.loki/metrics/efficiency/` |
|
|
329
329
|
| Retry count | Attempts before success | `.loki/metrics/efficiency/` |
|
|
330
330
|
| Model usage | Haiku/Sonnet/Opus call distribution | `.loki/metrics/efficiency/` |
|
|
331
331
|
|
|
@@ -351,12 +351,12 @@ See `references/tool-orchestration.md` for full implementation details.
|
|
|
351
351
|
|
|
352
352
|
---
|
|
353
353
|
|
|
354
|
-
## Structured Prompting for
|
|
354
|
+
## Structured Prompting for Task Agents
|
|
355
355
|
|
|
356
356
|
**Single-Responsibility Principle:** Each agent should have ONE clear goal and narrow scope.
|
|
357
357
|
([UiPath Best Practices](https://www.uipath.com/blog/ai/agent-builder-best-practices))
|
|
358
358
|
|
|
359
|
-
**Every
|
|
359
|
+
**Every Task agent dispatch MUST include:**
|
|
360
360
|
|
|
361
361
|
```markdown
|
|
362
362
|
## GOAL (What success looks like)
|
|
@@ -446,7 +446,7 @@ See `references/agent-types.md` for complete definitions and capabilities.
|
|
|
446
446
|
- **NEVER** skip code review between tasks
|
|
447
447
|
- **NEVER** proceed with unfixed Critical/High/Medium issues
|
|
448
448
|
- **NEVER** dispatch reviewers sequentially (always parallel - 3x faster)
|
|
449
|
-
- **NEVER** dispatch multiple implementation
|
|
449
|
+
- **NEVER** dispatch multiple implementation Task agents in parallel (conflicts)
|
|
450
450
|
- **NEVER** implement without reading task requirements first
|
|
451
451
|
|
|
452
452
|
### Review Anti-Patterns
|
|
@@ -466,7 +466,7 @@ See `references/agent-types.md` for complete definitions and capabilities.
|
|
|
466
466
|
- **ALWAYS** wait for all reviewers before aggregating
|
|
467
467
|
- **ALWAYS** fix Critical/High/Medium immediately
|
|
468
468
|
- **ALWAYS** re-run ALL 3 reviewers after fixes
|
|
469
|
-
- **ALWAYS** checkpoint state before spawning
|
|
469
|
+
- **ALWAYS** checkpoint state before spawning Task agents
|
|
470
470
|
|
|
471
471
|
---
|
|
472
472
|
|
|
@@ -618,14 +618,14 @@ context_budget:
|
|
|
618
618
|
reserve: "90% for model reasoning"
|
|
619
619
|
```
|
|
620
620
|
|
|
621
|
-
###
|
|
621
|
+
### Task Agents for Context Isolation
|
|
622
622
|
|
|
623
|
-
**Use
|
|
623
|
+
**Use Task agents to prevent token waste on noisy subtasks:**
|
|
624
624
|
|
|
625
625
|
```
|
|
626
|
-
Main agent (focused) -->
|
|
627
|
-
-->
|
|
628
|
-
-->
|
|
626
|
+
Main agent (focused) --> Task agent (file search)
|
|
627
|
+
--> Task agent (test running)
|
|
628
|
+
--> Task agent (linting)
|
|
629
629
|
```
|
|
630
630
|
|
|
631
631
|
See `references/production-patterns.md` for full practitioner patterns.
|
|
@@ -690,7 +690,7 @@ Loki Mode with PRD at path/to/prd # Start with PRD
|
|
|
690
690
|
|-------|-------|
|
|
691
691
|
| Trigger | "Loki Mode" or "Loki Mode with PRD at [path]" |
|
|
692
692
|
| Skip When | Need human approval, want to review plan first, single small task |
|
|
693
|
-
| Related Skills |
|
|
693
|
+
| Related Skills | task-agent-driven-development, executing-plans |
|
|
694
694
|
|
|
695
695
|
---
|
|
696
696
|
|
|
@@ -46,7 +46,7 @@ The multi-agent approach ensures each aspect is handled by domain experts:
|
|
|
46
46
|
## Phase 1: Data & Requirements Analysis
|
|
47
47
|
|
|
48
48
|
<Task>
|
|
49
|
-
subagent_type:
|
|
49
|
+
subagent_type: general-purpose
|
|
50
50
|
prompt: |
|
|
51
51
|
Analyze and design data pipeline for ML system with requirements: $ARGUMENTS
|
|
52
52
|
|
|
@@ -73,7 +73,7 @@ prompt: |
|
|
|
73
73
|
</Task>
|
|
74
74
|
|
|
75
75
|
<Task>
|
|
76
|
-
subagent_type:
|
|
76
|
+
subagent_type: general-purpose
|
|
77
77
|
prompt: |
|
|
78
78
|
Design feature engineering and model requirements for: $ARGUMENTS
|
|
79
79
|
Using data architecture from: {phase1.data-engineer.output}
|
|
@@ -103,7 +103,7 @@ prompt: |
|
|
|
103
103
|
## Phase 2: Model Development & Training
|
|
104
104
|
|
|
105
105
|
<Task>
|
|
106
|
-
subagent_type:
|
|
106
|
+
subagent_type: general-purpose
|
|
107
107
|
prompt: |
|
|
108
108
|
Implement training pipeline based on requirements: {phase1.data-scientist.output}
|
|
109
109
|
Using data pipeline: {phase1.data-engineer.output}
|
|
@@ -131,7 +131,7 @@ prompt: |
|
|
|
131
131
|
</Task>
|
|
132
132
|
|
|
133
133
|
<Task>
|
|
134
|
-
subagent_type:
|
|
134
|
+
subagent_type: general-purpose
|
|
135
135
|
prompt: |
|
|
136
136
|
Optimize and productionize ML code from: {phase2.ml-engineer.output}
|
|
137
137
|
|
|
@@ -160,7 +160,7 @@ prompt: |
|
|
|
160
160
|
## Phase 3: Production Deployment & Serving
|
|
161
161
|
|
|
162
162
|
<Task>
|
|
163
|
-
subagent_type:
|
|
163
|
+
subagent_type: general-purpose
|
|
164
164
|
prompt: |
|
|
165
165
|
Design production deployment for models from: {phase2.ml-engineer.output}
|
|
166
166
|
With optimized code from: {phase2.python-pro.output}
|
|
@@ -194,7 +194,7 @@ prompt: |
|
|
|
194
194
|
</Task>
|
|
195
195
|
|
|
196
196
|
<Task>
|
|
197
|
-
subagent_type:
|
|
197
|
+
subagent_type: general-purpose
|
|
198
198
|
prompt: |
|
|
199
199
|
Design Kubernetes infrastructure for ML workloads from: {phase3.mlops-engineer.output}
|
|
200
200
|
|
|
@@ -223,7 +223,7 @@ prompt: |
|
|
|
223
223
|
## Phase 4: Monitoring & Continuous Improvement
|
|
224
224
|
|
|
225
225
|
<Task>
|
|
226
|
-
subagent_type:
|
|
226
|
+
subagent_type: general-purpose
|
|
227
227
|
prompt: |
|
|
228
228
|
Implement comprehensive monitoring for ML system deployed in: {phase3.mlops-engineer.output}
|
|
229
229
|
Using Kubernetes infrastructure: {phase3.kubernetes-architect.output}
|
|
@@ -15,7 +15,7 @@ MCP is an open protocol enabling AI agents to connect to external tools and data
|
|
|
15
15
|
- Progressive disclosure of MCP capabilities (load only what's needed)
|
|
16
16
|
- Intelligent tool/prompt/resource selection based on task requirements
|
|
17
17
|
- Multi-server management from single config file
|
|
18
|
-
- Context-efficient:
|
|
18
|
+
- Context-efficient: Task agents handle MCP discovery and execution
|
|
19
19
|
- Persistent tool catalog: automatically saves discovered tools to JSON for fast reference
|
|
20
20
|
|
|
21
21
|
## When to Use This Skill
|
|
@@ -25,7 +25,7 @@ Use this skill when:
|
|
|
25
25
|
2. **Task-Based Tool Selection**: Analyzing which MCP tools are relevant for a specific task
|
|
26
26
|
3. **Executing MCP Tools**: Calling MCP tools programmatically with proper parameter handling
|
|
27
27
|
4. **MCP Integration**: Building or debugging MCP client implementations
|
|
28
|
-
5. **Context Management**: Avoiding context pollution by delegating MCP operations to
|
|
28
|
+
5. **Context Management**: Avoiding context pollution by delegating MCP operations to Task agents
|
|
29
29
|
|
|
30
30
|
## Core Capabilities
|
|
31
31
|
|
|
@@ -80,7 +80,7 @@ echo "Take a screenshot of https://example.com" | gemini -y -m gemini-2.5-flash
|
|
|
80
80
|
npx tsx scripts/cli.ts call-tool memory create_entities '{"entities":[...]}'
|
|
81
81
|
```
|
|
82
82
|
|
|
83
|
-
**Fallback: mcp-manager
|
|
83
|
+
**Fallback: mcp-manager Task agent**
|
|
84
84
|
|
|
85
85
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete examples.
|
|
86
86
|
|
|
@@ -106,14 +106,14 @@ echo "Take a screenshot of https://example.com. Return JSON only per GEMINI.md i
|
|
|
106
106
|
- Automatic tool discovery
|
|
107
107
|
- Structured JSON responses (parseable by Claude)
|
|
108
108
|
- GEMINI.md auto-loaded for consistent formatting
|
|
109
|
-
- Faster than
|
|
109
|
+
- Faster than Task agent orchestration
|
|
110
110
|
- No natural language ambiguity
|
|
111
111
|
|
|
112
112
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete guide.
|
|
113
113
|
|
|
114
|
-
### Pattern 2:
|
|
114
|
+
### Pattern 2: Task Agent-Based Execution (Fallback)
|
|
115
115
|
|
|
116
|
-
Use `mcp-manager` agent when Gemini CLI unavailable.
|
|
116
|
+
Use `mcp-manager` agent when Gemini CLI unavailable. Task agent discovers tools, selects relevant ones, executes tasks, reports back.
|
|
117
117
|
|
|
118
118
|
**Benefit**: Main context stays clean, only relevant tool definitions loaded when needed.
|
|
119
119
|
|
|
@@ -166,7 +166,7 @@ npx tsx cli.ts list-tools # Saves to assets/tools.json
|
|
|
166
166
|
npx tsx cli.ts call-tool memory create_entities '{"entities":[...]}'
|
|
167
167
|
```
|
|
168
168
|
|
|
169
|
-
**Method 3: mcp-manager
|
|
169
|
+
**Method 3: mcp-manager Task agent**
|
|
170
170
|
|
|
171
171
|
See [references/gemini-cli-integration.md](references/gemini-cli-integration.md) for complete guide.
|
|
172
172
|
|
|
@@ -193,7 +193,7 @@ See [references/mcp-protocol.md](references/mcp-protocol.md) for:
|
|
|
193
193
|
- Use when: Need specific tool/server control
|
|
194
194
|
- Execute: `npx tsx scripts/cli.ts call-tool <server> <tool> <args>`
|
|
195
195
|
|
|
196
|
-
3. **mcp-manager
|
|
196
|
+
3. **mcp-manager Task agent** (Fallback): Context-efficient delegation
|
|
197
197
|
- Use when: Gemini unavailable or failed
|
|
198
198
|
- Keeps main context clean
|
|
199
199
|
|
|
@@ -12,7 +12,7 @@ Master orchestrator, peer-to-peer, and hierarchical multi-agent architectures
|
|
|
12
12
|
Use this skill when working with master orchestrator, peer-to-peer, and hierarchical multi-agent architectures.
|
|
13
13
|
# Multi-Agent Architecture Patterns
|
|
14
14
|
|
|
15
|
-
Multi-agent architectures distribute work across multiple language model instances, each with its own context window. When designed well, this distribution enables capabilities beyond single-agent limits. When designed poorly, it introduces coordination overhead that negates benefits. The critical insight is that
|
|
15
|
+
Multi-agent architectures distribute work across multiple language model instances, each with its own context window. When designed well, this distribution enables capabilities beyond single-agent limits. When designed poorly, it introduces coordination overhead that negates benefits. The critical insight is that Task agents exist primarily to isolate context, not to anthropomorphize role division.
|
|
16
16
|
|
|
17
17
|
## When to Activate
|
|
18
18
|
|
|
@@ -26,7 +26,7 @@ Activate this skill when:
|
|
|
26
26
|
|
|
27
27
|
## Core Concepts
|
|
28
28
|
|
|
29
|
-
Multi-agent systems address single-agent context limitations through distribution. Three dominant patterns exist: supervisor/orchestrator for centralized control, peer-to-peer/swarm for flexible handoffs, and hierarchical for layered abstraction. The critical design principle is context isolation—
|
|
29
|
+
Multi-agent systems address single-agent context limitations through distribution. Three dominant patterns exist: supervisor/orchestrator for centralized control, peer-to-peer/swarm for flexible handoffs, and hierarchical for layered abstraction. The critical design principle is context isolation—Task agents exist primarily to partition context rather than to simulate organizational roles.
|
|
30
30
|
|
|
31
31
|
Effective multi-agent systems require explicit coordination protocols, consensus mechanisms that avoid sycophancy, and careful attention to failure modes including bottlenecks, divergence, and error propagation.
|
|
32
32
|
|
|
@@ -75,20 +75,20 @@ When to use: Complex tasks with clear decomposition, tasks requiring coordinatio
|
|
|
75
75
|
|
|
76
76
|
Advantages: Strict control over workflow, easier to implement human-in-the-loop interventions, ensures adherence to predefined plans.
|
|
77
77
|
|
|
78
|
-
Disadvantages: Supervisor context becomes bottleneck, supervisor failures cascade to all workers, "telephone game" problem where supervisors paraphrase
|
|
78
|
+
Disadvantages: Supervisor context becomes bottleneck, supervisor failures cascade to all workers, "telephone game" problem where supervisors paraphrase Task agent responses incorrectly.
|
|
79
79
|
|
|
80
80
|
**The Telephone Game Problem and Solution**
|
|
81
|
-
LangGraph benchmarks found supervisor architectures initially performed 50% worse than optimized versions due to the "telephone game" problem where supervisors paraphrase
|
|
81
|
+
LangGraph benchmarks found supervisor architectures initially performed 50% worse than optimized versions due to the "telephone game" problem where supervisors paraphrase Task agent responses incorrectly, losing fidelity.
|
|
82
82
|
|
|
83
|
-
The fix: implement a `forward_message` tool allowing
|
|
83
|
+
The fix: implement a `forward_message` tool allowing Task agents to pass responses directly to users:
|
|
84
84
|
|
|
85
85
|
```python
|
|
86
86
|
def forward_message(message: str, to_user: bool = True):
|
|
87
87
|
"""
|
|
88
|
-
Forward
|
|
89
|
-
|
|
88
|
+
Forward Task agent response directly to user without supervisor synthesis.
|
|
89
|
+
|
|
90
90
|
Use when:
|
|
91
|
-
-
|
|
91
|
+
- Task agent response is final and complete
|
|
92
92
|
- Supervisor synthesis would lose important details
|
|
93
93
|
- Response format must be preserved exactly
|
|
94
94
|
"""
|
|
@@ -97,9 +97,9 @@ def forward_message(message: str, to_user: bool = True):
|
|
|
97
97
|
return {"type": "supervisor_input", "content": message}
|
|
98
98
|
```
|
|
99
99
|
|
|
100
|
-
With this pattern, swarm architectures slightly outperform supervisors because
|
|
100
|
+
With this pattern, swarm architectures slightly outperform supervisors because Task agents respond directly to users, eliminating translation errors.
|
|
101
101
|
|
|
102
|
-
Implementation note: Implement direct pass-through mechanisms allowing
|
|
102
|
+
Implementation note: Implement direct pass-through mechanisms allowing Task agents to pass responses directly to users rather than through supervisor synthesis when appropriate.
|
|
103
103
|
|
|
104
104
|
**Pattern 2: Peer-to-Peer/Swarm**
|
|
105
105
|
The peer-to-peer pattern removes central control, allowing agents to communicate directly based on predefined protocols. Any agent can transfer control to any other through explicit handoff mechanisms.
|
|
@@ -137,17 +137,17 @@ Disadvantages: Coordination overhead between layers, potential for misalignment
|
|
|
137
137
|
|
|
138
138
|
### Context Isolation as Design Principle
|
|
139
139
|
|
|
140
|
-
The primary purpose of multi-agent architectures is context isolation. Each
|
|
140
|
+
The primary purpose of multi-agent architectures is context isolation. Each Task agent operates in a clean context window focused on its subtask without carrying accumulated context from other subtasks.
|
|
141
141
|
|
|
142
142
|
**Isolation Mechanisms**
|
|
143
|
-
Full context delegation: For complex tasks where the
|
|
143
|
+
Full context delegation: For complex tasks where the Task agent needs complete understanding, the planner shares its entire context. The Task agent has its own tools and instructions but receives full context for its decisions.
|
|
144
144
|
|
|
145
|
-
Instruction passing: For simple, well-defined subtasks, the planner creates instructions via function call. The
|
|
145
|
+
Instruction passing: For simple, well-defined subtasks, the planner creates instructions via function call. The Task agent receives only the instructions needed for its specific task.
|
|
146
146
|
|
|
147
147
|
File system memory: For complex tasks requiring shared state, agents read and write to persistent storage. The file system serves as the coordination mechanism, avoiding context bloat from shared state passing.
|
|
148
148
|
|
|
149
149
|
**Isolation Trade-offs**
|
|
150
|
-
Full context delegation provides maximum capability but defeats the purpose of
|
|
150
|
+
Full context delegation provides maximum capability but defeats the purpose of Task agents. Instruction passing maintains isolation but limits Task agent flexibility. File system memory enables shared state without context passing but introduces latency and consistency challenges.
|
|
151
151
|
|
|
152
152
|
The right choice depends on task complexity, coordination needs, and acceptable latency.
|
|
153
153
|
|