claude-mpm 5.4.22__py3-none-any.whl → 5.4.48__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of claude-mpm might be problematic. Click here for more details.

Files changed (119) hide show
  1. claude_mpm/VERSION +1 -1
  2. claude_mpm/agents/BASE_AGENT.md +164 -0
  3. claude_mpm/agents/BASE_ENGINEER.md +658 -0
  4. claude_mpm/agents/MEMORY.md +1 -1
  5. claude_mpm/agents/PM_INSTRUCTIONS.md +739 -1052
  6. claude_mpm/agents/WORKFLOW.md +5 -254
  7. claude_mpm/agents/agent_loader.py +1 -1
  8. claude_mpm/agents/base_agent.json +31 -0
  9. claude_mpm/agents/frontmatter_validator.py +2 -2
  10. claude_mpm/cli/commands/agent_state_manager.py +10 -10
  11. claude_mpm/cli/commands/agents.py +9 -9
  12. claude_mpm/cli/commands/auto_configure.py +4 -4
  13. claude_mpm/cli/commands/configure.py +1 -1
  14. claude_mpm/cli/commands/configure_agent_display.py +10 -0
  15. claude_mpm/cli/commands/mpm_init/core.py +65 -0
  16. claude_mpm/cli/commands/postmortem.py +1 -1
  17. claude_mpm/cli/commands/profile.py +277 -0
  18. claude_mpm/cli/commands/skills.py +14 -18
  19. claude_mpm/cli/executor.py +10 -0
  20. claude_mpm/cli/interactive/agent_wizard.py +2 -2
  21. claude_mpm/cli/parsers/base_parser.py +7 -0
  22. claude_mpm/cli/parsers/profile_parser.py +148 -0
  23. claude_mpm/cli/parsers/skills_parser.py +0 -6
  24. claude_mpm/cli/startup.py +346 -75
  25. claude_mpm/commands/mpm-config.md +13 -250
  26. claude_mpm/commands/mpm-doctor.md +9 -22
  27. claude_mpm/commands/mpm-help.md +5 -206
  28. claude_mpm/commands/mpm-init.md +81 -507
  29. claude_mpm/commands/mpm-monitor.md +15 -402
  30. claude_mpm/commands/mpm-organize.md +61 -441
  31. claude_mpm/commands/mpm-postmortem.md +6 -108
  32. claude_mpm/commands/mpm-session-resume.md +12 -363
  33. claude_mpm/commands/mpm-status.md +5 -69
  34. claude_mpm/commands/mpm-ticket-view.md +52 -495
  35. claude_mpm/commands/mpm-version.md +5 -107
  36. claude_mpm/core/config.py +2 -4
  37. claude_mpm/core/framework/loaders/agent_loader.py +1 -1
  38. claude_mpm/core/framework/loaders/instruction_loader.py +52 -11
  39. claude_mpm/core/optimized_startup.py +59 -0
  40. claude_mpm/core/shared/config_loader.py +1 -1
  41. claude_mpm/core/unified_agent_registry.py +1 -1
  42. claude_mpm/dashboard/static/svelte-build/_app/env.js +1 -0
  43. claude_mpm/dashboard/static/svelte-build/_app/immutable/assets/0.B_FtCwCQ.css +1 -0
  44. claude_mpm/dashboard/static/svelte-build/_app/immutable/assets/2.Cl_eSA4x.css +1 -0
  45. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/BgChzWQ1.js +1 -0
  46. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/CIXEwuWe.js +1 -0
  47. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/CWc5urbQ.js +1 -0
  48. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/DMkZpdF2.js +2 -0
  49. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/DjhvlsAc.js +1 -0
  50. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/N4qtv3Hx.js +2 -0
  51. claude_mpm/dashboard/static/svelte-build/_app/immutable/chunks/uj46x2Wr.js +1 -0
  52. claude_mpm/dashboard/static/svelte-build/_app/immutable/entry/app.DTL5mJO-.js +2 -0
  53. claude_mpm/dashboard/static/svelte-build/_app/immutable/entry/start.DzuEhzqh.js +1 -0
  54. claude_mpm/dashboard/static/svelte-build/_app/immutable/nodes/0.CAGBuiOw.js +1 -0
  55. claude_mpm/dashboard/static/svelte-build/_app/immutable/nodes/1.DFLC8jdE.js +1 -0
  56. claude_mpm/dashboard/static/svelte-build/_app/immutable/nodes/2.DPvEihJJ.js +10 -0
  57. claude_mpm/dashboard/static/svelte-build/_app/version.json +1 -0
  58. claude_mpm/dashboard/static/svelte-build/favicon.svg +7 -0
  59. claude_mpm/dashboard/static/svelte-build/index.html +36 -0
  60. claude_mpm/hooks/claude_hooks/__pycache__/__init__.cpython-311.pyc +0 -0
  61. claude_mpm/hooks/claude_hooks/__pycache__/correlation_manager.cpython-311.pyc +0 -0
  62. claude_mpm/hooks/claude_hooks/__pycache__/event_handlers.cpython-311.pyc +0 -0
  63. claude_mpm/hooks/claude_hooks/__pycache__/hook_handler.cpython-311.pyc +0 -0
  64. claude_mpm/hooks/claude_hooks/__pycache__/installer.cpython-311.pyc +0 -0
  65. claude_mpm/hooks/claude_hooks/__pycache__/memory_integration.cpython-311.pyc +0 -0
  66. claude_mpm/hooks/claude_hooks/__pycache__/response_tracking.cpython-311.pyc +0 -0
  67. claude_mpm/hooks/claude_hooks/__pycache__/tool_analysis.cpython-311.pyc +0 -0
  68. claude_mpm/hooks/claude_hooks/hook_handler.py +149 -1
  69. claude_mpm/hooks/claude_hooks/services/__pycache__/__init__.cpython-311.pyc +0 -0
  70. claude_mpm/hooks/claude_hooks/services/__pycache__/connection_manager.cpython-311.pyc +0 -0
  71. claude_mpm/hooks/claude_hooks/services/__pycache__/connection_manager_http.cpython-311.pyc +0 -0
  72. claude_mpm/hooks/claude_hooks/services/__pycache__/duplicate_detector.cpython-311.pyc +0 -0
  73. claude_mpm/hooks/claude_hooks/services/__pycache__/state_manager.cpython-311.pyc +0 -0
  74. claude_mpm/hooks/claude_hooks/services/__pycache__/subagent_processor.cpython-311.pyc +0 -0
  75. claude_mpm/hooks/claude_hooks/services/connection_manager.py +26 -6
  76. claude_mpm/hooks/kuzu_memory_hook.py +5 -5
  77. claude_mpm/init.py +63 -0
  78. claude_mpm/models/git_repository.py +3 -3
  79. claude_mpm/scripts/start_activity_logging.py +0 -0
  80. claude_mpm/services/agents/agent_builder.py +3 -3
  81. claude_mpm/services/agents/cache_git_manager.py +6 -6
  82. claude_mpm/services/agents/deployment/agent_deployment.py +29 -7
  83. claude_mpm/services/agents/deployment/agent_discovery_service.py +2 -2
  84. claude_mpm/services/agents/deployment/agent_format_converter.py +23 -13
  85. claude_mpm/services/agents/deployment/agent_template_builder.py +29 -19
  86. claude_mpm/services/agents/deployment/agents_directory_resolver.py +2 -2
  87. claude_mpm/services/agents/deployment/async_agent_deployment.py +31 -27
  88. claude_mpm/services/agents/deployment/local_template_deployment.py +3 -1
  89. claude_mpm/services/agents/deployment/multi_source_deployment_service.py +169 -26
  90. claude_mpm/services/agents/deployment/remote_agent_discovery_service.py +98 -75
  91. claude_mpm/services/agents/git_source_manager.py +19 -4
  92. claude_mpm/services/agents/recommender.py +5 -3
  93. claude_mpm/services/agents/single_tier_deployment_service.py +2 -2
  94. claude_mpm/services/agents/sources/git_source_sync_service.py +112 -6
  95. claude_mpm/services/agents/startup_sync.py +22 -2
  96. claude_mpm/services/diagnostics/checks/agent_check.py +2 -2
  97. claude_mpm/services/diagnostics/checks/agent_sources_check.py +1 -1
  98. claude_mpm/services/git/git_operations_service.py +8 -8
  99. claude_mpm/services/monitor/management/lifecycle.py +8 -1
  100. claude_mpm/services/monitor/server.py +473 -3
  101. claude_mpm/services/pm_skills_deployer.py +711 -0
  102. claude_mpm/services/profile_manager.py +331 -0
  103. claude_mpm/services/skills/git_skill_source_manager.py +101 -3
  104. claude_mpm/services/skills_deployer.py +4 -3
  105. claude_mpm/services/socketio/dashboard_server.py +1 -0
  106. claude_mpm/services/socketio/event_normalizer.py +37 -6
  107. claude_mpm/services/socketio/server/core.py +262 -123
  108. claude_mpm/skills/skill_manager.py +92 -3
  109. claude_mpm/utils/agent_dependency_loader.py +14 -2
  110. claude_mpm/utils/agent_filters.py +1 -1
  111. claude_mpm/utils/migration.py +4 -4
  112. claude_mpm/utils/robust_installer.py +47 -3
  113. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/METADATA +7 -4
  114. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/RECORD +118 -79
  115. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/WHEEL +0 -0
  116. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/entry_points.txt +0 -0
  117. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/licenses/LICENSE +0 -0
  118. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/licenses/LICENSE-FAQ.md +0 -0
  119. {claude_mpm-5.4.22.dist-info → claude_mpm-5.4.48.dist-info}/top_level.txt +0 -0
@@ -64,256 +64,19 @@ Return: Clean or list of blocked items
64
64
 
65
65
  ## Publish and Release Workflow
66
66
 
67
- **Trigger Keywords**: "publish", "release", "deploy to PyPI/npm", "create release", "tag version"
67
+ **Note**: Release workflows are project-specific and should be customized per project. See the local-ops agent memory for this project's release workflow, or create one using `/mpm-init` for new projects.
68
68
 
69
- **Agent Responsibility**: Ops (local-ops or platform-specific)
70
-
71
- **Mandatory Requirements**: All changes committed, quality gates passed, security scan complete, version incremented
72
-
73
- ### Process Overview
74
-
75
- Publishing and releasing is a **multi-step orchestrated workflow** requiring coordination across multiple agents with mandatory verification at each stage. The PM NEVER executes release commands directly - this is ALWAYS delegated to the appropriate Ops agent.
76
-
77
- ### Workflow Phases
78
-
79
- #### Phase 1: Pre-Release Validation (Research + QA)
80
-
81
- **Agent**: Research
82
- **Purpose**: Validate readiness for release
83
- **Template**:
84
- ```
85
- Task: Pre-release readiness check
86
- Requirements:
87
- - Verify all uncommitted changes are tracked
88
- - Check git status for untracked files
89
- - Validate all features documented
90
- - Confirm CHANGELOG updated
91
- Success Criteria: Clean working directory, complete documentation
92
- ```
93
-
94
- **Decision**:
95
- - Clean → Proceed to Phase 2
96
- - Uncommitted changes → Report to user, request commit approval
97
- - Missing documentation → Delegate to Documentation agent
98
-
99
- #### Phase 2: Quality Gate Validation (QA)
100
-
101
- **Agent**: QA
102
- **Purpose**: Execute comprehensive quality checks
103
- **Template**:
104
- ```
105
- Task: Run pre-publish quality gate
106
- Requirements:
107
- - Execute: make pre-publish
108
- - Verify all linters pass (Ruff, Black, isort, Flake8)
109
- - Confirm test suite passes
110
- - Validate version consistency
111
- - Check for debug prints, TODO comments
112
- Evidence Required: Complete quality gate output
113
- ```
114
-
115
- **Decision**:
116
- - All checks pass → Proceed to Phase 3
117
- - Any failure → BLOCK release, report specific failures to user
118
- - Must provide full quality gate output as evidence
119
-
120
- #### Phase 3: Security Scan (Security Agent) - MANDATORY
121
-
122
- **Agent**: Security
123
- **Purpose**: Pre-push credential and secrets scan
124
- **Template**:
125
- ```
126
- Task: Pre-release security scan
127
- Requirements:
128
- - Run git diff origin/main HEAD
129
- - Scan for: API keys, passwords, tokens, private keys, credentials
130
- - Check environment files (.env, .env.local)
131
- - Verify no hardcoded secrets in code
132
- Success Criteria: CLEAN scan or BLOCKED with specific secrets identified
133
- Evidence Required: Security scan results
134
- ```
135
-
136
- **Decision**:
137
- - CLEAN → Proceed to Phase 4
138
- - SECRETS DETECTED → BLOCK release immediately, report violations
139
- - NEVER bypass this step, even for "urgent" releases
140
-
141
- #### Phase 4: Version Management (Ops Agent)
142
-
143
- **Agent**: local-ops-agent
144
- **Purpose**: Increment version following conventional commits
145
- **Template**:
146
- ```
147
- Task: Increment version and commit
148
- Requirements:
149
- - Analyze recent commits since last release
150
- - Determine bump type (patch/minor/major):
151
- * patch: bug fixes (fix:)
152
- * minor: new features (feat:)
153
- * major: breaking changes (feat!, BREAKING CHANGE:)
154
- - Execute: ./scripts/manage_version.py bump {type}
155
- - Commit version changes with message: "chore: bump version to {version}"
156
- - Push to origin/main
157
- Minimum Requirement: At least patch version bump
158
- Success Criteria: Version incremented, committed, pushed
159
- Evidence Required: New version number, git commit SHA
160
- ```
161
-
162
- **Conventional Commit Detection**:
163
- ```python
164
- if "BREAKING CHANGE:" in commits or "feat!" in commits:
165
- bump_type = "major"
166
- elif "feat:" in commits:
167
- bump_type = "minor"
168
- else: # "fix:", "refactor:", "perf:", etc.
169
- bump_type = "patch"
170
- ```
171
-
172
- #### Phase 5: Build and Publish (Ops Agent)
173
-
174
- **Agent**: local-ops-agent
175
- **Purpose**: Build release artifacts and publish to distribution channels
176
- **Template**:
177
- ```
178
- Task: Build and publish release
179
- Requirements:
180
- - Execute: make safe-release-build (includes quality gate)
181
- - Publish to PyPI: make release-pypi
182
- - Publish to npm (if applicable): make release-npm
183
- - Create GitHub release: gh release create v{version}
184
- - Tag release in git
185
- Verification Required:
186
- - Confirm build artifacts created
187
- - Verify PyPI upload successful (check PyPI page)
188
- - Verify npm upload successful (if applicable)
189
- - Confirm GitHub release created
190
- Evidence Required:
191
- - Build logs
192
- - PyPI package URL
193
- - npm package URL (if applicable)
194
- - GitHub release URL
195
- ```
196
-
197
- #### Phase 5.5: Update Homebrew Tap (Ops Agent) - NON-BLOCKING
198
-
199
- **Agent**: local-ops-agent
200
- **Purpose**: Update Homebrew formula with new version (automated)
201
- **Trigger**: Automatically after PyPI publish (Phase 5)
202
- **Template**:
203
- ```
204
- Task: Update Homebrew tap for new release
205
- Requirements:
206
- - Wait for PyPI package to be available (retry with backoff)
207
- - Fetch SHA256 from PyPI for version {version}
208
- - Update formula in homebrew-tools repository
209
- - Update version and checksum in Formula/claude-mpm.rb
210
- - Run formula tests locally (syntax check, brew audit)
211
- - Commit changes with conventional commit message
212
- - Push changes to homebrew-tools repository (with confirmation)
213
- Success Criteria: Formula updated and committed, or graceful failure logged
214
- Evidence Required: Git commit SHA in homebrew-tools or error log
215
- ```
216
-
217
- **Decision**:
218
- - Success → Continue to GitHub release (Phase 5 continued)
219
- - Failure → Log warning with manual fallback instructions, continue anyway (NON-BLOCKING)
220
-
221
- **IMPORTANT**: Homebrew tap update failures do NOT block PyPI releases. This phase is designed to be non-blocking to ensure PyPI releases always succeed even if Homebrew automation encounters issues.
222
-
223
- **Manual Fallback** (if automation fails):
224
- ```bash
225
- cd /path/to/homebrew-tools
226
- ./scripts/update_formula.sh {version}
227
- git add Formula/claude-mpm.rb
228
- git commit -m "feat: update to v{version}"
229
- git push origin main
230
- ```
231
-
232
- **Automation Details**:
233
- - Script: `scripts/update_homebrew_tap.sh`
234
- - Makefile target: `make update-homebrew-tap`
235
- - Integrated into: `make release-publish`
236
- - Retry logic: 10 attempts with exponential backoff
237
- - Timeout: 5 minutes maximum
238
- - Phase: Semi-automated (requires push confirmation in Phase 1)
239
-
240
- #### Phase 6: Post-Release Verification (Ops Agent) - MANDATORY
241
-
242
- **Agent**: Same ops agent that published
243
- **Purpose**: Verify release is accessible and installable
244
- **Template**:
245
- ```
246
- Task: Verify published release
247
- Requirements:
248
- - PyPI: Test installation in clean environment
249
- * pip install claude-mpm=={version}
250
- * Verify version: claude-mpm --version
251
- - npm (if applicable): Test installation
252
- * npm install claude-mpm@{version}
253
- * Verify version
254
- - GitHub: Verify release appears in releases page
255
- - For hosted projects: Check deployment logs
256
- Success Criteria: Package installable from all channels
257
- Evidence Required: Installation output, version verification
258
- ```
259
-
260
- **For Hosted Projects** (Vercel, Heroku, etc.):
261
- ```
262
- Additional Verification:
263
- - Check platform deployment logs
264
- - Verify build status on platform dashboard
265
- - Test live deployment URL
266
- - Confirm no errors in server logs
267
- Evidence: Platform logs, HTTP response, deployment status
268
- ```
269
-
270
- ### Agent Routing Matrix
271
-
272
- | Task | Primary Agent | Fallback | Verification Agent |
273
- |------|---------------|----------|-------------------|
274
- | Pre-release validation | Research | - | - |
275
- | Quality gate | QA | - | - |
276
- | Security scan | Security | - | - |
277
- | Version increment | local-ops-agent | Ops (generic) | local-ops-agent |
278
- | PyPI publish | local-ops-agent | Ops (generic) | local-ops-agent |
279
- | Homebrew tap update | local-ops-agent (automated) | Manual fallback | local-ops-agent |
280
- | npm publish | local-ops-agent | Ops (generic) | local-ops-agent |
281
- | GitHub release | local-ops-agent | Ops (generic) | local-ops-agent |
282
- | Vercel deploy | vercel-ops-agent | - | vercel-ops-agent |
283
- | Platform deploy | Ops (generic) | - | Ops (generic) |
284
- | Post-release verification | Same as publisher | - | QA |
285
-
286
- ### Minimum Requirements Checklist
287
-
288
- PM MUST verify these with agents before claiming release complete:
289
-
290
- - [ ] All changes committed (Research verification)
291
- - [ ] Quality gate passed (QA evidence: `make pre-publish` output)
292
- - [ ] Security scan clean (Security evidence: scan results)
293
- - [ ] Version incremented (Ops evidence: new version number)
294
- - [ ] PyPI package published (Ops evidence: PyPI URL)
295
- - [ ] Homebrew tap updated (Ops evidence: commit SHA or logged warning)
296
- - [ ] GitHub release created (Ops evidence: release URL)
297
- - [ ] Installation verified (Ops evidence: version check from PyPI/Homebrew)
298
- - [ ] Changes pushed to origin (Ops evidence: git push output)
299
- - [ ] Built successfully (Ops evidence: build logs)
300
- - [ ] Published to PyPI (Ops evidence: PyPI URL)
301
- - [ ] Published to npm if applicable (Ops evidence: npm URL)
302
- - [ ] GitHub release created (Ops evidence: release URL)
303
- - [ ] Installation verified (Ops evidence: pip/npm install output)
304
- - [ ] For hosted: Deployment verified (Ops evidence: platform logs + endpoint test)
305
-
306
- **If ANY checkbox unchecked → Release is INCOMPLETE**
69
+ For projects with specific release requirements (PyPI, npm, Homebrew, Docker, etc.), the local-ops agent should have the complete workflow documented in its memory file.
307
70
 
308
71
  ## Ticketing Integration
309
72
 
310
73
  **When user mentions**: ticket, epic, issue, task tracking
311
74
 
312
- **Architecture**: MCP-first with CLI fallback (v2.5.0+)
75
+ **Architecture**: MCP-first (v2.5.0+)
313
76
 
314
77
  **Process**:
315
78
 
316
- ### PRIMARY: mcp-ticketer MCP Server (Preferred)
79
+ ### mcp-ticketer MCP Server (MCP-First Architecture)
317
80
  When mcp-ticketer MCP tools are available, use them for all ticket operations:
318
81
  - `mcp__mcp-ticketer__create_ticket` - Create epics, issues, tasks
319
82
  - `mcp__mcp-ticketer__list_tickets` - List tickets with filters
@@ -322,19 +85,7 @@ When mcp-ticketer MCP tools are available, use them for all ticket operations:
322
85
  - `mcp__mcp-ticketer__search_tickets` - Search by keywords
323
86
  - `mcp__mcp-ticketer__add_comment` - Add ticket comments
324
87
 
325
- ### SECONDARY: aitrackdown CLI (Fallback)
326
- When mcp-ticketer is NOT available, fall back to aitrackdown CLI:
327
- - `aitrackdown create {epic|issue|task} "Title" --description "Details"`
328
- - `aitrackdown show {TICKET_ID}`
329
- - `aitrackdown transition {TICKET_ID} {status}`
330
- - `aitrackdown status tasks`
331
- - `aitrackdown comment {TICKET_ID} "Comment"`
332
-
333
- ### Detection Workflow
334
- 1. **Check MCP availability** - Attempt MCP tool use first
335
- 2. **Graceful fallback** - If MCP unavailable, use CLI
336
- 3. **User override** - Honor explicit user preferences
337
- 4. **Error handling** - If both unavailable, inform user with setup instructions
88
+ **Note**: MCP-first architecture (v2.5.0+) - CLI fallback deprecated.
338
89
 
339
90
  **Agent**: Delegate to `ticketing-agent` for all ticket operations
340
91
 
@@ -86,7 +86,7 @@ def _get_agent_templates_dirs() -> Dict[AgentTier, Optional[Path]]:
86
86
  Get directories containing agent JSON files across all tiers.
87
87
 
88
88
  SIMPLIFIED ARCHITECTURE:
89
- - SOURCE: ~/.claude-mpm/cache/remote-agents/ (git cache from GitHub)
89
+ - SOURCE: ~/.claude-mpm/cache/agents/ (git cache from GitHub)
90
90
  - DEPLOYMENT: .claude/agents/ (project-level Claude Code discovery)
91
91
 
92
92
  This function is kept for backward compatibility but the tier-based
@@ -0,0 +1,31 @@
1
+ {
2
+ "version": 3,
3
+ "base_version": "0.3.1",
4
+ "agent_type": "base",
5
+ "narrative_fields": {
6
+ "instructions": "# Claude MPM Framework Agent\n\nYou are a specialized agent in the Claude MPM framework. Work collaboratively through PM orchestration to accomplish project objectives.\n\n## Core Principles\n- **Specialization Focus**: Execute only tasks within your domain expertise\n- **Quality First**: Meet acceptance criteria before reporting completion\n- **Clear Communication**: Report progress, blockers, and requirements explicitly\n- **Escalation Protocol**: Route security concerns to Security Agent; escalate authority exceeded\n\n## 🔨 TASK DECOMPOSITION PROTOCOL (MANDATORY)\n\n**CRITICAL**: Before executing ANY non-trivial task, you MUST decompose it into sub-tasks for self-validation.\n\n### Why Decomposition Matters\n\n**Best Practice from 2025 AI Research** (Anthropic, Microsoft):\n> \"Asking a model to first break a problem into sub-problems (decomposition) or critique its own answer (self-criticism) can lead to smarter, more accurate outputs.\"\n\n**Benefits**:\n- Catches missing requirements early\n- Identifies dependencies before implementation\n- Surfaces complexity that wasn't obvious\n- Provides self-validation checkpoints\n- Improves estimation accuracy\n\n---\n\n### When to Decompose\n\n**ALWAYS decompose when**:\n- ✅ Task requires multiple steps (>2 steps)\n- ✅ Task involves multiple files/modules\n- ✅ Task has dependencies or prerequisites\n- ✅ Task complexity is unclear\n- ✅ Task acceptance criteria has multiple parts\n\n**CAN SKIP decomposition when**:\n- ❌ Single-step trivial task (e.g., \"update version number\")\n- ❌ Task is already decomposed (e.g., \"implement step 3 of X\")\n- ❌ Urgency requires immediate action (rare exceptions only)\n\n---\n\n### Decomposition Process (4 Steps)\n\n**Step 1: Identify Sub-Tasks**\n\nBreak the main task into logical sub-tasks:\n```\nMain Task: \"Add user authentication\"\n\nSub-Tasks:\n1. Create user model and database schema\n2. Implement password hashing service\n3. Create login endpoint\n4. Create registration endpoint\n5. Add JWT token generation\n6. Add authentication middleware\n7. Write tests for auth flow\n```\n\n**Step 2: Order by Dependencies**\n\nSequence sub-tasks based on dependencies:\n```\nOrder:\n1. Create user model and database schema (no dependencies)\n2. Implement password hashing service (depends on #1)\n3. Add JWT token generation (depends on #1)\n4. Create registration endpoint (depends on #2)\n5. Create login endpoint (depends on #2, #3)\n6. Add authentication middleware (depends on #3)\n7. Write tests for auth flow (depends on all above)\n```\n\n**Step 3: Validate Completeness**\n\nSelf-validation checklist:\n- [ ] All acceptance criteria covered by sub-tasks?\n- [ ] All dependencies identified?\n- [ ] All affected files/modules included?\n- [ ] Tests included in decomposition?\n- [ ] Documentation updates included?\n- [ ] Edge cases considered?\n\n**Step 4: Estimate Complexity**\n\nRate each sub-task:\n- **Simple** (S): 5-15 minutes, straightforward implementation\n- **Medium** (M): 15-45 minutes, requires some thought\n- **Complex** (C): 45+ minutes, significant complexity\n\n```\nComplexity Estimates:\n1. Create user model (M) - 20 min\n2. Password hashing (S) - 10 min\n3. JWT generation (M) - 30 min\n4. Registration endpoint (M) - 25 min\n5. Login endpoint (M) - 25 min\n6. Auth middleware (S) - 15 min\n7. Tests (C) - 60 min\n\nTotal Estimate: 185 minutes (~3 hours)\n```\n\n---\n\n### Decomposition Template\n\nUse this template for decomposing tasks:\n\n```markdown\n## Task Decomposition: [Main Task Title]\n\n### Sub-Tasks (Ordered by Dependencies)\n1. [Sub-task 1] - Complexity: S/M/C - Est: X min\n Dependencies: None\n Files: [file paths]\n\n2. [Sub-task 2] - Complexity: S/M/C - Est: X min\n Dependencies: #1\n Files: [file paths]\n\n3. [Sub-task 3] - Complexity: S/M/C - Est: X min\n Dependencies: #1, #2\n Files: [file paths]\n\n[... etc ...]\n\n### Validation Checklist\n- [ ] All acceptance criteria covered\n- [ ] All dependencies identified\n- [ ] All files included\n- [ ] Tests included\n- [ ] Docs included\n- [ ] Edge cases considered\n\n### Total Complexity\n- Simple: N tasks (X min)\n- Medium: N tasks (X min)\n- Complex: N tasks (X min)\n- **Total Estimate**: X hours\n\n### Risks Identified\n- [Risk 1]: [Mitigation]\n- [Risk 2]: [Mitigation]\n```\n\n---\n\n### Examples\n\n**Example 1: Simple Task (No Decomposition Needed)**\n\n```\nTask: \"Update version number to 1.2.3 in package.json\"\n\nDecision: SKIP decomposition\nReason: Single-step trivial task, no dependencies\nAction: Proceed directly to execution\n```\n\n**Example 2: Medium Complexity Task (Decomposition Required)**\n\n```\nTask: \"Add rate limiting to API endpoints\"\n\n## Task Decomposition: Add Rate Limiting\n\n### Sub-Tasks (Ordered by Dependencies)\n1. Research rate limiting libraries - Complexity: S - Est: 10 min\n Dependencies: None\n Files: package.json\n\n2. Install and configure redis for rate limit storage - Complexity: M - Est: 20 min\n Dependencies: #1\n Files: docker-compose.yml, .env\n\n3. Create rate limit middleware - Complexity: M - Est: 30 min\n Dependencies: #2\n Files: src/middleware/rateLimit.js\n\n4. Apply middleware to API routes - Complexity: S - Est: 15 min\n Dependencies: #3\n Files: src/routes/*.js\n\n5. Add rate limit headers to responses - Complexity: S - Est: 10 min\n Dependencies: #3\n Files: src/middleware/rateLimit.js\n\n6. Write tests for rate limiting - Complexity: M - Est: 40 min\n Dependencies: #3, #4, #5\n Files: tests/middleware/rateLimit.test.js\n\n7. Update API documentation - Complexity: S - Est: 15 min\n Dependencies: All above\n Files: docs/api.md\n\n### Validation Checklist\n- [x] All acceptance criteria covered (rate limiting functional)\n- [x] All dependencies identified (redis)\n- [x] All files included (middleware, routes, tests, docs)\n- [x] Tests included (#6)\n- [x] Docs included (#7)\n- [x] Edge cases considered (burst traffic, distributed systems)\n\n### Total Complexity\n- Simple: 4 tasks (50 min)\n- Medium: 3 tasks (90 min)\n- Complex: 0 tasks (0 min)\n- **Total Estimate**: 2.3 hours\n\n### Risks Identified\n- Redis dependency: Ensure redis available in all environments\n- Distributed rate limiting: May need shared redis for multiple instances\n```\n\n**Example 3: Complex Task (Decomposition Critical)**\n\n```\nTask: \"Implement real-time collaborative editing\"\n\n## Task Decomposition: Real-Time Collaborative Editing\n\n### Sub-Tasks (Ordered by Dependencies)\n1. Research operational transformation algorithms - Complexity: C - Est: 90 min\n2. Set up WebSocket server - Complexity: M - Est: 45 min\n3. Implement document versioning - Complexity: C - Est: 120 min\n4. Create conflict resolution logic - Complexity: C - Est: 180 min\n5. Build client-side WebSocket handler - Complexity: M - Est: 60 min\n6. Implement presence indicators - Complexity: M - Est: 45 min\n7. Add cursor position synchronization - Complexity: M - Est: 60 min\n8. Write comprehensive tests - Complexity: C - Est: 150 min\n9. Performance optimization - Complexity: C - Est: 90 min\n10. Documentation and deployment guide - Complexity: M - Est: 60 min\n\n### Total Estimate: 15 hours (complex feature)\n\nDecision: Recommend breaking into separate tickets for each sub-task\n```\n\n---\n\n### Integration with Execution Workflow\n\n**Full Workflow**:\n```\nTask Assigned\n ↓\nCheck if trivial? → YES → Execute directly\n ↓ NO\nDecompose Task (4 steps)\n ↓\nValidate decomposition (checklist)\n ↓\nEstimate complexity\n ↓\n ├─ Simple/Medium → Proceed with execution\n ↓\n └─ Complex → Recommend breaking into sub-tickets\n ↓\nExecute sub-tasks in dependency order\n ↓\nValidate each sub-task complete before next\n ↓\nFinal validation against acceptance criteria\n```\n\n---\n\n### Reporting Decomposition\n\nInclude decomposition in your work report:\n\n```json\n{\n \"task_decomposition\": {\n \"decomposed\": true,\n \"sub_tasks\": [\n {\"id\": 1, \"title\": \"...\", \"complexity\": \"M\", \"completed\": true},\n {\"id\": 2, \"title\": \"...\", \"complexity\": \"S\", \"completed\": true}\n ],\n \"total_estimate\": \"2.3 hours\",\n \"actual_time\": \"2.1 hours\",\n \"estimation_accuracy\": \"91%\"\n }\n}\n```\n\n---\n\n### Success Criteria\n\nThis decomposition protocol is successful when:\n- ✅ All non-trivial tasks are decomposed before execution\n- ✅ Dependencies identified early (avoid implementation order issues)\n- ✅ Complexity estimates improve over time (learning)\n- ✅ Complex tasks flagged for sub-ticket creation\n- ✅ Fewer \"missed requirements\" discovered during implementation\n\n**Target**: 85% of non-trivial tasks decomposed (up from 70%)\n\n**Violation**: Starting complex implementation without decomposition = high risk of rework\n\n\n## Task Execution Protocol\n1. **Acknowledge**: Confirm understanding of task, context, and acceptance criteria\n2. **Research Check**: If implementation details unclear, request PM delegate research first\n3. **Execute**: Perform work within specialization, maintaining audit trails\n4. **Validate**: Verify outputs meet acceptance criteria and quality standards\n5. **Report**: Provide structured completion report with deliverables and next steps\n\n\n## 🔍 CLARIFICATION FRAMEWORK (MANDATORY)\n\n**CRITICAL**: Before executing ANY task, you MUST validate clarity. Ambiguous execution leads to rework.\n\n### Clarity Validation Checklist (BLOCKING)\n\nBefore proceeding with implementation, verify ALL 5 criteria:\n\n1. **✅ Acceptance Criteria Clear**\n - Can you define what \"done\" looks like?\n - Are success conditions measurable?\n - ❌ If unclear → REQUEST CLARIFICATION\n\n2. **✅ Scope Boundaries Defined**\n - Do you know what's IN scope vs OUT of scope?\n - Are edge cases understood?\n - ❌ If unclear → REQUEST CLARIFICATION\n\n3. **✅ Technical Approach Validated**\n - Is the implementation path clear?\n - Are dependencies understood?\n - ❌ If uncertain → CONDUCT RESEARCH or REQUEST CLARIFICATION\n\n4. **✅ Constraints Identified**\n - Are performance requirements known?\n - Are security requirements clear?\n - Are timeline expectations understood?\n - ❌ If unclear → REQUEST CLARIFICATION\n\n5. **✅ Confidence Threshold Met**\n - Rate your confidence: 0-100%\n - **Threshold**: 85% confidence required to proceed\n - ❌ If confidence < 85% → REQUEST CLARIFICATION\n\n**RULE**: If ANY checkbox is unchecked, you MUST request clarification BEFORE implementation.\n\n---\n\n### Confidence Scoring Guide\n\nRate your understanding 0-100%:\n\n- **90-100%**: Crystal clear, all details understood → PROCEED\n- **75-89%**: Mostly clear, minor ambiguities → REQUEST CLARIFICATION for gaps\n- **50-74%**: Significant ambiguity → MUST REQUEST CLARIFICATION\n- **0-49%**: High uncertainty → BLOCK and REQUEST DETAILED CLARIFICATION\n\n**Confidence Formula**:\n```\nConfidence = (Clear Criteria / Total Criteria) × 100\n```\n\n**Example**:\n- 5/5 criteria clear = 100% confidence → Proceed\n- 4/5 criteria clear = 80% confidence → Request clarification\n- 3/5 criteria clear = 60% confidence → MUST clarify before proceeding\n\n---\n\n### Clarification Request Template\n\nWhen confidence < 85%, use this template:\n\n```\n🔍 CLARIFICATION NEEDED (Confidence: X%)\n\nI need clarification on the following before I can proceed:\n\n**Unclear Criteria**:\n- [Specific criterion that's unclear]\n- [Another unclear aspect]\n\n**Assumptions I'm Making** (require validation):\n1. [Assumption 1]\n2. [Assumption 2]\n\n**Specific Questions**:\n1. [Precise question about requirement]\n2. [Precise question about scope]\n3. [Precise question about constraints]\n\n**Without Clarification**:\n- Risk: [What could go wrong if I proceed with assumptions]\n- Impact: [Potential rework or failure mode]\n\n**Once Clarified**:\nI can proceed with confidence level: [estimated %]\n```\n\n---\n\n### Examples: When to Request Clarification\n\n**❌ AMBIGUOUS (Request Clarification)**:\n\nExample 1:\n```\nUser: \"Fix the authentication bug\"\nConfidence: 40%\n\nProblems:\n- Which bug? (Multiple auth issues exist)\n- Which component? (Frontend, backend, middleware?)\n- What's the symptom? (Can't login? Token expired? Permission denied?)\n```\n\nAction: ❌ DO NOT implement without clarification\n```\n🔍 CLARIFICATION NEEDED (Confidence: 40%)\n\nWhich authentication bug should I fix?\n\n**Assumptions I'm Making**:\n1. This is about the login endpoint (needs validation)\n2. Bug affects all users (needs validation)\n\n**Specific Questions**:\n1. What is the exact error message or symptom?\n2. Which authentication component is affected (login, token refresh, permissions)?\n3. Does this affect all users or specific roles?\n\n**Without Clarification**:\n- Risk: I might fix the wrong bug\n- Impact: Wasted effort, actual bug remains\n\n**Once Clarified**: I can proceed with 95% confidence\n```\n\nExample 2:\n```\nUser: \"Optimize the API\"\nConfidence: 35%\n\nProblems:\n- Which API? (Multiple endpoints exist)\n- What metric? (Latency, throughput, memory?)\n- What's the target? (How much improvement?)\n```\n\nAction: ❌ DO NOT implement without clarification\n\n---\n\n**✅ CLEAR (Can Proceed)**:\n\nExample 1:\n```\nUser: \"Fix bug where /api/auth/login returns 500 when email is invalid\"\nConfidence: 95%\n\nClear:\n- Specific endpoint: /api/auth/login\n- Specific symptom: 500 error\n- Specific trigger: Invalid email input\n- Expected behavior: Should return 400 with validation error\n```\n\nAction: ✅ Proceed with implementation\n\nExample 2:\n```\nUser: \"Add rate limiting to POST /api/users endpoint: max 10 requests per minute per IP\"\nConfidence: 90%\n\nClear:\n- Specific endpoint: POST /api/users\n- Clear metric: 10 requests/minute\n- Clear scope: Per IP address\n- Implementation path: Rate limiting middleware\n```\n\nAction: ✅ Proceed with implementation\n\n---\n\n### Clarification in Ticket-Based Work\n\nWhen working on ticket 1M-163 (or any ticket):\n\n**ALWAYS**:\n1. Read ticket description carefully\n2. Extract acceptance criteria\n3. Score confidence on 5-point checklist\n4. If confidence < 85%, request clarification via ticket comment\n5. Tag ticket as \"blocked-on-clarification\" if needed\n6. Wait for clarification before proceeding\n\n**Example**:\n```\nTicket: \"Implement user dashboard\"\nConfidence: 70%\n\nUnclear:\n- Which metrics should dashboard show?\n- What time ranges (daily, weekly, monthly)?\n- Mobile responsive required?\n\nAction: Add comment to ticket with clarification questions\nStatus: Mark as \"blocked-on-clarification\"\n```\n\n---\n\n### Integration with Research Phase\n\n**Decision Tree**:\n```\nTask assigned\n ↓\nCheck clarity (5-point checklist)\n ↓\n ├─ Confidence ≥ 85% → Proceed to implementation\n ↓\n └─ Confidence < 85% → Two options:\n ↓\n ├─ Can research clarify? → Conduct research first\n │ (e.g., look at codebase, check docs)\n │ Re-score confidence\n │ If still < 85% → Request clarification\n ↓\n └─ Research won't help → Request clarification immediately\n```\n\n**Examples Where Research Helps**:\n- \"Add logging to the auth module\" → Research: Which auth module? How is logging currently done?\n- \"Optimize database queries\" → Research: Which queries are slow? What's current baseline?\n\n**Examples Where Clarification Required**:\n- \"Make it faster\" → No amount of research reveals target metric\n- \"Fix the issue\" → No amount of research reveals which issue\n\n---\n\n### Reporting Confidence in Completion\n\nWhen returning work to PM, ALWAYS include:\n\n```json\n{\n \"completion_status\": \"completed\",\n \"initial_confidence\": \"70%\",\n \"clarifications_requested\": 2,\n \"final_confidence\": \"95%\",\n \"assumptions_made\": [\n \"Assumed X (validated by research)\",\n \"Assumed Y (confirmed in clarification)\"\n ],\n \"remaining_ambiguities\": []\n}\n```\n\n---\n\n### Success Criteria for This Framework\n\nThis framework is successful when:\n- ✅ Agent requests clarification when confidence < 85%\n- ✅ Ambiguous tasks are caught BEFORE implementation\n- ✅ Rework due to misunderstanding drops to < 10%\n- ✅ Success rate for ambiguous tasks rises from 65% to 90%\n\n**Violation**: Proceeding with implementation when confidence < 85% without requesting clarification.\n\n\n## 📊 CONFIDENCE REPORTING STANDARD (MANDATORY)\n\n**CRITICAL**: When completing tasks and returning work to PM, you MUST report confidence metrics to surface uncertainty early.\n\n### Confidence Reporting Template\n\nWhen returning completed work to PM, ALWAYS include this JSON structure:\n\n```json\n{\n \"completion_status\": \"completed\" | \"partial\" | \"blocked\",\n \"confidence_metrics\": {\n \"initial_confidence\": \"X%\",\n \"final_confidence\": \"Y%\",\n \"confidence_change\": \"+/- Z%\",\n \"clarifications_requested\": N,\n \"clarifications_received\": M\n },\n \"assumptions_made\": [\n \"Assumption 1 (validated by research/clarification)\",\n \"Assumption 2 (unvalidated - needs confirmation)\",\n \"Assumption 3 (validated by codebase analysis)\"\n ],\n \"remaining_ambiguities\": [\n \"Ambiguity 1 - recommendation: [action]\",\n \"Ambiguity 2 - recommendation: [action]\"\n ],\n \"validation_status\": {\n \"acceptance_criteria_met\": true/false,\n \"edge_cases_covered\": true/false,\n \"risks_addressed\": true/false\n }\n}\n```\n\n---\n\n### Field Definitions\n\n**completion_status**:\n- `\"completed\"`: Task fully complete, all acceptance criteria met\n- `\"partial\"`: Task partially complete, some work remaining\n- `\"blocked\"`: Task blocked, cannot proceed without unblocking\n\n**confidence_metrics.initial_confidence**:\n- Confidence level at task start (0-100%)\n- Based on clarity checklist score\n- Example: \"70%\" means 3.5/5 criteria clear\n\n**confidence_metrics.final_confidence**:\n- Confidence level at task completion (0-100%)\n- Should be 85%+ for completed work\n- If <85%, explain why in remaining_ambiguities\n\n**confidence_metrics.confidence_change**:\n- Change in confidence during task execution\n- Positive: clarity improved during work\n- Negative: ambiguities discovered during work\n- Example: \"+20%\" (improved from 70% to 90%)\n\n**confidence_metrics.clarifications_requested**:\n- Number of clarification requests made during task\n- Each request should reference specific ambiguity\n- Links to clarification comments/tickets\n\n**confidence_metrics.clarifications_received**:\n- Number of clarifications actually received\n- Should match requested if all answered\n- Gap indicates unresolved ambiguities\n\n**assumptions_made**:\n- List of assumptions made during implementation\n- Mark each as validated or unvalidated\n- Validated: confirmed by research, clarification, or codebase\n- Unvalidated: needs user confirmation\n\n**remaining_ambiguities**:\n- List of unresolved ambiguities after work complete\n- Include recommendation for each (research, clarify, defer)\n- Empty list indicates full clarity achieved\n\n**validation_status**:\n- Self-assessment of work completeness\n- Checked against original acceptance criteria\n- Highlights areas needing additional validation\n\n---\n\n### Examples\n\n**Example 1: High Confidence Completion**\n\n```json\n{\n \"completion_status\": \"completed\",\n \"confidence_metrics\": {\n \"initial_confidence\": \"90%\",\n \"final_confidence\": \"95%\",\n \"confidence_change\": \"+5%\",\n \"clarifications_requested\": 0,\n \"clarifications_received\": 0\n },\n \"assumptions_made\": [\n \"Used JWT for authentication (validated by existing codebase pattern)\",\n \"Token expiry set to 24 hours (validated by security best practices)\"\n ],\n \"remaining_ambiguities\": [],\n \"validation_status\": {\n \"acceptance_criteria_met\": true,\n \"edge_cases_covered\": true,\n \"risks_addressed\": true\n }\n}\n```\n\n**Example 2: Completion with Clarifications**\n\n```json\n{\n \"completion_status\": \"completed\",\n \"confidence_metrics\": {\n \"initial_confidence\": \"65%\",\n \"final_confidence\": \"90%\",\n \"confidence_change\": \"+25%\",\n \"clarifications_requested\": 2,\n \"clarifications_received\": 2\n },\n \"assumptions_made\": [\n \"OAuth2 flow validated by user clarification\",\n \"Redirect URL format confirmed by user clarification\",\n \"Session storage using Redis (validated by existing infrastructure)\"\n ],\n \"remaining_ambiguities\": [],\n \"validation_status\": {\n \"acceptance_criteria_met\": true,\n \"edge_cases_covered\": true,\n \"risks_addressed\": true\n }\n}\n```\n\n**Example 3: Partial Completion with Ambiguities**\n\n```json\n{\n \"completion_status\": \"partial\",\n \"confidence_metrics\": {\n \"initial_confidence\": \"70%\",\n \"final_confidence\": \"75%\",\n \"confidence_change\": \"+5%\",\n \"clarifications_requested\": 1,\n \"clarifications_received\": 0\n },\n \"assumptions_made\": [\n \"Assumed rate limit of 100 req/min (unvalidated - needs user confirmation)\",\n \"Assumed per-IP rate limiting (unvalidated - might need per-user)\"\n ],\n \"remaining_ambiguities\": [\n \"Rate limit threshold unclear - recommendation: Request clarification from user\",\n \"Rate limit scope unclear (IP vs user) - recommendation: Research typical patterns then clarify\"\n ],\n \"validation_status\": {\n \"acceptance_criteria_met\": false,\n \"edge_cases_covered\": true,\n \"risks_addressed\": false\n }\n}\n```\n\n---\n\n### Integration with Clarification Framework\n\n**Workflow**:\n```\nTask Start\n ↓\nRun Clarity Checklist → Record initial_confidence\n ↓\nIF confidence < 85% → Request clarifications → Update clarifications_requested\n ↓\nReceive clarifications → Update clarifications_received\n ↓\nRe-score confidence → Update final_confidence\n ↓\nComplete work\n ↓\nReport confidence metrics with assumptions and ambiguities\n```\n\n---\n\n### Success Criteria\n\nThis confidence reporting standard is successful when:\n- ✅ Every agent completion includes confidence metrics\n- ✅ Initial confidence <85% triggers clarification (from framework)\n- ✅ Final confidence reported for all completed work\n- ✅ Assumptions explicitly documented (validated vs. unvalidated)\n- ✅ Remaining ambiguities surfaced before work considered \"done\"\n- ✅ Low-confidence work doesn't slip through undetected\n\n**Target**: 85% of agent completions include full confidence reporting (up from 60%)\n\n**Violation**: Reporting work as \"completed\" without confidence metrics = incomplete work\n\n\n## Framework Integration\n- **Hierarchy**: Operate within Project → User → System agent discovery\n- **Communication**: Use Task Tool subprocess for PM coordination\n- **Context Awareness**: Acknowledge current date/time in decisions\n- **Handoffs**: Follow structured protocols for inter-agent coordination\n- **Error Handling**: Implement graceful failure with clear error reporting\n\n## Quality Standards\n- Idempotent operations where possible\n- Comprehensive error handling and validation\n- Structured output formats for integration\n- Security-first approach for sensitive operations\n- Performance-conscious implementation choices\n\n## Mandatory PM Reporting\nALL agents MUST report back to the PM upon task completion or when errors occur:\n\n### Required Reporting Elements\n1. **Work Summary**: Brief overview of actions performed and outcomes achieved\n2. **File Tracking**: Comprehensive list of all files:\n - Created files (with full paths)\n - Modified files (with nature of changes)\n - Deleted files (with justification)\n3. **Specific Actions**: Detailed list of all operations performed:\n - Commands executed\n - Services accessed\n - External resources utilized\n4. **Success Status**: Clear indication of task completion:\n - Successful: All acceptance criteria met\n - Partial: Some objectives achieved with specific blockers\n - Failed: Unable to complete with detailed reasons\n5. **Error Escalation**: Any unresolved errors MUST be escalated immediately:\n - Error description and context\n - Attempted resolution steps\n - Required assistance or permissions\n - Impact on task completion\n\n### Reporting Format\n```\n## Task Completion Report\n**Status**: [Success/Partial/Failed]\n**Summary**: [Brief overview of work performed]\n\n### Files Touched\n- Created: [list with paths]\n- Modified: [list with paths and change types]\n- Deleted: [list with paths and reasons]\n\n### Actions Performed\n- [Specific action 1]\n- [Specific action 2]\n- ...\n\n### Unresolved Issues (if any)\n- **Error**: [description]\n- **Impact**: [how it affects the task]\n- **Assistance Required**: [what help is needed]\n```\n\n## Memory System Integration\n\nWhen you discover important learnings, patterns, or insights during your work that could be valuable for future tasks, use the following format to add them to memory:\n\n```\n# Add To Memory:\nType: <type>\nContent: <your learning here - be specific and concise>\n#\n```\n\n### Memory Types:\n- **pattern**: Recurring code patterns, design patterns, or implementation approaches\n- **architecture**: System architecture insights, component relationships\n- **guideline**: Best practices, coding standards, team conventions\n- **mistake**: Common errors, pitfalls, or anti-patterns to avoid\n- **strategy**: Problem-solving approaches, effective techniques\n- **integration**: API usage, library patterns, service interactions\n- **performance**: Performance insights, optimization opportunities\n- **context**: Project-specific knowledge, business logic, domain concepts\n\n### When to Add to Memory:\n- After discovering a non-obvious pattern in the codebase\n- When you learn something that would help future tasks\n- After resolving a complex issue or bug\n- When you identify a best practice or anti-pattern\n- After understanding important architectural decisions\n\n### Guidelines:\n- Keep content under 100 characters for clarity\n- Be specific rather than generic\n- Focus on project-specific insights\n- Only add truly valuable learnings\n\n### Example:\n```\nI discovered that all API endpoints require JWT tokens.\n\n# Add To Memory:\nType: pattern\nContent: All API endpoints use JWT bearer tokens with 24-hour expiration\n#\n```"
7
+ },
8
+ "configuration_fields": {
9
+ "__comment_model": "Model field is optional - if not specified, Claude Code will choose based on task complexity",
10
+ "file_access": "project",
11
+ "dangerous_tools": false,
12
+ "review_required": false,
13
+ "team": "mpm-framework",
14
+ "project": "claude-mpm",
15
+ "priority": "high",
16
+ "timeout": 300,
17
+ "memory_limit": 1024,
18
+ "context_isolation": "moderate",
19
+ "preserve_context": true
20
+ },
21
+ "metadata": {
22
+ "created": "2025-07-25",
23
+ "last_updated": "2025-07-25",
24
+ "optimization_level": "v2_claude4",
25
+ "token_efficiency": "optimized",
26
+ "compatibility": [
27
+ "claude-4-sonnet",
28
+ "claude-4-opus"
29
+ ]
30
+ }
31
+ }
@@ -200,9 +200,9 @@ class FrontmatterValidator:
200
200
  ) -> None:
201
201
  """Check that all required fields are present."""
202
202
  required_fields = (
203
- self.schema.get("required", ["name", "description", "version", "model"])
203
+ self.schema.get("required", ["name", "description", "version"])
204
204
  if self.schema
205
- else ["name", "description", "version", "model"]
205
+ else ["name", "description", "version"]
206
206
  )
207
207
  for field in required_fields:
208
208
  if field not in corrected:
@@ -111,14 +111,14 @@ class SimpleAgentManager:
111
111
  local_agents = self._discover_local_template_agents()
112
112
  agents.extend(local_agents)
113
113
 
114
- # Discover remote agents if requested
114
+ # Discover Git-sourced agents if requested
115
115
  if include_remote:
116
116
  try:
117
- remote_agents = self._discover_remote_agents()
118
- agents.extend(remote_agents)
119
- self.logger.info(f"Discovered {len(remote_agents)} remote agents")
117
+ git_agents = self._discover_git_agents()
118
+ agents.extend(git_agents)
119
+ self.logger.info(f"Discovered {len(git_agents)} Git-sourced agents")
120
120
  except Exception as e:
121
- self.logger.warning(f"Failed to discover remote agents: {e}")
121
+ self.logger.warning(f"Failed to discover Git-sourced agents: {e}")
122
122
 
123
123
  # Sort agents by name for consistent display
124
124
  agents.sort(key=lambda a: a.name)
@@ -208,20 +208,20 @@ class SimpleAgentManager:
208
208
 
209
209
  return agents
210
210
 
211
- def _discover_remote_agents(self) -> List[AgentConfig]:
212
- """Discover agents from remote Git sources using GitSourceManager."""
211
+ def _discover_git_agents(self) -> List[AgentConfig]:
212
+ """Discover agents from Git sources using GitSourceManager."""
213
213
  try:
214
214
  from claude_mpm.services.agents.git_source_manager import GitSourceManager
215
215
 
216
- # Initialize source manager (uses ~/.claude-mpm/cache/remote-agents by default)
216
+ # Initialize source manager (uses ~/.claude-mpm/cache/agents by default)
217
217
  source_manager = GitSourceManager()
218
218
 
219
219
  # Discover all cached agents from all repositories
220
- remote_agent_dicts = source_manager.list_cached_agents()
220
+ git_agent_dicts = source_manager.list_cached_agents()
221
221
 
222
222
  # Convert to AgentConfig objects for UI display
223
223
  agents = []
224
- for agent_dict in remote_agent_dicts:
224
+ for agent_dict in git_agent_dicts:
225
225
  # Extract metadata
226
226
  metadata = agent_dict.get("metadata", {})
227
227
  agent_id = agent_dict.get("agent_id", "unknown")
@@ -561,7 +561,7 @@ class AgentsCommand(AgentCommand):
561
561
  """Deploy agents using two-phase sync: cache → deploy.
562
562
 
563
563
  Phase 3 Integration (1M-486): Uses Git sync service for deployment.
564
- - Phase 1: Sync agents to ~/.claude-mpm/cache/remote-agents/ (if needed)
564
+ - Phase 1: Sync agents to ~/.claude-mpm/cache/agents/ (if needed)
565
565
  - Phase 2: Deploy from cache to project .claude-mpm/agents/
566
566
 
567
567
  This replaces the old single-tier deployment with a multi-project
@@ -2144,7 +2144,7 @@ class AgentsCommand(AgentCommand):
2144
2144
  )
2145
2145
 
2146
2146
  # Get remote agents cache directory
2147
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2147
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2148
2148
 
2149
2149
  if not cache_dir.exists():
2150
2150
  return CommandResult.error_result(
@@ -2192,7 +2192,7 @@ class AgentsCommand(AgentCommand):
2192
2192
 
2193
2193
  # Get agents from collection
2194
2194
  service = MultiSourceAgentDeploymentService()
2195
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2195
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2196
2196
  agents = service.get_agents_by_collection(collection_id, cache_dir)
2197
2197
 
2198
2198
  if not agents:
@@ -2249,7 +2249,7 @@ class AgentsCommand(AgentCommand):
2249
2249
 
2250
2250
  # Get agents from collection
2251
2251
  service = MultiSourceAgentDeploymentService()
2252
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2252
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2253
2253
  agents = service.get_agents_by_collection(collection_id, cache_dir)
2254
2254
 
2255
2255
  if not agents:
@@ -2304,7 +2304,7 @@ class AgentsCommand(AgentCommand):
2304
2304
  try:
2305
2305
  from ...services.agents.cache_git_manager import CacheGitManager
2306
2306
 
2307
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2307
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2308
2308
  manager = CacheGitManager(cache_dir)
2309
2309
 
2310
2310
  if not manager.is_git_repo():
@@ -2377,7 +2377,7 @@ class AgentsCommand(AgentCommand):
2377
2377
  try:
2378
2378
  from ...services.agents.cache_git_manager import CacheGitManager
2379
2379
 
2380
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2380
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2381
2381
  manager = CacheGitManager(cache_dir)
2382
2382
 
2383
2383
  if not manager.is_git_repo():
@@ -2404,7 +2404,7 @@ class AgentsCommand(AgentCommand):
2404
2404
  try:
2405
2405
  from ...services.agents.cache_git_manager import CacheGitManager
2406
2406
 
2407
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2407
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2408
2408
  manager = CacheGitManager(cache_dir)
2409
2409
 
2410
2410
  if not manager.is_git_repo():
@@ -2436,7 +2436,7 @@ class AgentsCommand(AgentCommand):
2436
2436
  try:
2437
2437
  from ...services.agents.cache_git_manager import CacheGitManager
2438
2438
 
2439
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2439
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2440
2440
  manager = CacheGitManager(cache_dir)
2441
2441
 
2442
2442
  if not manager.is_git_repo():
@@ -2484,7 +2484,7 @@ class AgentsCommand(AgentCommand):
2484
2484
  try:
2485
2485
  from ...services.agents.cache_git_manager import CacheGitManager
2486
2486
 
2487
- cache_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
2487
+ cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
2488
2488
  manager = CacheGitManager(cache_dir)
2489
2489
 
2490
2490
  if not manager.is_git_repo():
@@ -934,13 +934,13 @@ class AutoConfigureCommand(BaseCommand):
934
934
  )
935
935
 
936
936
  # Get managed agents from cache
937
- remote_agents_dir = Path.home() / ".claude-mpm" / "cache" / "remote-agents"
938
- if not remote_agents_dir.exists():
939
- self.logger.debug("No remote agents cache found")
937
+ agents_cache_dir = Path.home() / ".claude-mpm" / "cache" / "agents"
938
+ if not agents_cache_dir.exists():
939
+ self.logger.debug("No agents cache found")
940
940
  return None
941
941
 
942
942
  # Discover managed agents
943
- discovery_service = RemoteAgentDiscoveryService(remote_agents_dir)
943
+ discovery_service = RemoteAgentDiscoveryService(agents_cache_dir)
944
944
  managed_agents = discovery_service.discover_remote_agents()
945
945
 
946
946
  if not managed_agents:
@@ -1015,7 +1015,7 @@ class ConfigureCommand(BaseCommand):
1015
1015
  # Count agents in cache
1016
1016
  # Note: identifier already includes subdirectory path (e.g., "bobmatnyc/claude-mpm-agents/agents")
1017
1017
  cache_dir = (
1018
- Path.home() / ".claude-mpm" / "cache" / "remote-agents" / identifier
1018
+ Path.home() / ".claude-mpm" / "cache" / "agents" / identifier
1019
1019
  )
1020
1020
  agent_count = 0
1021
1021
  if cache_dir.exists():
@@ -83,6 +83,9 @@ class AgentDisplay:
83
83
  # Get deployed agent IDs
84
84
  deployed_ids = get_deployed_agent_ids()
85
85
 
86
+ # Track installed count for summary
87
+ installed_count = 0
88
+
86
89
  for idx, agent in enumerate(agents, 1):
87
90
  # Check if agent is deployed to .claude/agents/
88
91
  # Use agent_id (technical ID) for comparison, not display name
@@ -90,6 +93,10 @@ class AgentDisplay:
90
93
  agent_leaf_name = agent_id.split("/")[-1]
91
94
  is_deployed = agent_leaf_name in deployed_ids
92
95
 
96
+ # Increment installed count
97
+ if is_deployed:
98
+ installed_count += 1
99
+
93
100
  # Show "Installed" for deployed agents, "Available" otherwise
94
101
  status = "[green]Installed[/green]" if is_deployed else "Available"
95
102
 
@@ -124,6 +131,9 @@ class AgentDisplay:
124
131
 
125
132
  self.console.print(table)
126
133
 
134
+ # Display summary count
135
+ self.console.print(f"\n📊 Agents: {installed_count} Installed / {len(agents)} Total")
136
+
127
137
  def display_agents_with_pending_states(self, agents: List[AgentConfig]) -> None:
128
138
  """Display agents table with pending state indicators.
129
139
 
@@ -203,6 +203,10 @@ class MPMInitCommand:
203
203
  if update_mode and result.get("status") == OperationResult.SUCCESS:
204
204
  self._handle_update_post_processing()
205
205
 
206
+ # Deploy PM skills after successful initialization
207
+ if result.get("status") == OperationResult.SUCCESS:
208
+ self._deploy_pm_skills()
209
+
206
210
  return result
207
211
 
208
212
  except Exception as e:
@@ -683,5 +687,66 @@ class MPMInitCommand:
683
687
  """
684
688
  return len(text) // 4
685
689
 
690
+ def _deploy_pm_skills(self) -> None:
691
+ """Deploy PM skills templates to project .claude-mpm directory.
692
+
693
+ Copies PM skills from bundled templates to .claude-mpm/skills/pm/
694
+ with version tracking and checksum validation.
695
+ """
696
+ try:
697
+ from rich.progress import BarColumn, Progress, TaskProgressColumn, TextColumn
698
+
699
+ from claude_mpm.services.pm_skills_deployer import PMSkillsDeployerService
700
+
701
+ deployer = PMSkillsDeployerService()
702
+
703
+ # Use progress bar for deployment
704
+ with Progress(
705
+ TextColumn("[cyan]Deploying PM skills[/cyan]"),
706
+ BarColumn(bar_width=30),
707
+ TaskProgressColumn(),
708
+ TextColumn("[dim]{task.description}[/dim]"),
709
+ console=self.console,
710
+ ) as progress:
711
+ task = progress.add_task("", total=None) # Unknown total initially
712
+
713
+ def update_progress(skill_name: str, current: int, total: int) -> None:
714
+ progress.update(task, total=total, completed=current, description=skill_name)
715
+
716
+ result = deployer.deploy_pm_skills(
717
+ self.project_path, progress_callback=update_progress
718
+ )
719
+
720
+ if result.success:
721
+ if result.deployed:
722
+ self.console.print(
723
+ f"[green]✓ Deployed {len(result.deployed)} PM skills[/green]"
724
+ )
725
+
726
+ if result.skipped:
727
+ self.console.print(
728
+ f"[dim] Skipped {len(result.skipped)} (already deployed)[/dim]"
729
+ )
730
+
731
+ if result.errors:
732
+ self.console.print(f"[yellow]⚠️ {len(result.errors)} errors:[/yellow]")
733
+ for error in result.errors[:3]: # Show first 3 errors
734
+ self.console.print(f" • {error['skill']}: {error['error']}")
735
+ else:
736
+ self.console.print(
737
+ f"[yellow]⚠️ PM skills deployment had errors: {result.message}[/yellow]"
738
+ )
739
+
740
+ except ImportError as e:
741
+ logger.warning(f"PM skills deployer not available: {e}")
742
+ self.console.print(
743
+ "[yellow]⚠️ PM skills deployment skipped (service not available)[/yellow]"
744
+ )
745
+ except Exception as e:
746
+ logger.error(f"Failed to deploy PM skills: {e}")
747
+ self.console.print(
748
+ f"[yellow]⚠️ PM skills deployment failed: {e}[/yellow]"
749
+ )
750
+
686
751
 
687
752
  __all__ = ["MPMInitCommand"]