claude-flow-novice 2.6.0 → 2.8.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/adaptive-context/cfn-v3-reflection.json +21 -0
- package/.claude/agents/AGENT_LIFECYCLE.md +495 -0
- package/.claude/agents/CLAUDE.md +1002 -995
- package/.claude/agents/accessibility-advocate.md +457 -0
- package/.claude/agents/agent-principles/README.md +226 -226
- package/.claude/agents/agent-principles/agent-type-guidelines.md +10 -0
- package/.claude/agents/agent-principles/format-selection.md +10 -0
- package/.claude/agents/agent-principles/phase4-template-optimization.md +502 -494
- package/.claude/agents/agent-principles/prompt-engineering.md +8 -0
- package/.claude/agents/agent-principles/quality-metrics.md +8 -0
- package/.claude/agents/analysis/code-analyzer.md +7 -17
- package/.claude/agents/analysis/code-review/analyze-code-quality.md +2 -104
- package/.claude/agents/analysis/perf-analyzer.md +2 -196
- package/.claude/agents/context/context-curator.md +78 -84
- package/.claude/agents/context/context-reflector.md +27 -81
- package/.claude/agents/coordinators/README.md +42 -0
- package/.claude/agents/coordinators/cfn-v3-coordinator.md +440 -0
- package/.claude/agents/{product-owner-team → coordinators}/cto-agent.md +154 -187
- package/.claude/agents/coordinators/multi-sprint-coordinator.md +50 -0
- package/.claude/agents/{product-owner-team → coordinators}/product-owner-agent.md +6 -39
- package/.claude/agents/{cfn-loop → coordinators}/product-owner.md +72 -17
- package/.claude/agents/core-agents/reviewer.md +114 -135
- package/.claude/agents/custom/agent-builder.md +637 -637
- package/.claude/agents/developers/README.md +69 -0
- package/.claude/agents/developers/backend-dev.md +77 -0
- package/.claude/agents/{core-agents → developers}/coder.md +131 -26
- package/.claude/agents/developers/react-frontend-engineer.md +121 -0
- package/.claude/agents/{frontend → developers}/state-architect.md +1 -0
- package/.claude/agents/{frontend → developers}/ui-designer.md +1 -0
- package/.claude/agents/development/backend/dev-backend-api.md +0 -29
- package/.claude/agents/development/npm-package-specialist.md +355 -347
- package/.claude/agents/documentation/api-docs/docs-api-openapi.md +8 -0
- package/.claude/agents/documentation/api-docs.md +8 -0
- package/.claude/agents/github/github-commit-agent.md +125 -117
- package/.claude/agents/goal/goal-planner.md +8 -0
- package/.claude/agents/infrastructure/README.md +100 -0
- package/.claude/agents/{specialized → infrastructure}/devops-engineer.md +131 -150
- package/.claude/agents/planners/README.md +94 -0
- package/.claude/agents/{core-agents → planners}/analyst.md +1 -22
- package/.claude/agents/{planning-team → planners}/api-designer-persona.md +8 -0
- package/.claude/agents/{core-agents → planners}/architect.md +7 -20
- package/.claude/agents/{core-agents → planners}/planner.md +0 -21
- package/.claude/agents/{planning-team → planners}/security-architect-persona.md +8 -28
- package/.claude/agents/{planning-team → planners}/system-architect-persona.md +6 -38
- package/.claude/agents/{architecture → planners}/system-architect.md +12 -17
- package/.claude/agents/product-owner-team/accessibility-advocate-persona.md +132 -161
- package/.claude/agents/product-owner-team/power-user-persona.md +149 -182
- package/.claude/agents/retrospective-analyst.md +84 -0
- package/.claude/agents/reviewers/README.md +58 -0
- package/.claude/agents/{analysis → reviewers}/code-quality-validator.md +8 -17
- package/.claude/agents/reviewers/reviewer.md +181 -0
- package/.claude/agents/sparc/architecture.md +6 -25
- package/.claude/agents/sparc/pseudocode.md +6 -0
- package/.claude/agents/sparc/refinement.md +6 -0
- package/.claude/agents/sparc/specification.md +1 -0
- package/.claude/agents/specialists/README.md +60 -0
- package/.claude/agents/{core-agents → specialists}/base-template-generator.md +8 -21
- package/.claude/agents/{specialized → specialists}/cli-agent-optimizer.md +1 -1
- package/.claude/agents/{specialized → specialists}/code-booster.md +1 -0
- package/.claude/agents/{consensus → specialists}/consensus-builder.md +1 -17
- package/.claude/agents/{specialized/mobile → specialists}/mobile-dev.md +0 -20
- package/.claude/agents/{core-agents → specialists}/performance-benchmarker.md +134 -148
- package/.claude/agents/{specialized → specialists}/rust-developer.md +1 -20
- package/.claude/agents/{specialized → specialists}/rust-enterprise-developer.md +1 -20
- package/.claude/agents/{specialized → specialists}/rust-mvp-developer.md +1 -20
- package/.claude/agents/{core-agents → specialists}/security-manager.md +68 -88
- package/.claude/agents/{security → specialists}/security-specialist-existing.md +6 -57
- package/.claude/agents/{security → specialists}/security-specialist.md +6 -30
- package/.claude/agents/{specialized/mobile → specialists}/spec-mobile-react-native.md +2 -21
- package/.claude/agents/testers/README.md +94 -0
- package/.claude/agents/{testing → testers}/e2e/playwright-agent.md +1 -20
- package/.claude/agents/{testing → testers}/interaction-tester.md +1 -20
- package/.claude/agents/{testing → testers}/playwright-tester.md +1 -1
- package/.claude/agents/testers/tester.md +139 -0
- package/.claude/agents/testers/unit/tdd-london-swarm.md +49 -0
- package/.claude/agents/testers/validation/production-validator.md +33 -0
- package/.claude/agents-ignore/cfn-loop-coordinator.md +157 -0
- package/.claude/agents-ignore/cfn-loop-coordinator.md.backup +156 -0
- package/.claude/agents-ignore/coordinator.md.backup +182 -0
- package/.claude/agents-ignore/cost-savings-cfn-loop-coordinator.md +760 -0
- package/.claude/agents-ignore/cost-savings-coordinator.md +173 -0
- package/.claude/artifacts/ace-reflections/REFLECT-001-summary.json +39 -0
- package/.claude/artifacts/ace-reflections/sprint-7_$(date -u +/"%Y%m%d_%H%M%S/").json" +47 -0
- package/.claude/commands/CFN_COORDINATOR_PARAMETERS.md +10 -10
- package/.claude/commands/cfn-loop-epic.md +3 -3
- package/.claude/commands/cfn-loop-single.md +3 -3
- package/.claude/commands/cfn-loop-sprints.md +1 -1
- package/.claude/commands/cfn-loop.md +3 -3
- package/.claude/commands/cfn-mode.md +20 -0
- package/.claude/commands/write-plan.md +104 -0
- package/.claude/data/cfn-loop.db +0 -0
- package/.claude/data/cfn_loop_logs.db +0 -0
- package/.claude/hooks/BACKUP_USAGE.md +243 -0
- package/.claude/hooks/post-edit-cfn-retrospective.sh +79 -0
- package/.claude/hooks/post-edit.sh +21 -0
- package/.claude/hooks/pre-edit-backup.sh +71 -0
- package/.claude/hooks/restore-from-backup.sh +37 -0
- package/.claude/prompts/cfn-loop-context.md +115 -0
- package/.claude/prompts/loop-specific/loop2.md +50 -0
- package/.claude/prompts/loop-specific/loop3.md +43 -0
- package/.claude/prompts/loop-specific/loop4.md +54 -0
- package/.claude/root-claude-distribute/CLAUDE.md +76 -2
- package/.claude/skills/ace-system/sprint-7-lessons.json +46 -0
- package/.claude/skills/ace-system/store-reflection.sh +33 -136
- package/.claude/skills/agent-discovery/SKILL.md +40 -0
- package/.claude/skills/agent-discovery/agents-registry-clean.json +0 -0
- package/.claude/skills/agent-discovery/agents-registry-fixed.json +19 -0
- package/.claude/skills/agent-discovery/agents-registry.json +718 -0
- package/.claude/skills/agent-discovery/discover-agents.py +175 -0
- package/.claude/skills/agent-discovery/discover-agents.sh +87 -0
- package/.claude/skills/agent-discovery/invoke-registry.sh +11 -0
- package/.claude/skills/agent-discovery/temp_script.py +0 -0
- package/.claude/skills/agent-output-processing/SKILL.md +359 -0
- package/.claude/skills/agent-selector/SKILL.md +90 -0
- package/.claude/skills/agent-selector/select-agents.sh +96 -0
- package/.claude/skills/agent-spawning/agent-selection-guide.md +1 -1
- package/.claude/skills/agent-swap/SKILL.md +36 -0
- package/.claude/skills/agent-swap/recommend-swap.sh +60 -0
- package/.claude/skills/api-validation/test-endpoints.sh +54 -0
- package/.claude/skills/automatic-memory-persistence/SKILL.md +73 -0
- package/.claude/skills/automatic-memory-persistence/persist-agent-output.sh +49 -0
- package/.claude/skills/automatic-memory-persistence/query-agent-history.sh +35 -0
- package/.claude/skills/automatic-memory-persistence/test-memory-persistence.sh +235 -0
- package/.claude/skills/cfn-loop-orchestration/README.md +41 -0
- package/.claude/skills/cfn-loop-orchestration/SKILL.md +299 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/auto-tune-timeouts.sh +228 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/consensus.sh +84 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/deliverable-verifier.sh +71 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/gate-check.sh +90 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/iteration-manager.sh +87 -0
- package/.claude/skills/cfn-loop-orchestration/helpers/timeout-calculator.sh +51 -0
- package/.claude/skills/cfn-loop-orchestration/inject-loop-context.sh +41 -0
- package/.claude/skills/cfn-loop-orchestration/monitor-execution.sh +156 -0
- package/.claude/skills/cfn-loop-orchestration/orchestrate.sh +840 -0
- package/.claude/skills/cfn-loop-orchestration/security_utils.sh +99 -0
- package/.claude/skills/cfn-loop-orchestration/test-cfn-orchestration.sh +281 -0
- package/.claude/skills/cfn-loop-orchestration/test-edge-cases.sh +188 -0
- package/.claude/skills/cfn-loop-validation/SKILL.md +307 -217
- package/.claude/skills/complexity-estimator/SKILL.md +96 -0
- package/.claude/skills/complexity-estimator/estimate-complexity.sh +144 -0
- package/.claude/skills/context-pruner/SKILL.md +75 -0
- package/.claude/skills/context-pruner/prune-context.sh +73 -0
- package/.claude/skills/defense-in-depth/SKILL.md +133 -0
- package/.claude/skills/dependency-extractor/SKILL.md +35 -0
- package/.claude/skills/dependency-extractor/extract-dependencies.sh +66 -0
- package/.claude/skills/epic-decomposer/SKILL.md +44 -0
- package/.claude/skills/epic-decomposer/decompose-epic.sh +104 -0
- package/.claude/skills/improvement-recommender/SKILL.md +33 -0
- package/.claude/skills/improvement-recommender/recommend-improvements.sh +92 -0
- package/.claude/skills/intervention-detector/SKILL.md +39 -0
- package/.claude/skills/intervention-detector/detect-intervention.sh +111 -0
- package/.claude/skills/intervention-orchestrator/SKILL.md +43 -0
- package/.claude/skills/intervention-orchestrator/execute-intervention.sh +59 -0
- package/.claude/skills/loop2-output-processing/SKILL.md +163 -0
- package/.claude/skills/loop2-output-processing/execute-and-extract.sh +77 -0
- package/.claude/skills/loop2-output-processing/execute-and-extract.sh.backup +36 -0
- package/.claude/skills/loop2-output-processing/parse-feedback.sh +147 -0
- package/.claude/skills/loop2-output-processing/process-validator-output.sh +275 -0
- package/.claude/skills/loop2-output-processing/test-bug27-fix.sh +200 -0
- package/.claude/skills/loop2-output-processing/test-loop2-processing.sh +113 -0
- package/.claude/skills/loop3-output-processing/AGENT_COMPLETION_PROTOCOL.md +206 -0
- package/.claude/skills/loop3-output-processing/SKILL.md +421 -0
- package/.claude/skills/loop3-output-processing/calculate-confidence.sh +28 -0
- package/.claude/skills/loop3-output-processing/execute-and-extract.sh +85 -0
- package/.claude/skills/loop3-output-processing/parse-confidence.sh +31 -0
- package/.claude/skills/loop3-output-processing/test-agent-timeout.sh +327 -0
- package/.claude/skills/loop3-output-processing/test-loop3-processing.sh +155 -0
- package/.claude/skills/loop3-output-processing/verify-deliverables.sh +42 -0
- package/.claude/skills/pattern-extraction/SKILL.md +30 -0
- package/.claude/skills/pattern-extraction/extract-patterns.sh +80 -0
- package/.claude/skills/playbook/SKILL.md +113 -0
- package/.claude/skills/playbook/init-playbook.sh +54 -0
- package/.claude/skills/playbook/playbook.db +0 -0
- package/.claude/skills/playbook/query-playbook.sh +79 -0
- package/.claude/skills/playbook/update-playbook.sh +69 -0
- package/.claude/skills/playbook-auto-update/SKILL.md +29 -0
- package/.claude/skills/playbook-auto-update/auto-update-playbook.sh +86 -0
- package/.claude/skills/product-owner-decision/SKILL.md +332 -0
- package/.claude/skills/product-owner-decision/execute-decision.sh +176 -0
- package/.claude/skills/product-owner-decision/parse-decision.sh +66 -0
- package/.claude/skills/product-owner-decision/validate-deliverables.sh +82 -0
- package/.claude/skills/redis-coordination/LOGGING.md +260 -0
- package/.claude/skills/redis-coordination/README.md +30 -29
- package/.claude/skills/redis-coordination/SKILL.md +685 -83
- package/.claude/skills/redis-coordination/analyze-task-complexity.sh +277 -0
- package/.claude/skills/redis-coordination/cfn-loop-exec.sh +468 -0
- package/.claude/skills/redis-coordination/collect-confidence-scores.sh +179 -0
- package/.claude/skills/redis-coordination/collect-results.sh +75 -0
- package/.claude/skills/redis-coordination/data/cfn-loop.db +0 -0
- package/.claude/skills/redis-coordination/{test-orchestrator.sh → demos/test-orchestrator.sh} +25 -0
- package/.claude/skills/redis-coordination/execute-product-owner-decision.sh +258 -0
- package/.claude/skills/redis-coordination/get-agent-timeout.sh +176 -176
- package/.claude/skills/redis-coordination/invoke-waiting-mode.sh +93 -227
- package/.claude/skills/redis-coordination/invoke-waiting-mode.sh.backup-p7 +423 -0
- package/.claude/skills/redis-coordination/log-event.sh +109 -0
- package/.claude/skills/redis-coordination/monitor-cfn-violations.sh +391 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop-v3.sh +141 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh +31 -993
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup +38 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-1761167675 +1672 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-p5 +1604 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-phase1 +1550 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-phase2 +1621 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-phase3 +1621 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.bak +0 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.broken +1627 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.corrupted +80 -0
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.deprecated +1864 -0
- package/.claude/skills/redis-coordination/query-logs.sh +103 -0
- package/.claude/skills/redis-coordination/retrieve-context.sh +58 -0
- package/.claude/skills/redis-coordination/select-specialist-agent.sh +371 -0
- package/.claude/skills/redis-coordination/semantic-match-tfidf.py +252 -0
- package/.claude/skills/redis-coordination/send-heartbeat.sh +164 -72
- package/.claude/skills/redis-coordination/signal.sh +38 -0
- package/.claude/skills/redis-coordination/store-context.sh +86 -0
- package/.claude/skills/redis-coordination/test-context-injection.sh +354 -0
- package/.claude/skills/redis-coordination/test-timeout-enforcement.sh +513 -0
- package/.claude/skills/redis-coordination/tests/convert-line-endings.sh +15 -0
- package/.claude/skills/redis-coordination/tests/dlq-functionality-test.sh +101 -101
- package/.claude/skills/redis-coordination/tests/edge-cases-test.sh +98 -98
- package/.claude/skills/redis-coordination/tests/integration-test.sh +169 -169
- package/.claude/skills/redis-coordination/tests/retry-mechanism-test.sh +81 -81
- package/.claude/skills/redis-coordination/tests/run-test-suite.sh +91 -91
- package/.claude/skills/redis-coordination/tests/run-tests.sh +4 -0
- package/.claude/skills/redis-coordination/tests/test-primitives.sh +166 -0
- package/.claude/skills/redis-coordination/tests/test-utils.sh +53 -121
- package/.claude/skills/redis-coordination/tests/test_coordination_primitives.sh.deprecated +20 -0
- package/.claude/skills/redis-coordination/tests/test_utils.sh +49 -0
- package/.claude/skills/redis-coordination/v2_modularization/core_orchestration.sh +76 -0
- package/.claude/skills/redis-coordination/validate-parameters.sh +492 -0
- package/.claude/skills/retrospective-report/SKILL.md +31 -0
- package/.claude/skills/retrospective-report/generate-report.sh +101 -0
- package/.claude/skills/run-all-skill-tests.sh +124 -0
- package/.claude/skills/scope-simplifier/SKILL.md +37 -0
- package/.claude/skills/scope-simplifier/simplify-scope.sh +68 -0
- package/.claude/skills/simplified-agent-lifecycle/COST_ANALYSIS.md +49 -0
- package/.claude/skills/simplified-agent-lifecycle/DESIGN.md +98 -0
- package/.claude/skills/simplified-agent-lifecycle/MIGRATION_PLAN.md +74 -0
- package/.claude/skills/specialist-injection/SKILL.md +41 -0
- package/.claude/skills/specialist-injection/recommend-specialist.sh +57 -0
- package/.claude/skills/sprint-execution/SKILL.md +27 -0
- package/.claude/skills/sprint-execution/execute-sprint-task.sh +59 -0
- package/.claude/skills/sprint-execution/execute-sprint.sh +65 -0
- package/.claude/skills/sprint-planner/SKILL.md +37 -0
- package/.claude/skills/sprint-planner/plan-sprint.sh +85 -0
- package/.claude/skills/standardized-error-handling/SKILL.md +56 -0
- package/.claude/skills/standardized-error-handling/capture-agent-error.sh +87 -0
- package/.claude/skills/standardized-error-handling/test-error-handling.sh +166 -0
- package/.claude/skills/task-classifier/SKILL.md +94 -0
- package/.claude/skills/task-classifier/classify-task.sh +115 -0
- package/.claude/skills/validation-templates/SKILL.md +47 -0
- package/.claude/skills/validation-templates/content.json +38 -0
- package/.claude/skills/validation-templates/data.json +38 -0
- package/.claude/skills/validation-templates/design.json +38 -0
- package/.claude/skills/validation-templates/infrastructure.json +38 -0
- package/.claude/skills/validation-templates/research.json +38 -0
- package/.claude/skills/validation-templates/software.json +38 -0
- package/.claude/skills/webapp-testing/README.md +142 -0
- package/.claude/skills/webapp-testing/SCREENSHOT_NAMING_CONVENTION.md +547 -0
- package/.claude/skills/webapp-testing/SKILL.md +877 -0
- package/.claude/skills/webapp-testing/capture-screenshot.sh +238 -0
- package/.claude/skills/webapp-testing/cfn-loop-integration.sh +265 -0
- package/.claude/skills/webapp-testing/compare-screenshots.sh +199 -0
- package/.claude/skills/webapp-testing/init-storage.sh +150 -0
- package/.claude/skills/webapp-testing/set-baseline.sh +196 -0
- package/.claude/skills/webapp-testing/test-webapp-testing.sh +233 -0
- package/.claude/spawn-pattern-examples.md +3 -3
- package/CLAUDE.md +319 -45
- package/README.md +598 -251
- package/dist/agents/agent-loader.js +146 -165
- package/dist/agents/agent-loader.js.map +1 -1
- package/dist/cli/agent-command.js +2 -0
- package/dist/cli/agent-command.js.map +1 -1
- package/dist/cli/agent-definition-parser.js +7 -0
- package/dist/cli/agent-definition-parser.js.map +1 -1
- package/dist/cli/agent-executor.js +145 -11
- package/dist/cli/agent-executor.js.map +1 -1
- package/dist/cli/agent-prompt-builder.js +81 -1
- package/dist/cli/agent-prompt-builder.js.map +1 -1
- package/dist/cli/agent-spawn.js +10 -1
- package/dist/cli/agent-spawn.js.map +1 -1
- package/dist/cli/anthropic-client.js +192 -13
- package/dist/cli/anthropic-client.js.map +1 -1
- package/dist/cli/cfn-context.js +150 -0
- package/dist/cli/cfn-context.js.map +1 -1
- package/dist/cli/cfn-fork.js +159 -0
- package/dist/cli/cfn-fork.js.map +1 -0
- package/dist/cli/cli-agent-context.js +8 -3
- package/dist/cli/cli-agent-context.js.map +1 -1
- package/dist/cli/config-manager.js +109 -91
- package/dist/cli/config-manager.js.map +1 -1
- package/dist/cli/conversation-fork.js +201 -0
- package/dist/cli/conversation-fork.js.map +1 -0
- package/dist/cli/index.js +4 -0
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/tool-definitions.js +263 -0
- package/dist/cli/tool-definitions.js.map +1 -0
- package/dist/cli/tool-executor.js +247 -0
- package/dist/cli/tool-executor.js.map +1 -0
- package/dist/hello.js +8 -0
- package/dist/hello.js.map +1 -0
- package/package.json +14 -6
- package/scripts/README.md +68 -0
- package/scripts/cfn-intervention-example.sh +21 -0
- package/scripts/migrate-test-infrastructure.sh +40 -0
- package/scripts/validate-test-migration.sh +49 -0
- package/scripts/verify-no-secrets.sh +55 -0
- package/.claude/agents/architecture/system-architect.md.backup +0 -603
- package/.claude/agents/code-booster.md +0 -131
- package/.claude/agents/consensus/performance-benchmarker.md +0 -101
- package/.claude/agents/consensus/security-manager.md +0 -107
- package/.claude/agents/context-curator.md +0 -167
- package/.claude/agents/context-reflector.md +0 -65
- package/.claude/agents/core-agents/cfn-loop-coordinator.md +0 -134
- package/.claude/agents/core-agents/code-quality-validator.md +0 -149
- package/.claude/agents/core-agents/context-curator.md +0 -452
- package/.claude/agents/core-agents/context-reflector.md +0 -273
- package/.claude/agents/core-agents/cost-savings-cfn-loop-coordinator.md +0 -235
- package/.claude/agents/core-agents/tester.md +0 -170
- package/.claude/agents/development/backend-dev.md +0 -165
- package/.claude/agents/devops/devops-engineer.md +0 -148
- package/.claude/agents/frontend/interaction-tester.md +0 -139
- package/.claude/agents/frontend/react-frontend-engineer.md +0 -9
- package/.claude/agents/personas/accessibility-advocate-persona.md +0 -107
- package/.claude/agents/testing/production-validator.md +0 -179
- package/.claude/agents/testing/tdd-london-swarm.md +0 -209
- package/.claude/agents/testing/unit/tdd-london-swarm.md +0 -43
- package/.claude/agents/testing/validation/production-validator.md +0 -43
- package/.claude/api-configs/config-current-zai-config.env +0 -62
- package/.claude/api-configs/config-test-zai-config.env +0 -62
- package/.claude/api-configs/env-backups/before-anthropic-20251020-025404.env +0 -62
- package/.claude/api-configs/env-backups/before-restore-20251020-025431.env +0 -62
- package/.claude/skills/redis-coordination/orchestrate-cfn-loop.sh.backup-1760949407 +0 -933
- package/dist/cli/cli-agent-context.test.js +0 -451
- package/dist/cli/cli-agent-context.test.js.map +0 -1
- package/dist/coordination/fleet-manager.test.js +0 -141
- package/dist/coordination/fleet-manager.test.js.map +0 -1
- package/dist/middleware/transparency-middleware.test.js +0 -184
- package/dist/middleware/transparency-middleware.test.js.map +0 -1
- /package/.claude/agents/{core-agents → developers}/researcher.md +0 -0
- /package/.claude/agents/{consensus → specialists}/crdt-synchronizer.md +0 -0
- /package/.claude/agents/{consensus → specialists}/quorum-manager.md +0 -0
- /package/.claude/agents/{consensus → specialists}/raft-manager.md +0 -0
- /package/.claude/{agents/core-agents → agents-ignore}/coordinator.md +0 -0
- /package/.claude/{agents/core-agents/cost-savings-coordinator.md → agents-ignore/cost-savings-coordinator.md.backup} +0 -0
- /package/.claude/skills/redis-coordination/{phase4-wake-queue-test-report.md → demos/phase4-wake-queue-test-report.md} +0 -0
- /package/.claude/skills/redis-coordination/{test-bzpopmin-fix.sh → demos/test-bzpopmin-fix.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-cancel-swarm.sh → demos/test-cancel-swarm.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-dlq.sh → demos/test-dlq.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-iteration-feedback.sh → demos/test-iteration-feedback.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-priority-wake-phase4-unix.sh → demos/test-priority-wake-phase4-unix.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-priority-wake-phase4.sh → demos/test-priority-wake-phase4.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-priority-wake.sh → demos/test-priority-wake.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quick-fix.sh → demos/test-quick-fix.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quorum-absolute.sh → demos/test-quorum-absolute.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quorum-fallback.sh → demos/test-quorum-fallback.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quorum-percentage.sh → demos/test-quorum-percentage.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quorum-with-retry.sh → demos/test-quorum-with-retry.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-quorum.sh → demos/test-quorum.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-shutdown-handling.sh → demos/test-shutdown-handling.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-shutdown.sh → demos/test-shutdown.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-utils-unix.sh → demos/test-utils-unix.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-utils.sh → demos/test-utils.sh} +0 -0
- /package/.claude/skills/redis-coordination/{test-waiting-mode.sh → demos/test-waiting-mode.sh} +0 -0
|
@@ -0,0 +1,421 @@
|
|
|
1
|
+
# Loop 3 Output Processing Skill
|
|
2
|
+
|
|
3
|
+
**Version:** 1.0.0
|
|
4
|
+
**Status:** Production
|
|
5
|
+
**Purpose:** Guaranteed confidence extraction from Loop 3 implementer agents
|
|
6
|
+
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
## Overview
|
|
10
|
+
|
|
11
|
+
**Problem Solved:** Loop 3 agents (coders, researchers, developers) might document bash commands instead of executing them, leading to missing confidence scores.
|
|
12
|
+
|
|
13
|
+
**Solution:** Orchestrator-controlled output processing with:
|
|
14
|
+
- Multi-pattern confidence extraction
|
|
15
|
+
- Git-based deliverable verification
|
|
16
|
+
- Calculated confidence fallback
|
|
17
|
+
- Guaranteed Redis reporting
|
|
18
|
+
|
|
19
|
+
---
|
|
20
|
+
|
|
21
|
+
## Core Principle
|
|
22
|
+
|
|
23
|
+
```
|
|
24
|
+
Loop 3 Agents → Focus on implementation
|
|
25
|
+
This Skill → Extract confidence + verify deliverables
|
|
26
|
+
Orchestrator → Report to Redis + gate check
|
|
27
|
+
```
|
|
28
|
+
|
|
29
|
+
**Why This Works:**
|
|
30
|
+
- ✅ Agents implement features (what they do best)
|
|
31
|
+
- ✅ Skill extracts confidence (robust parsing)
|
|
32
|
+
- ✅ Orchestrator controls coordination (Redis state)
|
|
33
|
+
- ✅ No reliance on agent bash execution
|
|
34
|
+
|
|
35
|
+
---
|
|
36
|
+
|
|
37
|
+
## Architecture
|
|
38
|
+
|
|
39
|
+
### Processing Flow
|
|
40
|
+
|
|
41
|
+
```
|
|
42
|
+
1. Orchestrator spawns Loop 3 agent
|
|
43
|
+
2. Skill captures agent stdout/stderr
|
|
44
|
+
3. Skill parses confidence (multi-pattern)
|
|
45
|
+
4. Skill verifies deliverables (git status)
|
|
46
|
+
5. Skill calculates fallback confidence
|
|
47
|
+
6. Skill reports to Redis
|
|
48
|
+
7. Orchestrator uses for gate check
|
|
49
|
+
```
|
|
50
|
+
|
|
51
|
+
### Skill Components
|
|
52
|
+
|
|
53
|
+
```
|
|
54
|
+
.claude/skills/loop3-output-processing/
|
|
55
|
+
├── SKILL.md # This file
|
|
56
|
+
├── execute-and-extract.sh # Main wrapper script
|
|
57
|
+
├── parse-confidence.sh # Confidence pattern matching
|
|
58
|
+
├── verify-deliverables.sh # Git-based verification
|
|
59
|
+
├── calculate-confidence.sh # Fallback calculation
|
|
60
|
+
└── test-loop3-processing.sh # Integration tests
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
---
|
|
64
|
+
|
|
65
|
+
## Confidence Extraction Patterns
|
|
66
|
+
|
|
67
|
+
### Priority 1: Explicit Confidence Statement
|
|
68
|
+
```
|
|
69
|
+
Confidence: 0.85
|
|
70
|
+
confidence: 0.92
|
|
71
|
+
Confidence Score: 0.78
|
|
72
|
+
```
|
|
73
|
+
|
|
74
|
+
### Priority 2: Percentage Format
|
|
75
|
+
```
|
|
76
|
+
I'm 85% confident
|
|
77
|
+
Confidence: 92%
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
### Priority 3: Natural Language
|
|
81
|
+
```
|
|
82
|
+
I'm very confident (0.9)
|
|
83
|
+
High confidence: 0.85
|
|
84
|
+
```
|
|
85
|
+
|
|
86
|
+
### Priority 4: Calculated from Deliverables
|
|
87
|
+
```bash
|
|
88
|
+
# If no confidence found, calculate based on:
|
|
89
|
+
- Files created/modified (git status)
|
|
90
|
+
- Tests passing (if applicable)
|
|
91
|
+
- Build success (if applicable)
|
|
92
|
+
```
|
|
93
|
+
|
|
94
|
+
**Fallback Logic:**
|
|
95
|
+
- 0 files changed → 0.0
|
|
96
|
+
- 1-2 files, no tests → 0.50
|
|
97
|
+
- 3+ files, tests pass → 0.85
|
|
98
|
+
- Complete deliverables → 0.90
|
|
99
|
+
|
|
100
|
+
---
|
|
101
|
+
|
|
102
|
+
## Usage
|
|
103
|
+
|
|
104
|
+
### From Orchestrator
|
|
105
|
+
|
|
106
|
+
```bash
|
|
107
|
+
# Spawn Loop 3 agent with output processing
|
|
108
|
+
RESULT=$(./.claude/skills/loop3-output-processing/execute-and-extract.sh \
|
|
109
|
+
--agent-type "coder" \
|
|
110
|
+
--task-id "$TASK_ID" \
|
|
111
|
+
--agent-id "coder-1" \
|
|
112
|
+
--context "Implement authentication" \
|
|
113
|
+
--iteration 1)
|
|
114
|
+
|
|
115
|
+
CONFIDENCE=$(echo "$RESULT" | jq -r '.confidence')
|
|
116
|
+
FILES_CHANGED=$(echo "$RESULT" | jq -r '.files_changed')
|
|
117
|
+
DELIVERABLES=$(echo "$RESULT" | jq -r '.deliverables[]')
|
|
118
|
+
|
|
119
|
+
# Report to Redis (orchestrator does this, not agent)
|
|
120
|
+
redis-cli LPUSH "swarm:${TASK_ID}:coder-1:confidence" "$CONFIDENCE"
|
|
121
|
+
redis-cli LPUSH "swarm:${TASK_ID}:coder-1:done" "complete"
|
|
122
|
+
```
|
|
123
|
+
|
|
124
|
+
### Output Format
|
|
125
|
+
|
|
126
|
+
```json
|
|
127
|
+
{
|
|
128
|
+
"agent_id": "coder-1",
|
|
129
|
+
"confidence": 0.85,
|
|
130
|
+
"confidence_source": "explicit|calculated|fallback",
|
|
131
|
+
"files_changed": 5,
|
|
132
|
+
"deliverables": [
|
|
133
|
+
"src/auth/login.ts (A)",
|
|
134
|
+
"src/auth/register.ts (A)",
|
|
135
|
+
"tests/auth.test.ts (A)"
|
|
136
|
+
],
|
|
137
|
+
"tests_passed": true,
|
|
138
|
+
"iteration": 1,
|
|
139
|
+
"timestamp": "2025-10-20T15:30:00Z"
|
|
140
|
+
}
|
|
141
|
+
```
|
|
142
|
+
|
|
143
|
+
---
|
|
144
|
+
|
|
145
|
+
## Implementation
|
|
146
|
+
|
|
147
|
+
### execute-and-extract.sh
|
|
148
|
+
|
|
149
|
+
```bash
|
|
150
|
+
#!/bin/bash
|
|
151
|
+
set -euo pipefail
|
|
152
|
+
|
|
153
|
+
# Parse arguments
|
|
154
|
+
AGENT_TYPE=""
|
|
155
|
+
TASK_ID=""
|
|
156
|
+
AGENT_ID=""
|
|
157
|
+
CONTEXT=""
|
|
158
|
+
ITERATION=1
|
|
159
|
+
TIMEOUT=900
|
|
160
|
+
|
|
161
|
+
while [[ $# -gt 0 ]]; do
|
|
162
|
+
case $1 in
|
|
163
|
+
--agent-type) AGENT_TYPE="$2"; shift 2 ;;
|
|
164
|
+
--task-id) TASK_ID="$2"; shift 2 ;;
|
|
165
|
+
--agent-id) AGENT_ID="$2"; shift 2 ;;
|
|
166
|
+
--context) CONTEXT="$2"; shift 2 ;;
|
|
167
|
+
--iteration) ITERATION="$2"; shift 2 ;;
|
|
168
|
+
--timeout) TIMEOUT="$2"; shift 2 ;;
|
|
169
|
+
*) echo "Unknown: $1"; exit 1 ;;
|
|
170
|
+
esac
|
|
171
|
+
done
|
|
172
|
+
|
|
173
|
+
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
174
|
+
|
|
175
|
+
# Capture git state before agent runs
|
|
176
|
+
BEFORE_GIT=$(git status --short)
|
|
177
|
+
|
|
178
|
+
# Spawn agent and capture output
|
|
179
|
+
AGENT_OUTPUT=$(timeout "$TIMEOUT" npx claude-flow-novice agent "$AGENT_TYPE" \
|
|
180
|
+
--task-id "$TASK_ID" \
|
|
181
|
+
--agent-id "$AGENT_ID" \
|
|
182
|
+
--context "$CONTEXT" 2>&1 || true)
|
|
183
|
+
|
|
184
|
+
# Capture git state after agent runs
|
|
185
|
+
AFTER_GIT=$(git status --short)
|
|
186
|
+
|
|
187
|
+
# Parse confidence from output
|
|
188
|
+
CONFIDENCE=$("$SCRIPT_DIR/parse-confidence.sh" "$AGENT_OUTPUT")
|
|
189
|
+
|
|
190
|
+
# Verify deliverables
|
|
191
|
+
DELIVERABLE_CHECK=$("$SCRIPT_DIR/verify-deliverables.sh" \
|
|
192
|
+
--before "$BEFORE_GIT" \
|
|
193
|
+
--after "$AFTER_GIT")
|
|
194
|
+
|
|
195
|
+
FILES_CHANGED=$(echo "$DELIVERABLE_CHECK" | jq -r '.files_changed')
|
|
196
|
+
DELIVERABLES=$(echo "$DELIVERABLE_CHECK" | jq -r '.deliverables')
|
|
197
|
+
|
|
198
|
+
# If confidence not found or too low, calculate fallback
|
|
199
|
+
if (( $(echo "$CONFIDENCE == 0.0" | bc -l) )) || [ -z "$CONFIDENCE" ]; then
|
|
200
|
+
CONFIDENCE=$("$SCRIPT_DIR/calculate-confidence.sh" \
|
|
201
|
+
--files-changed "$FILES_CHANGED" \
|
|
202
|
+
--deliverables "$DELIVERABLES")
|
|
203
|
+
CONFIDENCE_SOURCE="calculated"
|
|
204
|
+
elif (( $(echo "$CONFIDENCE > 0.0" | bc -l) )); then
|
|
205
|
+
CONFIDENCE_SOURCE="explicit"
|
|
206
|
+
else
|
|
207
|
+
CONFIDENCE_SOURCE="fallback"
|
|
208
|
+
fi
|
|
209
|
+
|
|
210
|
+
# Build output JSON
|
|
211
|
+
cat <<EOF
|
|
212
|
+
{
|
|
213
|
+
"agent_id": "$AGENT_ID",
|
|
214
|
+
"confidence": $CONFIDENCE,
|
|
215
|
+
"confidence_source": "$CONFIDENCE_SOURCE",
|
|
216
|
+
"files_changed": $FILES_CHANGED,
|
|
217
|
+
"deliverables": $DELIVERABLES,
|
|
218
|
+
"iteration": $ITERATION,
|
|
219
|
+
"timestamp": "$(date -u +%Y-%m-%dT%H:%M:%SZ)"
|
|
220
|
+
}
|
|
221
|
+
EOF
|
|
222
|
+
```
|
|
223
|
+
|
|
224
|
+
### parse-confidence.sh
|
|
225
|
+
|
|
226
|
+
```bash
|
|
227
|
+
#!/bin/bash
|
|
228
|
+
set -euo pipefail
|
|
229
|
+
|
|
230
|
+
OUTPUT="$1"
|
|
231
|
+
|
|
232
|
+
# Pattern 1: Explicit confidence (0.0-1.0)
|
|
233
|
+
if echo "$OUTPUT" | grep -oP '[Cc]onfidence[:\s]*([0-9.]+)' | grep -oP '([0-9.]+)' | head -1; then
|
|
234
|
+
exit 0
|
|
235
|
+
fi
|
|
236
|
+
|
|
237
|
+
# Pattern 2: Percentage (85%)
|
|
238
|
+
if PERCENT=$(echo "$OUTPUT" | grep -oP '([0-9]{1,3})%' | grep -oP '[0-9]+' | head -1); then
|
|
239
|
+
echo "scale=2; $PERCENT / 100" | bc
|
|
240
|
+
exit 0
|
|
241
|
+
fi
|
|
242
|
+
|
|
243
|
+
# Pattern 3: Natural language with score
|
|
244
|
+
if echo "$OUTPUT" | grep -oP '\(([0-9.]+)\)' | grep -oP '[0-9.]+' | head -1; then
|
|
245
|
+
exit 0
|
|
246
|
+
fi
|
|
247
|
+
|
|
248
|
+
# No confidence found
|
|
249
|
+
echo "0.0"
|
|
250
|
+
```
|
|
251
|
+
|
|
252
|
+
### verify-deliverables.sh
|
|
253
|
+
|
|
254
|
+
```bash
|
|
255
|
+
#!/bin/bash
|
|
256
|
+
set -euo pipefail
|
|
257
|
+
|
|
258
|
+
BEFORE=""
|
|
259
|
+
AFTER=""
|
|
260
|
+
|
|
261
|
+
while [[ $# -gt 0 ]]; do
|
|
262
|
+
case $1 in
|
|
263
|
+
--before) BEFORE="$2"; shift 2 ;;
|
|
264
|
+
--after) AFTER="$2"; shift 2 ;;
|
|
265
|
+
*) echo "Unknown: $1"; exit 1 ;;
|
|
266
|
+
esac
|
|
267
|
+
done
|
|
268
|
+
|
|
269
|
+
# Find new/modified files
|
|
270
|
+
CHANGED_FILES=$(comm -13 <(echo "$BEFORE" | sort) <(echo "$AFTER" | sort) || true)
|
|
271
|
+
FILE_COUNT=$(echo "$CHANGED_FILES" | grep -c '^' || echo "0")
|
|
272
|
+
|
|
273
|
+
# Build deliverables array
|
|
274
|
+
DELIVERABLES="["
|
|
275
|
+
FIRST=true
|
|
276
|
+
while IFS= read -r line; do
|
|
277
|
+
if [ -n "$line" ]; then
|
|
278
|
+
if [ "$FIRST" = true ]; then
|
|
279
|
+
FIRST=false
|
|
280
|
+
else
|
|
281
|
+
DELIVERABLES+=","
|
|
282
|
+
fi
|
|
283
|
+
DELIVERABLES+="\"$line\""
|
|
284
|
+
fi
|
|
285
|
+
done <<< "$CHANGED_FILES"
|
|
286
|
+
DELIVERABLES+="]"
|
|
287
|
+
|
|
288
|
+
# Output JSON
|
|
289
|
+
cat <<EOF
|
|
290
|
+
{
|
|
291
|
+
"files_changed": $FILE_COUNT,
|
|
292
|
+
"deliverables": $DELIVERABLES
|
|
293
|
+
}
|
|
294
|
+
EOF
|
|
295
|
+
```
|
|
296
|
+
|
|
297
|
+
### calculate-confidence.sh
|
|
298
|
+
|
|
299
|
+
```bash
|
|
300
|
+
#!/bin/bash
|
|
301
|
+
set -euo pipefail
|
|
302
|
+
|
|
303
|
+
FILES_CHANGED=0
|
|
304
|
+
DELIVERABLES="[]"
|
|
305
|
+
|
|
306
|
+
while [[ $# -gt 0 ]]; do
|
|
307
|
+
case $1 in
|
|
308
|
+
--files-changed) FILES_CHANGED="$2"; shift 2 ;;
|
|
309
|
+
--deliverables) DELIVERABLES="$2"; shift 2 ;;
|
|
310
|
+
*) echo "Unknown: $1"; exit 1 ;;
|
|
311
|
+
esac
|
|
312
|
+
done
|
|
313
|
+
|
|
314
|
+
# Calculate confidence based on deliverables
|
|
315
|
+
if (( FILES_CHANGED == 0 )); then
|
|
316
|
+
echo "0.0"
|
|
317
|
+
elif (( FILES_CHANGED <= 2 )); then
|
|
318
|
+
echo "0.50"
|
|
319
|
+
elif (( FILES_CHANGED <= 5 )); then
|
|
320
|
+
echo "0.75"
|
|
321
|
+
else
|
|
322
|
+
echo "0.85"
|
|
323
|
+
fi
|
|
324
|
+
```
|
|
325
|
+
|
|
326
|
+
---
|
|
327
|
+
|
|
328
|
+
## Benefits
|
|
329
|
+
|
|
330
|
+
| Aspect | Before (Template-Based) | After (Skill-Based) |
|
|
331
|
+
|--------|------------------------|---------------------|
|
|
332
|
+
| **Confidence Guarantee** | ❌ 0.0 if agent doesn't execute | ✅ Always calculated |
|
|
333
|
+
| **Deliverable Verification** | ❌ Agent-dependent | ✅ Git-based proof |
|
|
334
|
+
| **Parsing Robustness** | ❌ None | ✅ 4 fallback patterns |
|
|
335
|
+
| **Redis Coordination** | ❌ Agent reports (maybe) | ✅ Orchestrator reports |
|
|
336
|
+
| **Race Conditions** | ❌ Polling wait needed | ✅ Synchronous processing |
|
|
337
|
+
| **Testability** | ❌ Hard to test | ✅ Unit testable |
|
|
338
|
+
|
|
339
|
+
---
|
|
340
|
+
|
|
341
|
+
## Testing
|
|
342
|
+
|
|
343
|
+
### Unit Tests
|
|
344
|
+
|
|
345
|
+
```bash
|
|
346
|
+
# Test confidence parsing
|
|
347
|
+
./test-parse-confidence.sh
|
|
348
|
+
|
|
349
|
+
# Test deliverable verification
|
|
350
|
+
./test-verify-deliverables.sh
|
|
351
|
+
|
|
352
|
+
# Test confidence calculation
|
|
353
|
+
./test-calculate-confidence.sh
|
|
354
|
+
```
|
|
355
|
+
|
|
356
|
+
### Integration Test
|
|
357
|
+
|
|
358
|
+
```bash
|
|
359
|
+
# Test full Loop 3 processing
|
|
360
|
+
./test-loop3-processing.sh
|
|
361
|
+
```
|
|
362
|
+
|
|
363
|
+
**Expected Results:**
|
|
364
|
+
- ✅ Explicit confidence extracted correctly
|
|
365
|
+
- ✅ Percentage converted to decimal
|
|
366
|
+
- ✅ Fallback calculation works
|
|
367
|
+
- ✅ Deliverables verified via git
|
|
368
|
+
- ✅ JSON output valid
|
|
369
|
+
|
|
370
|
+
---
|
|
371
|
+
|
|
372
|
+
## Integration with Orchestrator
|
|
373
|
+
|
|
374
|
+
### Before (BUG #10 Pattern)
|
|
375
|
+
|
|
376
|
+
```bash
|
|
377
|
+
# Spawn agents, wait, poll for confidence
|
|
378
|
+
spawn_all_loop3_agents
|
|
379
|
+
sleep 5 # Hope agents report in time
|
|
380
|
+
CONFIDENCE=$(redis-cli LRANGE "swarm:${TASK_ID}:${AGENT_ID}:confidence" 0 0)
|
|
381
|
+
# Often 0.0 due to race condition
|
|
382
|
+
```
|
|
383
|
+
|
|
384
|
+
### After (Skill-Based)
|
|
385
|
+
|
|
386
|
+
```bash
|
|
387
|
+
# Process each agent with guaranteed extraction
|
|
388
|
+
for AGENT in $LOOP3_AGENTS; do
|
|
389
|
+
RESULT=$(./.claude/skills/loop3-output-processing/execute-and-extract.sh \
|
|
390
|
+
--agent-type "$AGENT" \
|
|
391
|
+
--task-id "$TASK_ID" \
|
|
392
|
+
--agent-id "${AGENT}-1")
|
|
393
|
+
|
|
394
|
+
CONFIDENCE=$(echo "$RESULT" | jq -r '.confidence')
|
|
395
|
+
redis-cli LPUSH "swarm:${TASK_ID}:${AGENT}-1:confidence" "$CONFIDENCE"
|
|
396
|
+
redis-cli LPUSH "swarm:${TASK_ID}:${AGENT}-1:done" "complete"
|
|
397
|
+
done
|
|
398
|
+
```
|
|
399
|
+
|
|
400
|
+
---
|
|
401
|
+
|
|
402
|
+
## Related Skills
|
|
403
|
+
|
|
404
|
+
- **Agent Output Processing** (`.claude/skills/agent-output-processing/SKILL.md`) - Universal pattern
|
|
405
|
+
- **Loop 2 Output Processing** (`.claude/skills/loop2-output-processing/SKILL.md`) - Validator skill
|
|
406
|
+
- **Redis Coordination** (`.claude/skills/redis-coordination/SKILL.md`) - State management
|
|
407
|
+
|
|
408
|
+
---
|
|
409
|
+
|
|
410
|
+
## Version History
|
|
411
|
+
|
|
412
|
+
### 1.0.0 (2025-10-20)
|
|
413
|
+
- Initial implementation
|
|
414
|
+
- Multi-pattern confidence extraction
|
|
415
|
+
- Git-based deliverable verification
|
|
416
|
+
- Fallback confidence calculation
|
|
417
|
+
- Integration with orchestrator
|
|
418
|
+
|
|
419
|
+
---
|
|
420
|
+
|
|
421
|
+
**Summary:** This skill guarantees confidence extraction from Loop 3 implementers by processing agent output with robust parsing, git-based verification, and fallback calculation. Eliminates BUG #10 race conditions.
|
|
@@ -0,0 +1,28 @@
|
|
|
1
|
+
#!/bin/bash
|
|
2
|
+
set -euo pipefail
|
|
3
|
+
|
|
4
|
+
FILES_CHANGED=0
|
|
5
|
+
DELIVERABLES="[]"
|
|
6
|
+
|
|
7
|
+
while [[ $# -gt 0 ]]; do
|
|
8
|
+
case $1 in
|
|
9
|
+
--files-changed) FILES_CHANGED="$2"; shift 2 ;;
|
|
10
|
+
--deliverables) DELIVERABLES="$2"; shift 2 ;;
|
|
11
|
+
*) echo "ERROR: Unknown parameter: $1" >&2; exit 1 ;;
|
|
12
|
+
esac
|
|
13
|
+
done
|
|
14
|
+
|
|
15
|
+
# Calculate confidence based on deliverables
|
|
16
|
+
if (( FILES_CHANGED == 0 )); then
|
|
17
|
+
# No files changed - agent did not deliver
|
|
18
|
+
echo "0.0"
|
|
19
|
+
elif (( FILES_CHANGED <= 2 )); then
|
|
20
|
+
# Minimal changes - low confidence
|
|
21
|
+
echo "0.50"
|
|
22
|
+
elif (( FILES_CHANGED <= 5 )); then
|
|
23
|
+
# Moderate changes - medium confidence
|
|
24
|
+
echo "0.75"
|
|
25
|
+
else
|
|
26
|
+
# Significant changes - high confidence
|
|
27
|
+
echo "0.85"
|
|
28
|
+
fi
|
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
#!/bin/bash
|
|
2
|
+
set -euo pipefail
|
|
3
|
+
|
|
4
|
+
# Parse arguments
|
|
5
|
+
AGENT_TYPE=""
|
|
6
|
+
TASK_ID=""
|
|
7
|
+
AGENT_ID=""
|
|
8
|
+
CONTEXT=""
|
|
9
|
+
ITERATION=1
|
|
10
|
+
TIMEOUT=900
|
|
11
|
+
|
|
12
|
+
while [[ $# -gt 0 ]]; do
|
|
13
|
+
case $1 in
|
|
14
|
+
--agent-type) AGENT_TYPE="$2"; shift 2 ;;
|
|
15
|
+
--task-id) TASK_ID="$2"; shift 2 ;;
|
|
16
|
+
--agent-id) AGENT_ID="$2"; shift 2 ;;
|
|
17
|
+
--context) CONTEXT="$2"; shift 2 ;;
|
|
18
|
+
--iteration) ITERATION="$2"; shift 2 ;;
|
|
19
|
+
--timeout) TIMEOUT="$2"; shift 2 ;;
|
|
20
|
+
*) echo "ERROR: Unknown parameter: $1" >&2; exit 1 ;;
|
|
21
|
+
esac
|
|
22
|
+
done
|
|
23
|
+
|
|
24
|
+
# Validate required parameters
|
|
25
|
+
if [ -z "$AGENT_TYPE" ] || [ -z "$TASK_ID" ] || [ -z "$AGENT_ID" ] || [ -z "$CONTEXT" ]; then
|
|
26
|
+
echo "ERROR: Missing required parameters" >&2
|
|
27
|
+
echo "Usage: $0 --agent-type TYPE --task-id ID --agent-id ID --context CONTEXT [--iteration N] [--timeout SECONDS]" >&2
|
|
28
|
+
exit 1
|
|
29
|
+
fi
|
|
30
|
+
|
|
31
|
+
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
32
|
+
|
|
33
|
+
# Capture git state before agent runs
|
|
34
|
+
BEFORE_GIT=$(git status --short 2>/dev/null || echo "")
|
|
35
|
+
|
|
36
|
+
# Spawn agent and capture output
|
|
37
|
+
AGENT_OUTPUT=$(timeout "$TIMEOUT" npx claude-flow-novice agent "$AGENT_TYPE" \
|
|
38
|
+
--task-id "$TASK_ID" \
|
|
39
|
+
--agent-id "$AGENT_ID" \
|
|
40
|
+
--context "$CONTEXT" 2>&1 || true)
|
|
41
|
+
|
|
42
|
+
# Capture git state after agent runs
|
|
43
|
+
AFTER_GIT=$(git status --short 2>/dev/null || echo "")
|
|
44
|
+
|
|
45
|
+
# Parse confidence from output
|
|
46
|
+
CONFIDENCE=$("$SCRIPT_DIR/parse-confidence.sh" "$AGENT_OUTPUT")
|
|
47
|
+
|
|
48
|
+
# Verify deliverables
|
|
49
|
+
DELIVERABLE_CHECK=$("$SCRIPT_DIR/verify-deliverables.sh" \
|
|
50
|
+
--before "$BEFORE_GIT" \
|
|
51
|
+
--after "$AFTER_GIT")
|
|
52
|
+
|
|
53
|
+
FILES_CHANGED=$(echo "$DELIVERABLE_CHECK" | jq -r '.files_changed')
|
|
54
|
+
DELIVERABLES=$(echo "$DELIVERABLE_CHECK" | jq -r '.deliverables')
|
|
55
|
+
|
|
56
|
+
# If confidence not found or too low, calculate fallback
|
|
57
|
+
if (( $(echo "$CONFIDENCE == 0.0" | bc -l) )) || [ -z "$CONFIDENCE" ]; then
|
|
58
|
+
CONFIDENCE=$("$SCRIPT_DIR/calculate-confidence.sh" \
|
|
59
|
+
--files-changed "$FILES_CHANGED" \
|
|
60
|
+
--deliverables "$DELIVERABLES")
|
|
61
|
+
CONFIDENCE_SOURCE="calculated"
|
|
62
|
+
elif (( $(echo "$CONFIDENCE > 0.0" | bc -l) )); then
|
|
63
|
+
CONFIDENCE_SOURCE="explicit"
|
|
64
|
+
else
|
|
65
|
+
CONFIDENCE_SOURCE="fallback"
|
|
66
|
+
fi
|
|
67
|
+
|
|
68
|
+
# Build output JSON using jq to ensure proper formatting
|
|
69
|
+
jq -n \
|
|
70
|
+
--arg agent_id "$AGENT_ID" \
|
|
71
|
+
--argjson confidence "$CONFIDENCE" \
|
|
72
|
+
--arg confidence_source "$CONFIDENCE_SOURCE" \
|
|
73
|
+
--argjson files_changed "$FILES_CHANGED" \
|
|
74
|
+
--argjson deliverables "$DELIVERABLES" \
|
|
75
|
+
--arg iteration "$ITERATION" \
|
|
76
|
+
--arg timestamp "$(date -u +%Y-%m-%dT%H:%M:%SZ)" \
|
|
77
|
+
'{
|
|
78
|
+
agent_id: $agent_id,
|
|
79
|
+
confidence: $confidence,
|
|
80
|
+
confidence_source: $confidence_source,
|
|
81
|
+
files_changed: $files_changed,
|
|
82
|
+
deliverables: $deliverables,
|
|
83
|
+
iteration: ($iteration | tonumber),
|
|
84
|
+
timestamp: $timestamp
|
|
85
|
+
}'
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
#!/bin/bash
|
|
2
|
+
set -euo pipefail
|
|
3
|
+
|
|
4
|
+
OUTPUT="$1"
|
|
5
|
+
|
|
6
|
+
# Pattern 1: Explicit confidence (0.0-1.0)
|
|
7
|
+
if CONF=$(echo "$OUTPUT" | grep -oP '[Cc]onfidence[:\s]*([0-9.]+)' | grep -oP '([0-9.]+)' | head -1); then
|
|
8
|
+
echo "$CONF"
|
|
9
|
+
exit 0
|
|
10
|
+
fi
|
|
11
|
+
|
|
12
|
+
# Pattern 2: Percentage (85%)
|
|
13
|
+
if PERCENT=$(echo "$OUTPUT" | grep -oP '([0-9]{1,3})%' | grep -oP '[0-9]+' | head -1); then
|
|
14
|
+
echo "scale=2; $PERCENT / 100" | bc
|
|
15
|
+
exit 0
|
|
16
|
+
fi
|
|
17
|
+
|
|
18
|
+
# Pattern 3: Natural language with score in parentheses
|
|
19
|
+
if CONF=$(echo "$OUTPUT" | grep -oP '\(([0-9.]+)\)' | grep -oP '[0-9.]+' | head -1); then
|
|
20
|
+
echo "$CONF"
|
|
21
|
+
exit 0
|
|
22
|
+
fi
|
|
23
|
+
|
|
24
|
+
# Pattern 4: Score with colon
|
|
25
|
+
if CONF=$(echo "$OUTPUT" | grep -oP '[Ss]core[:\s]*([0-9.]+)' | grep -oP '([0-9.]+)' | head -1); then
|
|
26
|
+
echo "$CONF"
|
|
27
|
+
exit 0
|
|
28
|
+
fi
|
|
29
|
+
|
|
30
|
+
# No confidence found
|
|
31
|
+
echo "0.0"
|