moflo 4.8.31 → 4.8.33
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +13 -10
- package/src/@claude-flow/cli/dist/src/commands/doctor.js +1298 -1107
- package/src/@claude-flow/cli/dist/src/memory/memory-initializer.js +4 -7
- package/src/@claude-flow/cli/package.json +106 -106
- package/src/@claude-flow/neural/README.md +260 -0
- package/src/@claude-flow/neural/dist/algorithms/a2c.js +361 -0
- package/src/@claude-flow/neural/dist/algorithms/curiosity.js +392 -0
- package/src/@claude-flow/neural/dist/algorithms/decision-transformer.js +415 -0
- package/src/@claude-flow/neural/dist/algorithms/dqn.js +303 -0
- package/src/@claude-flow/neural/dist/algorithms/index.js +74 -0
- package/src/@claude-flow/neural/dist/algorithms/ppo.js +331 -0
- package/src/@claude-flow/neural/dist/algorithms/q-learning.js +259 -0
- package/src/@claude-flow/neural/dist/algorithms/sarsa.js +297 -0
- package/src/@claude-flow/neural/dist/application/index.js +7 -0
- package/src/@claude-flow/neural/dist/application/services/neural-application-service.js +161 -0
- package/src/@claude-flow/neural/dist/domain/entities/pattern.js +134 -0
- package/src/@claude-flow/neural/dist/domain/index.js +8 -0
- package/src/@claude-flow/neural/dist/domain/services/learning-service.js +195 -0
- package/src/@claude-flow/neural/dist/index.js +201 -0
- package/src/@claude-flow/neural/dist/modes/balanced.js +234 -0
- package/src/@claude-flow/neural/dist/modes/base.js +77 -0
- package/src/@claude-flow/neural/dist/modes/batch.js +316 -0
- package/src/@claude-flow/neural/dist/modes/edge.js +310 -0
- package/src/@claude-flow/neural/dist/modes/index.js +13 -0
- package/src/@claude-flow/neural/dist/modes/real-time.js +196 -0
- package/src/@claude-flow/neural/dist/modes/research.js +389 -0
- package/src/@claude-flow/neural/dist/pattern-learner.js +603 -0
- package/src/@claude-flow/neural/dist/reasoning-bank.js +993 -0
- package/src/@claude-flow/neural/dist/reasoningbank-adapter.js +463 -0
- package/src/@claude-flow/neural/dist/sona-integration.js +316 -0
- package/src/@claude-flow/neural/dist/sona-manager.js +695 -0
- package/src/@claude-flow/neural/dist/types.js +11 -0
- package/src/@claude-flow/neural/package.json +26 -0
- package/.claude/agents/browser/browser-agent.yaml +0 -182
- package/.claude/agents/database-specialist.yaml +0 -21
- package/.claude/agents/index.yaml +0 -17
- package/.claude/agents/project-coordinator.yaml +0 -15
- package/.claude/agents/python-specialist.yaml +0 -21
- package/.claude/agents/security-auditor.yaml +0 -20
- package/.claude/agents/typescript-specialist.yaml +0 -21
- package/.claude/checkpoints/1767754460.json +0 -8
- package/.claude/config/v3-dependency-optimization.json +0 -266
- package/.claude/config/v3-performance-targets.json +0 -251
- package/.claude/guidance/moflo-bootstrap.md +0 -129
- package/.claude/mcp.json +0 -13
- package/.claude/settings.json +0 -351
- package/.claude/settings.local.json +0 -18
- package/.claude/skills/agentdb-advanced/SKILL.md +0 -550
- package/.claude/skills/agentdb-learning/SKILL.md +0 -545
- package/.claude/skills/agentdb-memory-patterns/SKILL.md +0 -339
- package/.claude/skills/agentdb-optimization/SKILL.md +0 -509
- package/.claude/skills/agentdb-vector-search/SKILL.md +0 -339
- package/.claude/skills/browser/SKILL.md +0 -204
- package/.claude/skills/fl/SKILL.md +0 -583
- package/.claude/skills/flo/SKILL.md +0 -583
- package/.claude/skills/github-code-review/SKILL.md +0 -1140
- package/.claude/skills/github-multi-repo/SKILL.md +0 -874
- package/.claude/skills/github-project-management/SKILL.md +0 -1277
- package/.claude/skills/github-release-management/SKILL.md +0 -1081
- package/.claude/skills/github-workflow-automation/SKILL.md +0 -1065
- package/.claude/skills/hive-mind-advanced/SKILL.md +0 -712
- package/.claude/skills/hooks-automation/SKILL.md +0 -1201
- package/.claude/skills/pair-programming/SKILL.md +0 -1202
- package/.claude/skills/performance-analysis/SKILL.md +0 -563
- package/.claude/skills/reasoningbank-agentdb/SKILL.md +0 -446
- package/.claude/skills/reasoningbank-intelligence/SKILL.md +0 -201
- package/.claude/skills/skill-builder/SKILL.md +0 -910
- package/.claude/skills/sparc-methodology/SKILL.md +0 -1115
- package/.claude/skills/stream-chain/SKILL.md +0 -563
- package/.claude/skills/swarm-advanced/SKILL.md +0 -973
- package/.claude/skills/swarm-orchestration/SKILL.md +0 -179
- package/.claude/skills/v3-cli-modernization/SKILL.md +0 -872
- package/.claude/skills/v3-core-implementation/SKILL.md +0 -797
- package/.claude/skills/v3-ddd-architecture/SKILL.md +0 -442
- package/.claude/skills/v3-integration-deep/SKILL.md +0 -241
- package/.claude/skills/v3-mcp-optimization/SKILL.md +0 -777
- package/.claude/skills/v3-memory-unification/SKILL.md +0 -174
- package/.claude/skills/v3-performance-optimization/SKILL.md +0 -390
- package/.claude/skills/v3-security-overhaul/SKILL.md +0 -82
- package/.claude/skills/v3-swarm-coordination/SKILL.md +0 -340
- package/.claude/skills/verification-quality/SKILL.md +0 -649
- package/.claude/skills/worker-benchmarks/skill.md +0 -135
- package/.claude/skills/worker-integration/skill.md +0 -154
- package/.claude/workflow-state.json +0 -9
- package/src/@claude-flow/cli/dist/src/appliance/gguf-engine.d.ts +0 -91
- package/src/@claude-flow/cli/dist/src/appliance/ruvllm-bridge.d.ts +0 -102
- package/src/@claude-flow/cli/dist/src/appliance/rvfa-builder.d.ts +0 -44
- package/src/@claude-flow/cli/dist/src/appliance/rvfa-distribution.d.ts +0 -97
- package/src/@claude-flow/cli/dist/src/appliance/rvfa-format.d.ts +0 -111
- package/src/@claude-flow/cli/dist/src/appliance/rvfa-runner.d.ts +0 -69
- package/src/@claude-flow/cli/dist/src/appliance/rvfa-signing.d.ts +0 -123
- package/src/@claude-flow/cli/dist/src/benchmarks/pretrain/index.d.ts +0 -58
- package/src/@claude-flow/cli/dist/src/commands/agent.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/analyze.d.ts +0 -19
- package/src/@claude-flow/cli/dist/src/commands/appliance-advanced.d.ts +0 -9
- package/src/@claude-flow/cli/dist/src/commands/appliance.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/benchmark.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/claims.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/completions.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/config.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/daemon.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/deployment.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/diagnose.d.ts +0 -16
- package/src/@claude-flow/cli/dist/src/commands/doctor.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/embeddings.d.ts +0 -18
- package/src/@claude-flow/cli/dist/src/commands/gate.d.ts +0 -23
- package/src/@claude-flow/cli/dist/src/commands/github.d.ts +0 -12
- package/src/@claude-flow/cli/dist/src/commands/guidance.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/hive-mind.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/hooks.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/index.d.ts +0 -115
- package/src/@claude-flow/cli/dist/src/commands/init.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/issues.d.ts +0 -21
- package/src/@claude-flow/cli/dist/src/commands/mcp.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/memory.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/migrate.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/neural.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/orc.d.ts +0 -21
- package/src/@claude-flow/cli/dist/src/commands/performance.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/plugins.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/process.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/progress.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/providers.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/route.d.ts +0 -16
- package/src/@claude-flow/cli/dist/src/commands/ruvector/backup.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/ruvector/benchmark.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/ruvector/import.d.ts +0 -18
- package/src/@claude-flow/cli/dist/src/commands/ruvector/index.d.ts +0 -29
- package/src/@claude-flow/cli/dist/src/commands/ruvector/init.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/ruvector/migrate.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/ruvector/optimize.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/ruvector/setup.d.ts +0 -18
- package/src/@claude-flow/cli/dist/src/commands/ruvector/status.d.ts +0 -11
- package/src/@claude-flow/cli/dist/src/commands/security.d.ts +0 -10
- package/src/@claude-flow/cli/dist/src/commands/session.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/start.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/status.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/swarm.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/task.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/transfer-store.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/commands/update.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/commands/workflow.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/config/moflo-config.d.ts +0 -93
- package/src/@claude-flow/cli/dist/src/config-adapter.d.ts +0 -15
- package/src/@claude-flow/cli/dist/src/index.d.ts +0 -81
- package/src/@claude-flow/cli/dist/src/infrastructure/in-memory-repositories.d.ts +0 -68
- package/src/@claude-flow/cli/dist/src/init/claudemd-generator.d.ts +0 -30
- package/src/@claude-flow/cli/dist/src/init/executor.d.ts +0 -41
- package/src/@claude-flow/cli/dist/src/init/helpers-generator.d.ts +0 -51
- package/src/@claude-flow/cli/dist/src/init/index.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/init/mcp-generator.d.ts +0 -29
- package/src/@claude-flow/cli/dist/src/init/moflo-init.d.ts +0 -31
- package/src/@claude-flow/cli/dist/src/init/settings-generator.d.ts +0 -14
- package/src/@claude-flow/cli/dist/src/init/statusline-generator.d.ts +0 -28
- package/src/@claude-flow/cli/dist/src/init/types.d.ts +0 -285
- package/src/@claude-flow/cli/dist/src/mcp-client.d.ts +0 -92
- package/src/@claude-flow/cli/dist/src/mcp-server.d.ts +0 -161
- package/src/@claude-flow/cli/dist/src/mcp-tools/agent-tools.d.ts +0 -9
- package/src/@claude-flow/cli/dist/src/mcp-tools/agentdb-tools.d.ts +0 -30
- package/src/@claude-flow/cli/dist/src/mcp-tools/analyze-tools.d.ts +0 -38
- package/src/@claude-flow/cli/dist/src/mcp-tools/auto-install.d.ts +0 -83
- package/src/@claude-flow/cli/dist/src/mcp-tools/browser-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/claims-tools.d.ts +0 -12
- package/src/@claude-flow/cli/dist/src/mcp-tools/config-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/mcp-tools/coordination-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/daa-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/embeddings-tools.d.ts +0 -9
- package/src/@claude-flow/cli/dist/src/mcp-tools/github-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/hive-mind-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/mcp-tools/hooks-tools.d.ts +0 -44
- package/src/@claude-flow/cli/dist/src/mcp-tools/index.d.ts +0 -23
- package/src/@claude-flow/cli/dist/src/mcp-tools/memory-tools.d.ts +0 -14
- package/src/@claude-flow/cli/dist/src/mcp-tools/neural-tools.d.ts +0 -16
- package/src/@claude-flow/cli/dist/src/mcp-tools/performance-tools.d.ts +0 -16
- package/src/@claude-flow/cli/dist/src/mcp-tools/progress-tools.d.ts +0 -14
- package/src/@claude-flow/cli/dist/src/mcp-tools/security-tools.d.ts +0 -18
- package/src/@claude-flow/cli/dist/src/mcp-tools/session-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/mcp-tools/swarm-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/mcp-tools/system-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/task-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/mcp-tools/terminal-tools.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/mcp-tools/transfer-tools.d.ts +0 -14
- package/src/@claude-flow/cli/dist/src/mcp-tools/types.d.ts +0 -31
- package/src/@claude-flow/cli/dist/src/mcp-tools/workflow-tools.d.ts +0 -8
- package/src/@claude-flow/cli/dist/src/memory/ewc-consolidation.d.ts +0 -271
- package/src/@claude-flow/cli/dist/src/memory/intelligence.d.ts +0 -285
- package/src/@claude-flow/cli/dist/src/memory/memory-bridge.d.ts +0 -413
- package/src/@claude-flow/cli/dist/src/memory/memory-initializer.d.ts +0 -405
- package/src/@claude-flow/cli/dist/src/memory/sona-optimizer.d.ts +0 -227
- package/src/@claude-flow/cli/dist/src/output.d.ts +0 -133
- package/src/@claude-flow/cli/dist/src/parser.d.ts +0 -51
- package/src/@claude-flow/cli/dist/src/plugins/manager.d.ts +0 -133
- package/src/@claude-flow/cli/dist/src/plugins/store/discovery.d.ts +0 -88
- package/src/@claude-flow/cli/dist/src/plugins/store/index.d.ts +0 -76
- package/src/@claude-flow/cli/dist/src/plugins/store/search.d.ts +0 -46
- package/src/@claude-flow/cli/dist/src/plugins/store/types.d.ts +0 -274
- package/src/@claude-flow/cli/dist/src/plugins/tests/demo-plugin-store.d.ts +0 -7
- package/src/@claude-flow/cli/dist/src/plugins/tests/standalone-test.d.ts +0 -12
- package/src/@claude-flow/cli/dist/src/plugins/tests/test-plugin-store.d.ts +0 -7
- package/src/@claude-flow/cli/dist/src/production/circuit-breaker.d.ts +0 -101
- package/src/@claude-flow/cli/dist/src/production/error-handler.d.ts +0 -92
- package/src/@claude-flow/cli/dist/src/production/index.d.ts +0 -23
- package/src/@claude-flow/cli/dist/src/production/monitoring.d.ts +0 -161
- package/src/@claude-flow/cli/dist/src/production/rate-limiter.d.ts +0 -80
- package/src/@claude-flow/cli/dist/src/production/retry.d.ts +0 -48
- package/src/@claude-flow/cli/dist/src/prompt.d.ts +0 -44
- package/src/@claude-flow/cli/dist/src/runtime/headless.d.ts +0 -60
- package/src/@claude-flow/cli/dist/src/ruvector/ast-analyzer.d.ts +0 -67
- package/src/@claude-flow/cli/dist/src/ruvector/coverage-router.d.ts +0 -160
- package/src/@claude-flow/cli/dist/src/ruvector/coverage-tools.d.ts +0 -33
- package/src/@claude-flow/cli/dist/src/ruvector/diff-classifier.d.ts +0 -175
- package/src/@claude-flow/cli/dist/src/ruvector/enhanced-model-router.d.ts +0 -146
- package/src/@claude-flow/cli/dist/src/ruvector/flash-attention.d.ts +0 -195
- package/src/@claude-flow/cli/dist/src/ruvector/graph-analyzer.d.ts +0 -187
- package/src/@claude-flow/cli/dist/src/ruvector/index.d.ts +0 -34
- package/src/@claude-flow/cli/dist/src/ruvector/lora-adapter.d.ts +0 -218
- package/src/@claude-flow/cli/dist/src/ruvector/model-router.d.ts +0 -220
- package/src/@claude-flow/cli/dist/src/ruvector/moe-router.d.ts +0 -206
- package/src/@claude-flow/cli/dist/src/ruvector/q-learning-router.d.ts +0 -211
- package/src/@claude-flow/cli/dist/src/ruvector/semantic-router.d.ts +0 -77
- package/src/@claude-flow/cli/dist/src/ruvector/vector-db.d.ts +0 -69
- package/src/@claude-flow/cli/dist/src/services/agent-router.d.ts +0 -63
- package/src/@claude-flow/cli/dist/src/services/agentic-flow-bridge.d.ts +0 -50
- package/src/@claude-flow/cli/dist/src/services/claim-service.d.ts +0 -204
- package/src/@claude-flow/cli/dist/src/services/container-worker-pool.d.ts +0 -197
- package/src/@claude-flow/cli/dist/src/services/daemon-lock.d.ts +0 -60
- package/src/@claude-flow/cli/dist/src/services/headless-worker-executor.d.ts +0 -304
- package/src/@claude-flow/cli/dist/src/services/index.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/services/learning-service.d.ts +0 -161
- package/src/@claude-flow/cli/dist/src/services/moflo-require.d.ts +0 -34
- package/src/@claude-flow/cli/dist/src/services/registry-api.d.ts +0 -58
- package/src/@claude-flow/cli/dist/src/services/ruvector-training.d.ts +0 -214
- package/src/@claude-flow/cli/dist/src/services/worker-daemon.d.ts +0 -225
- package/src/@claude-flow/cli/dist/src/services/worker-queue.d.ts +0 -194
- package/src/@claude-flow/cli/dist/src/services/workflow-gate.d.ts +0 -88
- package/src/@claude-flow/cli/dist/src/suggest.d.ts +0 -53
- package/src/@claude-flow/cli/dist/src/transfer/anonymization/index.d.ts +0 -25
- package/src/@claude-flow/cli/dist/src/transfer/deploy-seraphine.d.ts +0 -13
- package/src/@claude-flow/cli/dist/src/transfer/export.d.ts +0 -25
- package/src/@claude-flow/cli/dist/src/transfer/index.d.ts +0 -12
- package/src/@claude-flow/cli/dist/src/transfer/ipfs/client.d.ts +0 -109
- package/src/@claude-flow/cli/dist/src/transfer/ipfs/upload.d.ts +0 -95
- package/src/@claude-flow/cli/dist/src/transfer/models/seraphine.d.ts +0 -72
- package/src/@claude-flow/cli/dist/src/transfer/serialization/cfp.d.ts +0 -49
- package/src/@claude-flow/cli/dist/src/transfer/storage/gcs.d.ts +0 -82
- package/src/@claude-flow/cli/dist/src/transfer/storage/index.d.ts +0 -6
- package/src/@claude-flow/cli/dist/src/transfer/store/discovery.d.ts +0 -84
- package/src/@claude-flow/cli/dist/src/transfer/store/download.d.ts +0 -70
- package/src/@claude-flow/cli/dist/src/transfer/store/index.d.ts +0 -84
- package/src/@claude-flow/cli/dist/src/transfer/store/publish.d.ts +0 -76
- package/src/@claude-flow/cli/dist/src/transfer/store/registry.d.ts +0 -58
- package/src/@claude-flow/cli/dist/src/transfer/store/search.d.ts +0 -54
- package/src/@claude-flow/cli/dist/src/transfer/store/tests/standalone-test.d.ts +0 -12
- package/src/@claude-flow/cli/dist/src/transfer/store/types.d.ts +0 -193
- package/src/@claude-flow/cli/dist/src/transfer/test-seraphine.d.ts +0 -6
- package/src/@claude-flow/cli/dist/src/transfer/tests/test-store.d.ts +0 -7
- package/src/@claude-flow/cli/dist/src/transfer/types.d.ts +0 -245
- package/src/@claude-flow/cli/dist/src/types.d.ts +0 -198
- package/src/@claude-flow/cli/dist/src/update/checker.d.ts +0 -34
- package/src/@claude-flow/cli/dist/src/update/executor.d.ts +0 -32
- package/src/@claude-flow/cli/dist/src/update/index.d.ts +0 -33
- package/src/@claude-flow/cli/dist/src/update/rate-limiter.d.ts +0 -20
- package/src/@claude-flow/cli/dist/src/update/validator.d.ts +0 -17
- package/src/@claude-flow/guidance/dist/adversarial.d.ts +0 -284
- package/src/@claude-flow/guidance/dist/analyzer.d.ts +0 -530
- package/src/@claude-flow/guidance/dist/artifacts.d.ts +0 -283
- package/src/@claude-flow/guidance/dist/authority.d.ts +0 -290
- package/src/@claude-flow/guidance/dist/capabilities.d.ts +0 -209
- package/src/@claude-flow/guidance/dist/coherence.d.ts +0 -233
- package/src/@claude-flow/guidance/dist/compiler.d.ts +0 -87
- package/src/@claude-flow/guidance/dist/conformance-kit.d.ts +0 -225
- package/src/@claude-flow/guidance/dist/continue-gate.d.ts +0 -214
- package/src/@claude-flow/guidance/dist/crypto-utils.d.ts +0 -17
- package/src/@claude-flow/guidance/dist/evolution.d.ts +0 -282
- package/src/@claude-flow/guidance/dist/gates.d.ts +0 -79
- package/src/@claude-flow/guidance/dist/gateway.d.ts +0 -206
- package/src/@claude-flow/guidance/dist/generators.d.ts +0 -153
- package/src/@claude-flow/guidance/dist/headless.d.ts +0 -177
- package/src/@claude-flow/guidance/dist/hooks.d.ts +0 -109
- package/src/@claude-flow/guidance/dist/index.d.ts +0 -205
- package/src/@claude-flow/guidance/dist/ledger.d.ts +0 -162
- package/src/@claude-flow/guidance/dist/manifest-validator.d.ts +0 -289
- package/src/@claude-flow/guidance/dist/memory-gate.d.ts +0 -222
- package/src/@claude-flow/guidance/dist/meta-governance.d.ts +0 -265
- package/src/@claude-flow/guidance/dist/optimizer.d.ts +0 -104
- package/src/@claude-flow/guidance/dist/persistence.d.ts +0 -189
- package/src/@claude-flow/guidance/dist/proof.d.ts +0 -185
- package/src/@claude-flow/guidance/dist/retriever.d.ts +0 -116
- package/src/@claude-flow/guidance/dist/ruvbot-integration.d.ts +0 -370
- package/src/@claude-flow/guidance/dist/temporal.d.ts +0 -426
- package/src/@claude-flow/guidance/dist/trust.d.ts +0 -283
- package/src/@claude-flow/guidance/dist/truth-anchors.d.ts +0 -276
- package/src/@claude-flow/guidance/dist/types.d.ts +0 -378
- package/src/@claude-flow/guidance/dist/uncertainty.d.ts +0 -372
- package/src/@claude-flow/guidance/dist/wasm-kernel.d.ts +0 -48
- package/src/@claude-flow/memory/dist/agent-memory-scope.d.ts +0 -131
- package/src/@claude-flow/memory/dist/agent-memory-scope.test.d.ts +0 -8
- package/src/@claude-flow/memory/dist/agentdb-adapter.d.ts +0 -165
- package/src/@claude-flow/memory/dist/agentdb-backend.d.ts +0 -212
- package/src/@claude-flow/memory/dist/agentdb-backend.test.d.ts +0 -7
- package/src/@claude-flow/memory/dist/application/commands/delete-memory.command.d.ts +0 -65
- package/src/@claude-flow/memory/dist/application/commands/store-memory.command.d.ts +0 -48
- package/src/@claude-flow/memory/dist/application/index.d.ts +0 -12
- package/src/@claude-flow/memory/dist/application/queries/search-memory.query.d.ts +0 -72
- package/src/@claude-flow/memory/dist/application/services/memory-application-service.d.ts +0 -121
- package/src/@claude-flow/memory/dist/auto-memory-bridge.d.ts +0 -226
- package/src/@claude-flow/memory/dist/auto-memory-bridge.test.d.ts +0 -8
- package/src/@claude-flow/memory/dist/benchmark.test.d.ts +0 -2
- package/src/@claude-flow/memory/dist/cache-manager.d.ts +0 -134
- package/src/@claude-flow/memory/dist/controller-registry.d.ts +0 -216
- package/src/@claude-flow/memory/dist/controller-registry.test.d.ts +0 -14
- package/src/@claude-flow/memory/dist/database-provider.d.ts +0 -87
- package/src/@claude-flow/memory/dist/database-provider.test.d.ts +0 -7
- package/src/@claude-flow/memory/dist/domain/entities/memory-entry.d.ts +0 -143
- package/src/@claude-flow/memory/dist/domain/index.d.ts +0 -11
- package/src/@claude-flow/memory/dist/domain/repositories/memory-repository.interface.d.ts +0 -102
- package/src/@claude-flow/memory/dist/domain/services/memory-domain-service.d.ts +0 -105
- package/src/@claude-flow/memory/dist/hnsw-index.d.ts +0 -111
- package/src/@claude-flow/memory/dist/hnsw-lite.d.ts +0 -23
- package/src/@claude-flow/memory/dist/hybrid-backend.d.ts +0 -245
- package/src/@claude-flow/memory/dist/hybrid-backend.test.d.ts +0 -8
- package/src/@claude-flow/memory/dist/index.d.ts +0 -204
- package/src/@claude-flow/memory/dist/infrastructure/index.d.ts +0 -17
- package/src/@claude-flow/memory/dist/infrastructure/repositories/hybrid-memory-repository.d.ts +0 -66
- package/src/@claude-flow/memory/dist/learning-bridge.d.ts +0 -137
- package/src/@claude-flow/memory/dist/learning-bridge.test.d.ts +0 -8
- package/src/@claude-flow/memory/dist/memory-graph.d.ts +0 -100
- package/src/@claude-flow/memory/dist/memory-graph.test.d.ts +0 -8
- package/src/@claude-flow/memory/dist/migration.d.ts +0 -68
- package/src/@claude-flow/memory/dist/persistent-sona.d.ts +0 -144
- package/src/@claude-flow/memory/dist/query-builder.d.ts +0 -211
- package/src/@claude-flow/memory/dist/rvf-backend.d.ts +0 -51
- package/src/@claude-flow/memory/dist/rvf-learning-store.d.ts +0 -139
- package/src/@claude-flow/memory/dist/rvf-migration.d.ts +0 -45
- package/src/@claude-flow/memory/dist/sqlite-backend.d.ts +0 -121
- package/src/@claude-flow/memory/dist/sqljs-backend.d.ts +0 -127
- package/src/@claude-flow/memory/dist/types.d.ts +0 -484
- package/src/@claude-flow/shared/dist/core/config/defaults.d.ts +0 -41
- package/src/@claude-flow/shared/dist/core/config/index.d.ts +0 -8
- package/src/@claude-flow/shared/dist/core/config/loader.d.ts +0 -45
- package/src/@claude-flow/shared/dist/core/config/schema.d.ts +0 -1134
- package/src/@claude-flow/shared/dist/core/config/validator.d.ts +0 -92
- package/src/@claude-flow/shared/dist/core/event-bus.d.ts +0 -31
- package/src/@claude-flow/shared/dist/core/index.d.ts +0 -15
- package/src/@claude-flow/shared/dist/core/interfaces/agent.interface.d.ts +0 -200
- package/src/@claude-flow/shared/dist/core/interfaces/coordinator.interface.d.ts +0 -310
- package/src/@claude-flow/shared/dist/core/interfaces/event.interface.d.ts +0 -224
- package/src/@claude-flow/shared/dist/core/interfaces/index.d.ts +0 -10
- package/src/@claude-flow/shared/dist/core/interfaces/memory.interface.d.ts +0 -298
- package/src/@claude-flow/shared/dist/core/interfaces/task.interface.d.ts +0 -185
- package/src/@claude-flow/shared/dist/core/orchestrator/event-coordinator.d.ts +0 -35
- package/src/@claude-flow/shared/dist/core/orchestrator/health-monitor.d.ts +0 -60
- package/src/@claude-flow/shared/dist/core/orchestrator/index.d.ts +0 -46
- package/src/@claude-flow/shared/dist/core/orchestrator/lifecycle-manager.d.ts +0 -56
- package/src/@claude-flow/shared/dist/core/orchestrator/session-manager.d.ts +0 -83
- package/src/@claude-flow/shared/dist/core/orchestrator/task-manager.d.ts +0 -49
- package/src/@claude-flow/shared/dist/events/domain-events.d.ts +0 -282
- package/src/@claude-flow/shared/dist/events/event-store.d.ts +0 -126
- package/src/@claude-flow/shared/dist/events/event-store.test.d.ts +0 -8
- package/src/@claude-flow/shared/dist/events/example-usage.d.ts +0 -10
- package/src/@claude-flow/shared/dist/events/index.d.ts +0 -21
- package/src/@claude-flow/shared/dist/events/projections.d.ts +0 -177
- package/src/@claude-flow/shared/dist/events/rvf-event-log.d.ts +0 -82
- package/src/@claude-flow/shared/dist/events/state-reconstructor.d.ts +0 -101
- package/src/@claude-flow/shared/dist/events.d.ts +0 -80
- package/src/@claude-flow/shared/dist/hooks/example-usage.d.ts +0 -42
- package/src/@claude-flow/shared/dist/hooks/executor.d.ts +0 -100
- package/src/@claude-flow/shared/dist/hooks/hooks.test.d.ts +0 -9
- package/src/@claude-flow/shared/dist/hooks/index.d.ts +0 -52
- package/src/@claude-flow/shared/dist/hooks/registry.d.ts +0 -133
- package/src/@claude-flow/shared/dist/hooks/safety/bash-safety.d.ts +0 -105
- package/src/@claude-flow/shared/dist/hooks/safety/file-organization.d.ts +0 -144
- package/src/@claude-flow/shared/dist/hooks/safety/git-commit.d.ts +0 -158
- package/src/@claude-flow/shared/dist/hooks/safety/index.d.ts +0 -17
- package/src/@claude-flow/shared/dist/hooks/session-hooks.d.ts +0 -234
- package/src/@claude-flow/shared/dist/hooks/task-hooks.d.ts +0 -163
- package/src/@claude-flow/shared/dist/hooks/types.d.ts +0 -267
- package/src/@claude-flow/shared/dist/hooks/verify-exports.test.d.ts +0 -9
- package/src/@claude-flow/shared/dist/index.d.ts +0 -20
- package/src/@claude-flow/shared/dist/mcp/connection-pool.d.ts +0 -98
- package/src/@claude-flow/shared/dist/mcp/index.d.ts +0 -69
- package/src/@claude-flow/shared/dist/mcp/server.d.ts +0 -166
- package/src/@claude-flow/shared/dist/mcp/session-manager.d.ts +0 -136
- package/src/@claude-flow/shared/dist/mcp/tool-registry.d.ts +0 -178
- package/src/@claude-flow/shared/dist/mcp/transport/http.d.ts +0 -104
- package/src/@claude-flow/shared/dist/mcp/transport/index.d.ts +0 -102
- package/src/@claude-flow/shared/dist/mcp/transport/stdio.d.ts +0 -104
- package/src/@claude-flow/shared/dist/mcp/transport/websocket.d.ts +0 -133
- package/src/@claude-flow/shared/dist/mcp/types.d.ts +0 -438
- package/src/@claude-flow/shared/dist/plugin-interface.d.ts +0 -544
- package/src/@claude-flow/shared/dist/plugin-loader.d.ts +0 -139
- package/src/@claude-flow/shared/dist/plugin-registry.d.ts +0 -183
- package/src/@claude-flow/shared/dist/plugins/index.d.ts +0 -10
- package/src/@claude-flow/shared/dist/plugins/official/hive-mind-plugin.d.ts +0 -106
- package/src/@claude-flow/shared/dist/plugins/official/index.d.ts +0 -10
- package/src/@claude-flow/shared/dist/plugins/official/maestro-plugin.d.ts +0 -121
- package/src/@claude-flow/shared/dist/plugins/types.d.ts +0 -93
- package/src/@claude-flow/shared/dist/resilience/bulkhead.d.ts +0 -105
- package/src/@claude-flow/shared/dist/resilience/circuit-breaker.d.ts +0 -132
- package/src/@claude-flow/shared/dist/resilience/index.d.ts +0 -19
- package/src/@claude-flow/shared/dist/resilience/rate-limiter.d.ts +0 -168
- package/src/@claude-flow/shared/dist/resilience/retry.d.ts +0 -91
- package/src/@claude-flow/shared/dist/security/index.d.ts +0 -10
- package/src/@claude-flow/shared/dist/security/input-validation.d.ts +0 -73
- package/src/@claude-flow/shared/dist/security/secure-random.d.ts +0 -92
- package/src/@claude-flow/shared/dist/services/index.d.ts +0 -7
- package/src/@claude-flow/shared/dist/services/v3-progress.service.d.ts +0 -124
- package/src/@claude-flow/shared/dist/types/agent.types.d.ts +0 -137
- package/src/@claude-flow/shared/dist/types/index.d.ts +0 -11
- package/src/@claude-flow/shared/dist/types/mcp.types.d.ts +0 -266
- package/src/@claude-flow/shared/dist/types/memory.types.d.ts +0 -236
- package/src/@claude-flow/shared/dist/types/swarm.types.d.ts +0 -186
- package/src/@claude-flow/shared/dist/types/task.types.d.ts +0 -178
- package/src/@claude-flow/shared/dist/types.d.ts +0 -197
- package/src/@claude-flow/shared/dist/utils/secure-logger.d.ts +0 -69
|
@@ -0,0 +1,361 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Advantage Actor-Critic (A2C)
|
|
3
|
+
*
|
|
4
|
+
* Implements synchronous A2C algorithm with:
|
|
5
|
+
* - Shared actor-critic network
|
|
6
|
+
* - N-step returns
|
|
7
|
+
* - Entropy regularization
|
|
8
|
+
* - Advantage normalization
|
|
9
|
+
*
|
|
10
|
+
* Performance Target: <10ms per update step
|
|
11
|
+
*/
|
|
12
|
+
/**
|
|
13
|
+
* Default A2C configuration
|
|
14
|
+
*/
|
|
15
|
+
export const DEFAULT_A2C_CONFIG = {
|
|
16
|
+
algorithm: 'a2c',
|
|
17
|
+
learningRate: 0.0007,
|
|
18
|
+
gamma: 0.99,
|
|
19
|
+
entropyCoef: 0.01,
|
|
20
|
+
valueLossCoef: 0.5,
|
|
21
|
+
maxGradNorm: 0.5,
|
|
22
|
+
epochs: 1,
|
|
23
|
+
miniBatchSize: 32,
|
|
24
|
+
nSteps: 5,
|
|
25
|
+
useGAE: true,
|
|
26
|
+
gaeLambda: 0.95,
|
|
27
|
+
};
|
|
28
|
+
/**
|
|
29
|
+
* A2C Algorithm Implementation
|
|
30
|
+
*/
|
|
31
|
+
export class A2CAlgorithm {
|
|
32
|
+
config;
|
|
33
|
+
// Shared network weights
|
|
34
|
+
sharedWeights;
|
|
35
|
+
policyHead;
|
|
36
|
+
valueHead;
|
|
37
|
+
// Optimizer state
|
|
38
|
+
sharedMomentum;
|
|
39
|
+
policyMomentum;
|
|
40
|
+
valueMomentum;
|
|
41
|
+
// Experience buffer for n-step
|
|
42
|
+
buffer = [];
|
|
43
|
+
// Dimensions
|
|
44
|
+
inputDim = 768;
|
|
45
|
+
hiddenDim = 64;
|
|
46
|
+
numActions = 4;
|
|
47
|
+
// Statistics
|
|
48
|
+
updateCount = 0;
|
|
49
|
+
avgPolicyLoss = 0;
|
|
50
|
+
avgValueLoss = 0;
|
|
51
|
+
avgEntropy = 0;
|
|
52
|
+
constructor(config = {}) {
|
|
53
|
+
this.config = { ...DEFAULT_A2C_CONFIG, ...config };
|
|
54
|
+
// Initialize network
|
|
55
|
+
const scale = Math.sqrt(2 / this.inputDim);
|
|
56
|
+
this.sharedWeights = new Float32Array(this.inputDim * this.hiddenDim);
|
|
57
|
+
this.policyHead = new Float32Array(this.hiddenDim * this.numActions);
|
|
58
|
+
this.valueHead = new Float32Array(this.hiddenDim);
|
|
59
|
+
for (let i = 0; i < this.sharedWeights.length; i++) {
|
|
60
|
+
this.sharedWeights[i] = (Math.random() - 0.5) * scale;
|
|
61
|
+
}
|
|
62
|
+
for (let i = 0; i < this.policyHead.length; i++) {
|
|
63
|
+
this.policyHead[i] = (Math.random() - 0.5) * 0.1;
|
|
64
|
+
}
|
|
65
|
+
for (let i = 0; i < this.valueHead.length; i++) {
|
|
66
|
+
this.valueHead[i] = (Math.random() - 0.5) * 0.1;
|
|
67
|
+
}
|
|
68
|
+
// Initialize momentum
|
|
69
|
+
this.sharedMomentum = new Float32Array(this.sharedWeights.length);
|
|
70
|
+
this.policyMomentum = new Float32Array(this.policyHead.length);
|
|
71
|
+
this.valueMomentum = new Float32Array(this.valueHead.length);
|
|
72
|
+
}
|
|
73
|
+
/**
|
|
74
|
+
* Add experience from trajectory
|
|
75
|
+
*/
|
|
76
|
+
addExperience(trajectory) {
|
|
77
|
+
for (const step of trajectory.steps) {
|
|
78
|
+
const { probs, value, entropy } = this.evaluate(step.stateAfter);
|
|
79
|
+
const action = this.hashAction(step.action);
|
|
80
|
+
this.buffer.push({
|
|
81
|
+
state: step.stateAfter,
|
|
82
|
+
action,
|
|
83
|
+
reward: step.reward,
|
|
84
|
+
value,
|
|
85
|
+
logProb: Math.log(probs[action] + 1e-8),
|
|
86
|
+
entropy,
|
|
87
|
+
});
|
|
88
|
+
}
|
|
89
|
+
}
|
|
90
|
+
/**
|
|
91
|
+
* Perform A2C update
|
|
92
|
+
* Target: <10ms
|
|
93
|
+
*/
|
|
94
|
+
update() {
|
|
95
|
+
const startTime = performance.now();
|
|
96
|
+
if (this.buffer.length < this.config.nSteps) {
|
|
97
|
+
return { policyLoss: 0, valueLoss: 0, entropy: 0 };
|
|
98
|
+
}
|
|
99
|
+
// Compute returns and advantages
|
|
100
|
+
const returns = this.computeReturns();
|
|
101
|
+
const advantages = this.computeAdvantages(returns);
|
|
102
|
+
// Initialize gradients
|
|
103
|
+
const sharedGrad = new Float32Array(this.sharedWeights.length);
|
|
104
|
+
const policyGrad = new Float32Array(this.policyHead.length);
|
|
105
|
+
const valueGrad = new Float32Array(this.valueHead.length);
|
|
106
|
+
let totalPolicyLoss = 0;
|
|
107
|
+
let totalValueLoss = 0;
|
|
108
|
+
let totalEntropy = 0;
|
|
109
|
+
// Process all experiences
|
|
110
|
+
for (let i = 0; i < this.buffer.length; i++) {
|
|
111
|
+
const exp = this.buffer[i];
|
|
112
|
+
const advantage = advantages[i];
|
|
113
|
+
const return_ = returns[i];
|
|
114
|
+
// Get current policy and value
|
|
115
|
+
const { probs, value, hidden } = this.forwardWithHidden(exp.state);
|
|
116
|
+
const logProb = Math.log(probs[exp.action] + 1e-8);
|
|
117
|
+
// Policy loss
|
|
118
|
+
const policyLoss = -logProb * advantage;
|
|
119
|
+
totalPolicyLoss += policyLoss;
|
|
120
|
+
// Value loss
|
|
121
|
+
const valueLoss = (value - return_) ** 2;
|
|
122
|
+
totalValueLoss += valueLoss;
|
|
123
|
+
// Entropy
|
|
124
|
+
let entropy = 0;
|
|
125
|
+
for (const p of probs) {
|
|
126
|
+
if (p > 0)
|
|
127
|
+
entropy -= p * Math.log(p);
|
|
128
|
+
}
|
|
129
|
+
totalEntropy += entropy;
|
|
130
|
+
// Accumulate gradients
|
|
131
|
+
this.accumulateGradients(sharedGrad, policyGrad, valueGrad, exp.state, hidden, exp.action, advantage, value - return_);
|
|
132
|
+
}
|
|
133
|
+
// Add entropy bonus to policy gradient
|
|
134
|
+
for (let i = 0; i < policyGrad.length; i++) {
|
|
135
|
+
policyGrad[i] -= this.config.entropyCoef * totalEntropy / this.buffer.length;
|
|
136
|
+
}
|
|
137
|
+
// Apply gradients
|
|
138
|
+
this.applyGradients(sharedGrad, policyGrad, valueGrad, this.buffer.length);
|
|
139
|
+
// Clear buffer
|
|
140
|
+
this.buffer = [];
|
|
141
|
+
this.updateCount++;
|
|
142
|
+
this.avgPolicyLoss = totalPolicyLoss / this.buffer.length || 0;
|
|
143
|
+
this.avgValueLoss = totalValueLoss / this.buffer.length || 0;
|
|
144
|
+
this.avgEntropy = totalEntropy / this.buffer.length || 0;
|
|
145
|
+
const elapsed = performance.now() - startTime;
|
|
146
|
+
if (elapsed > 10) {
|
|
147
|
+
console.warn(`A2C update exceeded target: ${elapsed.toFixed(2)}ms > 10ms`);
|
|
148
|
+
}
|
|
149
|
+
return {
|
|
150
|
+
policyLoss: this.avgPolicyLoss,
|
|
151
|
+
valueLoss: this.avgValueLoss,
|
|
152
|
+
entropy: this.avgEntropy,
|
|
153
|
+
};
|
|
154
|
+
}
|
|
155
|
+
/**
|
|
156
|
+
* Get action from policy
|
|
157
|
+
*/
|
|
158
|
+
getAction(state) {
|
|
159
|
+
const { probs, value } = this.evaluate(state);
|
|
160
|
+
const action = this.sampleAction(probs);
|
|
161
|
+
return { action, value };
|
|
162
|
+
}
|
|
163
|
+
/**
|
|
164
|
+
* Get statistics
|
|
165
|
+
*/
|
|
166
|
+
getStats() {
|
|
167
|
+
return {
|
|
168
|
+
updateCount: this.updateCount,
|
|
169
|
+
bufferSize: this.buffer.length,
|
|
170
|
+
avgPolicyLoss: this.avgPolicyLoss,
|
|
171
|
+
avgValueLoss: this.avgValueLoss,
|
|
172
|
+
avgEntropy: this.avgEntropy,
|
|
173
|
+
};
|
|
174
|
+
}
|
|
175
|
+
// ==========================================================================
|
|
176
|
+
// Private Methods
|
|
177
|
+
// ==========================================================================
|
|
178
|
+
evaluate(state) {
|
|
179
|
+
const { probs, value } = this.forward(state);
|
|
180
|
+
let entropy = 0;
|
|
181
|
+
for (const p of probs) {
|
|
182
|
+
if (p > 0)
|
|
183
|
+
entropy -= p * Math.log(p);
|
|
184
|
+
}
|
|
185
|
+
return { probs, value, entropy };
|
|
186
|
+
}
|
|
187
|
+
forward(state) {
|
|
188
|
+
// Shared hidden layer
|
|
189
|
+
const hidden = new Float32Array(this.hiddenDim);
|
|
190
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
191
|
+
let sum = 0;
|
|
192
|
+
for (let i = 0; i < Math.min(state.length, this.inputDim); i++) {
|
|
193
|
+
sum += state[i] * this.sharedWeights[i * this.hiddenDim + h];
|
|
194
|
+
}
|
|
195
|
+
hidden[h] = Math.max(0, sum); // ReLU
|
|
196
|
+
}
|
|
197
|
+
// Policy head
|
|
198
|
+
const logits = new Float32Array(this.numActions);
|
|
199
|
+
for (let a = 0; a < this.numActions; a++) {
|
|
200
|
+
let sum = 0;
|
|
201
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
202
|
+
sum += hidden[h] * this.policyHead[h * this.numActions + a];
|
|
203
|
+
}
|
|
204
|
+
logits[a] = sum;
|
|
205
|
+
}
|
|
206
|
+
const probs = this.softmax(logits);
|
|
207
|
+
// Value head
|
|
208
|
+
let value = 0;
|
|
209
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
210
|
+
value += hidden[h] * this.valueHead[h];
|
|
211
|
+
}
|
|
212
|
+
return { probs, value };
|
|
213
|
+
}
|
|
214
|
+
forwardWithHidden(state) {
|
|
215
|
+
const hidden = new Float32Array(this.hiddenDim);
|
|
216
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
217
|
+
let sum = 0;
|
|
218
|
+
for (let i = 0; i < Math.min(state.length, this.inputDim); i++) {
|
|
219
|
+
sum += state[i] * this.sharedWeights[i * this.hiddenDim + h];
|
|
220
|
+
}
|
|
221
|
+
hidden[h] = Math.max(0, sum);
|
|
222
|
+
}
|
|
223
|
+
const logits = new Float32Array(this.numActions);
|
|
224
|
+
for (let a = 0; a < this.numActions; a++) {
|
|
225
|
+
let sum = 0;
|
|
226
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
227
|
+
sum += hidden[h] * this.policyHead[h * this.numActions + a];
|
|
228
|
+
}
|
|
229
|
+
logits[a] = sum;
|
|
230
|
+
}
|
|
231
|
+
const probs = this.softmax(logits);
|
|
232
|
+
let value = 0;
|
|
233
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
234
|
+
value += hidden[h] * this.valueHead[h];
|
|
235
|
+
}
|
|
236
|
+
return { probs, value, hidden };
|
|
237
|
+
}
|
|
238
|
+
computeReturns() {
|
|
239
|
+
const returns = new Array(this.buffer.length).fill(0);
|
|
240
|
+
let cumReturn = 0;
|
|
241
|
+
// Bootstrap from last value if not terminal
|
|
242
|
+
if (this.buffer.length > 0) {
|
|
243
|
+
cumReturn = this.buffer[this.buffer.length - 1].value;
|
|
244
|
+
}
|
|
245
|
+
for (let t = this.buffer.length - 1; t >= 0; t--) {
|
|
246
|
+
cumReturn = this.buffer[t].reward + this.config.gamma * cumReturn;
|
|
247
|
+
returns[t] = cumReturn;
|
|
248
|
+
}
|
|
249
|
+
return returns;
|
|
250
|
+
}
|
|
251
|
+
computeAdvantages(returns) {
|
|
252
|
+
if (this.config.useGAE) {
|
|
253
|
+
return this.computeGAE();
|
|
254
|
+
}
|
|
255
|
+
// Simple advantage: return - value
|
|
256
|
+
const advantages = new Array(this.buffer.length).fill(0);
|
|
257
|
+
for (let i = 0; i < this.buffer.length; i++) {
|
|
258
|
+
advantages[i] = returns[i] - this.buffer[i].value;
|
|
259
|
+
}
|
|
260
|
+
// Normalize
|
|
261
|
+
const mean = advantages.reduce((a, b) => a + b, 0) / advantages.length;
|
|
262
|
+
const std = Math.sqrt(advantages.reduce((a, b) => a + (b - mean) ** 2, 0) / advantages.length) + 1e-8;
|
|
263
|
+
return advantages.map(a => (a - mean) / std);
|
|
264
|
+
}
|
|
265
|
+
computeGAE() {
|
|
266
|
+
const advantages = new Array(this.buffer.length).fill(0);
|
|
267
|
+
let lastGae = 0;
|
|
268
|
+
for (let t = this.buffer.length - 1; t >= 0; t--) {
|
|
269
|
+
const nextValue = t < this.buffer.length - 1
|
|
270
|
+
? this.buffer[t + 1].value
|
|
271
|
+
: 0;
|
|
272
|
+
const delta = this.buffer[t].reward + this.config.gamma * nextValue - this.buffer[t].value;
|
|
273
|
+
lastGae = delta + this.config.gamma * this.config.gaeLambda * lastGae;
|
|
274
|
+
advantages[t] = lastGae;
|
|
275
|
+
}
|
|
276
|
+
// Normalize
|
|
277
|
+
const mean = advantages.reduce((a, b) => a + b, 0) / advantages.length;
|
|
278
|
+
const std = Math.sqrt(advantages.reduce((a, b) => a + (b - mean) ** 2, 0) / advantages.length) + 1e-8;
|
|
279
|
+
return advantages.map(a => (a - mean) / std);
|
|
280
|
+
}
|
|
281
|
+
accumulateGradients(sharedGrad, policyGrad, valueGrad, state, hidden, action, advantage, valueError) {
|
|
282
|
+
// Policy gradient
|
|
283
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
284
|
+
policyGrad[h * this.numActions + action] += hidden[h] * advantage;
|
|
285
|
+
}
|
|
286
|
+
// Value gradient
|
|
287
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
288
|
+
valueGrad[h] += hidden[h] * valueError * this.config.valueLossCoef;
|
|
289
|
+
}
|
|
290
|
+
// Shared layer gradient (backprop through both heads)
|
|
291
|
+
for (let h = 0; h < this.hiddenDim; h++) {
|
|
292
|
+
if (hidden[h] > 0) { // ReLU gradient
|
|
293
|
+
const policySignal = advantage * this.policyHead[h * this.numActions + action];
|
|
294
|
+
const valueSignal = valueError * this.valueHead[h] * this.config.valueLossCoef;
|
|
295
|
+
const totalSignal = policySignal + valueSignal;
|
|
296
|
+
for (let i = 0; i < Math.min(state.length, this.inputDim); i++) {
|
|
297
|
+
sharedGrad[i * this.hiddenDim + h] += state[i] * totalSignal;
|
|
298
|
+
}
|
|
299
|
+
}
|
|
300
|
+
}
|
|
301
|
+
}
|
|
302
|
+
applyGradients(sharedGrad, policyGrad, valueGrad, batchSize) {
|
|
303
|
+
const lr = this.config.learningRate / batchSize;
|
|
304
|
+
const beta = 0.9;
|
|
305
|
+
// Apply to shared weights
|
|
306
|
+
for (let i = 0; i < this.sharedWeights.length; i++) {
|
|
307
|
+
const grad = Math.max(Math.min(sharedGrad[i], this.config.maxGradNorm), -this.config.maxGradNorm);
|
|
308
|
+
this.sharedMomentum[i] = beta * this.sharedMomentum[i] + (1 - beta) * grad;
|
|
309
|
+
this.sharedWeights[i] -= lr * this.sharedMomentum[i];
|
|
310
|
+
}
|
|
311
|
+
// Apply to policy head
|
|
312
|
+
for (let i = 0; i < this.policyHead.length; i++) {
|
|
313
|
+
const grad = Math.max(Math.min(policyGrad[i], this.config.maxGradNorm), -this.config.maxGradNorm);
|
|
314
|
+
this.policyMomentum[i] = beta * this.policyMomentum[i] + (1 - beta) * grad;
|
|
315
|
+
this.policyHead[i] -= lr * this.policyMomentum[i];
|
|
316
|
+
}
|
|
317
|
+
// Apply to value head
|
|
318
|
+
for (let i = 0; i < this.valueHead.length; i++) {
|
|
319
|
+
const grad = Math.max(Math.min(valueGrad[i], this.config.maxGradNorm), -this.config.maxGradNorm);
|
|
320
|
+
this.valueMomentum[i] = beta * this.valueMomentum[i] + (1 - beta) * grad;
|
|
321
|
+
this.valueHead[i] -= lr * this.valueMomentum[i];
|
|
322
|
+
}
|
|
323
|
+
}
|
|
324
|
+
softmax(logits) {
|
|
325
|
+
const max = Math.max(...logits);
|
|
326
|
+
const exps = new Float32Array(logits.length);
|
|
327
|
+
let sum = 0;
|
|
328
|
+
for (let i = 0; i < logits.length; i++) {
|
|
329
|
+
exps[i] = Math.exp(logits[i] - max);
|
|
330
|
+
sum += exps[i];
|
|
331
|
+
}
|
|
332
|
+
for (let i = 0; i < exps.length; i++) {
|
|
333
|
+
exps[i] /= sum;
|
|
334
|
+
}
|
|
335
|
+
return exps;
|
|
336
|
+
}
|
|
337
|
+
sampleAction(probs) {
|
|
338
|
+
const r = Math.random();
|
|
339
|
+
let cumSum = 0;
|
|
340
|
+
for (let i = 0; i < probs.length; i++) {
|
|
341
|
+
cumSum += probs[i];
|
|
342
|
+
if (r < cumSum)
|
|
343
|
+
return i;
|
|
344
|
+
}
|
|
345
|
+
return probs.length - 1;
|
|
346
|
+
}
|
|
347
|
+
hashAction(action) {
|
|
348
|
+
let hash = 0;
|
|
349
|
+
for (let i = 0; i < action.length; i++) {
|
|
350
|
+
hash = (hash * 31 + action.charCodeAt(i)) % this.numActions;
|
|
351
|
+
}
|
|
352
|
+
return hash;
|
|
353
|
+
}
|
|
354
|
+
}
|
|
355
|
+
/**
|
|
356
|
+
* Factory function
|
|
357
|
+
*/
|
|
358
|
+
export function createA2C(config) {
|
|
359
|
+
return new A2CAlgorithm(config);
|
|
360
|
+
}
|
|
361
|
+
//# sourceMappingURL=a2c.js.map
|