jfl 0.4.4 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/commands/context-hub.d.ts +1 -0
- package/dist/commands/context-hub.d.ts.map +1 -1
- package/dist/commands/context-hub.js +1064 -41
- package/dist/commands/context-hub.js.map +1 -1
- package/dist/commands/eval.d.ts +1 -1
- package/dist/commands/eval.d.ts.map +1 -1
- package/dist/commands/eval.js +192 -1
- package/dist/commands/eval.js.map +1 -1
- package/dist/commands/findings.d.ts +6 -0
- package/dist/commands/findings.d.ts.map +1 -0
- package/dist/commands/findings.js +203 -0
- package/dist/commands/findings.js.map +1 -0
- package/dist/commands/hud.d.ts.map +1 -1
- package/dist/commands/hud.js +47 -9
- package/dist/commands/hud.js.map +1 -1
- package/dist/commands/ide.d.ts +27 -0
- package/dist/commands/ide.d.ts.map +1 -0
- package/dist/commands/ide.js +546 -0
- package/dist/commands/ide.js.map +1 -0
- package/dist/commands/onboard.d.ts.map +1 -1
- package/dist/commands/onboard.js +212 -2
- package/dist/commands/onboard.js.map +1 -1
- package/dist/commands/openclaw.d.ts +3 -0
- package/dist/commands/openclaw.d.ts.map +1 -1
- package/dist/commands/openclaw.js +76 -2
- package/dist/commands/openclaw.js.map +1 -1
- package/dist/commands/peter.d.ts +3 -0
- package/dist/commands/peter.d.ts.map +1 -1
- package/dist/commands/peter.js +1168 -58
- package/dist/commands/peter.js.map +1 -1
- package/dist/commands/pi-fleet.d.ts +18 -0
- package/dist/commands/pi-fleet.d.ts.map +1 -0
- package/dist/commands/pi-fleet.js +382 -0
- package/dist/commands/pi-fleet.js.map +1 -0
- package/dist/commands/pi.d.ts.map +1 -1
- package/dist/commands/pi.js +18 -3
- package/dist/commands/pi.js.map +1 -1
- package/dist/commands/scope.d.ts.map +1 -1
- package/dist/commands/scope.js +90 -1
- package/dist/commands/scope.js.map +1 -1
- package/dist/commands/services.d.ts.map +1 -1
- package/dist/commands/services.js +18 -0
- package/dist/commands/services.js.map +1 -1
- package/dist/commands/setup.d.ts +12 -0
- package/dist/commands/setup.d.ts.map +1 -0
- package/dist/commands/setup.js +322 -0
- package/dist/commands/setup.js.map +1 -0
- package/dist/commands/status.d.ts.map +1 -1
- package/dist/commands/status.js +22 -4
- package/dist/commands/status.js.map +1 -1
- package/dist/commands/train.d.ts +33 -0
- package/dist/commands/train.d.ts.map +1 -0
- package/dist/commands/train.js +510 -0
- package/dist/commands/train.js.map +1 -0
- package/dist/commands/verify.d.ts +14 -0
- package/dist/commands/verify.d.ts.map +1 -0
- package/dist/commands/verify.js +276 -0
- package/dist/commands/verify.js.map +1 -0
- package/dist/commands/viz.d.ts.map +1 -1
- package/dist/commands/viz.js +417 -0
- package/dist/commands/viz.js.map +1 -1
- package/dist/dashboard-static/assets/index-CW9ZxqX8.css +1 -0
- package/dist/dashboard-static/assets/index-DNN__p4K.js +121 -0
- package/dist/dashboard-static/index.html +2 -2
- package/dist/index.js +324 -64
- package/dist/index.js.map +1 -1
- package/dist/lib/agent-config.d.ts +52 -0
- package/dist/lib/agent-config.d.ts.map +1 -0
- package/dist/lib/agent-config.js +231 -0
- package/dist/lib/agent-config.js.map +1 -0
- package/dist/lib/agent-generator.d.ts +10 -0
- package/dist/lib/agent-generator.d.ts.map +1 -1
- package/dist/lib/agent-generator.js +64 -10
- package/dist/lib/agent-generator.js.map +1 -1
- package/dist/lib/agent-session.d.ts +104 -0
- package/dist/lib/agent-session.d.ts.map +1 -0
- package/dist/lib/agent-session.js +635 -0
- package/dist/lib/agent-session.js.map +1 -0
- package/dist/lib/eval-snapshot.d.ts +47 -0
- package/dist/lib/eval-snapshot.d.ts.map +1 -0
- package/dist/lib/eval-snapshot.js +315 -0
- package/dist/lib/eval-snapshot.js.map +1 -0
- package/dist/lib/eval-store.d.ts +5 -0
- package/dist/lib/eval-store.d.ts.map +1 -1
- package/dist/lib/eval-store.js +33 -3
- package/dist/lib/eval-store.js.map +1 -1
- package/dist/lib/findings-engine.d.ts +51 -0
- package/dist/lib/findings-engine.d.ts.map +1 -0
- package/dist/lib/findings-engine.js +338 -0
- package/dist/lib/findings-engine.js.map +1 -0
- package/dist/lib/flow-engine.d.ts +8 -0
- package/dist/lib/flow-engine.d.ts.map +1 -1
- package/dist/lib/flow-engine.js +84 -2
- package/dist/lib/flow-engine.js.map +1 -1
- package/dist/lib/hub-client.d.ts +1 -0
- package/dist/lib/hub-client.d.ts.map +1 -1
- package/dist/lib/hub-client.js +33 -6
- package/dist/lib/hub-client.js.map +1 -1
- package/dist/lib/ide-panes.d.ts +58 -0
- package/dist/lib/ide-panes.d.ts.map +1 -0
- package/dist/lib/ide-panes.js +508 -0
- package/dist/lib/ide-panes.js.map +1 -0
- package/dist/lib/memory-db.js +4 -4
- package/dist/lib/memory-db.js.map +1 -1
- package/dist/lib/memory-indexer.d.ts.map +1 -1
- package/dist/lib/memory-indexer.js +3 -0
- package/dist/lib/memory-indexer.js.map +1 -1
- package/dist/lib/memory-search.d.ts +148 -4
- package/dist/lib/memory-search.d.ts.map +1 -1
- package/dist/lib/memory-search.js +496 -58
- package/dist/lib/memory-search.js.map +1 -1
- package/dist/lib/meta-orchestrator.d.ts +104 -0
- package/dist/lib/meta-orchestrator.d.ts.map +1 -0
- package/dist/lib/meta-orchestrator.js +373 -0
- package/dist/lib/meta-orchestrator.js.map +1 -0
- package/dist/lib/peer-agent-generator.d.ts.map +1 -1
- package/dist/lib/peer-agent-generator.js +43 -19
- package/dist/lib/peer-agent-generator.js.map +1 -1
- package/dist/lib/pi-sky/bridge.d.ts +55 -0
- package/dist/lib/pi-sky/bridge.d.ts.map +1 -0
- package/dist/lib/pi-sky/bridge.js +264 -0
- package/dist/lib/pi-sky/bridge.js.map +1 -0
- package/dist/lib/pi-sky/cost-monitor.d.ts +21 -0
- package/dist/lib/pi-sky/cost-monitor.d.ts.map +1 -0
- package/dist/lib/pi-sky/cost-monitor.js +126 -0
- package/dist/lib/pi-sky/cost-monitor.js.map +1 -0
- package/dist/lib/pi-sky/eval-sweep.d.ts +27 -0
- package/dist/lib/pi-sky/eval-sweep.d.ts.map +1 -0
- package/dist/lib/pi-sky/eval-sweep.js +141 -0
- package/dist/lib/pi-sky/eval-sweep.js.map +1 -0
- package/dist/lib/pi-sky/event-router.d.ts +32 -0
- package/dist/lib/pi-sky/event-router.d.ts.map +1 -0
- package/dist/lib/pi-sky/event-router.js +176 -0
- package/dist/lib/pi-sky/event-router.js.map +1 -0
- package/dist/lib/pi-sky/experiment.d.ts +9 -0
- package/dist/lib/pi-sky/experiment.d.ts.map +1 -0
- package/dist/lib/pi-sky/experiment.js +83 -0
- package/dist/lib/pi-sky/experiment.js.map +1 -0
- package/dist/lib/pi-sky/index.d.ts +16 -0
- package/dist/lib/pi-sky/index.d.ts.map +1 -0
- package/dist/lib/pi-sky/index.js +16 -0
- package/dist/lib/pi-sky/index.js.map +1 -0
- package/dist/lib/pi-sky/stratus-gate.d.ts +28 -0
- package/dist/lib/pi-sky/stratus-gate.d.ts.map +1 -0
- package/dist/lib/pi-sky/stratus-gate.js +61 -0
- package/dist/lib/pi-sky/stratus-gate.js.map +1 -0
- package/dist/lib/pi-sky/swarm.d.ts +28 -0
- package/dist/lib/pi-sky/swarm.d.ts.map +1 -0
- package/dist/lib/pi-sky/swarm.js +208 -0
- package/dist/lib/pi-sky/swarm.js.map +1 -0
- package/dist/lib/pi-sky/types.d.ts +139 -0
- package/dist/lib/pi-sky/types.d.ts.map +1 -0
- package/dist/lib/pi-sky/types.js +2 -0
- package/dist/lib/pi-sky/types.js.map +1 -0
- package/dist/lib/pi-sky/voice-bridge.d.ts +20 -0
- package/dist/lib/pi-sky/voice-bridge.d.ts.map +1 -0
- package/dist/lib/pi-sky/voice-bridge.js +91 -0
- package/dist/lib/pi-sky/voice-bridge.js.map +1 -0
- package/dist/lib/policy-head.d.ts +40 -0
- package/dist/lib/policy-head.d.ts.map +1 -0
- package/dist/lib/policy-head.js +234 -0
- package/dist/lib/policy-head.js.map +1 -0
- package/dist/lib/predictor.d.ts +10 -0
- package/dist/lib/predictor.d.ts.map +1 -1
- package/dist/lib/predictor.js +46 -7
- package/dist/lib/predictor.js.map +1 -1
- package/dist/lib/replay-buffer.d.ts +93 -0
- package/dist/lib/replay-buffer.d.ts.map +1 -0
- package/dist/lib/replay-buffer.js +302 -0
- package/dist/lib/replay-buffer.js.map +1 -0
- package/dist/lib/sentinel-rl.d.ts +97 -0
- package/dist/lib/sentinel-rl.d.ts.map +1 -0
- package/dist/lib/sentinel-rl.js +430 -0
- package/dist/lib/sentinel-rl.js.map +1 -0
- package/dist/lib/session-lock.d.ts +61 -0
- package/dist/lib/session-lock.d.ts.map +1 -0
- package/dist/lib/session-lock.js +438 -0
- package/dist/lib/session-lock.js.map +1 -0
- package/dist/lib/setup/agent-generator.d.ts +18 -0
- package/dist/lib/setup/agent-generator.d.ts.map +1 -0
- package/dist/lib/setup/agent-generator.js +114 -0
- package/dist/lib/setup/agent-generator.js.map +1 -0
- package/dist/lib/setup/context-analyzer.d.ts +16 -0
- package/dist/lib/setup/context-analyzer.d.ts.map +1 -0
- package/dist/lib/setup/context-analyzer.js +112 -0
- package/dist/lib/setup/context-analyzer.js.map +1 -0
- package/dist/lib/setup/doc-auditor.d.ts +54 -0
- package/dist/lib/setup/doc-auditor.d.ts.map +1 -0
- package/dist/lib/setup/doc-auditor.js +629 -0
- package/dist/lib/setup/doc-auditor.js.map +1 -0
- package/dist/lib/setup/domain-generator.d.ts +7 -0
- package/dist/lib/setup/domain-generator.d.ts.map +1 -0
- package/dist/lib/setup/domain-generator.js +58 -0
- package/dist/lib/setup/domain-generator.js.map +1 -0
- package/dist/lib/setup/smart-eval-generator.d.ts +38 -0
- package/dist/lib/setup/smart-eval-generator.d.ts.map +1 -0
- package/dist/lib/setup/smart-eval-generator.js +378 -0
- package/dist/lib/setup/smart-eval-generator.js.map +1 -0
- package/dist/lib/setup/smart-recommender.d.ts +63 -0
- package/dist/lib/setup/smart-recommender.d.ts.map +1 -0
- package/dist/lib/setup/smart-recommender.js +329 -0
- package/dist/lib/setup/smart-recommender.js.map +1 -0
- package/dist/lib/setup/spec-generator.d.ts +63 -0
- package/dist/lib/setup/spec-generator.d.ts.map +1 -0
- package/dist/lib/setup/spec-generator.js +310 -0
- package/dist/lib/setup/spec-generator.js.map +1 -0
- package/dist/lib/setup/violation-agent-generator.d.ts +32 -0
- package/dist/lib/setup/violation-agent-generator.d.ts.map +1 -0
- package/dist/lib/setup/violation-agent-generator.js +255 -0
- package/dist/lib/setup/violation-agent-generator.js.map +1 -0
- package/dist/lib/stratus-client.d.ts +1 -0
- package/dist/lib/stratus-client.d.ts.map +1 -1
- package/dist/lib/stratus-client.js +24 -2
- package/dist/lib/stratus-client.js.map +1 -1
- package/dist/lib/telemetry-agent-v2.d.ts +128 -0
- package/dist/lib/telemetry-agent-v2.d.ts.map +1 -0
- package/dist/lib/telemetry-agent-v2.js +1042 -0
- package/dist/lib/telemetry-agent-v2.js.map +1 -0
- package/dist/lib/telemetry-agent.d.ts.map +1 -1
- package/dist/lib/telemetry-agent.js +27 -6
- package/dist/lib/telemetry-agent.js.map +1 -1
- package/dist/lib/telemetry-digest.d.ts.map +1 -1
- package/dist/lib/telemetry-digest.js +27 -5
- package/dist/lib/telemetry-digest.js.map +1 -1
- package/dist/lib/telemetry.d.ts.map +1 -1
- package/dist/lib/telemetry.js +29 -4
- package/dist/lib/telemetry.js.map +1 -1
- package/dist/lib/text-preprocessing.d.ts +83 -0
- package/dist/lib/text-preprocessing.d.ts.map +1 -0
- package/dist/lib/text-preprocessing.js +261 -0
- package/dist/lib/text-preprocessing.js.map +1 -0
- package/dist/lib/training-buffer.d.ts +86 -0
- package/dist/lib/training-buffer.d.ts.map +1 -0
- package/dist/lib/training-buffer.js +139 -0
- package/dist/lib/training-buffer.js.map +1 -0
- package/dist/lib/tuple-miner.d.ts +30 -0
- package/dist/lib/tuple-miner.d.ts.map +1 -0
- package/dist/lib/tuple-miner.js +427 -0
- package/dist/lib/tuple-miner.js.map +1 -0
- package/dist/lib/vm-backend.d.ts +72 -0
- package/dist/lib/vm-backend.d.ts.map +1 -0
- package/dist/lib/vm-backend.js +175 -0
- package/dist/lib/vm-backend.js.map +1 -0
- package/dist/lib/workspace/backend.d.ts +53 -0
- package/dist/lib/workspace/backend.d.ts.map +1 -0
- package/dist/lib/workspace/backend.js +37 -0
- package/dist/lib/workspace/backend.js.map +1 -0
- package/dist/lib/workspace/cmux-adapter.d.ts +46 -0
- package/dist/lib/workspace/cmux-adapter.d.ts.map +1 -0
- package/dist/lib/workspace/cmux-adapter.js +261 -0
- package/dist/lib/workspace/cmux-adapter.js.map +1 -0
- package/dist/lib/workspace/data-pipeline.d.ts +35 -0
- package/dist/lib/workspace/data-pipeline.d.ts.map +1 -0
- package/dist/lib/workspace/data-pipeline.js +463 -0
- package/dist/lib/workspace/data-pipeline.js.map +1 -0
- package/dist/lib/workspace/engine.d.ts +64 -0
- package/dist/lib/workspace/engine.d.ts.map +1 -0
- package/dist/lib/workspace/engine.js +397 -0
- package/dist/lib/workspace/engine.js.map +1 -0
- package/dist/lib/workspace/notifications.d.ts +14 -0
- package/dist/lib/workspace/notifications.d.ts.map +1 -0
- package/dist/lib/workspace/notifications.js +41 -0
- package/dist/lib/workspace/notifications.js.map +1 -0
- package/dist/lib/workspace/surface-registry.d.ts +49 -0
- package/dist/lib/workspace/surface-registry.d.ts.map +1 -0
- package/dist/lib/workspace/surface-registry.js +217 -0
- package/dist/lib/workspace/surface-registry.js.map +1 -0
- package/dist/lib/workspace/surface-type.d.ts +153 -0
- package/dist/lib/workspace/surface-type.d.ts.map +1 -0
- package/dist/lib/workspace/surface-type.js +9 -0
- package/dist/lib/workspace/surface-type.js.map +1 -0
- package/dist/lib/workspace/surfaces/agent-overview.d.ts +16 -0
- package/dist/lib/workspace/surfaces/agent-overview.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/agent-overview.js +116 -0
- package/dist/lib/workspace/surfaces/agent-overview.js.map +1 -0
- package/dist/lib/workspace/surfaces/agent.d.ts +16 -0
- package/dist/lib/workspace/surfaces/agent.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/agent.js +112 -0
- package/dist/lib/workspace/surfaces/agent.js.map +1 -0
- package/dist/lib/workspace/surfaces/claude.d.ts +15 -0
- package/dist/lib/workspace/surfaces/claude.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/claude.js +23 -0
- package/dist/lib/workspace/surfaces/claude.js.map +1 -0
- package/dist/lib/workspace/surfaces/dashboard.d.ts +21 -0
- package/dist/lib/workspace/surfaces/dashboard.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/dashboard.js +32 -0
- package/dist/lib/workspace/surfaces/dashboard.js.map +1 -0
- package/dist/lib/workspace/surfaces/eval.d.ts +15 -0
- package/dist/lib/workspace/surfaces/eval.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/eval.js +42 -0
- package/dist/lib/workspace/surfaces/eval.js.map +1 -0
- package/dist/lib/workspace/surfaces/event-stream.d.ts +16 -0
- package/dist/lib/workspace/surfaces/event-stream.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/event-stream.js +40 -0
- package/dist/lib/workspace/surfaces/event-stream.js.map +1 -0
- package/dist/lib/workspace/surfaces/flow.d.ts +16 -0
- package/dist/lib/workspace/surfaces/flow.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/flow.js +49 -0
- package/dist/lib/workspace/surfaces/flow.js.map +1 -0
- package/dist/lib/workspace/surfaces/index.d.ts +16 -0
- package/dist/lib/workspace/surfaces/index.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/index.js +16 -0
- package/dist/lib/workspace/surfaces/index.js.map +1 -0
- package/dist/lib/workspace/surfaces/portfolio.d.ts +16 -0
- package/dist/lib/workspace/surfaces/portfolio.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/portfolio.js +102 -0
- package/dist/lib/workspace/surfaces/portfolio.js.map +1 -0
- package/dist/lib/workspace/surfaces/service.d.ts +16 -0
- package/dist/lib/workspace/surfaces/service.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/service.js +45 -0
- package/dist/lib/workspace/surfaces/service.js.map +1 -0
- package/dist/lib/workspace/surfaces/shell.d.ts +15 -0
- package/dist/lib/workspace/surfaces/shell.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/shell.js +19 -0
- package/dist/lib/workspace/surfaces/shell.js.map +1 -0
- package/dist/lib/workspace/surfaces/telemetry.d.ts +16 -0
- package/dist/lib/workspace/surfaces/telemetry.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/telemetry.js +48 -0
- package/dist/lib/workspace/surfaces/telemetry.js.map +1 -0
- package/dist/lib/workspace/surfaces/topology.d.ts +15 -0
- package/dist/lib/workspace/surfaces/topology.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/topology.js +19 -0
- package/dist/lib/workspace/surfaces/topology.js.map +1 -0
- package/dist/lib/workspace/surfaces/training.d.ts +16 -0
- package/dist/lib/workspace/surfaces/training.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/training.js +22 -0
- package/dist/lib/workspace/surfaces/training.js.map +1 -0
- package/dist/lib/workspace/tmux-adapter.d.ts +27 -0
- package/dist/lib/workspace/tmux-adapter.d.ts.map +1 -0
- package/dist/lib/workspace/tmux-adapter.js +106 -0
- package/dist/lib/workspace/tmux-adapter.js.map +1 -0
- package/dist/mcp/context-hub-mcp.js +7 -24
- package/dist/mcp/context-hub-mcp.js.map +1 -1
- package/dist/types/flows.d.ts +2 -0
- package/dist/types/flows.d.ts.map +1 -1
- package/dist/types/ide.d.ts +49 -0
- package/dist/types/ide.d.ts.map +1 -0
- package/dist/types/ide.js +5 -0
- package/dist/types/ide.js.map +1 -0
- package/dist/types/platform-digest.d.ts +228 -0
- package/dist/types/platform-digest.d.ts.map +1 -0
- package/dist/types/platform-digest.js +5 -0
- package/dist/types/platform-digest.js.map +1 -0
- package/dist/types/telemetry-digest.d.ts +2 -0
- package/dist/types/telemetry-digest.d.ts.map +1 -1
- package/dist/utils/ensure-project.d.ts +1 -0
- package/dist/utils/ensure-project.d.ts.map +1 -1
- package/dist/utils/ensure-project.js +19 -7
- package/dist/utils/ensure-project.js.map +1 -1
- package/dist/utils/jfl-config.d.ts +1 -0
- package/dist/utils/jfl-config.d.ts.map +1 -1
- package/dist/utils/jfl-config.js +19 -1
- package/dist/utils/jfl-config.js.map +1 -1
- package/dist/utils/jfl-paths.d.ts +5 -0
- package/dist/utils/jfl-paths.d.ts.map +1 -1
- package/dist/utils/jfl-paths.js +25 -3
- package/dist/utils/jfl-paths.js.map +1 -1
- package/package.json +3 -2
- package/packages/pi/AGENTS.md +112 -0
- package/packages/pi/extensions/agent-grid.ts +191 -0
- package/packages/pi/extensions/agent-names.ts +178 -0
- package/packages/pi/extensions/autoresearch.ts +427 -0
- package/packages/pi/extensions/bookmarks.ts +85 -0
- package/packages/pi/extensions/context.ts +184 -0
- package/packages/pi/extensions/crm-tool.ts +61 -0
- package/packages/pi/extensions/eval-tool.ts +224 -0
- package/packages/pi/extensions/eval.ts +60 -0
- package/packages/pi/extensions/footer.ts +239 -0
- package/packages/pi/extensions/hub-resolver.ts +63 -0
- package/packages/pi/extensions/hud-tool.ts +145 -0
- package/packages/pi/extensions/index.ts +405 -0
- package/packages/pi/extensions/journal.ts +224 -0
- package/packages/pi/extensions/map-bridge.ts +178 -0
- package/packages/pi/extensions/memory-tool.ts +73 -0
- package/packages/pi/extensions/notifications.ts +73 -0
- package/packages/pi/extensions/peter-parker.ts +202 -0
- package/packages/pi/extensions/policy-head-tool.ts +276 -0
- package/packages/pi/extensions/portfolio-bridge.ts +90 -0
- package/packages/pi/extensions/session.ts +142 -0
- package/packages/pi/extensions/shortcuts.ts +259 -0
- package/packages/pi/extensions/stratus-bridge.ts +115 -0
- package/packages/pi/extensions/synopsis-tool.ts +83 -0
- package/packages/pi/extensions/tool-renderers.ts +353 -0
- package/packages/pi/extensions/training-buffer-tool.ts +368 -0
- package/packages/pi/extensions/types.ts +163 -0
- package/packages/pi/package-lock.json +346 -0
- package/packages/pi/package.json +44 -0
- package/packages/pi/skills/agent-browser/SKILL.md +116 -0
- package/packages/pi/skills/brand-architect/SKILL.md +240 -0
- package/packages/pi/skills/brand-architect/config.yaml +137 -0
- package/packages/pi/skills/campaign-hud/config.yaml +112 -0
- package/packages/pi/skills/content-creator/SKILL.md +294 -0
- package/packages/pi/skills/context/SKILL.md +65 -0
- package/packages/pi/skills/debug/MULTI_AGENT.md +360 -0
- package/packages/pi/skills/debug/SKILL.md +554 -0
- package/packages/pi/skills/end/SKILL.md +1782 -0
- package/packages/pi/skills/eval/SKILL.md +75 -0
- package/packages/pi/skills/fly-deploy/SKILL.md +676 -0
- package/packages/pi/skills/founder-video/SKILL.md +467 -0
- package/packages/pi/skills/hud/SKILL.md +160 -0
- package/packages/pi/skills/orchestrate/SKILL.md +74 -0
- package/packages/pi/skills/pi-agents/SKILL.md +78 -0
- package/packages/pi/skills/react-best-practices/AGENTS.md +2249 -0
- package/packages/pi/skills/react-best-practices/README.md +123 -0
- package/packages/pi/skills/react-best-practices/SKILL.md +125 -0
- package/packages/pi/skills/react-best-practices/metadata.json +15 -0
- package/packages/pi/skills/react-best-practices/rules/_sections.md +46 -0
- package/packages/pi/skills/react-best-practices/rules/_template.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/advanced-event-handler-refs.md +55 -0
- package/packages/pi/skills/react-best-practices/rules/advanced-use-latest.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/async-api-routes.md +38 -0
- package/packages/pi/skills/react-best-practices/rules/async-defer-await.md +80 -0
- package/packages/pi/skills/react-best-practices/rules/async-dependencies.md +36 -0
- package/packages/pi/skills/react-best-practices/rules/async-parallel.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/async-suspense-boundaries.md +99 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-barrel-imports.md +59 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-conditional.md +31 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-defer-third-party.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-dynamic-imports.md +35 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-preload.md +50 -0
- package/packages/pi/skills/react-best-practices/rules/client-event-listeners.md +74 -0
- package/packages/pi/skills/react-best-practices/rules/client-swr-dedup.md +56 -0
- package/packages/pi/skills/react-best-practices/rules/js-batch-dom-css.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-function-results.md +80 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-property-access.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-storage.md +70 -0
- package/packages/pi/skills/react-best-practices/rules/js-combine-iterations.md +32 -0
- package/packages/pi/skills/react-best-practices/rules/js-early-exit.md +50 -0
- package/packages/pi/skills/react-best-practices/rules/js-hoist-regexp.md +45 -0
- package/packages/pi/skills/react-best-practices/rules/js-index-maps.md +37 -0
- package/packages/pi/skills/react-best-practices/rules/js-length-check-first.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/js-min-max-loop.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/js-set-map-lookups.md +24 -0
- package/packages/pi/skills/react-best-practices/rules/js-tosorted-immutable.md +57 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-activity.md +26 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-animate-svg-wrapper.md +47 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-conditional-render.md +40 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-content-visibility.md +38 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-hoist-jsx.md +46 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-hydration-no-flicker.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-svg-precision.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-defer-reads.md +39 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-dependencies.md +45 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-derived-state.md +29 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-functional-setstate.md +74 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-lazy-state-init.md +58 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-memo.md +44 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-transitions.md +40 -0
- package/packages/pi/skills/react-best-practices/rules/server-after-nonblocking.md +73 -0
- package/packages/pi/skills/react-best-practices/rules/server-cache-lru.md +41 -0
- package/packages/pi/skills/react-best-practices/rules/server-cache-react.md +26 -0
- package/packages/pi/skills/react-best-practices/rules/server-parallel-fetching.md +79 -0
- package/packages/pi/skills/react-best-practices/rules/server-serialization.md +38 -0
- package/packages/pi/skills/remotion-best-practices/SKILL.md +43 -0
- package/packages/pi/skills/remotion-best-practices/rules/3d.md +86 -0
- package/packages/pi/skills/remotion-best-practices/rules/animations.md +29 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/charts-bar-chart.tsx +173 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-typewriter.tsx +100 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-word-highlight.tsx +108 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets.md +78 -0
- package/packages/pi/skills/remotion-best-practices/rules/audio.md +172 -0
- package/packages/pi/skills/remotion-best-practices/rules/calculate-metadata.md +104 -0
- package/packages/pi/skills/remotion-best-practices/rules/can-decode.md +75 -0
- package/packages/pi/skills/remotion-best-practices/rules/charts.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/compositions.md +146 -0
- package/packages/pi/skills/remotion-best-practices/rules/display-captions.md +126 -0
- package/packages/pi/skills/remotion-best-practices/rules/extract-frames.md +229 -0
- package/packages/pi/skills/remotion-best-practices/rules/fonts.md +152 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-audio-duration.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-video-dimensions.md +68 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-video-duration.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/gifs.md +138 -0
- package/packages/pi/skills/remotion-best-practices/rules/images.md +130 -0
- package/packages/pi/skills/remotion-best-practices/rules/import-srt-captions.md +67 -0
- package/packages/pi/skills/remotion-best-practices/rules/lottie.md +68 -0
- package/packages/pi/skills/remotion-best-practices/rules/measuring-dom-nodes.md +35 -0
- package/packages/pi/skills/remotion-best-practices/rules/measuring-text.md +143 -0
- package/packages/pi/skills/remotion-best-practices/rules/sequencing.md +106 -0
- package/packages/pi/skills/remotion-best-practices/rules/tailwind.md +11 -0
- package/packages/pi/skills/remotion-best-practices/rules/text-animations.md +20 -0
- package/packages/pi/skills/remotion-best-practices/rules/timing.md +179 -0
- package/packages/pi/skills/remotion-best-practices/rules/transcribe-captions.md +19 -0
- package/packages/pi/skills/remotion-best-practices/rules/transitions.md +122 -0
- package/packages/pi/skills/remotion-best-practices/rules/trimming.md +53 -0
- package/packages/pi/skills/remotion-best-practices/rules/videos.md +171 -0
- package/packages/pi/skills/search/SKILL.md +220 -0
- package/packages/pi/skills/spec/SKILL.md +377 -0
- package/packages/pi/skills/startup/SKILL.md +315 -0
- package/packages/pi/skills/web-architect/SKILL.md +309 -0
- package/packages/pi/skills/x-algorithm/SKILL.md +305 -0
- package/packages/pi/teams/dev-team.yaml +63 -0
- package/packages/pi/teams/gtm-team.yaml +79 -0
- package/packages/pi/themes/jfl.theme.json +76 -0
- package/packages/pi/tsconfig.json +21 -0
- package/scripts/collect-tuples.sh +124 -0
- package/scripts/destroy-fleet.sh +37 -0
- package/scripts/jfl-ide.sh +48 -0
- package/scripts/session/session-cleanup.sh +4 -11
- package/scripts/session/session-init.sh +6 -0
- package/scripts/session/session-sync.sh +25 -0
- package/scripts/setup-branch-protection.sh +106 -0
- package/scripts/spawn-fleet.sh +144 -0
- package/scripts/train/requirements.txt +5 -0
- package/scripts/train/train-policy-head.py +477 -0
- package/scripts/train/v2/dataset.py +81 -0
- package/scripts/train/v2/domain.json +18 -0
- package/scripts/train/v2/eval.py +196 -0
- package/scripts/train/v2/generate_data.py +219 -0
- package/scripts/train/v2/infer.py +188 -0
- package/scripts/train/v2/model.py +112 -0
- package/scripts/train/v2/precompute.py +132 -0
- package/scripts/train/v2/train.py +302 -0
- package/scripts/train/v2/transform_buffer.py +227 -0
- package/scripts/train/v2/validate_data.py +115 -0
- package/scripts/train-policy-head.py +434 -0
- package/scripts/vm-swarm/README.md +301 -0
- package/scripts/vm-swarm/collect-tuples.sh +331 -0
- package/scripts/vm-swarm/create-base-template.sh +339 -0
- package/scripts/vm-swarm/kill-fleet.sh +204 -0
- package/scripts/vm-swarm/monitor-fleet.sh +346 -0
- package/scripts/vm-swarm/spawn-fleet.sh +304 -0
- package/template/.claude/settings.json +2 -15
- package/template/.github/workflows/jfl-eval.yml +6 -1
- package/template/.github/workflows/jfl-review.yml +4 -0
- package/template/scripts/session/session-cleanup.sh +2 -11
- package/template/scripts/session/session-end-hub.sh +72 -0
- package/template/scripts/session/session-end.sh +69 -6
- package/template/scripts/session/session-init.sh +55 -30
- package/template/scripts/session/session-lock.sh +464 -0
- package/template/scripts/session/session-start-hub.sh +105 -0
- package/template/templates/service-agent/workflows/jfl-eval.yml +19 -0
- package/dist/dashboard-static/assets/index-B6kRK9Rq.js +0 -116
- package/dist/dashboard-static/assets/index-BpdKJPLu.css +0 -1
|
@@ -0,0 +1,434 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
Train policy head from training buffer tuples.
|
|
4
|
+
|
|
5
|
+
Reads .jfl/training-buffer.jsonl, embeds via Stratus, trains a 768→256→256→1
|
|
6
|
+
Q-network that predicts reward given (state_embedding, action_embedding).
|
|
7
|
+
|
|
8
|
+
Usage:
|
|
9
|
+
python3 scripts/train-policy-head.py [--buffer PATH] [--epochs N] [--lr RATE]
|
|
10
|
+
|
|
11
|
+
STRATUS_API_KEY must be set in environment.
|
|
12
|
+
|
|
13
|
+
Output:
|
|
14
|
+
.jfl/policy-weights.json — trained weights for inference
|
|
15
|
+
.jfl/policy-embeddings.json — cached embeddings (skip re-embedding on retrain)
|
|
16
|
+
"""
|
|
17
|
+
|
|
18
|
+
import json
|
|
19
|
+
import os
|
|
20
|
+
import sys
|
|
21
|
+
import time
|
|
22
|
+
import urllib.request
|
|
23
|
+
import argparse
|
|
24
|
+
from pathlib import Path
|
|
25
|
+
|
|
26
|
+
import numpy as np
|
|
27
|
+
|
|
28
|
+
STRATUS_API_KEY = os.environ.get("STRATUS_API_KEY", "")
|
|
29
|
+
STRATUS_URL = os.environ.get("STRATUS_API_URL", "https://api.stratus.run")
|
|
30
|
+
EMBED_DIM = 768
|
|
31
|
+
HIDDEN_DIM = 256
|
|
32
|
+
EMBED_BATCH_SIZE = 20
|
|
33
|
+
|
|
34
|
+
|
|
35
|
+
def load_buffer(path: str) -> list[dict]:
|
|
36
|
+
entries = []
|
|
37
|
+
with open(path) as f:
|
|
38
|
+
for line in f:
|
|
39
|
+
line = line.strip()
|
|
40
|
+
if not line:
|
|
41
|
+
continue
|
|
42
|
+
try:
|
|
43
|
+
entries.append(json.loads(line))
|
|
44
|
+
except Exception:
|
|
45
|
+
pass
|
|
46
|
+
return entries
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
def format_state_text(entry: dict) -> str:
|
|
50
|
+
s = entry["state"]
|
|
51
|
+
dims = ", ".join(f"{k}={v:.4f}" for k, v in s.get("dimension_scores", {}).items())
|
|
52
|
+
deltas = ", ".join(
|
|
53
|
+
f"{'+' if d >= 0 else ''}{d:.4f}" for d in s.get("recent_deltas", [])
|
|
54
|
+
)
|
|
55
|
+
return (
|
|
56
|
+
f"Agent: {s.get('agent', '?')}\n"
|
|
57
|
+
f"Composite: {s.get('composite_score', 0):.4f}\n"
|
|
58
|
+
f"Tests: {s.get('tests_passing', 0)}/{s.get('tests_total', 0)}\n"
|
|
59
|
+
f"Trajectory: {s.get('trajectory_length', 0)}\n"
|
|
60
|
+
f"Dimensions: {dims or 'none'}\n"
|
|
61
|
+
f"Recent deltas: {deltas or 'none'}"
|
|
62
|
+
)
|
|
63
|
+
|
|
64
|
+
|
|
65
|
+
def format_action_text(entry: dict) -> str:
|
|
66
|
+
a = entry["action"]
|
|
67
|
+
files = ", ".join(a.get("files_affected", [])[:5])
|
|
68
|
+
return (
|
|
69
|
+
f"Type: {a.get('type', '?')}\n"
|
|
70
|
+
f"Description: {a.get('description', '')[:150]}\n"
|
|
71
|
+
f"Scope: {a.get('scope', '?')}\n"
|
|
72
|
+
f"Files: {files or 'none'}"
|
|
73
|
+
)
|
|
74
|
+
|
|
75
|
+
|
|
76
|
+
def embed_batch(texts: list[str]) -> list[list[float]]:
|
|
77
|
+
data = json.dumps({"model": "stratus-x1ac-base", "input": texts}).encode()
|
|
78
|
+
req = urllib.request.Request(
|
|
79
|
+
f"{STRATUS_URL}/v1/embeddings",
|
|
80
|
+
data=data,
|
|
81
|
+
headers={
|
|
82
|
+
"Authorization": f"Bearer {STRATUS_API_KEY}",
|
|
83
|
+
"Content-Type": "application/json",
|
|
84
|
+
},
|
|
85
|
+
)
|
|
86
|
+
try:
|
|
87
|
+
resp = urllib.request.urlopen(req, timeout=60)
|
|
88
|
+
result = json.loads(resp.read())
|
|
89
|
+
return [d["embedding"] for d in result["data"]]
|
|
90
|
+
except Exception as e:
|
|
91
|
+
print(f" Embedding error: {e}", file=sys.stderr)
|
|
92
|
+
return [[0.0] * EMBED_DIM] * len(texts)
|
|
93
|
+
|
|
94
|
+
|
|
95
|
+
def embed_all(texts: list[str], label: str = "") -> np.ndarray:
|
|
96
|
+
all_embeddings = []
|
|
97
|
+
total = len(texts)
|
|
98
|
+
for i in range(0, total, EMBED_BATCH_SIZE):
|
|
99
|
+
batch = texts[i : i + EMBED_BATCH_SIZE]
|
|
100
|
+
embs = embed_batch(batch)
|
|
101
|
+
all_embeddings.extend(embs)
|
|
102
|
+
done = min(i + EMBED_BATCH_SIZE, total)
|
|
103
|
+
print(f" {label}: {done}/{total} embedded", end="\r")
|
|
104
|
+
print(f" {label}: {total}/{total} embedded ")
|
|
105
|
+
return np.array(all_embeddings, dtype=np.float64)
|
|
106
|
+
|
|
107
|
+
|
|
108
|
+
# --- Neural Network ---
|
|
109
|
+
|
|
110
|
+
|
|
111
|
+
def xavier_init(fan_in: int, fan_out: int) -> np.ndarray:
|
|
112
|
+
std = np.sqrt(2.0 / fan_in) * 0.1 # Small init for stability
|
|
113
|
+
return (np.random.randn(fan_in, fan_out) * std).astype(np.float64)
|
|
114
|
+
|
|
115
|
+
|
|
116
|
+
def relu(x: np.ndarray) -> np.ndarray:
|
|
117
|
+
return np.maximum(0, x)
|
|
118
|
+
|
|
119
|
+
|
|
120
|
+
def relu_grad(x: np.ndarray) -> np.ndarray:
|
|
121
|
+
return (x > 0).astype(np.float64)
|
|
122
|
+
|
|
123
|
+
|
|
124
|
+
class PolicyHead:
|
|
125
|
+
def __init__(self, input_dim: int = EMBED_DIM * 2, hidden_dim: int = HIDDEN_DIM):
|
|
126
|
+
self.W1 = xavier_init(input_dim, hidden_dim)
|
|
127
|
+
self.b1 = np.zeros(hidden_dim, dtype=np.float64)
|
|
128
|
+
self.W2 = xavier_init(hidden_dim, hidden_dim)
|
|
129
|
+
self.b2 = np.zeros(hidden_dim, dtype=np.float64)
|
|
130
|
+
self.W3 = xavier_init(hidden_dim, 1)
|
|
131
|
+
self.b3 = np.zeros(1, dtype=np.float64)
|
|
132
|
+
|
|
133
|
+
# Adam state
|
|
134
|
+
self.params = [self.W1, self.b1, self.W2, self.b2, self.W3, self.b3]
|
|
135
|
+
self.m = [np.zeros_like(p) for p in self.params]
|
|
136
|
+
self.v = [np.zeros_like(p) for p in self.params]
|
|
137
|
+
self.t = 0
|
|
138
|
+
|
|
139
|
+
def forward(self, x: np.ndarray) -> tuple:
|
|
140
|
+
z1 = x @ self.W1 + self.b1
|
|
141
|
+
a1 = relu(z1)
|
|
142
|
+
z2 = a1 @ self.W2 + self.b2
|
|
143
|
+
a2 = relu(z2)
|
|
144
|
+
z3 = a2 @ self.W3 + self.b3
|
|
145
|
+
return z3, (x, z1, a1, z2, a2)
|
|
146
|
+
|
|
147
|
+
def backward(self, pred: np.ndarray, target: np.ndarray, cache: tuple) -> list:
|
|
148
|
+
x, z1, a1, z2, a2 = cache
|
|
149
|
+
batch_size = x.shape[0]
|
|
150
|
+
|
|
151
|
+
# MSE gradient
|
|
152
|
+
dz3 = (pred - target) / batch_size # (B, 1)
|
|
153
|
+
|
|
154
|
+
dW3 = a2.T @ dz3
|
|
155
|
+
db3 = dz3.sum(axis=0)
|
|
156
|
+
|
|
157
|
+
da2 = dz3 @ self.W3.T
|
|
158
|
+
dz2 = da2 * relu_grad(z2)
|
|
159
|
+
|
|
160
|
+
dW2 = a1.T @ dz2
|
|
161
|
+
db2 = dz2.sum(axis=0)
|
|
162
|
+
|
|
163
|
+
da1 = dz2 @ self.W2.T
|
|
164
|
+
dz1 = da1 * relu_grad(z1)
|
|
165
|
+
|
|
166
|
+
dW1 = x.T @ dz1
|
|
167
|
+
db1 = dz1.sum(axis=0)
|
|
168
|
+
|
|
169
|
+
return [dW1, db1, dW2, db2, dW3, db3]
|
|
170
|
+
|
|
171
|
+
def adam_step(self, grads: list, lr: float = 1e-4, beta1=0.9, beta2=0.999, eps=1e-8, max_grad_norm=1.0):
|
|
172
|
+
# Clip individual gradient values first
|
|
173
|
+
grads = [np.clip(g, -5.0, 5.0) for g in grads]
|
|
174
|
+
|
|
175
|
+
# Global gradient norm clipping
|
|
176
|
+
total_norm = 0.0
|
|
177
|
+
for g in grads:
|
|
178
|
+
total_norm += float(np.sum(g.astype(np.float64) ** 2))
|
|
179
|
+
total_norm = np.sqrt(total_norm)
|
|
180
|
+
if total_norm > max_grad_norm:
|
|
181
|
+
scale = max_grad_norm / (total_norm + eps)
|
|
182
|
+
grads = [g * scale for g in grads]
|
|
183
|
+
|
|
184
|
+
self.t += 1
|
|
185
|
+
for i, (param, grad) in enumerate(zip(self.params, grads)):
|
|
186
|
+
if np.any(np.isnan(grad)):
|
|
187
|
+
continue
|
|
188
|
+
self.m[i] = beta1 * self.m[i] + (1 - beta1) * grad
|
|
189
|
+
self.v[i] = beta2 * self.v[i] + (1 - beta2) * (grad ** 2)
|
|
190
|
+
m_hat = self.m[i] / (1 - beta1 ** self.t)
|
|
191
|
+
v_hat = self.v[i] / (1 - beta2 ** self.t)
|
|
192
|
+
update = lr * m_hat / (np.sqrt(v_hat) + eps)
|
|
193
|
+
param -= np.clip(update, -0.1, 0.1)
|
|
194
|
+
# Sync references
|
|
195
|
+
self.W1, self.b1, self.W2, self.b2, self.W3, self.b3 = self.params
|
|
196
|
+
|
|
197
|
+
def save(self, path: str, metadata: dict):
|
|
198
|
+
weights = {
|
|
199
|
+
"version": 1,
|
|
200
|
+
"architecture": f"{self.W1.shape[0]}-{self.W1.shape[1]}-{self.W2.shape[1]}-{self.W3.shape[1]}",
|
|
201
|
+
"embed_dim": EMBED_DIM,
|
|
202
|
+
"mode": "embedding",
|
|
203
|
+
"trained_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
|
|
204
|
+
**metadata,
|
|
205
|
+
"layers": {
|
|
206
|
+
"W1": self.W1.tolist(),
|
|
207
|
+
"b1": self.b1.tolist(),
|
|
208
|
+
"W2": self.W2.tolist(),
|
|
209
|
+
"b2": self.b2.tolist(),
|
|
210
|
+
"W3": self.W3.tolist(),
|
|
211
|
+
"b3": self.b3.tolist(),
|
|
212
|
+
},
|
|
213
|
+
}
|
|
214
|
+
with open(path, "w") as f:
|
|
215
|
+
json.dump(weights, f)
|
|
216
|
+
|
|
217
|
+
|
|
218
|
+
def train(
|
|
219
|
+
entries: list[dict],
|
|
220
|
+
epochs: int = 50,
|
|
221
|
+
lr: float = 1e-4,
|
|
222
|
+
batch_size: int = 32,
|
|
223
|
+
cache_path: str | None = None,
|
|
224
|
+
) -> tuple:
|
|
225
|
+
print(f"\n Training policy head on {len(entries)} tuples\n")
|
|
226
|
+
|
|
227
|
+
# Check for cached embeddings
|
|
228
|
+
state_embs = None
|
|
229
|
+
action_embs = None
|
|
230
|
+
if cache_path and os.path.exists(cache_path):
|
|
231
|
+
print(" Loading cached embeddings...")
|
|
232
|
+
with open(cache_path) as f:
|
|
233
|
+
cache = json.load(f)
|
|
234
|
+
if cache.get("count") == len(entries):
|
|
235
|
+
state_embs = np.array(cache["state_embeddings"], dtype=np.float64)
|
|
236
|
+
action_embs = np.array(cache["action_embeddings"], dtype=np.float64)
|
|
237
|
+
print(f" Loaded {len(state_embs)} cached embeddings")
|
|
238
|
+
|
|
239
|
+
if state_embs is None:
|
|
240
|
+
# Embed states and actions
|
|
241
|
+
state_texts = [format_state_text(e) for e in entries]
|
|
242
|
+
action_texts = [format_action_text(e) for e in entries]
|
|
243
|
+
|
|
244
|
+
state_embs = embed_all(state_texts, "States")
|
|
245
|
+
action_embs = embed_all(action_texts, "Actions")
|
|
246
|
+
|
|
247
|
+
# Cache embeddings
|
|
248
|
+
if cache_path:
|
|
249
|
+
os.makedirs(os.path.dirname(cache_path), exist_ok=True)
|
|
250
|
+
with open(cache_path, "w") as f:
|
|
251
|
+
json.dump(
|
|
252
|
+
{
|
|
253
|
+
"count": len(entries),
|
|
254
|
+
"state_embeddings": state_embs.tolist(),
|
|
255
|
+
"action_embeddings": action_embs.tolist(),
|
|
256
|
+
},
|
|
257
|
+
f,
|
|
258
|
+
)
|
|
259
|
+
print(f" Cached embeddings to {cache_path}")
|
|
260
|
+
|
|
261
|
+
# Prepare training data
|
|
262
|
+
# Input: concat(state_embedding, action_embedding) = 1536 dims
|
|
263
|
+
X = np.concatenate([state_embs, action_embs], axis=1)
|
|
264
|
+
|
|
265
|
+
# L2 normalize each input vector for stable training
|
|
266
|
+
norms = np.linalg.norm(X, axis=1, keepdims=True)
|
|
267
|
+
norms = np.maximum(norms, 1e-8)
|
|
268
|
+
X = X / norms
|
|
269
|
+
|
|
270
|
+
# Target: composite_delta (reward)
|
|
271
|
+
y = np.array(
|
|
272
|
+
[float(e["reward"].get("composite_delta", 0)) for e in entries],
|
|
273
|
+
dtype=np.float64,
|
|
274
|
+
).reshape(-1, 1)
|
|
275
|
+
|
|
276
|
+
# Normalize targets to [-1, 1] range for stable training
|
|
277
|
+
y_mean = y.mean()
|
|
278
|
+
y_std = max(y.std(), 1e-6)
|
|
279
|
+
y_norm = (y - y_mean) / y_std
|
|
280
|
+
|
|
281
|
+
input_dim = X.shape[1]
|
|
282
|
+
print(f" Input dim: {input_dim} ({EMBED_DIM} state + {EMBED_DIM} action)")
|
|
283
|
+
print(f" Target range: [{y.min():.4f}, {y.max():.4f}] (mean={y_mean:.4f})")
|
|
284
|
+
print()
|
|
285
|
+
|
|
286
|
+
# Train/val split (90/10)
|
|
287
|
+
n = len(X)
|
|
288
|
+
indices = np.random.permutation(n)
|
|
289
|
+
split = int(n * 0.9)
|
|
290
|
+
train_idx, val_idx = indices[:split], indices[split:]
|
|
291
|
+
|
|
292
|
+
X_train, y_train = X[train_idx], y_norm[train_idx]
|
|
293
|
+
X_val, y_val = X[val_idx], y_norm[val_idx]
|
|
294
|
+
|
|
295
|
+
model = PolicyHead(input_dim=input_dim)
|
|
296
|
+
best_val_loss = float("inf")
|
|
297
|
+
best_epoch = 0
|
|
298
|
+
|
|
299
|
+
for epoch in range(epochs):
|
|
300
|
+
# Shuffle training data
|
|
301
|
+
perm = np.random.permutation(len(X_train))
|
|
302
|
+
X_train = X_train[perm]
|
|
303
|
+
y_train = y_train[perm]
|
|
304
|
+
|
|
305
|
+
epoch_loss = 0.0
|
|
306
|
+
n_batches = 0
|
|
307
|
+
|
|
308
|
+
for i in range(0, len(X_train), batch_size):
|
|
309
|
+
X_batch = X_train[i : i + batch_size]
|
|
310
|
+
y_batch = y_train[i : i + batch_size]
|
|
311
|
+
|
|
312
|
+
pred, cache = model.forward(X_batch)
|
|
313
|
+
loss = float(((pred - y_batch) ** 2).mean())
|
|
314
|
+
if np.isnan(loss) or np.isinf(loss):
|
|
315
|
+
continue
|
|
316
|
+
epoch_loss += loss
|
|
317
|
+
n_batches += 1
|
|
318
|
+
|
|
319
|
+
grads = model.backward(pred, y_batch, cache)
|
|
320
|
+
model.adam_step(grads, lr=lr)
|
|
321
|
+
|
|
322
|
+
avg_loss = epoch_loss / max(n_batches, 1)
|
|
323
|
+
|
|
324
|
+
# Validation
|
|
325
|
+
val_pred, _ = model.forward(X_val)
|
|
326
|
+
val_loss = ((val_pred - y_val) ** 2).mean()
|
|
327
|
+
|
|
328
|
+
if val_loss < best_val_loss:
|
|
329
|
+
best_val_loss = val_loss
|
|
330
|
+
best_epoch = epoch + 1
|
|
331
|
+
|
|
332
|
+
if (epoch + 1) % 10 == 0 or epoch == 0:
|
|
333
|
+
print(
|
|
334
|
+
f" Epoch {epoch+1:3d}/{epochs}: "
|
|
335
|
+
f"train_loss={avg_loss:.6f} val_loss={val_loss:.6f}"
|
|
336
|
+
f"{' ★ best' if epoch + 1 == best_epoch else ''}"
|
|
337
|
+
)
|
|
338
|
+
|
|
339
|
+
# Final metrics
|
|
340
|
+
all_pred, _ = model.forward(X)
|
|
341
|
+
all_pred_denorm = all_pred * y_std + y_mean
|
|
342
|
+
mse = ((all_pred_denorm - y) ** 2).mean()
|
|
343
|
+
|
|
344
|
+
# Direction accuracy: did we predict positive/negative correctly?
|
|
345
|
+
pred_dir = (all_pred_denorm > 0).flatten()
|
|
346
|
+
actual_dir = (y > 0).flatten()
|
|
347
|
+
direction_acc = (pred_dir == actual_dir).mean()
|
|
348
|
+
|
|
349
|
+
# Rank correlation (Spearman) — implemented without scipy
|
|
350
|
+
def spearman_corr(x: np.ndarray, y: np.ndarray) -> float:
|
|
351
|
+
n = len(x)
|
|
352
|
+
if n < 3:
|
|
353
|
+
return 0.0
|
|
354
|
+
rank_x = np.argsort(np.argsort(x))
|
|
355
|
+
rank_y = np.argsort(np.argsort(y))
|
|
356
|
+
d = rank_x - rank_y
|
|
357
|
+
return float(1 - 6 * np.sum(d**2) / (n * (n**2 - 1)))
|
|
358
|
+
|
|
359
|
+
try:
|
|
360
|
+
rank_corr = spearman_corr(all_pred_denorm.flatten(), y.flatten())
|
|
361
|
+
except Exception:
|
|
362
|
+
rank_corr = 0.0
|
|
363
|
+
|
|
364
|
+
print(f"\n Final MSE: {mse:.6f}")
|
|
365
|
+
print(f" Direction accuracy: {direction_acc:.1%}")
|
|
366
|
+
print(f" Rank correlation: {rank_corr:.4f}")
|
|
367
|
+
print(f" Best epoch: {best_epoch}")
|
|
368
|
+
|
|
369
|
+
metadata = {
|
|
370
|
+
"trained_on": len(entries),
|
|
371
|
+
"train_size": len(X_train),
|
|
372
|
+
"val_size": len(X_val),
|
|
373
|
+
"epochs": epochs,
|
|
374
|
+
"learning_rate": lr,
|
|
375
|
+
"best_epoch": best_epoch,
|
|
376
|
+
"final_mse": float(mse),
|
|
377
|
+
"direction_accuracy": float(direction_acc),
|
|
378
|
+
"rank_correlation": float(rank_corr),
|
|
379
|
+
"target_mean": float(y_mean),
|
|
380
|
+
"target_std": float(y_std),
|
|
381
|
+
}
|
|
382
|
+
|
|
383
|
+
return model, metadata
|
|
384
|
+
|
|
385
|
+
|
|
386
|
+
def main():
|
|
387
|
+
parser = argparse.ArgumentParser(description="Train policy head from training buffer")
|
|
388
|
+
parser.add_argument("--buffer", default=".jfl/training-buffer.jsonl", help="Training buffer path")
|
|
389
|
+
parser.add_argument("--output", default=".jfl/policy-weights.json", help="Output weights path")
|
|
390
|
+
parser.add_argument("--cache", default=".jfl/policy-embeddings.json", help="Embeddings cache path")
|
|
391
|
+
parser.add_argument("--epochs", type=int, default=50, help="Training epochs")
|
|
392
|
+
parser.add_argument("--lr", type=float, default=3e-4, help="Learning rate")
|
|
393
|
+
parser.add_argument("--batch-size", type=int, default=32, help="Batch size")
|
|
394
|
+
args = parser.parse_args()
|
|
395
|
+
|
|
396
|
+
if not STRATUS_API_KEY:
|
|
397
|
+
print("Error: STRATUS_API_KEY not set", file=sys.stderr)
|
|
398
|
+
print(" export STRATUS_API_KEY=stratus_sk_live_...", file=sys.stderr)
|
|
399
|
+
sys.exit(1)
|
|
400
|
+
|
|
401
|
+
if not os.path.exists(args.buffer):
|
|
402
|
+
print(f"Error: Training buffer not found: {args.buffer}", file=sys.stderr)
|
|
403
|
+
print(" Run: jfl eval mine --all --telemetry", file=sys.stderr)
|
|
404
|
+
sys.exit(1)
|
|
405
|
+
|
|
406
|
+
entries = load_buffer(args.buffer)
|
|
407
|
+
if len(entries) < 3:
|
|
408
|
+
print(f"Error: Need at least 3 tuples, got {len(entries)}", file=sys.stderr)
|
|
409
|
+
sys.exit(1)
|
|
410
|
+
|
|
411
|
+
print(f"\n Policy Head Trainer")
|
|
412
|
+
print(f" {'─' * 40}")
|
|
413
|
+
print(f" Buffer: {args.buffer} ({len(entries)} tuples)")
|
|
414
|
+
print(f" Epochs: {args.epochs}, LR: {args.lr}, Batch: {args.batch_size}")
|
|
415
|
+
print(f" Stratus: {STRATUS_URL}")
|
|
416
|
+
|
|
417
|
+
model, metadata = train(
|
|
418
|
+
entries,
|
|
419
|
+
epochs=args.epochs,
|
|
420
|
+
lr=args.lr,
|
|
421
|
+
batch_size=args.batch_size,
|
|
422
|
+
cache_path=args.cache,
|
|
423
|
+
)
|
|
424
|
+
|
|
425
|
+
model.save(args.output, metadata)
|
|
426
|
+
size_kb = os.path.getsize(args.output) / 1024
|
|
427
|
+
print(f"\n Saved: {args.output} ({size_kb:.0f}KB)")
|
|
428
|
+
print(f" Direction accuracy: {metadata['direction_accuracy']:.1%}")
|
|
429
|
+
print(f" Rank correlation: {metadata['rank_correlation']:.4f}")
|
|
430
|
+
print()
|
|
431
|
+
|
|
432
|
+
|
|
433
|
+
if __name__ == "__main__":
|
|
434
|
+
main()
|