jfl 0.4.4 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/commands/context-hub.d.ts +1 -0
- package/dist/commands/context-hub.d.ts.map +1 -1
- package/dist/commands/context-hub.js +1064 -41
- package/dist/commands/context-hub.js.map +1 -1
- package/dist/commands/eval.d.ts +1 -1
- package/dist/commands/eval.d.ts.map +1 -1
- package/dist/commands/eval.js +192 -1
- package/dist/commands/eval.js.map +1 -1
- package/dist/commands/findings.d.ts +6 -0
- package/dist/commands/findings.d.ts.map +1 -0
- package/dist/commands/findings.js +203 -0
- package/dist/commands/findings.js.map +1 -0
- package/dist/commands/hud.d.ts.map +1 -1
- package/dist/commands/hud.js +47 -9
- package/dist/commands/hud.js.map +1 -1
- package/dist/commands/ide.d.ts +27 -0
- package/dist/commands/ide.d.ts.map +1 -0
- package/dist/commands/ide.js +546 -0
- package/dist/commands/ide.js.map +1 -0
- package/dist/commands/onboard.d.ts.map +1 -1
- package/dist/commands/onboard.js +212 -2
- package/dist/commands/onboard.js.map +1 -1
- package/dist/commands/openclaw.d.ts +3 -0
- package/dist/commands/openclaw.d.ts.map +1 -1
- package/dist/commands/openclaw.js +76 -2
- package/dist/commands/openclaw.js.map +1 -1
- package/dist/commands/peter.d.ts +3 -0
- package/dist/commands/peter.d.ts.map +1 -1
- package/dist/commands/peter.js +1168 -58
- package/dist/commands/peter.js.map +1 -1
- package/dist/commands/pi-fleet.d.ts +18 -0
- package/dist/commands/pi-fleet.d.ts.map +1 -0
- package/dist/commands/pi-fleet.js +382 -0
- package/dist/commands/pi-fleet.js.map +1 -0
- package/dist/commands/pi.d.ts.map +1 -1
- package/dist/commands/pi.js +18 -3
- package/dist/commands/pi.js.map +1 -1
- package/dist/commands/scope.d.ts.map +1 -1
- package/dist/commands/scope.js +90 -1
- package/dist/commands/scope.js.map +1 -1
- package/dist/commands/services.d.ts.map +1 -1
- package/dist/commands/services.js +18 -0
- package/dist/commands/services.js.map +1 -1
- package/dist/commands/setup.d.ts +12 -0
- package/dist/commands/setup.d.ts.map +1 -0
- package/dist/commands/setup.js +322 -0
- package/dist/commands/setup.js.map +1 -0
- package/dist/commands/status.d.ts.map +1 -1
- package/dist/commands/status.js +22 -4
- package/dist/commands/status.js.map +1 -1
- package/dist/commands/train.d.ts +33 -0
- package/dist/commands/train.d.ts.map +1 -0
- package/dist/commands/train.js +510 -0
- package/dist/commands/train.js.map +1 -0
- package/dist/commands/verify.d.ts +14 -0
- package/dist/commands/verify.d.ts.map +1 -0
- package/dist/commands/verify.js +276 -0
- package/dist/commands/verify.js.map +1 -0
- package/dist/commands/viz.d.ts.map +1 -1
- package/dist/commands/viz.js +417 -0
- package/dist/commands/viz.js.map +1 -1
- package/dist/dashboard-static/assets/index-CW9ZxqX8.css +1 -0
- package/dist/dashboard-static/assets/index-DNN__p4K.js +121 -0
- package/dist/dashboard-static/index.html +2 -2
- package/dist/index.js +324 -64
- package/dist/index.js.map +1 -1
- package/dist/lib/agent-config.d.ts +52 -0
- package/dist/lib/agent-config.d.ts.map +1 -0
- package/dist/lib/agent-config.js +231 -0
- package/dist/lib/agent-config.js.map +1 -0
- package/dist/lib/agent-generator.d.ts +10 -0
- package/dist/lib/agent-generator.d.ts.map +1 -1
- package/dist/lib/agent-generator.js +64 -10
- package/dist/lib/agent-generator.js.map +1 -1
- package/dist/lib/agent-session.d.ts +104 -0
- package/dist/lib/agent-session.d.ts.map +1 -0
- package/dist/lib/agent-session.js +635 -0
- package/dist/lib/agent-session.js.map +1 -0
- package/dist/lib/eval-snapshot.d.ts +47 -0
- package/dist/lib/eval-snapshot.d.ts.map +1 -0
- package/dist/lib/eval-snapshot.js +315 -0
- package/dist/lib/eval-snapshot.js.map +1 -0
- package/dist/lib/eval-store.d.ts +5 -0
- package/dist/lib/eval-store.d.ts.map +1 -1
- package/dist/lib/eval-store.js +33 -3
- package/dist/lib/eval-store.js.map +1 -1
- package/dist/lib/findings-engine.d.ts +51 -0
- package/dist/lib/findings-engine.d.ts.map +1 -0
- package/dist/lib/findings-engine.js +338 -0
- package/dist/lib/findings-engine.js.map +1 -0
- package/dist/lib/flow-engine.d.ts +8 -0
- package/dist/lib/flow-engine.d.ts.map +1 -1
- package/dist/lib/flow-engine.js +84 -2
- package/dist/lib/flow-engine.js.map +1 -1
- package/dist/lib/hub-client.d.ts +1 -0
- package/dist/lib/hub-client.d.ts.map +1 -1
- package/dist/lib/hub-client.js +33 -6
- package/dist/lib/hub-client.js.map +1 -1
- package/dist/lib/ide-panes.d.ts +58 -0
- package/dist/lib/ide-panes.d.ts.map +1 -0
- package/dist/lib/ide-panes.js +508 -0
- package/dist/lib/ide-panes.js.map +1 -0
- package/dist/lib/memory-db.js +4 -4
- package/dist/lib/memory-db.js.map +1 -1
- package/dist/lib/memory-indexer.d.ts.map +1 -1
- package/dist/lib/memory-indexer.js +3 -0
- package/dist/lib/memory-indexer.js.map +1 -1
- package/dist/lib/memory-search.d.ts +148 -4
- package/dist/lib/memory-search.d.ts.map +1 -1
- package/dist/lib/memory-search.js +496 -58
- package/dist/lib/memory-search.js.map +1 -1
- package/dist/lib/meta-orchestrator.d.ts +104 -0
- package/dist/lib/meta-orchestrator.d.ts.map +1 -0
- package/dist/lib/meta-orchestrator.js +373 -0
- package/dist/lib/meta-orchestrator.js.map +1 -0
- package/dist/lib/peer-agent-generator.d.ts.map +1 -1
- package/dist/lib/peer-agent-generator.js +43 -19
- package/dist/lib/peer-agent-generator.js.map +1 -1
- package/dist/lib/pi-sky/bridge.d.ts +55 -0
- package/dist/lib/pi-sky/bridge.d.ts.map +1 -0
- package/dist/lib/pi-sky/bridge.js +264 -0
- package/dist/lib/pi-sky/bridge.js.map +1 -0
- package/dist/lib/pi-sky/cost-monitor.d.ts +21 -0
- package/dist/lib/pi-sky/cost-monitor.d.ts.map +1 -0
- package/dist/lib/pi-sky/cost-monitor.js +126 -0
- package/dist/lib/pi-sky/cost-monitor.js.map +1 -0
- package/dist/lib/pi-sky/eval-sweep.d.ts +27 -0
- package/dist/lib/pi-sky/eval-sweep.d.ts.map +1 -0
- package/dist/lib/pi-sky/eval-sweep.js +141 -0
- package/dist/lib/pi-sky/eval-sweep.js.map +1 -0
- package/dist/lib/pi-sky/event-router.d.ts +32 -0
- package/dist/lib/pi-sky/event-router.d.ts.map +1 -0
- package/dist/lib/pi-sky/event-router.js +176 -0
- package/dist/lib/pi-sky/event-router.js.map +1 -0
- package/dist/lib/pi-sky/experiment.d.ts +9 -0
- package/dist/lib/pi-sky/experiment.d.ts.map +1 -0
- package/dist/lib/pi-sky/experiment.js +83 -0
- package/dist/lib/pi-sky/experiment.js.map +1 -0
- package/dist/lib/pi-sky/index.d.ts +16 -0
- package/dist/lib/pi-sky/index.d.ts.map +1 -0
- package/dist/lib/pi-sky/index.js +16 -0
- package/dist/lib/pi-sky/index.js.map +1 -0
- package/dist/lib/pi-sky/stratus-gate.d.ts +28 -0
- package/dist/lib/pi-sky/stratus-gate.d.ts.map +1 -0
- package/dist/lib/pi-sky/stratus-gate.js +61 -0
- package/dist/lib/pi-sky/stratus-gate.js.map +1 -0
- package/dist/lib/pi-sky/swarm.d.ts +28 -0
- package/dist/lib/pi-sky/swarm.d.ts.map +1 -0
- package/dist/lib/pi-sky/swarm.js +208 -0
- package/dist/lib/pi-sky/swarm.js.map +1 -0
- package/dist/lib/pi-sky/types.d.ts +139 -0
- package/dist/lib/pi-sky/types.d.ts.map +1 -0
- package/dist/lib/pi-sky/types.js +2 -0
- package/dist/lib/pi-sky/types.js.map +1 -0
- package/dist/lib/pi-sky/voice-bridge.d.ts +20 -0
- package/dist/lib/pi-sky/voice-bridge.d.ts.map +1 -0
- package/dist/lib/pi-sky/voice-bridge.js +91 -0
- package/dist/lib/pi-sky/voice-bridge.js.map +1 -0
- package/dist/lib/policy-head.d.ts +40 -0
- package/dist/lib/policy-head.d.ts.map +1 -0
- package/dist/lib/policy-head.js +234 -0
- package/dist/lib/policy-head.js.map +1 -0
- package/dist/lib/predictor.d.ts +10 -0
- package/dist/lib/predictor.d.ts.map +1 -1
- package/dist/lib/predictor.js +46 -7
- package/dist/lib/predictor.js.map +1 -1
- package/dist/lib/replay-buffer.d.ts +93 -0
- package/dist/lib/replay-buffer.d.ts.map +1 -0
- package/dist/lib/replay-buffer.js +302 -0
- package/dist/lib/replay-buffer.js.map +1 -0
- package/dist/lib/sentinel-rl.d.ts +97 -0
- package/dist/lib/sentinel-rl.d.ts.map +1 -0
- package/dist/lib/sentinel-rl.js +430 -0
- package/dist/lib/sentinel-rl.js.map +1 -0
- package/dist/lib/session-lock.d.ts +61 -0
- package/dist/lib/session-lock.d.ts.map +1 -0
- package/dist/lib/session-lock.js +438 -0
- package/dist/lib/session-lock.js.map +1 -0
- package/dist/lib/setup/agent-generator.d.ts +18 -0
- package/dist/lib/setup/agent-generator.d.ts.map +1 -0
- package/dist/lib/setup/agent-generator.js +114 -0
- package/dist/lib/setup/agent-generator.js.map +1 -0
- package/dist/lib/setup/context-analyzer.d.ts +16 -0
- package/dist/lib/setup/context-analyzer.d.ts.map +1 -0
- package/dist/lib/setup/context-analyzer.js +112 -0
- package/dist/lib/setup/context-analyzer.js.map +1 -0
- package/dist/lib/setup/doc-auditor.d.ts +54 -0
- package/dist/lib/setup/doc-auditor.d.ts.map +1 -0
- package/dist/lib/setup/doc-auditor.js +629 -0
- package/dist/lib/setup/doc-auditor.js.map +1 -0
- package/dist/lib/setup/domain-generator.d.ts +7 -0
- package/dist/lib/setup/domain-generator.d.ts.map +1 -0
- package/dist/lib/setup/domain-generator.js +58 -0
- package/dist/lib/setup/domain-generator.js.map +1 -0
- package/dist/lib/setup/smart-eval-generator.d.ts +38 -0
- package/dist/lib/setup/smart-eval-generator.d.ts.map +1 -0
- package/dist/lib/setup/smart-eval-generator.js +378 -0
- package/dist/lib/setup/smart-eval-generator.js.map +1 -0
- package/dist/lib/setup/smart-recommender.d.ts +63 -0
- package/dist/lib/setup/smart-recommender.d.ts.map +1 -0
- package/dist/lib/setup/smart-recommender.js +329 -0
- package/dist/lib/setup/smart-recommender.js.map +1 -0
- package/dist/lib/setup/spec-generator.d.ts +63 -0
- package/dist/lib/setup/spec-generator.d.ts.map +1 -0
- package/dist/lib/setup/spec-generator.js +310 -0
- package/dist/lib/setup/spec-generator.js.map +1 -0
- package/dist/lib/setup/violation-agent-generator.d.ts +32 -0
- package/dist/lib/setup/violation-agent-generator.d.ts.map +1 -0
- package/dist/lib/setup/violation-agent-generator.js +255 -0
- package/dist/lib/setup/violation-agent-generator.js.map +1 -0
- package/dist/lib/stratus-client.d.ts +1 -0
- package/dist/lib/stratus-client.d.ts.map +1 -1
- package/dist/lib/stratus-client.js +24 -2
- package/dist/lib/stratus-client.js.map +1 -1
- package/dist/lib/telemetry-agent-v2.d.ts +128 -0
- package/dist/lib/telemetry-agent-v2.d.ts.map +1 -0
- package/dist/lib/telemetry-agent-v2.js +1042 -0
- package/dist/lib/telemetry-agent-v2.js.map +1 -0
- package/dist/lib/telemetry-agent.d.ts.map +1 -1
- package/dist/lib/telemetry-agent.js +27 -6
- package/dist/lib/telemetry-agent.js.map +1 -1
- package/dist/lib/telemetry-digest.d.ts.map +1 -1
- package/dist/lib/telemetry-digest.js +27 -5
- package/dist/lib/telemetry-digest.js.map +1 -1
- package/dist/lib/telemetry.d.ts.map +1 -1
- package/dist/lib/telemetry.js +29 -4
- package/dist/lib/telemetry.js.map +1 -1
- package/dist/lib/text-preprocessing.d.ts +83 -0
- package/dist/lib/text-preprocessing.d.ts.map +1 -0
- package/dist/lib/text-preprocessing.js +261 -0
- package/dist/lib/text-preprocessing.js.map +1 -0
- package/dist/lib/training-buffer.d.ts +86 -0
- package/dist/lib/training-buffer.d.ts.map +1 -0
- package/dist/lib/training-buffer.js +139 -0
- package/dist/lib/training-buffer.js.map +1 -0
- package/dist/lib/tuple-miner.d.ts +30 -0
- package/dist/lib/tuple-miner.d.ts.map +1 -0
- package/dist/lib/tuple-miner.js +427 -0
- package/dist/lib/tuple-miner.js.map +1 -0
- package/dist/lib/vm-backend.d.ts +72 -0
- package/dist/lib/vm-backend.d.ts.map +1 -0
- package/dist/lib/vm-backend.js +175 -0
- package/dist/lib/vm-backend.js.map +1 -0
- package/dist/lib/workspace/backend.d.ts +53 -0
- package/dist/lib/workspace/backend.d.ts.map +1 -0
- package/dist/lib/workspace/backend.js +37 -0
- package/dist/lib/workspace/backend.js.map +1 -0
- package/dist/lib/workspace/cmux-adapter.d.ts +46 -0
- package/dist/lib/workspace/cmux-adapter.d.ts.map +1 -0
- package/dist/lib/workspace/cmux-adapter.js +261 -0
- package/dist/lib/workspace/cmux-adapter.js.map +1 -0
- package/dist/lib/workspace/data-pipeline.d.ts +35 -0
- package/dist/lib/workspace/data-pipeline.d.ts.map +1 -0
- package/dist/lib/workspace/data-pipeline.js +463 -0
- package/dist/lib/workspace/data-pipeline.js.map +1 -0
- package/dist/lib/workspace/engine.d.ts +64 -0
- package/dist/lib/workspace/engine.d.ts.map +1 -0
- package/dist/lib/workspace/engine.js +397 -0
- package/dist/lib/workspace/engine.js.map +1 -0
- package/dist/lib/workspace/notifications.d.ts +14 -0
- package/dist/lib/workspace/notifications.d.ts.map +1 -0
- package/dist/lib/workspace/notifications.js +41 -0
- package/dist/lib/workspace/notifications.js.map +1 -0
- package/dist/lib/workspace/surface-registry.d.ts +49 -0
- package/dist/lib/workspace/surface-registry.d.ts.map +1 -0
- package/dist/lib/workspace/surface-registry.js +217 -0
- package/dist/lib/workspace/surface-registry.js.map +1 -0
- package/dist/lib/workspace/surface-type.d.ts +153 -0
- package/dist/lib/workspace/surface-type.d.ts.map +1 -0
- package/dist/lib/workspace/surface-type.js +9 -0
- package/dist/lib/workspace/surface-type.js.map +1 -0
- package/dist/lib/workspace/surfaces/agent-overview.d.ts +16 -0
- package/dist/lib/workspace/surfaces/agent-overview.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/agent-overview.js +116 -0
- package/dist/lib/workspace/surfaces/agent-overview.js.map +1 -0
- package/dist/lib/workspace/surfaces/agent.d.ts +16 -0
- package/dist/lib/workspace/surfaces/agent.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/agent.js +112 -0
- package/dist/lib/workspace/surfaces/agent.js.map +1 -0
- package/dist/lib/workspace/surfaces/claude.d.ts +15 -0
- package/dist/lib/workspace/surfaces/claude.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/claude.js +23 -0
- package/dist/lib/workspace/surfaces/claude.js.map +1 -0
- package/dist/lib/workspace/surfaces/dashboard.d.ts +21 -0
- package/dist/lib/workspace/surfaces/dashboard.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/dashboard.js +32 -0
- package/dist/lib/workspace/surfaces/dashboard.js.map +1 -0
- package/dist/lib/workspace/surfaces/eval.d.ts +15 -0
- package/dist/lib/workspace/surfaces/eval.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/eval.js +42 -0
- package/dist/lib/workspace/surfaces/eval.js.map +1 -0
- package/dist/lib/workspace/surfaces/event-stream.d.ts +16 -0
- package/dist/lib/workspace/surfaces/event-stream.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/event-stream.js +40 -0
- package/dist/lib/workspace/surfaces/event-stream.js.map +1 -0
- package/dist/lib/workspace/surfaces/flow.d.ts +16 -0
- package/dist/lib/workspace/surfaces/flow.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/flow.js +49 -0
- package/dist/lib/workspace/surfaces/flow.js.map +1 -0
- package/dist/lib/workspace/surfaces/index.d.ts +16 -0
- package/dist/lib/workspace/surfaces/index.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/index.js +16 -0
- package/dist/lib/workspace/surfaces/index.js.map +1 -0
- package/dist/lib/workspace/surfaces/portfolio.d.ts +16 -0
- package/dist/lib/workspace/surfaces/portfolio.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/portfolio.js +102 -0
- package/dist/lib/workspace/surfaces/portfolio.js.map +1 -0
- package/dist/lib/workspace/surfaces/service.d.ts +16 -0
- package/dist/lib/workspace/surfaces/service.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/service.js +45 -0
- package/dist/lib/workspace/surfaces/service.js.map +1 -0
- package/dist/lib/workspace/surfaces/shell.d.ts +15 -0
- package/dist/lib/workspace/surfaces/shell.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/shell.js +19 -0
- package/dist/lib/workspace/surfaces/shell.js.map +1 -0
- package/dist/lib/workspace/surfaces/telemetry.d.ts +16 -0
- package/dist/lib/workspace/surfaces/telemetry.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/telemetry.js +48 -0
- package/dist/lib/workspace/surfaces/telemetry.js.map +1 -0
- package/dist/lib/workspace/surfaces/topology.d.ts +15 -0
- package/dist/lib/workspace/surfaces/topology.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/topology.js +19 -0
- package/dist/lib/workspace/surfaces/topology.js.map +1 -0
- package/dist/lib/workspace/surfaces/training.d.ts +16 -0
- package/dist/lib/workspace/surfaces/training.d.ts.map +1 -0
- package/dist/lib/workspace/surfaces/training.js +22 -0
- package/dist/lib/workspace/surfaces/training.js.map +1 -0
- package/dist/lib/workspace/tmux-adapter.d.ts +27 -0
- package/dist/lib/workspace/tmux-adapter.d.ts.map +1 -0
- package/dist/lib/workspace/tmux-adapter.js +106 -0
- package/dist/lib/workspace/tmux-adapter.js.map +1 -0
- package/dist/mcp/context-hub-mcp.js +7 -24
- package/dist/mcp/context-hub-mcp.js.map +1 -1
- package/dist/types/flows.d.ts +2 -0
- package/dist/types/flows.d.ts.map +1 -1
- package/dist/types/ide.d.ts +49 -0
- package/dist/types/ide.d.ts.map +1 -0
- package/dist/types/ide.js +5 -0
- package/dist/types/ide.js.map +1 -0
- package/dist/types/platform-digest.d.ts +228 -0
- package/dist/types/platform-digest.d.ts.map +1 -0
- package/dist/types/platform-digest.js +5 -0
- package/dist/types/platform-digest.js.map +1 -0
- package/dist/types/telemetry-digest.d.ts +2 -0
- package/dist/types/telemetry-digest.d.ts.map +1 -1
- package/dist/utils/ensure-project.d.ts +1 -0
- package/dist/utils/ensure-project.d.ts.map +1 -1
- package/dist/utils/ensure-project.js +19 -7
- package/dist/utils/ensure-project.js.map +1 -1
- package/dist/utils/jfl-config.d.ts +1 -0
- package/dist/utils/jfl-config.d.ts.map +1 -1
- package/dist/utils/jfl-config.js +19 -1
- package/dist/utils/jfl-config.js.map +1 -1
- package/dist/utils/jfl-paths.d.ts +5 -0
- package/dist/utils/jfl-paths.d.ts.map +1 -1
- package/dist/utils/jfl-paths.js +25 -3
- package/dist/utils/jfl-paths.js.map +1 -1
- package/package.json +3 -2
- package/packages/pi/AGENTS.md +112 -0
- package/packages/pi/extensions/agent-grid.ts +191 -0
- package/packages/pi/extensions/agent-names.ts +178 -0
- package/packages/pi/extensions/autoresearch.ts +427 -0
- package/packages/pi/extensions/bookmarks.ts +85 -0
- package/packages/pi/extensions/context.ts +184 -0
- package/packages/pi/extensions/crm-tool.ts +61 -0
- package/packages/pi/extensions/eval-tool.ts +224 -0
- package/packages/pi/extensions/eval.ts +60 -0
- package/packages/pi/extensions/footer.ts +239 -0
- package/packages/pi/extensions/hub-resolver.ts +63 -0
- package/packages/pi/extensions/hud-tool.ts +145 -0
- package/packages/pi/extensions/index.ts +405 -0
- package/packages/pi/extensions/journal.ts +224 -0
- package/packages/pi/extensions/map-bridge.ts +178 -0
- package/packages/pi/extensions/memory-tool.ts +73 -0
- package/packages/pi/extensions/notifications.ts +73 -0
- package/packages/pi/extensions/peter-parker.ts +202 -0
- package/packages/pi/extensions/policy-head-tool.ts +276 -0
- package/packages/pi/extensions/portfolio-bridge.ts +90 -0
- package/packages/pi/extensions/session.ts +142 -0
- package/packages/pi/extensions/shortcuts.ts +259 -0
- package/packages/pi/extensions/stratus-bridge.ts +115 -0
- package/packages/pi/extensions/synopsis-tool.ts +83 -0
- package/packages/pi/extensions/tool-renderers.ts +353 -0
- package/packages/pi/extensions/training-buffer-tool.ts +368 -0
- package/packages/pi/extensions/types.ts +163 -0
- package/packages/pi/package-lock.json +346 -0
- package/packages/pi/package.json +44 -0
- package/packages/pi/skills/agent-browser/SKILL.md +116 -0
- package/packages/pi/skills/brand-architect/SKILL.md +240 -0
- package/packages/pi/skills/brand-architect/config.yaml +137 -0
- package/packages/pi/skills/campaign-hud/config.yaml +112 -0
- package/packages/pi/skills/content-creator/SKILL.md +294 -0
- package/packages/pi/skills/context/SKILL.md +65 -0
- package/packages/pi/skills/debug/MULTI_AGENT.md +360 -0
- package/packages/pi/skills/debug/SKILL.md +554 -0
- package/packages/pi/skills/end/SKILL.md +1782 -0
- package/packages/pi/skills/eval/SKILL.md +75 -0
- package/packages/pi/skills/fly-deploy/SKILL.md +676 -0
- package/packages/pi/skills/founder-video/SKILL.md +467 -0
- package/packages/pi/skills/hud/SKILL.md +160 -0
- package/packages/pi/skills/orchestrate/SKILL.md +74 -0
- package/packages/pi/skills/pi-agents/SKILL.md +78 -0
- package/packages/pi/skills/react-best-practices/AGENTS.md +2249 -0
- package/packages/pi/skills/react-best-practices/README.md +123 -0
- package/packages/pi/skills/react-best-practices/SKILL.md +125 -0
- package/packages/pi/skills/react-best-practices/metadata.json +15 -0
- package/packages/pi/skills/react-best-practices/rules/_sections.md +46 -0
- package/packages/pi/skills/react-best-practices/rules/_template.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/advanced-event-handler-refs.md +55 -0
- package/packages/pi/skills/react-best-practices/rules/advanced-use-latest.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/async-api-routes.md +38 -0
- package/packages/pi/skills/react-best-practices/rules/async-defer-await.md +80 -0
- package/packages/pi/skills/react-best-practices/rules/async-dependencies.md +36 -0
- package/packages/pi/skills/react-best-practices/rules/async-parallel.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/async-suspense-boundaries.md +99 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-barrel-imports.md +59 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-conditional.md +31 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-defer-third-party.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-dynamic-imports.md +35 -0
- package/packages/pi/skills/react-best-practices/rules/bundle-preload.md +50 -0
- package/packages/pi/skills/react-best-practices/rules/client-event-listeners.md +74 -0
- package/packages/pi/skills/react-best-practices/rules/client-swr-dedup.md +56 -0
- package/packages/pi/skills/react-best-practices/rules/js-batch-dom-css.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-function-results.md +80 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-property-access.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/js-cache-storage.md +70 -0
- package/packages/pi/skills/react-best-practices/rules/js-combine-iterations.md +32 -0
- package/packages/pi/skills/react-best-practices/rules/js-early-exit.md +50 -0
- package/packages/pi/skills/react-best-practices/rules/js-hoist-regexp.md +45 -0
- package/packages/pi/skills/react-best-practices/rules/js-index-maps.md +37 -0
- package/packages/pi/skills/react-best-practices/rules/js-length-check-first.md +49 -0
- package/packages/pi/skills/react-best-practices/rules/js-min-max-loop.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/js-set-map-lookups.md +24 -0
- package/packages/pi/skills/react-best-practices/rules/js-tosorted-immutable.md +57 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-activity.md +26 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-animate-svg-wrapper.md +47 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-conditional-render.md +40 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-content-visibility.md +38 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-hoist-jsx.md +46 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-hydration-no-flicker.md +82 -0
- package/packages/pi/skills/react-best-practices/rules/rendering-svg-precision.md +28 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-defer-reads.md +39 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-dependencies.md +45 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-derived-state.md +29 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-functional-setstate.md +74 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-lazy-state-init.md +58 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-memo.md +44 -0
- package/packages/pi/skills/react-best-practices/rules/rerender-transitions.md +40 -0
- package/packages/pi/skills/react-best-practices/rules/server-after-nonblocking.md +73 -0
- package/packages/pi/skills/react-best-practices/rules/server-cache-lru.md +41 -0
- package/packages/pi/skills/react-best-practices/rules/server-cache-react.md +26 -0
- package/packages/pi/skills/react-best-practices/rules/server-parallel-fetching.md +79 -0
- package/packages/pi/skills/react-best-practices/rules/server-serialization.md +38 -0
- package/packages/pi/skills/remotion-best-practices/SKILL.md +43 -0
- package/packages/pi/skills/remotion-best-practices/rules/3d.md +86 -0
- package/packages/pi/skills/remotion-best-practices/rules/animations.md +29 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/charts-bar-chart.tsx +173 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-typewriter.tsx +100 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-word-highlight.tsx +108 -0
- package/packages/pi/skills/remotion-best-practices/rules/assets.md +78 -0
- package/packages/pi/skills/remotion-best-practices/rules/audio.md +172 -0
- package/packages/pi/skills/remotion-best-practices/rules/calculate-metadata.md +104 -0
- package/packages/pi/skills/remotion-best-practices/rules/can-decode.md +75 -0
- package/packages/pi/skills/remotion-best-practices/rules/charts.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/compositions.md +146 -0
- package/packages/pi/skills/remotion-best-practices/rules/display-captions.md +126 -0
- package/packages/pi/skills/remotion-best-practices/rules/extract-frames.md +229 -0
- package/packages/pi/skills/remotion-best-practices/rules/fonts.md +152 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-audio-duration.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-video-dimensions.md +68 -0
- package/packages/pi/skills/remotion-best-practices/rules/get-video-duration.md +58 -0
- package/packages/pi/skills/remotion-best-practices/rules/gifs.md +138 -0
- package/packages/pi/skills/remotion-best-practices/rules/images.md +130 -0
- package/packages/pi/skills/remotion-best-practices/rules/import-srt-captions.md +67 -0
- package/packages/pi/skills/remotion-best-practices/rules/lottie.md +68 -0
- package/packages/pi/skills/remotion-best-practices/rules/measuring-dom-nodes.md +35 -0
- package/packages/pi/skills/remotion-best-practices/rules/measuring-text.md +143 -0
- package/packages/pi/skills/remotion-best-practices/rules/sequencing.md +106 -0
- package/packages/pi/skills/remotion-best-practices/rules/tailwind.md +11 -0
- package/packages/pi/skills/remotion-best-practices/rules/text-animations.md +20 -0
- package/packages/pi/skills/remotion-best-practices/rules/timing.md +179 -0
- package/packages/pi/skills/remotion-best-practices/rules/transcribe-captions.md +19 -0
- package/packages/pi/skills/remotion-best-practices/rules/transitions.md +122 -0
- package/packages/pi/skills/remotion-best-practices/rules/trimming.md +53 -0
- package/packages/pi/skills/remotion-best-practices/rules/videos.md +171 -0
- package/packages/pi/skills/search/SKILL.md +220 -0
- package/packages/pi/skills/spec/SKILL.md +377 -0
- package/packages/pi/skills/startup/SKILL.md +315 -0
- package/packages/pi/skills/web-architect/SKILL.md +309 -0
- package/packages/pi/skills/x-algorithm/SKILL.md +305 -0
- package/packages/pi/teams/dev-team.yaml +63 -0
- package/packages/pi/teams/gtm-team.yaml +79 -0
- package/packages/pi/themes/jfl.theme.json +76 -0
- package/packages/pi/tsconfig.json +21 -0
- package/scripts/collect-tuples.sh +124 -0
- package/scripts/destroy-fleet.sh +37 -0
- package/scripts/jfl-ide.sh +48 -0
- package/scripts/session/session-cleanup.sh +4 -11
- package/scripts/session/session-init.sh +6 -0
- package/scripts/session/session-sync.sh +25 -0
- package/scripts/setup-branch-protection.sh +106 -0
- package/scripts/spawn-fleet.sh +144 -0
- package/scripts/train/requirements.txt +5 -0
- package/scripts/train/train-policy-head.py +477 -0
- package/scripts/train/v2/dataset.py +81 -0
- package/scripts/train/v2/domain.json +18 -0
- package/scripts/train/v2/eval.py +196 -0
- package/scripts/train/v2/generate_data.py +219 -0
- package/scripts/train/v2/infer.py +188 -0
- package/scripts/train/v2/model.py +112 -0
- package/scripts/train/v2/precompute.py +132 -0
- package/scripts/train/v2/train.py +302 -0
- package/scripts/train/v2/transform_buffer.py +227 -0
- package/scripts/train/v2/validate_data.py +115 -0
- package/scripts/train-policy-head.py +434 -0
- package/scripts/vm-swarm/README.md +301 -0
- package/scripts/vm-swarm/collect-tuples.sh +331 -0
- package/scripts/vm-swarm/create-base-template.sh +339 -0
- package/scripts/vm-swarm/kill-fleet.sh +204 -0
- package/scripts/vm-swarm/monitor-fleet.sh +346 -0
- package/scripts/vm-swarm/spawn-fleet.sh +304 -0
- package/template/.claude/settings.json +2 -15
- package/template/.github/workflows/jfl-eval.yml +6 -1
- package/template/.github/workflows/jfl-review.yml +4 -0
- package/template/scripts/session/session-cleanup.sh +2 -11
- package/template/scripts/session/session-end-hub.sh +72 -0
- package/template/scripts/session/session-end.sh +69 -6
- package/template/scripts/session/session-init.sh +55 -30
- package/template/scripts/session/session-lock.sh +464 -0
- package/template/scripts/session/session-start-hub.sh +105 -0
- package/template/templates/service-agent/workflows/jfl-eval.yml +19 -0
- package/dist/dashboard-static/assets/index-B6kRK9Rq.js +0 -116
- package/dist/dashboard-static/assets/index-BpdKJPLu.css +0 -1
|
@@ -0,0 +1,112 @@
|
|
|
1
|
+
"""
|
|
2
|
+
v2 Policy Head — Transformer-based action selector.
|
|
3
|
+
|
|
4
|
+
Architecture from Drew's Stratus tutorial:
|
|
5
|
+
(current_state_emb, goal_emb) -> state_proj + goal_proj -> fusion -> TransformerEncoder -> classifier -> action logits
|
|
6
|
+
|
|
7
|
+
~8.7M params, ~17MB checkpoint. Replaces v1 MLP reward predictor.
|
|
8
|
+
"""
|
|
9
|
+
|
|
10
|
+
import torch
|
|
11
|
+
import torch.nn as nn
|
|
12
|
+
import torch.nn.functional as F
|
|
13
|
+
|
|
14
|
+
|
|
15
|
+
class PolicyHead(nn.Module):
|
|
16
|
+
def __init__(
|
|
17
|
+
self,
|
|
18
|
+
embedding_dim: int = 768,
|
|
19
|
+
hidden_dim: int = 512,
|
|
20
|
+
num_tools: int = 12,
|
|
21
|
+
num_layers: int = 4,
|
|
22
|
+
num_heads: int = 8,
|
|
23
|
+
dropout: float = 0.1,
|
|
24
|
+
):
|
|
25
|
+
super().__init__()
|
|
26
|
+
|
|
27
|
+
self.embedding_dim = embedding_dim
|
|
28
|
+
self.hidden_dim = hidden_dim
|
|
29
|
+
self.num_tools = num_tools
|
|
30
|
+
|
|
31
|
+
self.state_proj = nn.Linear(embedding_dim, hidden_dim)
|
|
32
|
+
self.goal_proj = nn.Linear(embedding_dim, hidden_dim)
|
|
33
|
+
|
|
34
|
+
self.fusion = nn.Sequential(
|
|
35
|
+
nn.Linear(hidden_dim * 2, hidden_dim),
|
|
36
|
+
nn.GELU(),
|
|
37
|
+
nn.Dropout(dropout),
|
|
38
|
+
)
|
|
39
|
+
|
|
40
|
+
encoder_layer = nn.TransformerEncoderLayer(
|
|
41
|
+
d_model=hidden_dim,
|
|
42
|
+
nhead=num_heads,
|
|
43
|
+
dim_feedforward=hidden_dim * 4,
|
|
44
|
+
dropout=dropout,
|
|
45
|
+
activation="gelu",
|
|
46
|
+
batch_first=True,
|
|
47
|
+
)
|
|
48
|
+
self.transformer = nn.TransformerEncoder(
|
|
49
|
+
encoder_layer,
|
|
50
|
+
num_layers=num_layers,
|
|
51
|
+
)
|
|
52
|
+
|
|
53
|
+
self.norm = nn.LayerNorm(hidden_dim)
|
|
54
|
+
self.classifier = nn.Sequential(
|
|
55
|
+
nn.Linear(hidden_dim, hidden_dim),
|
|
56
|
+
nn.GELU(),
|
|
57
|
+
nn.Dropout(dropout),
|
|
58
|
+
nn.Linear(hidden_dim, num_tools),
|
|
59
|
+
)
|
|
60
|
+
|
|
61
|
+
self._init_weights()
|
|
62
|
+
|
|
63
|
+
def _init_weights(self):
|
|
64
|
+
for module in self.modules():
|
|
65
|
+
if isinstance(module, nn.Linear):
|
|
66
|
+
nn.init.xavier_uniform_(module.weight)
|
|
67
|
+
if module.bias is not None:
|
|
68
|
+
nn.init.zeros_(module.bias)
|
|
69
|
+
elif isinstance(module, nn.LayerNorm):
|
|
70
|
+
nn.init.ones_(module.weight)
|
|
71
|
+
nn.init.zeros_(module.bias)
|
|
72
|
+
|
|
73
|
+
def forward(
|
|
74
|
+
self,
|
|
75
|
+
current_state_emb: torch.Tensor,
|
|
76
|
+
goal_state_emb: torch.Tensor,
|
|
77
|
+
) -> torch.Tensor:
|
|
78
|
+
state_h = self.state_proj(current_state_emb)
|
|
79
|
+
goal_h = self.goal_proj(goal_state_emb)
|
|
80
|
+
|
|
81
|
+
fused = self.fusion(torch.cat([state_h, goal_h], dim=-1))
|
|
82
|
+
|
|
83
|
+
x = fused.unsqueeze(1)
|
|
84
|
+
x = self.transformer(x)
|
|
85
|
+
x = x.squeeze(1)
|
|
86
|
+
|
|
87
|
+
x = self.norm(x)
|
|
88
|
+
logits = self.classifier(x)
|
|
89
|
+
|
|
90
|
+
return logits
|
|
91
|
+
|
|
92
|
+
def predict(
|
|
93
|
+
self,
|
|
94
|
+
current_state_emb: torch.Tensor,
|
|
95
|
+
goal_state_emb: torch.Tensor,
|
|
96
|
+
top_k: int = 3,
|
|
97
|
+
) -> dict:
|
|
98
|
+
self.eval()
|
|
99
|
+
with torch.no_grad():
|
|
100
|
+
logits = self.forward(current_state_emb, goal_state_emb)
|
|
101
|
+
probs = F.softmax(logits, dim=-1)
|
|
102
|
+
top_probs, top_indices = torch.topk(probs, k=min(top_k, self.num_tools), dim=-1)
|
|
103
|
+
|
|
104
|
+
return {
|
|
105
|
+
"top_k_indices": top_indices,
|
|
106
|
+
"top_k_probs": top_probs,
|
|
107
|
+
"all_probs": probs,
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
@property
|
|
111
|
+
def num_parameters(self) -> int:
|
|
112
|
+
return sum(p.numel() for p in self.parameters() if p.requires_grad)
|
|
@@ -0,0 +1,132 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Pre-compute Stratus embeddings for all unique texts in v2 training data.
|
|
3
|
+
Caches embeddings as .npz files to avoid re-computation during training.
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
import json
|
|
7
|
+
import os
|
|
8
|
+
import sys
|
|
9
|
+
import argparse
|
|
10
|
+
import numpy as np
|
|
11
|
+
|
|
12
|
+
def get_stratus_embedder(api_url: str, api_key: str):
|
|
13
|
+
import requests
|
|
14
|
+
|
|
15
|
+
def embed_batch(texts: list[str]) -> list[list[float]]:
|
|
16
|
+
response = requests.post(
|
|
17
|
+
f"{api_url}/v1/embeddings",
|
|
18
|
+
headers={
|
|
19
|
+
"Authorization": f"Bearer {api_key}",
|
|
20
|
+
"Content-Type": "application/json",
|
|
21
|
+
},
|
|
22
|
+
json={
|
|
23
|
+
"model": "stratus-x1ac-base",
|
|
24
|
+
"input": texts,
|
|
25
|
+
},
|
|
26
|
+
timeout=30,
|
|
27
|
+
)
|
|
28
|
+
response.raise_for_status()
|
|
29
|
+
data = response.json()
|
|
30
|
+
return [d["embedding"] for d in data["data"]]
|
|
31
|
+
|
|
32
|
+
return embed_batch
|
|
33
|
+
|
|
34
|
+
def collect_unique_texts(data_path: str) -> tuple[list[str], list[str]]:
|
|
35
|
+
states = set()
|
|
36
|
+
goals = set()
|
|
37
|
+
|
|
38
|
+
with open(data_path) as f:
|
|
39
|
+
for line in f:
|
|
40
|
+
line = line.strip()
|
|
41
|
+
if not line:
|
|
42
|
+
continue
|
|
43
|
+
ex = json.loads(line)
|
|
44
|
+
states.add(ex["current_state"])
|
|
45
|
+
goals.add(ex["goal"])
|
|
46
|
+
|
|
47
|
+
return sorted(states), sorted(goals)
|
|
48
|
+
|
|
49
|
+
def precompute_embeddings(
|
|
50
|
+
data_dir: str,
|
|
51
|
+
api_url: str,
|
|
52
|
+
api_key: str,
|
|
53
|
+
batch_size: int = 32,
|
|
54
|
+
):
|
|
55
|
+
embedder = get_stratus_embedder(api_url, api_key)
|
|
56
|
+
|
|
57
|
+
all_states = set()
|
|
58
|
+
all_goals = set()
|
|
59
|
+
|
|
60
|
+
for split in ["train", "val", "test"]:
|
|
61
|
+
path = os.path.join(data_dir, f"{split}.jsonl")
|
|
62
|
+
if not os.path.exists(path):
|
|
63
|
+
print(f" Skipping {split} (file not found)")
|
|
64
|
+
continue
|
|
65
|
+
states, goals = collect_unique_texts(path)
|
|
66
|
+
all_states.update(states)
|
|
67
|
+
all_goals.update(goals)
|
|
68
|
+
|
|
69
|
+
all_texts = sorted(all_states | all_goals)
|
|
70
|
+
print(f"Unique texts to embed: {len(all_texts)} ({len(all_states)} states, {len(all_goals)} goals)")
|
|
71
|
+
|
|
72
|
+
text_to_embedding = {}
|
|
73
|
+
for i in range(0, len(all_texts), batch_size):
|
|
74
|
+
batch = all_texts[i : i + batch_size]
|
|
75
|
+
try:
|
|
76
|
+
embeddings = embedder(batch)
|
|
77
|
+
for text, emb in zip(batch, embeddings):
|
|
78
|
+
text_to_embedding[text] = emb
|
|
79
|
+
except Exception as e:
|
|
80
|
+
print(f" Error embedding batch {i}-{i + len(batch)}: {e}")
|
|
81
|
+
continue
|
|
82
|
+
|
|
83
|
+
done = min(i + batch_size, len(all_texts))
|
|
84
|
+
print(f" Embedded {done}/{len(all_texts)} texts")
|
|
85
|
+
|
|
86
|
+
texts_list = sorted(text_to_embedding.keys())
|
|
87
|
+
text_to_idx = {t: i for i, t in enumerate(texts_list)}
|
|
88
|
+
embeddings_matrix = np.array([text_to_embedding[t] for t in texts_list], dtype=np.float32)
|
|
89
|
+
|
|
90
|
+
cache_path = os.path.join(data_dir, "embeddings_cache.npz")
|
|
91
|
+
np.savez(
|
|
92
|
+
cache_path,
|
|
93
|
+
embeddings=embeddings_matrix,
|
|
94
|
+
texts=np.array(texts_list, dtype=object),
|
|
95
|
+
)
|
|
96
|
+
print(f"Saved embedding cache: {cache_path} ({embeddings_matrix.shape})")
|
|
97
|
+
|
|
98
|
+
index_path = os.path.join(data_dir, "text_to_idx.json")
|
|
99
|
+
with open(index_path, "w") as f:
|
|
100
|
+
json.dump(text_to_idx, f)
|
|
101
|
+
print(f"Saved text index: {index_path} ({len(text_to_idx)} entries)")
|
|
102
|
+
|
|
103
|
+
return text_to_idx, embeddings_matrix
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
def main():
|
|
107
|
+
parser = argparse.ArgumentParser(description="Pre-compute Stratus embeddings for v2 training data")
|
|
108
|
+
parser.add_argument("--data-dir", default=".jfl/v2-data", help="Directory with train/val/test JSONL files")
|
|
109
|
+
parser.add_argument("--batch-size", type=int, default=32, help="Embedding batch size")
|
|
110
|
+
args = parser.parse_args()
|
|
111
|
+
|
|
112
|
+
api_url = os.environ.get("STRATUS_API_URL", "https://api.stratus.run")
|
|
113
|
+
api_key = os.environ.get("STRATUS_API_KEY", "")
|
|
114
|
+
|
|
115
|
+
if not api_key:
|
|
116
|
+
print("STRATUS_API_KEY not set")
|
|
117
|
+
sys.exit(1)
|
|
118
|
+
|
|
119
|
+
if not os.path.exists(args.data_dir):
|
|
120
|
+
print(f"Data directory not found: {args.data_dir}")
|
|
121
|
+
sys.exit(1)
|
|
122
|
+
|
|
123
|
+
precompute_embeddings(
|
|
124
|
+
data_dir=args.data_dir,
|
|
125
|
+
api_url=api_url,
|
|
126
|
+
api_key=api_key,
|
|
127
|
+
batch_size=args.batch_size,
|
|
128
|
+
)
|
|
129
|
+
|
|
130
|
+
|
|
131
|
+
if __name__ == "__main__":
|
|
132
|
+
main()
|
|
@@ -0,0 +1,302 @@
|
|
|
1
|
+
"""
|
|
2
|
+
v2 Policy Head Training Loop.
|
|
3
|
+
|
|
4
|
+
CrossEntropyLoss with label smoothing, cosine annealing with warmup,
|
|
5
|
+
early stopping. Produces .pt checkpoint with model weights, config, and tool index.
|
|
6
|
+
"""
|
|
7
|
+
|
|
8
|
+
import json
|
|
9
|
+
import os
|
|
10
|
+
import sys
|
|
11
|
+
import time
|
|
12
|
+
import math
|
|
13
|
+
import argparse
|
|
14
|
+
|
|
15
|
+
import numpy as np
|
|
16
|
+
import torch
|
|
17
|
+
import torch.nn as nn
|
|
18
|
+
import torch.optim as optim
|
|
19
|
+
from torch.utils.data import DataLoader
|
|
20
|
+
|
|
21
|
+
from model import PolicyHead
|
|
22
|
+
from dataset import PolicyHeadDataset, load_embedding_cache
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
def load_tool_index(domain_path: str) -> dict[str, int]:
|
|
26
|
+
with open(domain_path) as f:
|
|
27
|
+
domain = json.load(f)
|
|
28
|
+
return {tool["name"]: i for i, tool in enumerate(domain["tools"])}
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
def get_lr_scheduler(optimizer, warmup_steps: int, total_steps: int):
|
|
32
|
+
def lr_lambda(step):
|
|
33
|
+
if step < warmup_steps:
|
|
34
|
+
return float(step) / float(max(1, warmup_steps))
|
|
35
|
+
progress = float(step - warmup_steps) / float(max(1, total_steps - warmup_steps))
|
|
36
|
+
return max(0.0, 0.5 * (1.0 + math.cos(progress * math.pi)))
|
|
37
|
+
|
|
38
|
+
return optim.lr_scheduler.LambdaLR(optimizer, lr_lambda)
|
|
39
|
+
|
|
40
|
+
|
|
41
|
+
def train_epoch(model, dataloader, criterion, optimizer, scheduler, device):
|
|
42
|
+
model.train()
|
|
43
|
+
total_loss = 0.0
|
|
44
|
+
correct = 0
|
|
45
|
+
total = 0
|
|
46
|
+
|
|
47
|
+
for batch in dataloader:
|
|
48
|
+
state_emb = batch["state_emb"].to(device)
|
|
49
|
+
goal_emb = batch["goal_emb"].to(device)
|
|
50
|
+
labels = batch["label"].to(device)
|
|
51
|
+
|
|
52
|
+
optimizer.zero_grad()
|
|
53
|
+
|
|
54
|
+
logits = model(state_emb, goal_emb)
|
|
55
|
+
loss = criterion(logits, labels)
|
|
56
|
+
|
|
57
|
+
loss.backward()
|
|
58
|
+
torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm=1.0)
|
|
59
|
+
optimizer.step()
|
|
60
|
+
scheduler.step()
|
|
61
|
+
|
|
62
|
+
total_loss += loss.item() * labels.size(0)
|
|
63
|
+
preds = logits.argmax(dim=-1)
|
|
64
|
+
correct += (preds == labels).sum().item()
|
|
65
|
+
total += labels.size(0)
|
|
66
|
+
|
|
67
|
+
return total_loss / max(total, 1), correct / max(total, 1)
|
|
68
|
+
|
|
69
|
+
|
|
70
|
+
@torch.no_grad()
|
|
71
|
+
def evaluate(model, dataloader, criterion, device):
|
|
72
|
+
model.eval()
|
|
73
|
+
total_loss = 0.0
|
|
74
|
+
correct = 0
|
|
75
|
+
total = 0
|
|
76
|
+
|
|
77
|
+
for batch in dataloader:
|
|
78
|
+
state_emb = batch["state_emb"].to(device)
|
|
79
|
+
goal_emb = batch["goal_emb"].to(device)
|
|
80
|
+
labels = batch["label"].to(device)
|
|
81
|
+
|
|
82
|
+
logits = model(state_emb, goal_emb)
|
|
83
|
+
loss = criterion(logits, labels)
|
|
84
|
+
|
|
85
|
+
total_loss += loss.item() * labels.size(0)
|
|
86
|
+
preds = logits.argmax(dim=-1)
|
|
87
|
+
correct += (preds == labels).sum().item()
|
|
88
|
+
total += labels.size(0)
|
|
89
|
+
|
|
90
|
+
return total_loss / max(total, 1), correct / max(total, 1)
|
|
91
|
+
|
|
92
|
+
|
|
93
|
+
def train(args):
|
|
94
|
+
# Device
|
|
95
|
+
if torch.cuda.is_available():
|
|
96
|
+
device = "cuda"
|
|
97
|
+
elif hasattr(torch.backends, "mps") and torch.backends.mps.is_available():
|
|
98
|
+
device = "mps"
|
|
99
|
+
else:
|
|
100
|
+
device = "cpu"
|
|
101
|
+
print(f"Device: {device}")
|
|
102
|
+
|
|
103
|
+
# Domain
|
|
104
|
+
domain_path = args.domain
|
|
105
|
+
tool_to_index = load_tool_index(domain_path)
|
|
106
|
+
index_to_tool = {v: k for k, v in tool_to_index.items()}
|
|
107
|
+
num_tools = len(tool_to_index)
|
|
108
|
+
print(f"Tools: {num_tools}")
|
|
109
|
+
|
|
110
|
+
# Embeddings cache
|
|
111
|
+
embeddings_matrix, text_to_idx = load_embedding_cache(args.data_dir)
|
|
112
|
+
if embeddings_matrix is not None:
|
|
113
|
+
print(f"Embedding cache: {embeddings_matrix.shape[0]} texts, {embeddings_matrix.shape[1]}-dim")
|
|
114
|
+
else:
|
|
115
|
+
print("WARNING: No embedding cache found. Training with zero vectors.")
|
|
116
|
+
print(" Run: python precompute.py --data-dir", args.data_dir)
|
|
117
|
+
|
|
118
|
+
# Datasets
|
|
119
|
+
train_path = os.path.join(args.data_dir, "train.jsonl")
|
|
120
|
+
val_path = os.path.join(args.data_dir, "val.jsonl")
|
|
121
|
+
|
|
122
|
+
if not os.path.exists(train_path):
|
|
123
|
+
print(f"Training data not found: {train_path}")
|
|
124
|
+
sys.exit(1)
|
|
125
|
+
|
|
126
|
+
train_ds = PolicyHeadDataset(train_path, tool_to_index, embeddings_matrix, text_to_idx)
|
|
127
|
+
val_ds = PolicyHeadDataset(val_path, tool_to_index, embeddings_matrix, text_to_idx) if os.path.exists(val_path) else None
|
|
128
|
+
|
|
129
|
+
num_workers = 0 if device == "mps" else min(4, os.cpu_count() or 1)
|
|
130
|
+
train_loader = DataLoader(train_ds, batch_size=args.batch_size, shuffle=True, num_workers=num_workers)
|
|
131
|
+
val_loader = DataLoader(val_ds, batch_size=args.batch_size, shuffle=False, num_workers=num_workers) if val_ds else None
|
|
132
|
+
|
|
133
|
+
print(f"Train: {len(train_ds)} examples")
|
|
134
|
+
if val_ds:
|
|
135
|
+
print(f"Val: {len(val_ds)} examples")
|
|
136
|
+
|
|
137
|
+
# Model
|
|
138
|
+
embedding_dim = embeddings_matrix.shape[1] if embeddings_matrix is not None else 768
|
|
139
|
+
model = PolicyHead(
|
|
140
|
+
embedding_dim=embedding_dim,
|
|
141
|
+
hidden_dim=args.hidden_dim,
|
|
142
|
+
num_tools=num_tools,
|
|
143
|
+
num_layers=args.num_layers,
|
|
144
|
+
num_heads=args.num_heads,
|
|
145
|
+
dropout=args.dropout,
|
|
146
|
+
).to(device)
|
|
147
|
+
|
|
148
|
+
print(f"Parameters: {model.num_parameters:,}")
|
|
149
|
+
|
|
150
|
+
# Warm start
|
|
151
|
+
if args.warm_start and os.path.exists(args.warm_start):
|
|
152
|
+
print(f"Warm-starting from: {args.warm_start}")
|
|
153
|
+
state_dict = torch.load(args.warm_start, map_location=device, weights_only=True)
|
|
154
|
+
if "model_state_dict" in state_dict:
|
|
155
|
+
state_dict = state_dict["model_state_dict"]
|
|
156
|
+
compatible = {}
|
|
157
|
+
for k, v in state_dict.items():
|
|
158
|
+
if k in model.state_dict() and v.shape == model.state_dict()[k].shape:
|
|
159
|
+
compatible[k] = v
|
|
160
|
+
model.load_state_dict(compatible, strict=False)
|
|
161
|
+
print(f" Loaded {len(compatible)}/{len(state_dict)} layers")
|
|
162
|
+
|
|
163
|
+
# Loss, optimizer, scheduler
|
|
164
|
+
criterion = nn.CrossEntropyLoss(label_smoothing=args.label_smoothing)
|
|
165
|
+
optimizer = optim.AdamW(
|
|
166
|
+
model.parameters(),
|
|
167
|
+
lr=args.lr,
|
|
168
|
+
weight_decay=args.weight_decay,
|
|
169
|
+
)
|
|
170
|
+
total_steps = len(train_loader) * args.epochs
|
|
171
|
+
scheduler = get_lr_scheduler(optimizer, args.warmup_steps, total_steps)
|
|
172
|
+
|
|
173
|
+
# Training loop
|
|
174
|
+
os.makedirs(args.output_dir, exist_ok=True)
|
|
175
|
+
best_val_acc = 0.0
|
|
176
|
+
best_val_loss = float("inf")
|
|
177
|
+
patience_counter = 0
|
|
178
|
+
|
|
179
|
+
print(f"\nStarting training for {args.epochs} epochs...")
|
|
180
|
+
print(f"{'Epoch':>5} {'Train Loss':>12} {'Train Acc':>10} {'Val Loss':>10} {'Val Acc':>9} {'LR':>10} {'Time':>8}")
|
|
181
|
+
print("-" * 75)
|
|
182
|
+
|
|
183
|
+
for epoch in range(1, args.epochs + 1):
|
|
184
|
+
t0 = time.time()
|
|
185
|
+
|
|
186
|
+
train_loss, train_acc = train_epoch(model, train_loader, criterion, optimizer, scheduler, device)
|
|
187
|
+
|
|
188
|
+
val_loss, val_acc = (0.0, 0.0)
|
|
189
|
+
if val_loader:
|
|
190
|
+
val_loss, val_acc = evaluate(model, val_loader, criterion, device)
|
|
191
|
+
|
|
192
|
+
elapsed = time.time() - t0
|
|
193
|
+
lr = scheduler.get_last_lr()[0]
|
|
194
|
+
|
|
195
|
+
print(
|
|
196
|
+
f"{epoch:5d} {train_loss:12.4f} {train_acc:9.1%} {val_loss:10.4f} {val_acc:8.1%} {lr:10.2e} {elapsed:7.1f}s"
|
|
197
|
+
)
|
|
198
|
+
|
|
199
|
+
# Save best model
|
|
200
|
+
is_best = False
|
|
201
|
+
if val_loader:
|
|
202
|
+
if val_acc > best_val_acc:
|
|
203
|
+
best_val_acc = val_acc
|
|
204
|
+
best_val_loss = val_loss
|
|
205
|
+
is_best = True
|
|
206
|
+
elif train_loss < best_val_loss:
|
|
207
|
+
best_val_loss = train_loss
|
|
208
|
+
best_val_acc = train_acc
|
|
209
|
+
is_best = True
|
|
210
|
+
|
|
211
|
+
if is_best:
|
|
212
|
+
patience_counter = 0
|
|
213
|
+
checkpoint = {
|
|
214
|
+
"epoch": epoch,
|
|
215
|
+
"model_state_dict": model.state_dict(),
|
|
216
|
+
"val_accuracy": best_val_acc,
|
|
217
|
+
"val_loss": best_val_loss,
|
|
218
|
+
"num_tools": num_tools,
|
|
219
|
+
"tool_to_index": tool_to_index,
|
|
220
|
+
"index_to_tool": index_to_tool,
|
|
221
|
+
"config": {
|
|
222
|
+
"embedding_dim": embedding_dim,
|
|
223
|
+
"hidden_dim": args.hidden_dim,
|
|
224
|
+
"num_layers": args.num_layers,
|
|
225
|
+
"num_heads": args.num_heads,
|
|
226
|
+
"dropout": args.dropout,
|
|
227
|
+
},
|
|
228
|
+
}
|
|
229
|
+
ckpt_path = os.path.join(args.output_dir, "best_policy_head.pt")
|
|
230
|
+
torch.save(checkpoint, ckpt_path)
|
|
231
|
+
print(f" ✅ New best model (val_acc={best_val_acc:.1%})")
|
|
232
|
+
else:
|
|
233
|
+
patience_counter += 1
|
|
234
|
+
|
|
235
|
+
# Early stopping
|
|
236
|
+
if patience_counter >= args.patience:
|
|
237
|
+
print(f"\n Early stopping at epoch {epoch} (no improvement for {args.patience} epochs)")
|
|
238
|
+
break
|
|
239
|
+
|
|
240
|
+
print(f"\nTraining complete. Best val accuracy: {best_val_acc:.1%}")
|
|
241
|
+
|
|
242
|
+
ckpt_path = os.path.join(args.output_dir, "best_policy_head.pt")
|
|
243
|
+
if os.path.exists(ckpt_path):
|
|
244
|
+
size_mb = os.path.getsize(ckpt_path) / 1024 / 1024
|
|
245
|
+
print(f"Checkpoint: {ckpt_path} ({size_mb:.1f} MB)")
|
|
246
|
+
|
|
247
|
+
# Write metadata for TypeScript bridge
|
|
248
|
+
meta = {
|
|
249
|
+
"version": 2,
|
|
250
|
+
"architecture": "transformer-4layer-512h",
|
|
251
|
+
"embedding_dim": embedding_dim,
|
|
252
|
+
"hidden_dim": args.hidden_dim,
|
|
253
|
+
"num_tools": num_tools,
|
|
254
|
+
"num_layers": args.num_layers,
|
|
255
|
+
"num_heads": args.num_heads,
|
|
256
|
+
"trained_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
|
|
257
|
+
"trained_on": len(train_ds),
|
|
258
|
+
"val_accuracy": best_val_acc,
|
|
259
|
+
"val_loss": best_val_loss,
|
|
260
|
+
"device": device,
|
|
261
|
+
"parameters": model.num_parameters,
|
|
262
|
+
"tool_to_index": tool_to_index,
|
|
263
|
+
"index_to_tool": {str(k): v for k, v in index_to_tool.items()},
|
|
264
|
+
"checkpoint_path": os.path.abspath(ckpt_path),
|
|
265
|
+
}
|
|
266
|
+
meta_path = os.path.join(args.output_dir, "policy-head-v2.json")
|
|
267
|
+
with open(meta_path, "w") as f:
|
|
268
|
+
json.dump(meta, f, indent=2)
|
|
269
|
+
print(f"Metadata: {meta_path}")
|
|
270
|
+
|
|
271
|
+
|
|
272
|
+
def main():
|
|
273
|
+
parser = argparse.ArgumentParser(description="Train v2 policy head (transformer action selector)")
|
|
274
|
+
parser.add_argument("--data-dir", default=".jfl/v2-data", help="Directory with train/val/test JSONL + embeddings")
|
|
275
|
+
parser.add_argument("--domain", default=None, help="Path to domain.json")
|
|
276
|
+
parser.add_argument("--output-dir", default=".jfl/checkpoints", help="Output directory for checkpoints")
|
|
277
|
+
parser.add_argument("--warm-start", default=None, help="Path to pretrained checkpoint for warm start")
|
|
278
|
+
parser.add_argument("--epochs", type=int, default=50, help="Max training epochs")
|
|
279
|
+
parser.add_argument("--batch-size", type=int, default=64, help="Batch size")
|
|
280
|
+
parser.add_argument("--lr", type=float, default=3e-4, help="Learning rate")
|
|
281
|
+
parser.add_argument("--weight-decay", type=float, default=0.01, help="Weight decay")
|
|
282
|
+
parser.add_argument("--warmup-steps", type=int, default=100, help="Warmup steps for LR scheduler")
|
|
283
|
+
parser.add_argument("--patience", type=int, default=7, help="Early stopping patience")
|
|
284
|
+
parser.add_argument("--label-smoothing", type=float, default=0.1, help="Label smoothing for CrossEntropyLoss")
|
|
285
|
+
parser.add_argument("--hidden-dim", type=int, default=512, help="Hidden dimension")
|
|
286
|
+
parser.add_argument("--num-layers", type=int, default=4, help="Transformer encoder layers")
|
|
287
|
+
parser.add_argument("--num-heads", type=int, default=8, help="Attention heads")
|
|
288
|
+
parser.add_argument("--dropout", type=float, default=0.1, help="Dropout rate")
|
|
289
|
+
args = parser.parse_args()
|
|
290
|
+
|
|
291
|
+
if args.domain is None:
|
|
292
|
+
args.domain = os.path.join(os.path.dirname(os.path.abspath(__file__)), "domain.json")
|
|
293
|
+
|
|
294
|
+
if not os.path.exists(args.domain):
|
|
295
|
+
print(f"Domain file not found: {args.domain}")
|
|
296
|
+
sys.exit(1)
|
|
297
|
+
|
|
298
|
+
train(args)
|
|
299
|
+
|
|
300
|
+
|
|
301
|
+
if __name__ == "__main__":
|
|
302
|
+
main()
|