jfl 0.4.4 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (533) hide show
  1. package/dist/commands/context-hub.d.ts +1 -0
  2. package/dist/commands/context-hub.d.ts.map +1 -1
  3. package/dist/commands/context-hub.js +1064 -41
  4. package/dist/commands/context-hub.js.map +1 -1
  5. package/dist/commands/eval.d.ts +1 -1
  6. package/dist/commands/eval.d.ts.map +1 -1
  7. package/dist/commands/eval.js +192 -1
  8. package/dist/commands/eval.js.map +1 -1
  9. package/dist/commands/findings.d.ts +6 -0
  10. package/dist/commands/findings.d.ts.map +1 -0
  11. package/dist/commands/findings.js +203 -0
  12. package/dist/commands/findings.js.map +1 -0
  13. package/dist/commands/hud.d.ts.map +1 -1
  14. package/dist/commands/hud.js +47 -9
  15. package/dist/commands/hud.js.map +1 -1
  16. package/dist/commands/ide.d.ts +27 -0
  17. package/dist/commands/ide.d.ts.map +1 -0
  18. package/dist/commands/ide.js +546 -0
  19. package/dist/commands/ide.js.map +1 -0
  20. package/dist/commands/onboard.d.ts.map +1 -1
  21. package/dist/commands/onboard.js +212 -2
  22. package/dist/commands/onboard.js.map +1 -1
  23. package/dist/commands/openclaw.d.ts +3 -0
  24. package/dist/commands/openclaw.d.ts.map +1 -1
  25. package/dist/commands/openclaw.js +76 -2
  26. package/dist/commands/openclaw.js.map +1 -1
  27. package/dist/commands/peter.d.ts +3 -0
  28. package/dist/commands/peter.d.ts.map +1 -1
  29. package/dist/commands/peter.js +1168 -58
  30. package/dist/commands/peter.js.map +1 -1
  31. package/dist/commands/pi-fleet.d.ts +18 -0
  32. package/dist/commands/pi-fleet.d.ts.map +1 -0
  33. package/dist/commands/pi-fleet.js +382 -0
  34. package/dist/commands/pi-fleet.js.map +1 -0
  35. package/dist/commands/pi.d.ts.map +1 -1
  36. package/dist/commands/pi.js +18 -3
  37. package/dist/commands/pi.js.map +1 -1
  38. package/dist/commands/scope.d.ts.map +1 -1
  39. package/dist/commands/scope.js +90 -1
  40. package/dist/commands/scope.js.map +1 -1
  41. package/dist/commands/services.d.ts.map +1 -1
  42. package/dist/commands/services.js +18 -0
  43. package/dist/commands/services.js.map +1 -1
  44. package/dist/commands/setup.d.ts +12 -0
  45. package/dist/commands/setup.d.ts.map +1 -0
  46. package/dist/commands/setup.js +322 -0
  47. package/dist/commands/setup.js.map +1 -0
  48. package/dist/commands/status.d.ts.map +1 -1
  49. package/dist/commands/status.js +22 -4
  50. package/dist/commands/status.js.map +1 -1
  51. package/dist/commands/train.d.ts +33 -0
  52. package/dist/commands/train.d.ts.map +1 -0
  53. package/dist/commands/train.js +510 -0
  54. package/dist/commands/train.js.map +1 -0
  55. package/dist/commands/verify.d.ts +14 -0
  56. package/dist/commands/verify.d.ts.map +1 -0
  57. package/dist/commands/verify.js +276 -0
  58. package/dist/commands/verify.js.map +1 -0
  59. package/dist/commands/viz.d.ts.map +1 -1
  60. package/dist/commands/viz.js +417 -0
  61. package/dist/commands/viz.js.map +1 -1
  62. package/dist/dashboard-static/assets/index-CW9ZxqX8.css +1 -0
  63. package/dist/dashboard-static/assets/index-DNN__p4K.js +121 -0
  64. package/dist/dashboard-static/index.html +2 -2
  65. package/dist/index.js +324 -64
  66. package/dist/index.js.map +1 -1
  67. package/dist/lib/agent-config.d.ts +52 -0
  68. package/dist/lib/agent-config.d.ts.map +1 -0
  69. package/dist/lib/agent-config.js +231 -0
  70. package/dist/lib/agent-config.js.map +1 -0
  71. package/dist/lib/agent-generator.d.ts +10 -0
  72. package/dist/lib/agent-generator.d.ts.map +1 -1
  73. package/dist/lib/agent-generator.js +64 -10
  74. package/dist/lib/agent-generator.js.map +1 -1
  75. package/dist/lib/agent-session.d.ts +104 -0
  76. package/dist/lib/agent-session.d.ts.map +1 -0
  77. package/dist/lib/agent-session.js +635 -0
  78. package/dist/lib/agent-session.js.map +1 -0
  79. package/dist/lib/eval-snapshot.d.ts +47 -0
  80. package/dist/lib/eval-snapshot.d.ts.map +1 -0
  81. package/dist/lib/eval-snapshot.js +315 -0
  82. package/dist/lib/eval-snapshot.js.map +1 -0
  83. package/dist/lib/eval-store.d.ts +5 -0
  84. package/dist/lib/eval-store.d.ts.map +1 -1
  85. package/dist/lib/eval-store.js +33 -3
  86. package/dist/lib/eval-store.js.map +1 -1
  87. package/dist/lib/findings-engine.d.ts +51 -0
  88. package/dist/lib/findings-engine.d.ts.map +1 -0
  89. package/dist/lib/findings-engine.js +338 -0
  90. package/dist/lib/findings-engine.js.map +1 -0
  91. package/dist/lib/flow-engine.d.ts +8 -0
  92. package/dist/lib/flow-engine.d.ts.map +1 -1
  93. package/dist/lib/flow-engine.js +84 -2
  94. package/dist/lib/flow-engine.js.map +1 -1
  95. package/dist/lib/hub-client.d.ts +1 -0
  96. package/dist/lib/hub-client.d.ts.map +1 -1
  97. package/dist/lib/hub-client.js +33 -6
  98. package/dist/lib/hub-client.js.map +1 -1
  99. package/dist/lib/ide-panes.d.ts +58 -0
  100. package/dist/lib/ide-panes.d.ts.map +1 -0
  101. package/dist/lib/ide-panes.js +508 -0
  102. package/dist/lib/ide-panes.js.map +1 -0
  103. package/dist/lib/memory-db.js +4 -4
  104. package/dist/lib/memory-db.js.map +1 -1
  105. package/dist/lib/memory-indexer.d.ts.map +1 -1
  106. package/dist/lib/memory-indexer.js +3 -0
  107. package/dist/lib/memory-indexer.js.map +1 -1
  108. package/dist/lib/memory-search.d.ts +148 -4
  109. package/dist/lib/memory-search.d.ts.map +1 -1
  110. package/dist/lib/memory-search.js +496 -58
  111. package/dist/lib/memory-search.js.map +1 -1
  112. package/dist/lib/meta-orchestrator.d.ts +104 -0
  113. package/dist/lib/meta-orchestrator.d.ts.map +1 -0
  114. package/dist/lib/meta-orchestrator.js +373 -0
  115. package/dist/lib/meta-orchestrator.js.map +1 -0
  116. package/dist/lib/peer-agent-generator.d.ts.map +1 -1
  117. package/dist/lib/peer-agent-generator.js +43 -19
  118. package/dist/lib/peer-agent-generator.js.map +1 -1
  119. package/dist/lib/pi-sky/bridge.d.ts +55 -0
  120. package/dist/lib/pi-sky/bridge.d.ts.map +1 -0
  121. package/dist/lib/pi-sky/bridge.js +264 -0
  122. package/dist/lib/pi-sky/bridge.js.map +1 -0
  123. package/dist/lib/pi-sky/cost-monitor.d.ts +21 -0
  124. package/dist/lib/pi-sky/cost-monitor.d.ts.map +1 -0
  125. package/dist/lib/pi-sky/cost-monitor.js +126 -0
  126. package/dist/lib/pi-sky/cost-monitor.js.map +1 -0
  127. package/dist/lib/pi-sky/eval-sweep.d.ts +27 -0
  128. package/dist/lib/pi-sky/eval-sweep.d.ts.map +1 -0
  129. package/dist/lib/pi-sky/eval-sweep.js +141 -0
  130. package/dist/lib/pi-sky/eval-sweep.js.map +1 -0
  131. package/dist/lib/pi-sky/event-router.d.ts +32 -0
  132. package/dist/lib/pi-sky/event-router.d.ts.map +1 -0
  133. package/dist/lib/pi-sky/event-router.js +176 -0
  134. package/dist/lib/pi-sky/event-router.js.map +1 -0
  135. package/dist/lib/pi-sky/experiment.d.ts +9 -0
  136. package/dist/lib/pi-sky/experiment.d.ts.map +1 -0
  137. package/dist/lib/pi-sky/experiment.js +83 -0
  138. package/dist/lib/pi-sky/experiment.js.map +1 -0
  139. package/dist/lib/pi-sky/index.d.ts +16 -0
  140. package/dist/lib/pi-sky/index.d.ts.map +1 -0
  141. package/dist/lib/pi-sky/index.js +16 -0
  142. package/dist/lib/pi-sky/index.js.map +1 -0
  143. package/dist/lib/pi-sky/stratus-gate.d.ts +28 -0
  144. package/dist/lib/pi-sky/stratus-gate.d.ts.map +1 -0
  145. package/dist/lib/pi-sky/stratus-gate.js +61 -0
  146. package/dist/lib/pi-sky/stratus-gate.js.map +1 -0
  147. package/dist/lib/pi-sky/swarm.d.ts +28 -0
  148. package/dist/lib/pi-sky/swarm.d.ts.map +1 -0
  149. package/dist/lib/pi-sky/swarm.js +208 -0
  150. package/dist/lib/pi-sky/swarm.js.map +1 -0
  151. package/dist/lib/pi-sky/types.d.ts +139 -0
  152. package/dist/lib/pi-sky/types.d.ts.map +1 -0
  153. package/dist/lib/pi-sky/types.js +2 -0
  154. package/dist/lib/pi-sky/types.js.map +1 -0
  155. package/dist/lib/pi-sky/voice-bridge.d.ts +20 -0
  156. package/dist/lib/pi-sky/voice-bridge.d.ts.map +1 -0
  157. package/dist/lib/pi-sky/voice-bridge.js +91 -0
  158. package/dist/lib/pi-sky/voice-bridge.js.map +1 -0
  159. package/dist/lib/policy-head.d.ts +40 -0
  160. package/dist/lib/policy-head.d.ts.map +1 -0
  161. package/dist/lib/policy-head.js +234 -0
  162. package/dist/lib/policy-head.js.map +1 -0
  163. package/dist/lib/predictor.d.ts +10 -0
  164. package/dist/lib/predictor.d.ts.map +1 -1
  165. package/dist/lib/predictor.js +46 -7
  166. package/dist/lib/predictor.js.map +1 -1
  167. package/dist/lib/replay-buffer.d.ts +93 -0
  168. package/dist/lib/replay-buffer.d.ts.map +1 -0
  169. package/dist/lib/replay-buffer.js +302 -0
  170. package/dist/lib/replay-buffer.js.map +1 -0
  171. package/dist/lib/sentinel-rl.d.ts +97 -0
  172. package/dist/lib/sentinel-rl.d.ts.map +1 -0
  173. package/dist/lib/sentinel-rl.js +430 -0
  174. package/dist/lib/sentinel-rl.js.map +1 -0
  175. package/dist/lib/session-lock.d.ts +61 -0
  176. package/dist/lib/session-lock.d.ts.map +1 -0
  177. package/dist/lib/session-lock.js +438 -0
  178. package/dist/lib/session-lock.js.map +1 -0
  179. package/dist/lib/setup/agent-generator.d.ts +18 -0
  180. package/dist/lib/setup/agent-generator.d.ts.map +1 -0
  181. package/dist/lib/setup/agent-generator.js +114 -0
  182. package/dist/lib/setup/agent-generator.js.map +1 -0
  183. package/dist/lib/setup/context-analyzer.d.ts +16 -0
  184. package/dist/lib/setup/context-analyzer.d.ts.map +1 -0
  185. package/dist/lib/setup/context-analyzer.js +112 -0
  186. package/dist/lib/setup/context-analyzer.js.map +1 -0
  187. package/dist/lib/setup/doc-auditor.d.ts +54 -0
  188. package/dist/lib/setup/doc-auditor.d.ts.map +1 -0
  189. package/dist/lib/setup/doc-auditor.js +629 -0
  190. package/dist/lib/setup/doc-auditor.js.map +1 -0
  191. package/dist/lib/setup/domain-generator.d.ts +7 -0
  192. package/dist/lib/setup/domain-generator.d.ts.map +1 -0
  193. package/dist/lib/setup/domain-generator.js +58 -0
  194. package/dist/lib/setup/domain-generator.js.map +1 -0
  195. package/dist/lib/setup/smart-eval-generator.d.ts +38 -0
  196. package/dist/lib/setup/smart-eval-generator.d.ts.map +1 -0
  197. package/dist/lib/setup/smart-eval-generator.js +378 -0
  198. package/dist/lib/setup/smart-eval-generator.js.map +1 -0
  199. package/dist/lib/setup/smart-recommender.d.ts +63 -0
  200. package/dist/lib/setup/smart-recommender.d.ts.map +1 -0
  201. package/dist/lib/setup/smart-recommender.js +329 -0
  202. package/dist/lib/setup/smart-recommender.js.map +1 -0
  203. package/dist/lib/setup/spec-generator.d.ts +63 -0
  204. package/dist/lib/setup/spec-generator.d.ts.map +1 -0
  205. package/dist/lib/setup/spec-generator.js +310 -0
  206. package/dist/lib/setup/spec-generator.js.map +1 -0
  207. package/dist/lib/setup/violation-agent-generator.d.ts +32 -0
  208. package/dist/lib/setup/violation-agent-generator.d.ts.map +1 -0
  209. package/dist/lib/setup/violation-agent-generator.js +255 -0
  210. package/dist/lib/setup/violation-agent-generator.js.map +1 -0
  211. package/dist/lib/stratus-client.d.ts +1 -0
  212. package/dist/lib/stratus-client.d.ts.map +1 -1
  213. package/dist/lib/stratus-client.js +24 -2
  214. package/dist/lib/stratus-client.js.map +1 -1
  215. package/dist/lib/telemetry-agent-v2.d.ts +128 -0
  216. package/dist/lib/telemetry-agent-v2.d.ts.map +1 -0
  217. package/dist/lib/telemetry-agent-v2.js +1042 -0
  218. package/dist/lib/telemetry-agent-v2.js.map +1 -0
  219. package/dist/lib/telemetry-agent.d.ts.map +1 -1
  220. package/dist/lib/telemetry-agent.js +27 -6
  221. package/dist/lib/telemetry-agent.js.map +1 -1
  222. package/dist/lib/telemetry-digest.d.ts.map +1 -1
  223. package/dist/lib/telemetry-digest.js +27 -5
  224. package/dist/lib/telemetry-digest.js.map +1 -1
  225. package/dist/lib/telemetry.d.ts.map +1 -1
  226. package/dist/lib/telemetry.js +29 -4
  227. package/dist/lib/telemetry.js.map +1 -1
  228. package/dist/lib/text-preprocessing.d.ts +83 -0
  229. package/dist/lib/text-preprocessing.d.ts.map +1 -0
  230. package/dist/lib/text-preprocessing.js +261 -0
  231. package/dist/lib/text-preprocessing.js.map +1 -0
  232. package/dist/lib/training-buffer.d.ts +86 -0
  233. package/dist/lib/training-buffer.d.ts.map +1 -0
  234. package/dist/lib/training-buffer.js +139 -0
  235. package/dist/lib/training-buffer.js.map +1 -0
  236. package/dist/lib/tuple-miner.d.ts +30 -0
  237. package/dist/lib/tuple-miner.d.ts.map +1 -0
  238. package/dist/lib/tuple-miner.js +427 -0
  239. package/dist/lib/tuple-miner.js.map +1 -0
  240. package/dist/lib/vm-backend.d.ts +72 -0
  241. package/dist/lib/vm-backend.d.ts.map +1 -0
  242. package/dist/lib/vm-backend.js +175 -0
  243. package/dist/lib/vm-backend.js.map +1 -0
  244. package/dist/lib/workspace/backend.d.ts +53 -0
  245. package/dist/lib/workspace/backend.d.ts.map +1 -0
  246. package/dist/lib/workspace/backend.js +37 -0
  247. package/dist/lib/workspace/backend.js.map +1 -0
  248. package/dist/lib/workspace/cmux-adapter.d.ts +46 -0
  249. package/dist/lib/workspace/cmux-adapter.d.ts.map +1 -0
  250. package/dist/lib/workspace/cmux-adapter.js +261 -0
  251. package/dist/lib/workspace/cmux-adapter.js.map +1 -0
  252. package/dist/lib/workspace/data-pipeline.d.ts +35 -0
  253. package/dist/lib/workspace/data-pipeline.d.ts.map +1 -0
  254. package/dist/lib/workspace/data-pipeline.js +463 -0
  255. package/dist/lib/workspace/data-pipeline.js.map +1 -0
  256. package/dist/lib/workspace/engine.d.ts +64 -0
  257. package/dist/lib/workspace/engine.d.ts.map +1 -0
  258. package/dist/lib/workspace/engine.js +397 -0
  259. package/dist/lib/workspace/engine.js.map +1 -0
  260. package/dist/lib/workspace/notifications.d.ts +14 -0
  261. package/dist/lib/workspace/notifications.d.ts.map +1 -0
  262. package/dist/lib/workspace/notifications.js +41 -0
  263. package/dist/lib/workspace/notifications.js.map +1 -0
  264. package/dist/lib/workspace/surface-registry.d.ts +49 -0
  265. package/dist/lib/workspace/surface-registry.d.ts.map +1 -0
  266. package/dist/lib/workspace/surface-registry.js +217 -0
  267. package/dist/lib/workspace/surface-registry.js.map +1 -0
  268. package/dist/lib/workspace/surface-type.d.ts +153 -0
  269. package/dist/lib/workspace/surface-type.d.ts.map +1 -0
  270. package/dist/lib/workspace/surface-type.js +9 -0
  271. package/dist/lib/workspace/surface-type.js.map +1 -0
  272. package/dist/lib/workspace/surfaces/agent-overview.d.ts +16 -0
  273. package/dist/lib/workspace/surfaces/agent-overview.d.ts.map +1 -0
  274. package/dist/lib/workspace/surfaces/agent-overview.js +116 -0
  275. package/dist/lib/workspace/surfaces/agent-overview.js.map +1 -0
  276. package/dist/lib/workspace/surfaces/agent.d.ts +16 -0
  277. package/dist/lib/workspace/surfaces/agent.d.ts.map +1 -0
  278. package/dist/lib/workspace/surfaces/agent.js +112 -0
  279. package/dist/lib/workspace/surfaces/agent.js.map +1 -0
  280. package/dist/lib/workspace/surfaces/claude.d.ts +15 -0
  281. package/dist/lib/workspace/surfaces/claude.d.ts.map +1 -0
  282. package/dist/lib/workspace/surfaces/claude.js +23 -0
  283. package/dist/lib/workspace/surfaces/claude.js.map +1 -0
  284. package/dist/lib/workspace/surfaces/dashboard.d.ts +21 -0
  285. package/dist/lib/workspace/surfaces/dashboard.d.ts.map +1 -0
  286. package/dist/lib/workspace/surfaces/dashboard.js +32 -0
  287. package/dist/lib/workspace/surfaces/dashboard.js.map +1 -0
  288. package/dist/lib/workspace/surfaces/eval.d.ts +15 -0
  289. package/dist/lib/workspace/surfaces/eval.d.ts.map +1 -0
  290. package/dist/lib/workspace/surfaces/eval.js +42 -0
  291. package/dist/lib/workspace/surfaces/eval.js.map +1 -0
  292. package/dist/lib/workspace/surfaces/event-stream.d.ts +16 -0
  293. package/dist/lib/workspace/surfaces/event-stream.d.ts.map +1 -0
  294. package/dist/lib/workspace/surfaces/event-stream.js +40 -0
  295. package/dist/lib/workspace/surfaces/event-stream.js.map +1 -0
  296. package/dist/lib/workspace/surfaces/flow.d.ts +16 -0
  297. package/dist/lib/workspace/surfaces/flow.d.ts.map +1 -0
  298. package/dist/lib/workspace/surfaces/flow.js +49 -0
  299. package/dist/lib/workspace/surfaces/flow.js.map +1 -0
  300. package/dist/lib/workspace/surfaces/index.d.ts +16 -0
  301. package/dist/lib/workspace/surfaces/index.d.ts.map +1 -0
  302. package/dist/lib/workspace/surfaces/index.js +16 -0
  303. package/dist/lib/workspace/surfaces/index.js.map +1 -0
  304. package/dist/lib/workspace/surfaces/portfolio.d.ts +16 -0
  305. package/dist/lib/workspace/surfaces/portfolio.d.ts.map +1 -0
  306. package/dist/lib/workspace/surfaces/portfolio.js +102 -0
  307. package/dist/lib/workspace/surfaces/portfolio.js.map +1 -0
  308. package/dist/lib/workspace/surfaces/service.d.ts +16 -0
  309. package/dist/lib/workspace/surfaces/service.d.ts.map +1 -0
  310. package/dist/lib/workspace/surfaces/service.js +45 -0
  311. package/dist/lib/workspace/surfaces/service.js.map +1 -0
  312. package/dist/lib/workspace/surfaces/shell.d.ts +15 -0
  313. package/dist/lib/workspace/surfaces/shell.d.ts.map +1 -0
  314. package/dist/lib/workspace/surfaces/shell.js +19 -0
  315. package/dist/lib/workspace/surfaces/shell.js.map +1 -0
  316. package/dist/lib/workspace/surfaces/telemetry.d.ts +16 -0
  317. package/dist/lib/workspace/surfaces/telemetry.d.ts.map +1 -0
  318. package/dist/lib/workspace/surfaces/telemetry.js +48 -0
  319. package/dist/lib/workspace/surfaces/telemetry.js.map +1 -0
  320. package/dist/lib/workspace/surfaces/topology.d.ts +15 -0
  321. package/dist/lib/workspace/surfaces/topology.d.ts.map +1 -0
  322. package/dist/lib/workspace/surfaces/topology.js +19 -0
  323. package/dist/lib/workspace/surfaces/topology.js.map +1 -0
  324. package/dist/lib/workspace/surfaces/training.d.ts +16 -0
  325. package/dist/lib/workspace/surfaces/training.d.ts.map +1 -0
  326. package/dist/lib/workspace/surfaces/training.js +22 -0
  327. package/dist/lib/workspace/surfaces/training.js.map +1 -0
  328. package/dist/lib/workspace/tmux-adapter.d.ts +27 -0
  329. package/dist/lib/workspace/tmux-adapter.d.ts.map +1 -0
  330. package/dist/lib/workspace/tmux-adapter.js +106 -0
  331. package/dist/lib/workspace/tmux-adapter.js.map +1 -0
  332. package/dist/mcp/context-hub-mcp.js +7 -24
  333. package/dist/mcp/context-hub-mcp.js.map +1 -1
  334. package/dist/types/flows.d.ts +2 -0
  335. package/dist/types/flows.d.ts.map +1 -1
  336. package/dist/types/ide.d.ts +49 -0
  337. package/dist/types/ide.d.ts.map +1 -0
  338. package/dist/types/ide.js +5 -0
  339. package/dist/types/ide.js.map +1 -0
  340. package/dist/types/platform-digest.d.ts +228 -0
  341. package/dist/types/platform-digest.d.ts.map +1 -0
  342. package/dist/types/platform-digest.js +5 -0
  343. package/dist/types/platform-digest.js.map +1 -0
  344. package/dist/types/telemetry-digest.d.ts +2 -0
  345. package/dist/types/telemetry-digest.d.ts.map +1 -1
  346. package/dist/utils/ensure-project.d.ts +1 -0
  347. package/dist/utils/ensure-project.d.ts.map +1 -1
  348. package/dist/utils/ensure-project.js +19 -7
  349. package/dist/utils/ensure-project.js.map +1 -1
  350. package/dist/utils/jfl-config.d.ts +1 -0
  351. package/dist/utils/jfl-config.d.ts.map +1 -1
  352. package/dist/utils/jfl-config.js +19 -1
  353. package/dist/utils/jfl-config.js.map +1 -1
  354. package/dist/utils/jfl-paths.d.ts +5 -0
  355. package/dist/utils/jfl-paths.d.ts.map +1 -1
  356. package/dist/utils/jfl-paths.js +25 -3
  357. package/dist/utils/jfl-paths.js.map +1 -1
  358. package/package.json +3 -2
  359. package/packages/pi/AGENTS.md +112 -0
  360. package/packages/pi/extensions/agent-grid.ts +191 -0
  361. package/packages/pi/extensions/agent-names.ts +178 -0
  362. package/packages/pi/extensions/autoresearch.ts +427 -0
  363. package/packages/pi/extensions/bookmarks.ts +85 -0
  364. package/packages/pi/extensions/context.ts +184 -0
  365. package/packages/pi/extensions/crm-tool.ts +61 -0
  366. package/packages/pi/extensions/eval-tool.ts +224 -0
  367. package/packages/pi/extensions/eval.ts +60 -0
  368. package/packages/pi/extensions/footer.ts +239 -0
  369. package/packages/pi/extensions/hub-resolver.ts +63 -0
  370. package/packages/pi/extensions/hud-tool.ts +145 -0
  371. package/packages/pi/extensions/index.ts +405 -0
  372. package/packages/pi/extensions/journal.ts +224 -0
  373. package/packages/pi/extensions/map-bridge.ts +178 -0
  374. package/packages/pi/extensions/memory-tool.ts +73 -0
  375. package/packages/pi/extensions/notifications.ts +73 -0
  376. package/packages/pi/extensions/peter-parker.ts +202 -0
  377. package/packages/pi/extensions/policy-head-tool.ts +276 -0
  378. package/packages/pi/extensions/portfolio-bridge.ts +90 -0
  379. package/packages/pi/extensions/session.ts +142 -0
  380. package/packages/pi/extensions/shortcuts.ts +259 -0
  381. package/packages/pi/extensions/stratus-bridge.ts +115 -0
  382. package/packages/pi/extensions/synopsis-tool.ts +83 -0
  383. package/packages/pi/extensions/tool-renderers.ts +353 -0
  384. package/packages/pi/extensions/training-buffer-tool.ts +368 -0
  385. package/packages/pi/extensions/types.ts +163 -0
  386. package/packages/pi/package-lock.json +346 -0
  387. package/packages/pi/package.json +44 -0
  388. package/packages/pi/skills/agent-browser/SKILL.md +116 -0
  389. package/packages/pi/skills/brand-architect/SKILL.md +240 -0
  390. package/packages/pi/skills/brand-architect/config.yaml +137 -0
  391. package/packages/pi/skills/campaign-hud/config.yaml +112 -0
  392. package/packages/pi/skills/content-creator/SKILL.md +294 -0
  393. package/packages/pi/skills/context/SKILL.md +65 -0
  394. package/packages/pi/skills/debug/MULTI_AGENT.md +360 -0
  395. package/packages/pi/skills/debug/SKILL.md +554 -0
  396. package/packages/pi/skills/end/SKILL.md +1782 -0
  397. package/packages/pi/skills/eval/SKILL.md +75 -0
  398. package/packages/pi/skills/fly-deploy/SKILL.md +676 -0
  399. package/packages/pi/skills/founder-video/SKILL.md +467 -0
  400. package/packages/pi/skills/hud/SKILL.md +160 -0
  401. package/packages/pi/skills/orchestrate/SKILL.md +74 -0
  402. package/packages/pi/skills/pi-agents/SKILL.md +78 -0
  403. package/packages/pi/skills/react-best-practices/AGENTS.md +2249 -0
  404. package/packages/pi/skills/react-best-practices/README.md +123 -0
  405. package/packages/pi/skills/react-best-practices/SKILL.md +125 -0
  406. package/packages/pi/skills/react-best-practices/metadata.json +15 -0
  407. package/packages/pi/skills/react-best-practices/rules/_sections.md +46 -0
  408. package/packages/pi/skills/react-best-practices/rules/_template.md +28 -0
  409. package/packages/pi/skills/react-best-practices/rules/advanced-event-handler-refs.md +55 -0
  410. package/packages/pi/skills/react-best-practices/rules/advanced-use-latest.md +49 -0
  411. package/packages/pi/skills/react-best-practices/rules/async-api-routes.md +38 -0
  412. package/packages/pi/skills/react-best-practices/rules/async-defer-await.md +80 -0
  413. package/packages/pi/skills/react-best-practices/rules/async-dependencies.md +36 -0
  414. package/packages/pi/skills/react-best-practices/rules/async-parallel.md +28 -0
  415. package/packages/pi/skills/react-best-practices/rules/async-suspense-boundaries.md +99 -0
  416. package/packages/pi/skills/react-best-practices/rules/bundle-barrel-imports.md +59 -0
  417. package/packages/pi/skills/react-best-practices/rules/bundle-conditional.md +31 -0
  418. package/packages/pi/skills/react-best-practices/rules/bundle-defer-third-party.md +49 -0
  419. package/packages/pi/skills/react-best-practices/rules/bundle-dynamic-imports.md +35 -0
  420. package/packages/pi/skills/react-best-practices/rules/bundle-preload.md +50 -0
  421. package/packages/pi/skills/react-best-practices/rules/client-event-listeners.md +74 -0
  422. package/packages/pi/skills/react-best-practices/rules/client-swr-dedup.md +56 -0
  423. package/packages/pi/skills/react-best-practices/rules/js-batch-dom-css.md +82 -0
  424. package/packages/pi/skills/react-best-practices/rules/js-cache-function-results.md +80 -0
  425. package/packages/pi/skills/react-best-practices/rules/js-cache-property-access.md +28 -0
  426. package/packages/pi/skills/react-best-practices/rules/js-cache-storage.md +70 -0
  427. package/packages/pi/skills/react-best-practices/rules/js-combine-iterations.md +32 -0
  428. package/packages/pi/skills/react-best-practices/rules/js-early-exit.md +50 -0
  429. package/packages/pi/skills/react-best-practices/rules/js-hoist-regexp.md +45 -0
  430. package/packages/pi/skills/react-best-practices/rules/js-index-maps.md +37 -0
  431. package/packages/pi/skills/react-best-practices/rules/js-length-check-first.md +49 -0
  432. package/packages/pi/skills/react-best-practices/rules/js-min-max-loop.md +82 -0
  433. package/packages/pi/skills/react-best-practices/rules/js-set-map-lookups.md +24 -0
  434. package/packages/pi/skills/react-best-practices/rules/js-tosorted-immutable.md +57 -0
  435. package/packages/pi/skills/react-best-practices/rules/rendering-activity.md +26 -0
  436. package/packages/pi/skills/react-best-practices/rules/rendering-animate-svg-wrapper.md +47 -0
  437. package/packages/pi/skills/react-best-practices/rules/rendering-conditional-render.md +40 -0
  438. package/packages/pi/skills/react-best-practices/rules/rendering-content-visibility.md +38 -0
  439. package/packages/pi/skills/react-best-practices/rules/rendering-hoist-jsx.md +46 -0
  440. package/packages/pi/skills/react-best-practices/rules/rendering-hydration-no-flicker.md +82 -0
  441. package/packages/pi/skills/react-best-practices/rules/rendering-svg-precision.md +28 -0
  442. package/packages/pi/skills/react-best-practices/rules/rerender-defer-reads.md +39 -0
  443. package/packages/pi/skills/react-best-practices/rules/rerender-dependencies.md +45 -0
  444. package/packages/pi/skills/react-best-practices/rules/rerender-derived-state.md +29 -0
  445. package/packages/pi/skills/react-best-practices/rules/rerender-functional-setstate.md +74 -0
  446. package/packages/pi/skills/react-best-practices/rules/rerender-lazy-state-init.md +58 -0
  447. package/packages/pi/skills/react-best-practices/rules/rerender-memo.md +44 -0
  448. package/packages/pi/skills/react-best-practices/rules/rerender-transitions.md +40 -0
  449. package/packages/pi/skills/react-best-practices/rules/server-after-nonblocking.md +73 -0
  450. package/packages/pi/skills/react-best-practices/rules/server-cache-lru.md +41 -0
  451. package/packages/pi/skills/react-best-practices/rules/server-cache-react.md +26 -0
  452. package/packages/pi/skills/react-best-practices/rules/server-parallel-fetching.md +79 -0
  453. package/packages/pi/skills/react-best-practices/rules/server-serialization.md +38 -0
  454. package/packages/pi/skills/remotion-best-practices/SKILL.md +43 -0
  455. package/packages/pi/skills/remotion-best-practices/rules/3d.md +86 -0
  456. package/packages/pi/skills/remotion-best-practices/rules/animations.md +29 -0
  457. package/packages/pi/skills/remotion-best-practices/rules/assets/charts-bar-chart.tsx +173 -0
  458. package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-typewriter.tsx +100 -0
  459. package/packages/pi/skills/remotion-best-practices/rules/assets/text-animations-word-highlight.tsx +108 -0
  460. package/packages/pi/skills/remotion-best-practices/rules/assets.md +78 -0
  461. package/packages/pi/skills/remotion-best-practices/rules/audio.md +172 -0
  462. package/packages/pi/skills/remotion-best-practices/rules/calculate-metadata.md +104 -0
  463. package/packages/pi/skills/remotion-best-practices/rules/can-decode.md +75 -0
  464. package/packages/pi/skills/remotion-best-practices/rules/charts.md +58 -0
  465. package/packages/pi/skills/remotion-best-practices/rules/compositions.md +146 -0
  466. package/packages/pi/skills/remotion-best-practices/rules/display-captions.md +126 -0
  467. package/packages/pi/skills/remotion-best-practices/rules/extract-frames.md +229 -0
  468. package/packages/pi/skills/remotion-best-practices/rules/fonts.md +152 -0
  469. package/packages/pi/skills/remotion-best-practices/rules/get-audio-duration.md +58 -0
  470. package/packages/pi/skills/remotion-best-practices/rules/get-video-dimensions.md +68 -0
  471. package/packages/pi/skills/remotion-best-practices/rules/get-video-duration.md +58 -0
  472. package/packages/pi/skills/remotion-best-practices/rules/gifs.md +138 -0
  473. package/packages/pi/skills/remotion-best-practices/rules/images.md +130 -0
  474. package/packages/pi/skills/remotion-best-practices/rules/import-srt-captions.md +67 -0
  475. package/packages/pi/skills/remotion-best-practices/rules/lottie.md +68 -0
  476. package/packages/pi/skills/remotion-best-practices/rules/measuring-dom-nodes.md +35 -0
  477. package/packages/pi/skills/remotion-best-practices/rules/measuring-text.md +143 -0
  478. package/packages/pi/skills/remotion-best-practices/rules/sequencing.md +106 -0
  479. package/packages/pi/skills/remotion-best-practices/rules/tailwind.md +11 -0
  480. package/packages/pi/skills/remotion-best-practices/rules/text-animations.md +20 -0
  481. package/packages/pi/skills/remotion-best-practices/rules/timing.md +179 -0
  482. package/packages/pi/skills/remotion-best-practices/rules/transcribe-captions.md +19 -0
  483. package/packages/pi/skills/remotion-best-practices/rules/transitions.md +122 -0
  484. package/packages/pi/skills/remotion-best-practices/rules/trimming.md +53 -0
  485. package/packages/pi/skills/remotion-best-practices/rules/videos.md +171 -0
  486. package/packages/pi/skills/search/SKILL.md +220 -0
  487. package/packages/pi/skills/spec/SKILL.md +377 -0
  488. package/packages/pi/skills/startup/SKILL.md +315 -0
  489. package/packages/pi/skills/web-architect/SKILL.md +309 -0
  490. package/packages/pi/skills/x-algorithm/SKILL.md +305 -0
  491. package/packages/pi/teams/dev-team.yaml +63 -0
  492. package/packages/pi/teams/gtm-team.yaml +79 -0
  493. package/packages/pi/themes/jfl.theme.json +76 -0
  494. package/packages/pi/tsconfig.json +21 -0
  495. package/scripts/collect-tuples.sh +124 -0
  496. package/scripts/destroy-fleet.sh +37 -0
  497. package/scripts/jfl-ide.sh +48 -0
  498. package/scripts/session/session-cleanup.sh +4 -11
  499. package/scripts/session/session-init.sh +6 -0
  500. package/scripts/session/session-sync.sh +25 -0
  501. package/scripts/setup-branch-protection.sh +106 -0
  502. package/scripts/spawn-fleet.sh +144 -0
  503. package/scripts/train/requirements.txt +5 -0
  504. package/scripts/train/train-policy-head.py +477 -0
  505. package/scripts/train/v2/dataset.py +81 -0
  506. package/scripts/train/v2/domain.json +18 -0
  507. package/scripts/train/v2/eval.py +196 -0
  508. package/scripts/train/v2/generate_data.py +219 -0
  509. package/scripts/train/v2/infer.py +188 -0
  510. package/scripts/train/v2/model.py +112 -0
  511. package/scripts/train/v2/precompute.py +132 -0
  512. package/scripts/train/v2/train.py +302 -0
  513. package/scripts/train/v2/transform_buffer.py +227 -0
  514. package/scripts/train/v2/validate_data.py +115 -0
  515. package/scripts/train-policy-head.py +434 -0
  516. package/scripts/vm-swarm/README.md +301 -0
  517. package/scripts/vm-swarm/collect-tuples.sh +331 -0
  518. package/scripts/vm-swarm/create-base-template.sh +339 -0
  519. package/scripts/vm-swarm/kill-fleet.sh +204 -0
  520. package/scripts/vm-swarm/monitor-fleet.sh +346 -0
  521. package/scripts/vm-swarm/spawn-fleet.sh +304 -0
  522. package/template/.claude/settings.json +2 -15
  523. package/template/.github/workflows/jfl-eval.yml +6 -1
  524. package/template/.github/workflows/jfl-review.yml +4 -0
  525. package/template/scripts/session/session-cleanup.sh +2 -11
  526. package/template/scripts/session/session-end-hub.sh +72 -0
  527. package/template/scripts/session/session-end.sh +69 -6
  528. package/template/scripts/session/session-init.sh +55 -30
  529. package/template/scripts/session/session-lock.sh +464 -0
  530. package/template/scripts/session/session-start-hub.sh +105 -0
  531. package/template/templates/service-agent/workflows/jfl-eval.yml +19 -0
  532. package/dist/dashboard-static/assets/index-B6kRK9Rq.js +0 -116
  533. package/dist/dashboard-static/assets/index-BpdKJPLu.css +0 -1
@@ -0,0 +1,112 @@
1
+ """
2
+ v2 Policy Head — Transformer-based action selector.
3
+
4
+ Architecture from Drew's Stratus tutorial:
5
+ (current_state_emb, goal_emb) -> state_proj + goal_proj -> fusion -> TransformerEncoder -> classifier -> action logits
6
+
7
+ ~8.7M params, ~17MB checkpoint. Replaces v1 MLP reward predictor.
8
+ """
9
+
10
+ import torch
11
+ import torch.nn as nn
12
+ import torch.nn.functional as F
13
+
14
+
15
+ class PolicyHead(nn.Module):
16
+ def __init__(
17
+ self,
18
+ embedding_dim: int = 768,
19
+ hidden_dim: int = 512,
20
+ num_tools: int = 12,
21
+ num_layers: int = 4,
22
+ num_heads: int = 8,
23
+ dropout: float = 0.1,
24
+ ):
25
+ super().__init__()
26
+
27
+ self.embedding_dim = embedding_dim
28
+ self.hidden_dim = hidden_dim
29
+ self.num_tools = num_tools
30
+
31
+ self.state_proj = nn.Linear(embedding_dim, hidden_dim)
32
+ self.goal_proj = nn.Linear(embedding_dim, hidden_dim)
33
+
34
+ self.fusion = nn.Sequential(
35
+ nn.Linear(hidden_dim * 2, hidden_dim),
36
+ nn.GELU(),
37
+ nn.Dropout(dropout),
38
+ )
39
+
40
+ encoder_layer = nn.TransformerEncoderLayer(
41
+ d_model=hidden_dim,
42
+ nhead=num_heads,
43
+ dim_feedforward=hidden_dim * 4,
44
+ dropout=dropout,
45
+ activation="gelu",
46
+ batch_first=True,
47
+ )
48
+ self.transformer = nn.TransformerEncoder(
49
+ encoder_layer,
50
+ num_layers=num_layers,
51
+ )
52
+
53
+ self.norm = nn.LayerNorm(hidden_dim)
54
+ self.classifier = nn.Sequential(
55
+ nn.Linear(hidden_dim, hidden_dim),
56
+ nn.GELU(),
57
+ nn.Dropout(dropout),
58
+ nn.Linear(hidden_dim, num_tools),
59
+ )
60
+
61
+ self._init_weights()
62
+
63
+ def _init_weights(self):
64
+ for module in self.modules():
65
+ if isinstance(module, nn.Linear):
66
+ nn.init.xavier_uniform_(module.weight)
67
+ if module.bias is not None:
68
+ nn.init.zeros_(module.bias)
69
+ elif isinstance(module, nn.LayerNorm):
70
+ nn.init.ones_(module.weight)
71
+ nn.init.zeros_(module.bias)
72
+
73
+ def forward(
74
+ self,
75
+ current_state_emb: torch.Tensor,
76
+ goal_state_emb: torch.Tensor,
77
+ ) -> torch.Tensor:
78
+ state_h = self.state_proj(current_state_emb)
79
+ goal_h = self.goal_proj(goal_state_emb)
80
+
81
+ fused = self.fusion(torch.cat([state_h, goal_h], dim=-1))
82
+
83
+ x = fused.unsqueeze(1)
84
+ x = self.transformer(x)
85
+ x = x.squeeze(1)
86
+
87
+ x = self.norm(x)
88
+ logits = self.classifier(x)
89
+
90
+ return logits
91
+
92
+ def predict(
93
+ self,
94
+ current_state_emb: torch.Tensor,
95
+ goal_state_emb: torch.Tensor,
96
+ top_k: int = 3,
97
+ ) -> dict:
98
+ self.eval()
99
+ with torch.no_grad():
100
+ logits = self.forward(current_state_emb, goal_state_emb)
101
+ probs = F.softmax(logits, dim=-1)
102
+ top_probs, top_indices = torch.topk(probs, k=min(top_k, self.num_tools), dim=-1)
103
+
104
+ return {
105
+ "top_k_indices": top_indices,
106
+ "top_k_probs": top_probs,
107
+ "all_probs": probs,
108
+ }
109
+
110
+ @property
111
+ def num_parameters(self) -> int:
112
+ return sum(p.numel() for p in self.parameters() if p.requires_grad)
@@ -0,0 +1,132 @@
1
+ """
2
+ Pre-compute Stratus embeddings for all unique texts in v2 training data.
3
+ Caches embeddings as .npz files to avoid re-computation during training.
4
+ """
5
+
6
+ import json
7
+ import os
8
+ import sys
9
+ import argparse
10
+ import numpy as np
11
+
12
+ def get_stratus_embedder(api_url: str, api_key: str):
13
+ import requests
14
+
15
+ def embed_batch(texts: list[str]) -> list[list[float]]:
16
+ response = requests.post(
17
+ f"{api_url}/v1/embeddings",
18
+ headers={
19
+ "Authorization": f"Bearer {api_key}",
20
+ "Content-Type": "application/json",
21
+ },
22
+ json={
23
+ "model": "stratus-x1ac-base",
24
+ "input": texts,
25
+ },
26
+ timeout=30,
27
+ )
28
+ response.raise_for_status()
29
+ data = response.json()
30
+ return [d["embedding"] for d in data["data"]]
31
+
32
+ return embed_batch
33
+
34
+ def collect_unique_texts(data_path: str) -> tuple[list[str], list[str]]:
35
+ states = set()
36
+ goals = set()
37
+
38
+ with open(data_path) as f:
39
+ for line in f:
40
+ line = line.strip()
41
+ if not line:
42
+ continue
43
+ ex = json.loads(line)
44
+ states.add(ex["current_state"])
45
+ goals.add(ex["goal"])
46
+
47
+ return sorted(states), sorted(goals)
48
+
49
+ def precompute_embeddings(
50
+ data_dir: str,
51
+ api_url: str,
52
+ api_key: str,
53
+ batch_size: int = 32,
54
+ ):
55
+ embedder = get_stratus_embedder(api_url, api_key)
56
+
57
+ all_states = set()
58
+ all_goals = set()
59
+
60
+ for split in ["train", "val", "test"]:
61
+ path = os.path.join(data_dir, f"{split}.jsonl")
62
+ if not os.path.exists(path):
63
+ print(f" Skipping {split} (file not found)")
64
+ continue
65
+ states, goals = collect_unique_texts(path)
66
+ all_states.update(states)
67
+ all_goals.update(goals)
68
+
69
+ all_texts = sorted(all_states | all_goals)
70
+ print(f"Unique texts to embed: {len(all_texts)} ({len(all_states)} states, {len(all_goals)} goals)")
71
+
72
+ text_to_embedding = {}
73
+ for i in range(0, len(all_texts), batch_size):
74
+ batch = all_texts[i : i + batch_size]
75
+ try:
76
+ embeddings = embedder(batch)
77
+ for text, emb in zip(batch, embeddings):
78
+ text_to_embedding[text] = emb
79
+ except Exception as e:
80
+ print(f" Error embedding batch {i}-{i + len(batch)}: {e}")
81
+ continue
82
+
83
+ done = min(i + batch_size, len(all_texts))
84
+ print(f" Embedded {done}/{len(all_texts)} texts")
85
+
86
+ texts_list = sorted(text_to_embedding.keys())
87
+ text_to_idx = {t: i for i, t in enumerate(texts_list)}
88
+ embeddings_matrix = np.array([text_to_embedding[t] for t in texts_list], dtype=np.float32)
89
+
90
+ cache_path = os.path.join(data_dir, "embeddings_cache.npz")
91
+ np.savez(
92
+ cache_path,
93
+ embeddings=embeddings_matrix,
94
+ texts=np.array(texts_list, dtype=object),
95
+ )
96
+ print(f"Saved embedding cache: {cache_path} ({embeddings_matrix.shape})")
97
+
98
+ index_path = os.path.join(data_dir, "text_to_idx.json")
99
+ with open(index_path, "w") as f:
100
+ json.dump(text_to_idx, f)
101
+ print(f"Saved text index: {index_path} ({len(text_to_idx)} entries)")
102
+
103
+ return text_to_idx, embeddings_matrix
104
+
105
+
106
+ def main():
107
+ parser = argparse.ArgumentParser(description="Pre-compute Stratus embeddings for v2 training data")
108
+ parser.add_argument("--data-dir", default=".jfl/v2-data", help="Directory with train/val/test JSONL files")
109
+ parser.add_argument("--batch-size", type=int, default=32, help="Embedding batch size")
110
+ args = parser.parse_args()
111
+
112
+ api_url = os.environ.get("STRATUS_API_URL", "https://api.stratus.run")
113
+ api_key = os.environ.get("STRATUS_API_KEY", "")
114
+
115
+ if not api_key:
116
+ print("STRATUS_API_KEY not set")
117
+ sys.exit(1)
118
+
119
+ if not os.path.exists(args.data_dir):
120
+ print(f"Data directory not found: {args.data_dir}")
121
+ sys.exit(1)
122
+
123
+ precompute_embeddings(
124
+ data_dir=args.data_dir,
125
+ api_url=api_url,
126
+ api_key=api_key,
127
+ batch_size=args.batch_size,
128
+ )
129
+
130
+
131
+ if __name__ == "__main__":
132
+ main()
@@ -0,0 +1,302 @@
1
+ """
2
+ v2 Policy Head Training Loop.
3
+
4
+ CrossEntropyLoss with label smoothing, cosine annealing with warmup,
5
+ early stopping. Produces .pt checkpoint with model weights, config, and tool index.
6
+ """
7
+
8
+ import json
9
+ import os
10
+ import sys
11
+ import time
12
+ import math
13
+ import argparse
14
+
15
+ import numpy as np
16
+ import torch
17
+ import torch.nn as nn
18
+ import torch.optim as optim
19
+ from torch.utils.data import DataLoader
20
+
21
+ from model import PolicyHead
22
+ from dataset import PolicyHeadDataset, load_embedding_cache
23
+
24
+
25
+ def load_tool_index(domain_path: str) -> dict[str, int]:
26
+ with open(domain_path) as f:
27
+ domain = json.load(f)
28
+ return {tool["name"]: i for i, tool in enumerate(domain["tools"])}
29
+
30
+
31
+ def get_lr_scheduler(optimizer, warmup_steps: int, total_steps: int):
32
+ def lr_lambda(step):
33
+ if step < warmup_steps:
34
+ return float(step) / float(max(1, warmup_steps))
35
+ progress = float(step - warmup_steps) / float(max(1, total_steps - warmup_steps))
36
+ return max(0.0, 0.5 * (1.0 + math.cos(progress * math.pi)))
37
+
38
+ return optim.lr_scheduler.LambdaLR(optimizer, lr_lambda)
39
+
40
+
41
+ def train_epoch(model, dataloader, criterion, optimizer, scheduler, device):
42
+ model.train()
43
+ total_loss = 0.0
44
+ correct = 0
45
+ total = 0
46
+
47
+ for batch in dataloader:
48
+ state_emb = batch["state_emb"].to(device)
49
+ goal_emb = batch["goal_emb"].to(device)
50
+ labels = batch["label"].to(device)
51
+
52
+ optimizer.zero_grad()
53
+
54
+ logits = model(state_emb, goal_emb)
55
+ loss = criterion(logits, labels)
56
+
57
+ loss.backward()
58
+ torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm=1.0)
59
+ optimizer.step()
60
+ scheduler.step()
61
+
62
+ total_loss += loss.item() * labels.size(0)
63
+ preds = logits.argmax(dim=-1)
64
+ correct += (preds == labels).sum().item()
65
+ total += labels.size(0)
66
+
67
+ return total_loss / max(total, 1), correct / max(total, 1)
68
+
69
+
70
+ @torch.no_grad()
71
+ def evaluate(model, dataloader, criterion, device):
72
+ model.eval()
73
+ total_loss = 0.0
74
+ correct = 0
75
+ total = 0
76
+
77
+ for batch in dataloader:
78
+ state_emb = batch["state_emb"].to(device)
79
+ goal_emb = batch["goal_emb"].to(device)
80
+ labels = batch["label"].to(device)
81
+
82
+ logits = model(state_emb, goal_emb)
83
+ loss = criterion(logits, labels)
84
+
85
+ total_loss += loss.item() * labels.size(0)
86
+ preds = logits.argmax(dim=-1)
87
+ correct += (preds == labels).sum().item()
88
+ total += labels.size(0)
89
+
90
+ return total_loss / max(total, 1), correct / max(total, 1)
91
+
92
+
93
+ def train(args):
94
+ # Device
95
+ if torch.cuda.is_available():
96
+ device = "cuda"
97
+ elif hasattr(torch.backends, "mps") and torch.backends.mps.is_available():
98
+ device = "mps"
99
+ else:
100
+ device = "cpu"
101
+ print(f"Device: {device}")
102
+
103
+ # Domain
104
+ domain_path = args.domain
105
+ tool_to_index = load_tool_index(domain_path)
106
+ index_to_tool = {v: k for k, v in tool_to_index.items()}
107
+ num_tools = len(tool_to_index)
108
+ print(f"Tools: {num_tools}")
109
+
110
+ # Embeddings cache
111
+ embeddings_matrix, text_to_idx = load_embedding_cache(args.data_dir)
112
+ if embeddings_matrix is not None:
113
+ print(f"Embedding cache: {embeddings_matrix.shape[0]} texts, {embeddings_matrix.shape[1]}-dim")
114
+ else:
115
+ print("WARNING: No embedding cache found. Training with zero vectors.")
116
+ print(" Run: python precompute.py --data-dir", args.data_dir)
117
+
118
+ # Datasets
119
+ train_path = os.path.join(args.data_dir, "train.jsonl")
120
+ val_path = os.path.join(args.data_dir, "val.jsonl")
121
+
122
+ if not os.path.exists(train_path):
123
+ print(f"Training data not found: {train_path}")
124
+ sys.exit(1)
125
+
126
+ train_ds = PolicyHeadDataset(train_path, tool_to_index, embeddings_matrix, text_to_idx)
127
+ val_ds = PolicyHeadDataset(val_path, tool_to_index, embeddings_matrix, text_to_idx) if os.path.exists(val_path) else None
128
+
129
+ num_workers = 0 if device == "mps" else min(4, os.cpu_count() or 1)
130
+ train_loader = DataLoader(train_ds, batch_size=args.batch_size, shuffle=True, num_workers=num_workers)
131
+ val_loader = DataLoader(val_ds, batch_size=args.batch_size, shuffle=False, num_workers=num_workers) if val_ds else None
132
+
133
+ print(f"Train: {len(train_ds)} examples")
134
+ if val_ds:
135
+ print(f"Val: {len(val_ds)} examples")
136
+
137
+ # Model
138
+ embedding_dim = embeddings_matrix.shape[1] if embeddings_matrix is not None else 768
139
+ model = PolicyHead(
140
+ embedding_dim=embedding_dim,
141
+ hidden_dim=args.hidden_dim,
142
+ num_tools=num_tools,
143
+ num_layers=args.num_layers,
144
+ num_heads=args.num_heads,
145
+ dropout=args.dropout,
146
+ ).to(device)
147
+
148
+ print(f"Parameters: {model.num_parameters:,}")
149
+
150
+ # Warm start
151
+ if args.warm_start and os.path.exists(args.warm_start):
152
+ print(f"Warm-starting from: {args.warm_start}")
153
+ state_dict = torch.load(args.warm_start, map_location=device, weights_only=True)
154
+ if "model_state_dict" in state_dict:
155
+ state_dict = state_dict["model_state_dict"]
156
+ compatible = {}
157
+ for k, v in state_dict.items():
158
+ if k in model.state_dict() and v.shape == model.state_dict()[k].shape:
159
+ compatible[k] = v
160
+ model.load_state_dict(compatible, strict=False)
161
+ print(f" Loaded {len(compatible)}/{len(state_dict)} layers")
162
+
163
+ # Loss, optimizer, scheduler
164
+ criterion = nn.CrossEntropyLoss(label_smoothing=args.label_smoothing)
165
+ optimizer = optim.AdamW(
166
+ model.parameters(),
167
+ lr=args.lr,
168
+ weight_decay=args.weight_decay,
169
+ )
170
+ total_steps = len(train_loader) * args.epochs
171
+ scheduler = get_lr_scheduler(optimizer, args.warmup_steps, total_steps)
172
+
173
+ # Training loop
174
+ os.makedirs(args.output_dir, exist_ok=True)
175
+ best_val_acc = 0.0
176
+ best_val_loss = float("inf")
177
+ patience_counter = 0
178
+
179
+ print(f"\nStarting training for {args.epochs} epochs...")
180
+ print(f"{'Epoch':>5} {'Train Loss':>12} {'Train Acc':>10} {'Val Loss':>10} {'Val Acc':>9} {'LR':>10} {'Time':>8}")
181
+ print("-" * 75)
182
+
183
+ for epoch in range(1, args.epochs + 1):
184
+ t0 = time.time()
185
+
186
+ train_loss, train_acc = train_epoch(model, train_loader, criterion, optimizer, scheduler, device)
187
+
188
+ val_loss, val_acc = (0.0, 0.0)
189
+ if val_loader:
190
+ val_loss, val_acc = evaluate(model, val_loader, criterion, device)
191
+
192
+ elapsed = time.time() - t0
193
+ lr = scheduler.get_last_lr()[0]
194
+
195
+ print(
196
+ f"{epoch:5d} {train_loss:12.4f} {train_acc:9.1%} {val_loss:10.4f} {val_acc:8.1%} {lr:10.2e} {elapsed:7.1f}s"
197
+ )
198
+
199
+ # Save best model
200
+ is_best = False
201
+ if val_loader:
202
+ if val_acc > best_val_acc:
203
+ best_val_acc = val_acc
204
+ best_val_loss = val_loss
205
+ is_best = True
206
+ elif train_loss < best_val_loss:
207
+ best_val_loss = train_loss
208
+ best_val_acc = train_acc
209
+ is_best = True
210
+
211
+ if is_best:
212
+ patience_counter = 0
213
+ checkpoint = {
214
+ "epoch": epoch,
215
+ "model_state_dict": model.state_dict(),
216
+ "val_accuracy": best_val_acc,
217
+ "val_loss": best_val_loss,
218
+ "num_tools": num_tools,
219
+ "tool_to_index": tool_to_index,
220
+ "index_to_tool": index_to_tool,
221
+ "config": {
222
+ "embedding_dim": embedding_dim,
223
+ "hidden_dim": args.hidden_dim,
224
+ "num_layers": args.num_layers,
225
+ "num_heads": args.num_heads,
226
+ "dropout": args.dropout,
227
+ },
228
+ }
229
+ ckpt_path = os.path.join(args.output_dir, "best_policy_head.pt")
230
+ torch.save(checkpoint, ckpt_path)
231
+ print(f" ✅ New best model (val_acc={best_val_acc:.1%})")
232
+ else:
233
+ patience_counter += 1
234
+
235
+ # Early stopping
236
+ if patience_counter >= args.patience:
237
+ print(f"\n Early stopping at epoch {epoch} (no improvement for {args.patience} epochs)")
238
+ break
239
+
240
+ print(f"\nTraining complete. Best val accuracy: {best_val_acc:.1%}")
241
+
242
+ ckpt_path = os.path.join(args.output_dir, "best_policy_head.pt")
243
+ if os.path.exists(ckpt_path):
244
+ size_mb = os.path.getsize(ckpt_path) / 1024 / 1024
245
+ print(f"Checkpoint: {ckpt_path} ({size_mb:.1f} MB)")
246
+
247
+ # Write metadata for TypeScript bridge
248
+ meta = {
249
+ "version": 2,
250
+ "architecture": "transformer-4layer-512h",
251
+ "embedding_dim": embedding_dim,
252
+ "hidden_dim": args.hidden_dim,
253
+ "num_tools": num_tools,
254
+ "num_layers": args.num_layers,
255
+ "num_heads": args.num_heads,
256
+ "trained_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
257
+ "trained_on": len(train_ds),
258
+ "val_accuracy": best_val_acc,
259
+ "val_loss": best_val_loss,
260
+ "device": device,
261
+ "parameters": model.num_parameters,
262
+ "tool_to_index": tool_to_index,
263
+ "index_to_tool": {str(k): v for k, v in index_to_tool.items()},
264
+ "checkpoint_path": os.path.abspath(ckpt_path),
265
+ }
266
+ meta_path = os.path.join(args.output_dir, "policy-head-v2.json")
267
+ with open(meta_path, "w") as f:
268
+ json.dump(meta, f, indent=2)
269
+ print(f"Metadata: {meta_path}")
270
+
271
+
272
+ def main():
273
+ parser = argparse.ArgumentParser(description="Train v2 policy head (transformer action selector)")
274
+ parser.add_argument("--data-dir", default=".jfl/v2-data", help="Directory with train/val/test JSONL + embeddings")
275
+ parser.add_argument("--domain", default=None, help="Path to domain.json")
276
+ parser.add_argument("--output-dir", default=".jfl/checkpoints", help="Output directory for checkpoints")
277
+ parser.add_argument("--warm-start", default=None, help="Path to pretrained checkpoint for warm start")
278
+ parser.add_argument("--epochs", type=int, default=50, help="Max training epochs")
279
+ parser.add_argument("--batch-size", type=int, default=64, help="Batch size")
280
+ parser.add_argument("--lr", type=float, default=3e-4, help="Learning rate")
281
+ parser.add_argument("--weight-decay", type=float, default=0.01, help="Weight decay")
282
+ parser.add_argument("--warmup-steps", type=int, default=100, help="Warmup steps for LR scheduler")
283
+ parser.add_argument("--patience", type=int, default=7, help="Early stopping patience")
284
+ parser.add_argument("--label-smoothing", type=float, default=0.1, help="Label smoothing for CrossEntropyLoss")
285
+ parser.add_argument("--hidden-dim", type=int, default=512, help="Hidden dimension")
286
+ parser.add_argument("--num-layers", type=int, default=4, help="Transformer encoder layers")
287
+ parser.add_argument("--num-heads", type=int, default=8, help="Attention heads")
288
+ parser.add_argument("--dropout", type=float, default=0.1, help="Dropout rate")
289
+ args = parser.parse_args()
290
+
291
+ if args.domain is None:
292
+ args.domain = os.path.join(os.path.dirname(os.path.abspath(__file__)), "domain.json")
293
+
294
+ if not os.path.exists(args.domain):
295
+ print(f"Domain file not found: {args.domain}")
296
+ sys.exit(1)
297
+
298
+ train(args)
299
+
300
+
301
+ if __name__ == "__main__":
302
+ main()