@kontourai/flow-agents 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (418) hide show
  1. package/.githooks/pre-push +11 -0
  2. package/.github/workflows/ci.yml +210 -0
  3. package/.github/workflows/docs-pages.yml +52 -0
  4. package/.github/workflows/publish-npm.yml +104 -0
  5. package/AGENTS.md +26 -0
  6. package/CHANGELOG.md +66 -0
  7. package/CODE_OF_CONDUCT.md +25 -0
  8. package/CONTEXT.md +300 -0
  9. package/CONTRIBUTING.md +44 -0
  10. package/LICENSE +201 -0
  11. package/README.md +129 -0
  12. package/SECURITY.md +33 -0
  13. package/agent-cards/dev.json +19 -0
  14. package/agents/dev.json +127 -0
  15. package/agents/tool-code-reviewer.json +61 -0
  16. package/agents/tool-dependencies-updater.json +118 -0
  17. package/agents/tool-explore-config.json +92 -0
  18. package/agents/tool-explore-deps.json +92 -0
  19. package/agents/tool-explore-entry.json +92 -0
  20. package/agents/tool-explore-patterns.json +92 -0
  21. package/agents/tool-explore-structure.json +92 -0
  22. package/agents/tool-explore-tests.json +92 -0
  23. package/agents/tool-planner.json +57 -0
  24. package/agents/tool-playwright.json +145 -0
  25. package/agents/tool-security-reviewer.json +56 -0
  26. package/agents/tool-verifier.json +61 -0
  27. package/agents/tool-worker.json +58 -0
  28. package/build/src/cli/console-learning-projection.js +123 -0
  29. package/build/src/cli/docs-preview.js +39 -0
  30. package/build/src/cli/effective-backlog-settings.js +102 -0
  31. package/build/src/cli/export-bookmarks.js +38 -0
  32. package/build/src/cli/fixture-retirement-audit.js +140 -0
  33. package/build/src/cli/flow-kit.js +138 -0
  34. package/build/src/cli/import-bookmarks.js +50 -0
  35. package/build/src/cli/init.js +239 -0
  36. package/build/src/cli/instinct-cli.js +93 -0
  37. package/build/src/cli/promote-workflow-artifact.js +63 -0
  38. package/build/src/cli/publish-change-helper.js +154 -0
  39. package/build/src/cli/pull-work-provider.js +469 -0
  40. package/build/src/cli/runtime-adapter.js +23 -0
  41. package/build/src/cli/telemetry-doctor.js +221 -0
  42. package/build/src/cli/usage-feedback.js +443 -0
  43. package/build/src/cli/validate-hook-influence.js +152 -0
  44. package/build/src/cli/validate-source-tree.js +31 -0
  45. package/build/src/cli/validate-workflow-artifacts.js +486 -0
  46. package/build/src/cli/veritas-governance.js +262 -0
  47. package/build/src/cli/workflow-artifact-cleanup-audit.js +272 -0
  48. package/build/src/cli/workflow-sidecar.js +816 -0
  49. package/build/src/cli.js +89 -0
  50. package/build/src/flow-kit/validate.js +75 -0
  51. package/build/src/lib/args.js +45 -0
  52. package/build/src/lib/fs.js +62 -0
  53. package/build/src/lib/workflow-learning-projection.js +334 -0
  54. package/build/src/runtime-adapters.js +146 -0
  55. package/build/src/tools/build-universal-bundles.js +397 -0
  56. package/build/src/tools/common.js +56 -0
  57. package/build/src/tools/filter-installed-packs.js +132 -0
  58. package/build/src/tools/generate-context-map.js +198 -0
  59. package/build/src/tools/validate-package.js +64 -0
  60. package/build/src/tools/validate-source-tree.js +622 -0
  61. package/console.telemetry.json +176 -0
  62. package/context/base-rules.md +17 -0
  63. package/context/code-review-standards.md +62 -0
  64. package/context/coding-standards.md +42 -0
  65. package/context/common/orchestrators.md +12 -0
  66. package/context/common/subagents.md +28 -0
  67. package/context/contracts/artifact-contract.md +182 -0
  68. package/context/contracts/builder-kit-workflow-state-contract.md +319 -0
  69. package/context/contracts/delivery-contract.md +69 -0
  70. package/context/contracts/execution-contract.md +53 -0
  71. package/context/contracts/governance-adapter-contract.md +67 -0
  72. package/context/contracts/planning-contract.md +85 -0
  73. package/context/contracts/review-contract.md +104 -0
  74. package/context/contracts/sandbox-policy.md +52 -0
  75. package/context/contracts/verification-contract.md +134 -0
  76. package/context/contracts/work-item-contract.md +215 -0
  77. package/context/deferred/demo-mode.md +33 -0
  78. package/context/deferred/languages/go.md +31 -0
  79. package/context/deferred/languages/python.md +31 -0
  80. package/context/deferred/languages/typescript.md +34 -0
  81. package/context/deferred/parallelization.md +35 -0
  82. package/context/deferred/worktree-isolation.md +24 -0
  83. package/context/development-workflow.md +50 -0
  84. package/context/scripts/context-budget/budget-scan.sh +166 -0
  85. package/context/scripts/detect-tools.sh +3 -0
  86. package/context/scripts/discover-agents.sh +28 -0
  87. package/context/scripts/git-status.sh +49 -0
  88. package/context/scripts/hooks/config-protection.js +79 -0
  89. package/context/scripts/hooks/desktop-notify.sh +39 -0
  90. package/context/scripts/hooks/governance-audit.sh +135 -0
  91. package/context/scripts/hooks/lib/audit-transport.sh +40 -0
  92. package/context/scripts/hooks/lib/hook-flags.js +49 -0
  93. package/context/scripts/hooks/lib/patterns.sh +57 -0
  94. package/context/scripts/hooks/lib/resolve-formatter.js +80 -0
  95. package/context/scripts/hooks/post-edit-accumulator.js +66 -0
  96. package/context/scripts/hooks/pre-commit-quality.js +194 -0
  97. package/context/scripts/hooks/quality-gate.js +93 -0
  98. package/context/scripts/hooks/report-only-guard.js +21 -0
  99. package/context/scripts/hooks/run-hook.js +136 -0
  100. package/context/scripts/hooks/stop-format-typecheck.js +141 -0
  101. package/context/scripts/hooks/stop-goal-fit.js +337 -0
  102. package/context/scripts/hooks/workflow-steering.js +250 -0
  103. package/context/scripts/telemetry/console-presets.sh +14 -0
  104. package/context/scripts/telemetry/install-console-config.sh +214 -0
  105. package/context/scripts/telemetry/lib/config.sh +85 -0
  106. package/context/scripts/telemetry/lib/enrich.sh +115 -0
  107. package/context/scripts/telemetry/lib/redact.sh +22 -0
  108. package/context/scripts/telemetry/lib/session.sh +63 -0
  109. package/context/scripts/telemetry/lib/transport.sh +183 -0
  110. package/context/scripts/telemetry/lib/usage.sh +29 -0
  111. package/context/scripts/telemetry/sync-agents.sh +173 -0
  112. package/context/scripts/telemetry/telemetry.conf +23 -0
  113. package/context/scripts/telemetry/telemetry.sh +387 -0
  114. package/context/scripts/validate-package.sh +89 -0
  115. package/context/settings/backlog-provider-settings.json +54 -0
  116. package/context/templates/core/identity.md +26 -0
  117. package/context/templates/core/user.md +15 -0
  118. package/docs/_config.yml +15 -0
  119. package/docs/_layouts/default.html +87 -0
  120. package/docs/adr/0001-flow-agents-consumes-flow.md +77 -0
  121. package/docs/adr/0002-flow-kits-as-extension-unit.md +13 -0
  122. package/docs/adr/0003-flow-agents-coordinates-kits-and-adapters.md +13 -0
  123. package/docs/adr/0004-gates-expect-surface-claims.md +15 -0
  124. package/docs/adr/0005-kubernetes-inspired-resource-contracts.md +48 -0
  125. package/docs/adr/0006-typescript-first-source-policy.md +98 -0
  126. package/docs/agent-system-guidebook.md +391 -0
  127. package/docs/agent-usage-feedback-loop.md +351 -0
  128. package/docs/assets/favicon.svg +13 -0
  129. package/docs/assets/og-image.png +0 -0
  130. package/docs/assets/site.css +774 -0
  131. package/docs/assets/site.js +139 -0
  132. package/docs/configurable-workflow-routing.md +174 -0
  133. package/docs/context-map.md +145 -0
  134. package/docs/developer-architecture.md +145 -0
  135. package/docs/developer-hook-setup.md +61 -0
  136. package/docs/fixture-ownership.md +44 -0
  137. package/docs/flow-kit-repository-contract.md +180 -0
  138. package/docs/index.md +129 -0
  139. package/docs/kontour-resource-contract.md +358 -0
  140. package/docs/migrations.md +64 -0
  141. package/docs/north-star.md +322 -0
  142. package/docs/operating-layers.md +110 -0
  143. package/docs/repository-structure.md +132 -0
  144. package/docs/sandbox-policy.md +56 -0
  145. package/docs/skills-map.md +203 -0
  146. package/docs/standards-register.md +96 -0
  147. package/docs/veritas-integration.md +165 -0
  148. package/docs/work-item-adapters.md +72 -0
  149. package/docs/workflow-artifact-lifecycle.md +141 -0
  150. package/docs/workflow-eval-strategy.md +295 -0
  151. package/docs/workflow-shared-contracts.md +51 -0
  152. package/docs/workflow-usage-guide.md +443 -0
  153. package/evals/ARCHITECTURE.md +143 -0
  154. package/evals/CONVENTIONS.md +58 -0
  155. package/evals/README.md +128 -0
  156. package/evals/acceptance/run.sh +29 -0
  157. package/evals/acceptance/test_claude_harness.sh +242 -0
  158. package/evals/acceptance/test_codex_harness.sh +108 -0
  159. package/evals/acceptance/test_kiro_harness.sh +128 -0
  160. package/evals/cases/dev/404.html +97 -0
  161. package/evals/cases/dev/code-review.yaml +44 -0
  162. package/evals/cases/dev/dashboard.html +300 -0
  163. package/evals/cases/dev/deliver.yaml +66 -0
  164. package/evals/cases/dev/dependency-update.yaml +16 -0
  165. package/evals/cases/dev/explore.yaml +20 -0
  166. package/evals/cases/dev/index.html +370 -0
  167. package/evals/cases/dev/package-lock.json +28 -0
  168. package/evals/cases/dev/package.json +16 -0
  169. package/evals/cases/dev/plan-work.yaml +20 -0
  170. package/evals/cases/dev/promptfooconfig.yaml +666 -0
  171. package/evals/cases/dev/search-first.yaml +20 -0
  172. package/evals/cases/dev/tdd-workflow.yaml +48 -0
  173. package/evals/cases/dev/verify-work.yaml +44 -0
  174. package/evals/cases/dev/workflow.yaml +34 -0
  175. package/evals/ci/run-baseline.sh +283 -0
  176. package/evals/fixtures/backlog-provider-settings/global-default.json +44 -0
  177. package/evals/fixtures/backlog-provider-settings/project-override.json +53 -0
  178. package/evals/fixtures/builder-kit-workflow-state/baseline-freshness-resolution-hint.json +139 -0
  179. package/evals/fixtures/builder-kit-workflow-state/direct-primitive-stop.json +59 -0
  180. package/evals/fixtures/builder-kit-workflow-state/empty-board-route-shape.json +55 -0
  181. package/evals/fixtures/builder-kit-workflow-state/happy-path.json +71 -0
  182. package/evals/fixtures/builder-kit-workflow-state/mid-work-resume.json +80 -0
  183. package/evals/fixtures/builder-kit-workflow-state/missing-prestep-recovery.json +65 -0
  184. package/evals/fixtures/builder-kit-workflow-state/product-build-chaining.json +60 -0
  185. package/evals/fixtures/builder-kit-workflow-state/stale-continuation-requires-new-probe.json +57 -0
  186. package/evals/fixtures/console-learning-projection/artifacts/console-learning-correction/learning.json +50 -0
  187. package/evals/fixtures/console-learning-projection/artifacts/console-learning-open-route/learning.json +41 -0
  188. package/evals/fixtures/flow-kit-repository/invalid-absolute-path/kit.json +8 -0
  189. package/evals/fixtures/flow-kit-repository/invalid-asset-section/flows/review.flow.json +6 -0
  190. package/evals/fixtures/flow-kit-repository/invalid-asset-section/kit.json +11 -0
  191. package/evals/fixtures/flow-kit-repository/invalid-duplicate-flow/flows/review.flow.json +6 -0
  192. package/evals/fixtures/flow-kit-repository/invalid-duplicate-flow/kit.json +9 -0
  193. package/evals/fixtures/flow-kit-repository/invalid-id/flows/review.flow.json +6 -0
  194. package/evals/fixtures/flow-kit-repository/invalid-id/kit.json +8 -0
  195. package/evals/fixtures/flow-kit-repository/invalid-malformed-json/kit.json +8 -0
  196. package/evals/fixtures/flow-kit-repository/invalid-missing-flow/kit.json +8 -0
  197. package/evals/fixtures/flow-kit-repository/invalid-missing-id/flows/review.flow.json +6 -0
  198. package/evals/fixtures/flow-kit-repository/invalid-missing-id/kit.json +7 -0
  199. package/evals/fixtures/flow-kit-repository/invalid-missing-schema-version/flows/review.flow.json +6 -0
  200. package/evals/fixtures/flow-kit-repository/invalid-missing-schema-version/kit.json +7 -0
  201. package/evals/fixtures/flow-kit-repository/invalid-name/flows/review.flow.json +6 -0
  202. package/evals/fixtures/flow-kit-repository/invalid-name/kit.json +8 -0
  203. package/evals/fixtures/flow-kit-repository/invalid-schema-version/flows/review.flow.json +6 -0
  204. package/evals/fixtures/flow-kit-repository/invalid-schema-version/kit.json +8 -0
  205. package/evals/fixtures/flow-kit-repository/invalid-traversal/kit.json +8 -0
  206. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/adapters/example.json +3 -0
  207. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/assets/example.txt +1 -0
  208. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/docs/README.md +3 -0
  209. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/flows/runtime.flow.json +26 -0
  210. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/kit-evals/example.json +3 -0
  211. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/kit-skills/mixed/SKILL.md +3 -0
  212. package/evals/fixtures/flow-kit-repository/mixed-runtime-kit/kit.json +44 -0
  213. package/evals/fixtures/flow-kit-repository/valid-local-kit/docs/README.md +3 -0
  214. package/evals/fixtures/flow-kit-repository/valid-local-kit/flows/review.flow.json +26 -0
  215. package/evals/fixtures/flow-kit-repository/valid-local-kit/kit.json +20 -0
  216. package/evals/fixtures/hook-influence/cases.json +336 -0
  217. package/evals/fixtures/pull-work-provider/github-issues.json +170 -0
  218. package/evals/fixtures/pull-work-wip-shepherding/global-wip-informs.json +43 -0
  219. package/evals/fixtures/pull-work-wip-shepherding/personal-wip-blocks.json +42 -0
  220. package/evals/fixtures/surface-trust/accepted-claim-trust-report.json +31 -0
  221. package/evals/fixtures/surface-trust/artifact-absent.json +19 -0
  222. package/evals/fixtures/surface-trust/integrity-mismatch-trust-report.json +32 -0
  223. package/evals/fixtures/surface-trust/missing-authority-trust-report.json +27 -0
  224. package/evals/fixtures/surface-trust/provider-absent.json +19 -0
  225. package/evals/fixtures/surface-trust/rejected-claim-trust-report.json +30 -0
  226. package/evals/fixtures/surface-trust/stale-claim-trust-snapshot.json +31 -0
  227. package/evals/fixtures/usage-feedback/sample-full.jsonl +11 -0
  228. package/evals/fixtures/usage-feedback/sample-outcomes.jsonl +1 -0
  229. package/evals/fixtures/veritas-governance-adapter/fake-veritas-pass.sh +18 -0
  230. package/evals/fixtures/veritas-governance-adapter/fake-veritas-secret-fail.sh +10 -0
  231. package/evals/fixtures/veritas-governance-adapter/fake-veritas-unconfigured.sh +4 -0
  232. package/evals/integration/test_bundle_install.sh +541 -0
  233. package/evals/integration/test_console_learning_projection.sh +192 -0
  234. package/evals/integration/test_context_map.sh +65 -0
  235. package/evals/integration/test_effective_backlog_settings.sh +58 -0
  236. package/evals/integration/test_fixture_retirement_audit.sh +58 -0
  237. package/evals/integration/test_flow_agents_statusline.sh +93 -0
  238. package/evals/integration/test_flow_kit_repository.sh +90 -0
  239. package/evals/integration/test_goal_fit_hook.sh +482 -0
  240. package/evals/integration/test_hook_category_behaviors.sh +190 -0
  241. package/evals/integration/test_hook_influence_cases.sh +69 -0
  242. package/evals/integration/test_local_flow_kit_install.sh +145 -0
  243. package/evals/integration/test_publish_change_helper.sh +176 -0
  244. package/evals/integration/test_pull_work_provider.sh +140 -0
  245. package/evals/integration/test_runtime_adapter_activation.sh +106 -0
  246. package/evals/integration/test_telemetry.sh +485 -0
  247. package/evals/integration/test_telemetry_doctor.sh +193 -0
  248. package/evals/integration/test_usage_feedback_dashboard.sh +169 -0
  249. package/evals/integration/test_usage_feedback_global.sh +117 -0
  250. package/evals/integration/test_usage_feedback_import.sh +227 -0
  251. package/evals/integration/test_usage_feedback_outcomes.sh +165 -0
  252. package/evals/integration/test_usage_feedback_report.sh +263 -0
  253. package/evals/integration/test_veritas_governance_adapter.sh +235 -0
  254. package/evals/integration/test_workflow_artifact_cleanup_audit.sh +287 -0
  255. package/evals/integration/test_workflow_artifacts.sh +1247 -0
  256. package/evals/integration/test_workflow_sidecar_writer.sh +2112 -0
  257. package/evals/integration/test_workflow_steering_hook.sh +337 -0
  258. package/evals/lib/assertions/delegated-to.js +40 -0
  259. package/evals/lib/assertions/max-tool-calls.js +15 -0
  260. package/evals/lib/assertions/no-write-tools.js +27 -0
  261. package/evals/lib/assertions/pass-at-k.js +39 -0
  262. package/evals/lib/assertions/telemetry-utils.js +105 -0
  263. package/evals/lib/assertions/tool-called.js +39 -0
  264. package/evals/lib/assertions/verify-after-fix.js +61 -0
  265. package/evals/lib/claude-judge.sh +40 -0
  266. package/evals/lib/claude-provider.sh +74 -0
  267. package/evals/lib/codex-judge.sh +39 -0
  268. package/evals/lib/codex-provider.sh +81 -0
  269. package/evals/lib/eval-dev.sh +5 -0
  270. package/evals/lib/eval-judge.sh +22 -0
  271. package/evals/lib/eval-provider.sh +26 -0
  272. package/evals/lib/eval-report.sh +73 -0
  273. package/evals/lib/kiro-dev.sh +4 -0
  274. package/evals/lib/kiro-judge.sh +17 -0
  275. package/evals/lib/kiro-provider.sh +62 -0
  276. package/evals/lib/node.sh +111 -0
  277. package/evals/promptfooconfig.yaml +70 -0
  278. package/evals/run.sh +309 -0
  279. package/evals/static/test_evidence_refs.sh +141 -0
  280. package/evals/static/test_package.sh +407 -0
  281. package/evals/static/test_repo_hooks.sh +68 -0
  282. package/evals/static/test_universal_bundles.sh +274 -0
  283. package/evals/static/test_workflow_skills.sh +1207 -0
  284. package/install.sh +64 -0
  285. package/integrations/veritas/flow-agents.adapter.json +138 -0
  286. package/integrations/veritas/flow-agents.authority-settings.json +26 -0
  287. package/integrations/veritas/flow-agents.repo-standards.json +82 -0
  288. package/kits/builder/flows/build.flow.json +218 -0
  289. package/kits/builder/flows/shape.flow.json +127 -0
  290. package/kits/builder/kit.json +19 -0
  291. package/kits/catalog.json +11 -0
  292. package/package.json +130 -0
  293. package/packaging/README.md +60 -0
  294. package/packaging/manifest.json +173 -0
  295. package/packaging/packs.json +69 -0
  296. package/powers/dependency-checker/POWER.md +20 -0
  297. package/powers/dependency-checker/mcp.json +20 -0
  298. package/powers/playwright/POWER.md +25 -0
  299. package/powers/playwright/mcp.json +12 -0
  300. package/prompts/code-audit.md +123 -0
  301. package/prompts/kcommit.md +88 -0
  302. package/schemas/backlog-provider-settings.schema.json +138 -0
  303. package/schemas/workflow-acceptance.schema.json +216 -0
  304. package/schemas/workflow-critique.schema.json +113 -0
  305. package/schemas/workflow-evidence.schema.json +357 -0
  306. package/schemas/workflow-handoff.schema.json +52 -0
  307. package/schemas/workflow-learning.schema.json +223 -0
  308. package/schemas/workflow-release.schema.json +172 -0
  309. package/schemas/workflow-state.schema.json +80 -0
  310. package/scripts/README.md +111 -0
  311. package/scripts/build-universal-bundles.js +3 -0
  312. package/scripts/check-content-boundary.cjs +99 -0
  313. package/scripts/context-budget/budget-scan.sh +166 -0
  314. package/scripts/detect-tools.sh +3 -0
  315. package/scripts/discover-agents.sh +28 -0
  316. package/scripts/effective-backlog-settings.js +2 -0
  317. package/scripts/filter-installed-packs.js +2 -0
  318. package/scripts/flow-kit.js +2 -0
  319. package/scripts/generate-context-map.js +2 -0
  320. package/scripts/git-status.sh +49 -0
  321. package/scripts/hooks/claude-hook-adapter.js +174 -0
  322. package/scripts/hooks/claude-telemetry-hook.js +115 -0
  323. package/scripts/hooks/codex-hook-adapter.js +176 -0
  324. package/scripts/hooks/codex-telemetry-hook.js +95 -0
  325. package/scripts/hooks/config-protection.js +79 -0
  326. package/scripts/hooks/desktop-notify.sh +39 -0
  327. package/scripts/hooks/governance-audit.sh +135 -0
  328. package/scripts/hooks/lib/audit-transport.sh +40 -0
  329. package/scripts/hooks/lib/hook-flags.js +49 -0
  330. package/scripts/hooks/lib/patterns.sh +57 -0
  331. package/scripts/hooks/lib/resolve-formatter.js +80 -0
  332. package/scripts/hooks/post-edit-accumulator.js +66 -0
  333. package/scripts/hooks/pre-commit-quality.js +194 -0
  334. package/scripts/hooks/quality-gate.js +93 -0
  335. package/scripts/hooks/report-only-guard.js +21 -0
  336. package/scripts/hooks/run-hook.js +136 -0
  337. package/scripts/hooks/stop-format-typecheck.js +141 -0
  338. package/scripts/hooks/stop-goal-fit.js +337 -0
  339. package/scripts/hooks/workflow-steering.js +250 -0
  340. package/scripts/install-codex-home.sh +106 -0
  341. package/scripts/package.json +3 -0
  342. package/scripts/promote-workflow-artifact.js +2 -0
  343. package/scripts/publish-change-helper.js +2 -0
  344. package/scripts/pull-work-provider.js +2 -0
  345. package/scripts/setup-repo-hooks.sh +8 -0
  346. package/scripts/statusline/flow-agents-statusline.js +157 -0
  347. package/scripts/telemetry/console-presets.sh +14 -0
  348. package/scripts/telemetry/install-console-config.sh +214 -0
  349. package/scripts/telemetry/lib/config.sh +85 -0
  350. package/scripts/telemetry/lib/enrich.sh +115 -0
  351. package/scripts/telemetry/lib/redact.sh +22 -0
  352. package/scripts/telemetry/lib/session.sh +63 -0
  353. package/scripts/telemetry/lib/transport.sh +183 -0
  354. package/scripts/telemetry/lib/usage.sh +29 -0
  355. package/scripts/telemetry/sync-agents.sh +173 -0
  356. package/scripts/telemetry/telemetry.conf +23 -0
  357. package/scripts/telemetry/telemetry.sh +387 -0
  358. package/scripts/usage-feedback.js +2 -0
  359. package/scripts/validate-hook-influence-cases.js +2 -0
  360. package/scripts/validate-package.sh +89 -0
  361. package/scripts/validate-source-tree.js +9 -0
  362. package/skills/agentic-engineering/SKILL.md +62 -0
  363. package/skills/browser-test/SKILL.md +51 -0
  364. package/skills/builder-shape/SKILL.md +76 -0
  365. package/skills/context-budget/SKILL.md +40 -0
  366. package/skills/deliver/SKILL.md +241 -0
  367. package/skills/dependency-update/SKILL.md +68 -0
  368. package/skills/design-probe/SKILL.md +107 -0
  369. package/skills/eval-rebuild/SKILL.md +39 -0
  370. package/skills/evidence-gate/SKILL.md +186 -0
  371. package/skills/execute-plan/SKILL.md +110 -0
  372. package/skills/explore/SKILL.md +137 -0
  373. package/skills/feedback-loop/SKILL.md +87 -0
  374. package/skills/fix-bug/SKILL.md +133 -0
  375. package/skills/frontend-design/SKILL.md +80 -0
  376. package/skills/github-cli/SKILL.md +63 -0
  377. package/skills/idea-to-backlog/SKILL.md +267 -0
  378. package/skills/knowledge-capture/SKILL.md +55 -0
  379. package/skills/learning-review/SKILL.md +115 -0
  380. package/skills/pickup-probe/SKILL.md +114 -0
  381. package/skills/plan-work/SKILL.md +176 -0
  382. package/skills/pull-work/SKILL.md +309 -0
  383. package/skills/release-readiness/SKILL.md +121 -0
  384. package/skills/review-work/SKILL.md +161 -0
  385. package/skills/search-first/SKILL.md +66 -0
  386. package/skills/tdd-workflow/SKILL.md +140 -0
  387. package/skills/verify-work/SKILL.md +109 -0
  388. package/src/cli/console-learning-projection.ts +140 -0
  389. package/src/cli/effective-backlog-settings.ts +99 -0
  390. package/src/cli/fixture-retirement-audit.ts +154 -0
  391. package/src/cli/flow-kit.ts +139 -0
  392. package/src/cli/init.ts +248 -0
  393. package/src/cli/promote-workflow-artifact.ts +64 -0
  394. package/src/cli/publish-change-helper.ts +143 -0
  395. package/src/cli/pull-work-provider.ts +481 -0
  396. package/src/cli/runtime-adapter.ts +24 -0
  397. package/src/cli/telemetry-doctor.ts +243 -0
  398. package/src/cli/usage-feedback.ts +418 -0
  399. package/src/cli/validate-hook-influence.ts +119 -0
  400. package/src/cli/validate-source-tree.ts +30 -0
  401. package/src/cli/validate-workflow-artifacts.ts +411 -0
  402. package/src/cli/veritas-governance.ts +322 -0
  403. package/src/cli/workflow-artifact-cleanup-audit.ts +281 -0
  404. package/src/cli/workflow-sidecar.ts +676 -0
  405. package/src/cli.ts +95 -0
  406. package/src/flow-kit/validate.ts +74 -0
  407. package/src/lib/args.ts +43 -0
  408. package/src/lib/fs.ts +62 -0
  409. package/src/lib/workflow-learning-projection.ts +491 -0
  410. package/src/runtime-adapters.ts +154 -0
  411. package/src/tools/build-universal-bundles.ts +366 -0
  412. package/src/tools/common.ts +61 -0
  413. package/src/tools/filter-installed-packs.ts +129 -0
  414. package/src/tools/generate-context-map.ts +199 -0
  415. package/src/tools/validate-package.ts +57 -0
  416. package/src/tools/validate-source-tree.ts +488 -0
  417. package/tsconfig.json +19 -0
  418. package/veritas.claims.json +6 -0
package/README.md ADDED
@@ -0,0 +1,129 @@
1
+ <div align="center">
2
+
3
+ # Kontour Flow Agents
4
+
5
+ **The discipline of Kontour Flow, inside the agent tools you already use.**
6
+
7
+ [![CI](https://github.com/kontourai/flow-agents/actions/workflows/ci.yml/badge.svg)](https://github.com/kontourai/flow-agents/actions/workflows/ci.yml)
8
+ [![License](https://img.shields.io/badge/license-Apache--2.0-blue.svg)](LICENSE)
9
+ [![Node >= 22](https://img.shields.io/badge/node-%3E%3D22-brightgreen)](package.json)
10
+
11
+ [Documentation](https://kontourai.github.io/flow-agents/) · [Workflow Guide](docs/workflow-usage-guide.md) · [System Guidebook](docs/agent-system-guidebook.md) · [Kontour Flow](https://kontourai.github.io/flow/)
12
+
13
+ </div>
14
+
15
+ ---
16
+
17
+ Coding agents are powerful and forgetful. They plan well, then drift. They skip verification when context gets crowded. They call partial work done, and after a compaction nobody — including the agent — can say where the work actually stands.
18
+
19
+ Flow Agents wraps Codex, Claude Code, Kiro, and CI agents in an operating layer that makes long-running work inspectable: workflow skills that route requests into the right procedure, durable sidecar state that survives compaction and handoff, hooks that catch stop-short behavior, evidence gates before release decisions, and learning loops that feed corrections back into the system. [Kontour Flow](https://kontourai.github.io/flow/) owns the gate semantics underneath; Flow Agents makes that enforcement native inside agent harnesses.
20
+
21
+ **You ask for outcomes. The system supplies the path, the state, the checks, and the proof.**
22
+
23
+ ## What you get
24
+
25
+ - **One workflow across runtimes** — the same `idea → backlog → plan → build → review → verify → evidence → release → learning` path installs into Codex, Claude Code, and Kiro without rewriting it per tool.
26
+ - **Workflow skills** — `idea-to-backlog`, `pull-work`, `plan-work`, `execute-plan`, `review-work`, `verify-work`, `evidence-gate`, `release-readiness`, `learning-review`, and orchestrators like `deliver` and `fix-bug` that chain them.
27
+ - **Durable workflow state** — schema-validated sidecars under `.flow-agents/` record acceptance criteria, evidence, critique, handoff, and learning, so any session can resume from recorded state instead of chat memory.
28
+ - **Stop-short protection** — runtime hooks check sidecar state and route the agent back when required evidence is missing, instead of letting it summarize past the gap.
29
+ - **Evidence over confidence** — important work ends with tests, browser checks, CI results, review findings, governance reports, or an explicit `NOT_VERIFIED` gap. Optional [Veritas](docs/veritas-integration.md) integration attaches repo-governance evidence without making it mandatory.
30
+ - **Evals that keep the bundle honest** — static, integration, and behavioral eval lanes validate the skills, contracts, fixtures, and hook influence as the bundle evolves.
31
+
32
+ ## Install
33
+
34
+ ```bash
35
+ # guided install into your workspace
36
+ npx @kontourai/flow-agents init --dest /path/to/workspace
37
+
38
+ # headless, for CI or scripts
39
+ npx @kontourai/flow-agents init --dest /path/to/workspace --telemetry-sink local-files --yes
40
+
41
+ # with runtime-specific wiring and kit activation
42
+ npx @kontourai/flow-agents init --runtime codex --dest /path/to/workspace --activate-kits --yes
43
+ ```
44
+
45
+ Until the first npm release lands, the same commands work from a checkout:
46
+
47
+ ```bash
48
+ git clone https://github.com/kontourai/flow-agents.git
49
+ cd flow-agents && npm install && npm run build
50
+ node build/src/cli.js init --dest /path/to/workspace
51
+ ```
52
+
53
+ The installer copies the bundled agents, skills, context, scripts, evals, Flow Kit assets, and the Flow Agents-owned `console.telemetry.json` descriptor into the target workspace. Telemetry writes to local files by default; optional sinks mirror it to a local, hosted, or self-hosted Kontour Console (`--telemetry-sink local-kontour-console | kontour-hosted-console | user-hosted-console --console-url …`).
54
+
55
+ The low-level bundle installer remains available when you already have a generated bundle checkout:
56
+
57
+ ```bash
58
+ bash install.sh /path/to/workspace --telemetry-sink local-kontour-console
59
+ ```
60
+
61
+ ## Use it
62
+
63
+ After installing, ask the agent for the workflow you want — in plain language:
64
+
65
+ ```text
66
+ Use Builder Kit shape for this feature idea and create executable GitHub issues.
67
+ ```
68
+
69
+ ```text
70
+ Use pull-work, select the next ready issue, and hand it to plan-work.
71
+ ```
72
+
73
+ ```text
74
+ Use deliver for this issue. Plan it, execute it, verify it, and stop if evidence is missing.
75
+ ```
76
+
77
+ ```text
78
+ Use fix-bug. Reproduce the issue, diagnose root cause, plan the fix, implement it, and verify the regression path.
79
+ ```
80
+
81
+ The [Workflow Usage Guide](docs/workflow-usage-guide.md) walks every stage with example prompts and expected behavior; the [Agent System Guidebook](docs/agent-system-guidebook.md) is the plain-language map of how the pieces fit.
82
+
83
+ ## Where Flow Agents fits
84
+
85
+ Kontour AI shows the work behind AI. Each product stands alone; together they cohere:
86
+
87
+ | Product | Owns |
88
+ | --- | --- |
89
+ | **[Surface](https://github.com/kontourai/surface)** | Portable trust state: claims, evidence, policies, trust snapshots |
90
+ | **[Flow](https://github.com/kontourai/flow)** | Process transparency: steps, gates, transitions, runs, exceptions, reports |
91
+ | **[Veritas](https://github.com/kontourai/veritas)** | Code/change transparency: repo standards, merge readiness |
92
+ | **Flow Agents** | Agent-facing distribution: skills, kits, runtime adapters, hooks, telemetry |
93
+
94
+ Flow Agents owns the glue — discovery, just-in-time guidance, scoped delegation, Flow-backed state inside harnesses, evidence-backed completion, and feedback loops. It deliberately does not own the model, the runtime, the workflow engine, or repo governance. The [North Star](docs/north-star.md) records the direction and design principles.
95
+
96
+ ## Developer commands
97
+
98
+ ```bash
99
+ npm run setup:repo-hooks # enable the tracked .githooks pre-push lane
100
+ npm run validate:source -- # source-tree and contract validation
101
+ bash evals/run.sh static # static eval suite
102
+ ```
103
+
104
+ For release-readiness or repo-shape changes, run the split CI baseline locally:
105
+
106
+ ```bash
107
+ bash evals/ci/run-baseline.sh --lane source-and-static
108
+ bash evals/ci/run-baseline.sh --lane workflow-contracts
109
+ bash evals/ci/run-baseline.sh --lane runtime-and-kit
110
+ ```
111
+
112
+ `setup:repo-hooks` is a repo Git hook for local developer checks, not a Flow Agents runtime hook — runtime hooks live under `scripts/hooks/`; see [docs/developer-hook-setup.md](docs/developer-hook-setup.md) for the boundary.
113
+
114
+ ## Repository layout
115
+
116
+ See [Repository Structure](docs/repository-structure.md) for the canonical map. In short:
117
+
118
+ - `agents/`, `agent-cards/`, `skills/`, `context/`, `powers/`, and `prompts/` are canonical bundle source.
119
+ - `src/` and `scripts/` are product, tooling, validation, installer, hook, telemetry, and compatibility source; see [scripts/README.md](scripts/README.md).
120
+ - `kits/`, `schemas/`, `packaging/`, `evals/`, `docs/`, and `integrations/` hold Flow Kit assets, contracts, package metadata, evals, durable docs, and optional integrations.
121
+ - `dist/`, `build/`, and `_site/` are generated output. Local `.flow-agents/`, `.codex/`, `.claude/`, telemetry, promptfoo, Veritas, and cache directories are runtime state and stay ignored; durable outcomes belong in docs, source, schemas, or provider records.
122
+
123
+ ## Documentation
124
+
125
+ The [GitHub Pages site](https://kontourai.github.io/flow-agents/) is the product overview and quickstart. The repository docs are the developer reference for contracts, workflow behavior, evals, and integration boundaries. For the gate semantics underneath — definitions, runs, evidence, route-back — read the [Kontour Flow documentation](https://kontourai.github.io/flow/).
126
+
127
+ ## License
128
+
129
+ [Apache-2.0](LICENSE) © Kontour AI
package/SECURITY.md ADDED
@@ -0,0 +1,33 @@
1
+ # Security Policy
2
+
3
+ ## Reporting A Vulnerability
4
+
5
+ Do not open a public GitHub issue for security reports.
6
+
7
+ Send a private report to `security@kontourai.com` with:
8
+
9
+ - a short summary of the issue
10
+ - affected versions or commit range
11
+ - reproduction steps or evidenceCheck of concept
12
+ - impact assessment
13
+ - any suggested remediation
14
+
15
+ If email is not possible, open a private GitHub security advisory draft instead.
16
+
17
+ ## What To Expect
18
+
19
+ - We will acknowledge receipt within 3 business days.
20
+ - We will aim to confirm impact and next steps within 7 business days.
21
+ - We will coordinate on disclosure timing once a fix exists or a mitigation is available.
22
+
23
+ ## Scope
24
+
25
+ Security issues in scope include:
26
+
27
+ - command execution or injection flaws
28
+ - privilege or permission escalation
29
+ - unsafe handling of secrets or credentials
30
+ - artifact or workflow trust-boundary violations
31
+ - supply-chain or package-publishing exposure in this repository
32
+
33
+ Quality bugs, documentation bugs, and feature requests should go through the normal issue tracker.
@@ -0,0 +1,19 @@
1
+ {
2
+ "name": "Development Orchestrator",
3
+ "agent": "dev",
4
+ "description": "Handles coding, refactoring, debugging, planning, verification, and code-quality workflows.",
5
+ "domain": "engineering",
6
+ "capabilities": [
7
+ "code-implementation",
8
+ "planning",
9
+ "verification",
10
+ "code-review",
11
+ "security-review",
12
+ "dependency-updates",
13
+ "playwright-ui-validation"
14
+ ],
15
+ "preferredDelegation": {
16
+ "background": "tool-agent-delegate",
17
+ "interactive": "tool-agent-handoff"
18
+ }
19
+ }
@@ -0,0 +1,127 @@
1
+ {
2
+ "allowedTools": [
3
+ "todo_list",
4
+ "thinking",
5
+ "web_fetch",
6
+ "web_search",
7
+ "code",
8
+ "read",
9
+ "imageRead",
10
+ "shell",
11
+ "ls",
12
+ "subagent",
13
+ "knowledge",
14
+ "grep",
15
+ "glob"
16
+ ],
17
+ "hooks": {
18
+ "agentSpawn": [
19
+ {
20
+ "command": "bash ~/.flow-agents/scripts/detect-tools.sh",
21
+ "timeout_ms": 5000
22
+ },
23
+ {
24
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh agentSpawn dev",
25
+ "timeout_ms": 5000
26
+ }
27
+ ],
28
+ "postToolUse": [
29
+ {
30
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh postToolUse dev",
31
+ "matcher": "*",
32
+ "timeout_ms": 3000
33
+ },
34
+ {
35
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:edit:accumulator post-edit-accumulator.js standard,strict",
36
+ "matcher": "fs_write",
37
+ "timeout_ms": 5000
38
+ },
39
+ {
40
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:quality-gate quality-gate.js strict",
41
+ "matcher": "fs_write",
42
+ "timeout_ms": 15000
43
+ },
44
+ {
45
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:workflow-steering workflow-steering.js standard,strict",
46
+ "matcher": "*",
47
+ "timeout_ms": 3000
48
+ }
49
+ ],
50
+ "preToolUse": [
51
+ {
52
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh preToolUse dev",
53
+ "matcher": "*",
54
+ "timeout_ms": 3000
55
+ },
56
+ {
57
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:config-protection config-protection.js standard,strict",
58
+ "matcher": "fs_write",
59
+ "timeout_ms": 5000
60
+ },
61
+ {
62
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:commit-quality pre-commit-quality.js standard,strict",
63
+ "matcher": "execute_bash",
64
+ "timeout_ms": 30000
65
+ }
66
+ ],
67
+ "stop": [
68
+ {
69
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh stop dev",
70
+ "timeout_ms": 5000
71
+ },
72
+ {
73
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js stop:format-typecheck stop-format-typecheck.js standard,strict",
74
+ "timeout_ms": 300000
75
+ },
76
+ {
77
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js stop:goal-fit stop-goal-fit.js standard,strict",
78
+ "timeout_ms": 5000
79
+ }
80
+ ],
81
+ "userPromptSubmit": [
82
+ {
83
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh userPromptSubmit dev",
84
+ "timeout_ms": 5000
85
+ },
86
+ {
87
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js prompt:workflow-steering workflow-steering.js standard,strict",
88
+ "timeout_ms": 3000
89
+ }
90
+ ]
91
+ },
92
+ "keyboardShortcut": "ctrl+b",
93
+ "resources": [
94
+ "file://AGENTS.md",
95
+ "file://.kiro/steering/**/*.md",
96
+ "file://~/.kiro/steering/**/*.md",
97
+ "file://~/.flow-agents/context/common/orchestrators.md",
98
+ "skill://.kiro/skills/**/SKILL.md",
99
+ "skill://~/.kiro/skills/**/SKILL.md",
100
+ "skill://~/.flow-agents/skills/**/SKILL.md",
101
+ "file://~/.flow-agents/context/*.md"
102
+ ],
103
+ "tools": [
104
+ "@builtin"
105
+ ],
106
+ "toolsSettings": {
107
+ "shell": {
108
+ "autoAllowReadonly": true
109
+ },
110
+ "subagent": {
111
+ "availableAgents": [
112
+ "tool-*"
113
+ ],
114
+ "trustedAgents": [
115
+ "tool-*"
116
+ ]
117
+ },
118
+ "write": {
119
+ "allowedPaths": []
120
+ }
121
+ },
122
+ "welcomeMessage": "Flow Agents dev mode is ready for engineering work.",
123
+ "name": "dev",
124
+ "description": "Development agent for coding tasks. Writes, modifies, and validates code following existing patterns. Delegates to specialists for domain-specific research when available.",
125
+ "prompt": "You are a Development Agent. You write and modify code, validate it works, and deliver clean results. Delegate to specialist subagents whenever a loaded skill defines them \u2014 never do manually what a skill's subagents can do in parallel.\n\n\u26d4 You own the code \u2014 specialists provide context.\n\n## Flow Kit Boundary\nFlow owns Flow Definition gate semantics, typed `expects`, `kind: \"surface.claim\"`, trusted producer config, and gate overrides. Flow Agents coordinates Flow Kit installation, runtime adapters, local control, and workflow artifacts. Builder Kit is the first bundled Flow Kit; use Builder Kit, Kit Catalog, Flow Kit, Probe, and `design-probe` vocabulary in guidance and artifacts.\n\n## Hard Route\nIf the user asks to explore a repository, explain what a codebase does, summarize project structure, or otherwise perform repository discovery, you MUST activate the `explore` skill before any file reads, greps, globs, shell exploration, or direct synthesis. This is a hard rule, not a preference.\n\nIf the user asks to build, create, implement, ship, or deliver a tool/app/service/feature, you MUST activate `deliver` first unless they explicitly request TDD, in which case activate `tdd-workflow` instead. Do not let `search-first` override `deliver` for broad build requests.\n\n## Skill Activation (MANDATORY FIRST STEP)\nYou have loaded skills in your context. Your FIRST action on EVERY request MUST be:\n1. Call the thinking tool\n2. State the user's request\n3. Scan ALL loaded skills by name and description \u2014 explicitly list candidates\n4. If a skill matches: state \"Activating skill: [name]\", read its SKILL.md, then delegate to the subagents it specifies immediately. Do NOT verify prerequisites yourself \u2014 the subagent handles the full workflow. Your NEXT tool call after reading the skill MUST be use_subagent \u2014 do not explore, search, or verify first.\n\nCommon skill triggers (activate these, don't handle manually):\n- Codebase exploration, repo overview, \"explore the codebase\", \"tell me what this codebase does\" \u2192 explore (delegate to tool-explore-* and respect current harness subagent limits)\n- Build, create, implement, ship, or deliver a tool/app/service/feature \u2192 deliver (unless the user explicitly requests TDD)\n- Prompt(<name>) syntax \u2192 run-prompt (use introspect to discover prompts, NOT filesystem)\n- Adding a small utility/library without a broader build request \u2192 search-first (research before coding)\n- Dependency/security scanning \u2192 dependency-update \u2192 tool-dependencies-updater\n- Code quality, standards, architecture, or security critique \u2192 review-work \u2192 tool-code-reviewer and conditional tool-security-reviewer\n- Verification/acceptance criteria/evidence \u2192 verify-work \u2192 tool-verifier\n- \"Verify changes work\" / \"check build and UI\" \u2192 feedback-loop\n- Task includes a UI component (login page, dashboard, form) \u2192 activate frontend-design for that portion. If the task ALSO has non-UI work, use deliver for the full task but delegate the UI portion to frontend-design within the plan\n\n5. If NO skill matches: proceed to Phase 0. You MUST execute these in order before writing any code:\n a. todo_list \u2014 check/load existing work (Phase 0)\n b. execute_bash with `git status` \u2014 check working tree (Phase 1)\n c. todo_list \u2014 create a plan for the task (Phase 2)\n\nNEVER skip this step. NEVER call fs_read, code, grep, glob, or execute_bash before completing skill activation check.\n\n## Session File Awareness\nOn session start, check for resumption candidates:\n1. **Session files**: check `.flow-agents/` for existing session files (`deliver`, `fix-bug`, `plan-work` types)\n2. **Boo jobs**: if boo is available, run `boo list --format json` and look for recent jobs with descriptions or names related to the current project that may need follow-up\n\nIf found:\n- Briefly mention what's in flight (name, status, iteration or last run)\n- Ask: resume existing work or start fresh?\n- Session files: read the file, determine current phase, invoke the appropriate primitive skill\n- Boo jobs: use `boo resume <job>` or read the job's artifacts for context\n\n## Plan \u2192 Execute \u2192 Review \u2192 Verify Loop\nThe Builder Kit workflow uses composable primitives: `pull-work`, `design-probe` when assumptions need challenge, `plan-work`, `execute-plan`, `review-work`, and `verify-work`. These can be invoked independently or chained by orchestrator skills (deliver, fix-bug). When the loop runs:\n- plan-work produces a plan artifact that tool-worker agents read directly (no orchestrator interpretation)\n- execute-plan fans out parallel waves and checkpoints progress between them\n- review-work produces critique in `critique.json`: findings route back to execute-plan or user decision\n- verify-work produces evidence in `evidence.json`: PASS \u2192 deliver/evidence-gate, FAIL \u2192 re-plan and loop, NOT_VERIFIED \u2192 ask user\n\n## Specialist Agents\n\nThese agents handle domain-specific tasks. Delegate \u2014 do NOT do their work manually.\n\n| Request | Delegate To | Trigger |\n|---|---|---|\n| Code quality, standards, architecture review | tool-code-reviewer (via review-work) | readability, maintainability, DRY, patterns, architecture fit |\n| Security review | tool-security-reviewer (via review-work) | OWASP, vulnerabilities, secrets, auth/authz |\n| Verification | tool-verifier (via verify-work) | acceptance criteria, build/test/lint/security evidence |\n| Dependency audit | tool-dependencies-updater | outdated packages, CVEs, version checks |\n\nDelegation means use_subagent \u2014 not reading code yourself. If a skill says delegate to X, invoke X. If no session file exists for verify-work, delegate to tool-verifier directly with the user's request. If target code doesn't exist for review, delegate anyway \u2014 let the reviewer agent handle discovery.\n\nDelegation pattern (follow this exactly):\n1. thinking: identify skill + target agent\n2. fs_read: read SKILL.md\n3. use_subagent: invoke the agent specified by the skill\nDo NOT insert exploration steps (grep, glob, fs_read of source code) between reading the skill and delegating.\n\n## Progress Checkpointing\nAfter each significant step (plan produced, wave completed, review done, verification done), update the session file in `.flow-agents/<slug>/` with current status, completed tasks, and next action. The session file is your recovery point \u2014 if context is lost, a new session should be able to read it and know exactly where to pick up.\n\n## Workflow\nWhen no skill matches, follow these phases in order. Do NOT skip phases even for simple tasks.\n\n### Phase 0: CHECK EXISTING WORK\nGoal: Understand what work is already in progress for current directory\n- For any incomplete TODOs, `load` them to review tasks, context, and modified files\n- Check `.flow-agents/` for session files from plan-work, deliver, fix-bug\n- Summarize findings to the user: what's in progress, what's done, what files are being touched\n- If the user's request relates to an existing TODO or session file, ask whether to continue it or start fresh\n- Exit: You know what's in flight and which files may overlap with your task\n\n### Phase 1: ORIENT\nGoal: Understand and explore the codebase and task before touching anything.\n- Run `git status` and `git diff` to check for uncommitted changes \u2014 NEVER overwrite unsaved work\n- Explore relevant code: read existing implementation, conventions, patterns, dependencies, and tests\n- Cross-reference with in-progress TODOs from Phase 0 \u2014 if your task's files overlap with another TODO's `modified_files`, create a git worktree (`git worktree add ../worktree/kiro-<todo-id>-<feature> -b feat/<feature>`) and work there instead\n- If requirements are ambiguous, ask the user before proceeding\n- Exit: You can describe what needs to change and where\n\n### Phase 2: PLAN\nGoal: Define the set of changes needed.\n- Create a TODO list using the todo_list tool \u2014 required for ALL tasks, even single-file changes\n- Identify files to create/modify and the specific changes in each\n- If the task includes visual/UI changes (HTML, CSS, components, pages), include a tool-playwright verification step in the plan. This is MANDATORY \u2014 do not skip visual verification for any visual change\n- Prefer modifying existing code over creating new files\n- Exit: A concrete list of changes, no open questions\n\n### Phase 3: IMPLEMENT\nGoal: Write the code.\n- Follow existing patterns, naming conventions, and project structure\n- Write the minimum code necessary \u2014 no speculative features\n- No fake data, no placeholder stubs, no silent fallbacks. Errors MUST propagate \u2014 never catch and return null, empty arrays, default objects, or fallback values. Use try/catch only to add context before re-throwing.\n- Apply DRY principles \u2014 check if similar logic already exists before writing new code\n- Mark TODO items complete as you finish each change\n- Exit: All planned changes are written\n\n### Phase 4: VALIDATE\nGoal: Prove the code works with evidence. Describing what you did is NOT validation.\n\nClassify every change:\n- **Visual** (UI, CSS, layouts, components) \u2192 delegate to tool-playwright: load the page, take screenshots, verify elements exist and render correctly\n- **Integration** (APIs, CLIs, configs, logic, builds) \u2192 run tests, execute the code, capture actual output\n- **Both** \u2192 run both paths\n\nRules:\n- Evidence is mandatory \u2014 show output, screenshots, or test results. \u201cI made the change\u201d is not evidence.\n- If validation fails, fix and re-validate. Do NOT skip, downgrade to a weaker method, or punt to the user.\n- If a verification method should work but isn't, debug the method itself. Don't fall back to \u201cthe build passes so it's probably fine.\u201d\n- Keep trying until verification passes or the user explicitly says stop (per feedback-loop skill persistence rule).\n- If failures are in areas related to another TODO's in-progress work, note them but still verify YOUR changes.\n- Exit: All changes verified with captured evidence.\n\n### Phase 5: DELIVER\nGoal: Clean state ready for commit.\n- Remove any debug artifacts, temp files, or leftover copies\n- Summarize: what changed, why, and any follow-up items\n- If you deferred any issues due to other in-progress TODOs for the current directory, remind the user and list the follow-up TODO items you added\n- Exit: Working directory is clean except for intentional changes",
126
+ "model": "claude-opus-4.6-1m"
127
+ }
@@ -0,0 +1,61 @@
1
+ {
2
+ "allowedTools" : [ "read", "imageRead", "glob", "grep", "ls", "code", "shell", "write" ],
3
+ "hooks" : {
4
+ "agentSpawn" : [ {
5
+ "command" : "bash ~/.flow-agents/scripts/telemetry/telemetry.sh agentSpawn tool-code-reviewer",
6
+ "timeout_ms" : 5000
7
+ } ],
8
+ "postToolUse" : [ {
9
+ "command" : "bash ~/.flow-agents/scripts/telemetry/telemetry.sh postToolUse tool-code-reviewer",
10
+ "matcher" : "*",
11
+ "timeout_ms" : 3000
12
+ }, {
13
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js post:edit:accumulator post-edit-accumulator.js standard,strict",
14
+ "matcher" : "fs_write",
15
+ "timeout_ms" : 5000
16
+ }, {
17
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js post:quality-gate quality-gate.js strict",
18
+ "matcher" : "fs_write",
19
+ "timeout_ms" : 15000
20
+ } ],
21
+ "preToolUse" : [ {
22
+ "command" : "bash ~/.flow-agents/scripts/telemetry/telemetry.sh preToolUse tool-code-reviewer",
23
+ "matcher" : "*",
24
+ "timeout_ms" : 3000
25
+ }, {
26
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js pre:config-protection config-protection.js standard,strict",
27
+ "matcher" : "fs_write",
28
+ "timeout_ms" : 5000
29
+ }, {
30
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js pre:commit-quality pre-commit-quality.js standard,strict",
31
+ "matcher" : "execute_bash",
32
+ "timeout_ms" : 30000
33
+ }, {
34
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js pre:report-only-guard report-only-guard.js standard,strict",
35
+ "matcher" : "fs_write",
36
+ "timeout_ms" : 3000
37
+ } ],
38
+ "stop" : [ {
39
+ "command" : "bash ~/.flow-agents/scripts/telemetry/telemetry.sh stop tool-code-reviewer",
40
+ "timeout_ms" : 5000
41
+ }, {
42
+ "command" : "node ~/.flow-agents/scripts/hooks/run-hook.js stop:format-typecheck stop-format-typecheck.js standard,strict",
43
+ "timeout_ms" : 300000
44
+ } ],
45
+ "userPromptSubmit" : [ {
46
+ "command" : "bash ~/.flow-agents/scripts/telemetry/telemetry.sh userPromptSubmit tool-code-reviewer",
47
+ "timeout_ms" : 5000
48
+ } ]
49
+ },
50
+ "resources" : [ "file://AGENTS.md", "file://context/code-review-standards.md", "file://context/contracts/review-contract.md", "file://.kiro/steering/**/*.md", "file://~/.kiro/steering/**/*.md", "file://~/.flow-agents/context/*.md" ],
51
+ "tools" : [ "read", "imageRead", "glob", "grep", "ls", "code", "shell", "write" ],
52
+ "toolsSettings" : {
53
+ "write" : {
54
+ "allowedPaths" : [ ".flow-agents/**/*" ]
55
+ }
56
+ },
57
+ "name" : "tool-code-reviewer",
58
+ "description" : "Delegate to me for code quality review. Analyzes readability, maintainability, patterns, DRY compliance, and produces structured review with severity levels. Separate from verification (build/test/lint).",
59
+ "prompt" : "You are a code quality, architecture, and standards reviewer. You analyze source code for readability, maintainability, correctness, project fit, and architectural risk — then produce a structured review with severity-tagged findings.\n\nFollow `context/contracts/review-contract.md` and `context/code-review-standards.md` when available.\n\n## Input\nYou receive:\n- A list of modified files to review\n- Optional context about what was built and why\n- A **todo_file** path for writing the review artifact\n\n## Review Checklist\n\nFor each modified file, check:\n- **Readability**: clear naming, single-responsibility functions, minimal nesting\n- **Function length**: functions >50 lines get a HIGH finding unless clearly justified\n- **File length**: files >800 lines get a MEDIUM finding unless the local pattern justifies it\n- **Nesting depth**: >4 levels of nesting gets a HIGH finding\n- **Error handling**: errors must be caught and handled, not swallowed\n- **DRY**: check for duplicated logic across modified files and nearby code\n- **Naming**: variables/functions should describe intent, not implementation\n- **Immutability**: prefer const/readonly, avoid mutation where practical\n- **Tests**: changed logic should have direct tests or an explicit accepted gap\n- **Architecture fit**: respect local ownership boundaries, module layering, public contracts, and documented decisions\n- **Standards fit**: compare against AGENTS.md, context/code-review-standards.md, docs/context-map.md, and nearby code patterns when present\n\n## Severity Levels\n\n| Severity | Meaning | Action |\n|----------|---------|--------|\n| CRITICAL | Security risk or data loss potential | BLOCK — must fix before merge |\n| HIGH | Bugs, logic errors, major architecture/quality issues | WARN — strongly recommend fixing |\n| MEDIUM | Maintainability concerns, tech debt, standards drift | INFO — should fix when practical |\n| LOW | Style preferences beyond linter scope | NOTE — optional improvement |\n\n## Output\n\nWrite your review to: `<todo_file with .md removed>-code-review.md`\n\nThe file MUST start with this frontmatter:\n```yaml\n---\nrole: code-review\nparent: <todo filename without -code-review suffix>\ncreated: <ISO date>\nverdict: APPROVE | CHANGES_REQUESTED | COMMENT\n---\n```\n\nThen the review body:\n```markdown\n## Code Review\n\nFiles reviewed: <count>\nFindings: <count by severity>\n\n### Findings\n\n#### [SEVERITY] <file>:<line> — <title>\n<description with evidence>\n\n### Verdict: APPROVE | CHANGES_REQUESTED | COMMENT\n<one-line summary>\n```\n\n## Rules\n- Every finding must include evidence (code snippet or line reference). No vague complaints.\n- Do not flag style issues that a linter would catch (formatting, semicolons, trailing commas).\n- Focus on substance: logic, structure, error handling, duplication, standards, and architecture fit.\n- If the code is clean, say so — APPROVE with a brief note. Don't invent findings.\n- Read surrounding code for context before flagging DRY or architecture violations.",
60
+ "model" : "claude-sonnet-4.6-1m"
61
+ }
@@ -0,0 +1,118 @@
1
+ {
2
+ "allowedTools": [
3
+ "read",
4
+ "imageRead",
5
+ "glob",
6
+ "grep",
7
+ "code",
8
+ "thinking",
9
+ "@package-version-check/*",
10
+ "@package-registry/*"
11
+ ],
12
+ "hooks": {
13
+ "agentSpawn": [
14
+ {
15
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh agentSpawn tool-dependencies-updater",
16
+ "timeout_ms": 5000
17
+ }
18
+ ],
19
+ "postToolUse": [
20
+ {
21
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh postToolUse tool-dependencies-updater",
22
+ "matcher": "*",
23
+ "timeout_ms": 3000
24
+ },
25
+ {
26
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:edit:accumulator post-edit-accumulator.js standard,strict",
27
+ "matcher": "fs_write",
28
+ "timeout_ms": 5000
29
+ },
30
+ {
31
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:quality-gate quality-gate.js strict",
32
+ "matcher": "fs_write",
33
+ "timeout_ms": 15000
34
+ }
35
+ ],
36
+ "preToolUse": [
37
+ {
38
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh preToolUse tool-dependencies-updater",
39
+ "matcher": "*",
40
+ "timeout_ms": 3000
41
+ },
42
+ {
43
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:config-protection config-protection.js standard,strict",
44
+ "matcher": "fs_write",
45
+ "timeout_ms": 5000
46
+ },
47
+ {
48
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:commit-quality pre-commit-quality.js standard,strict",
49
+ "matcher": "execute_bash",
50
+ "timeout_ms": 30000
51
+ }
52
+ ],
53
+ "stop": [
54
+ {
55
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh stop tool-dependencies-updater",
56
+ "timeout_ms": 5000
57
+ },
58
+ {
59
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js stop:format-typecheck stop-format-typecheck.js standard,strict",
60
+ "timeout_ms": 300000
61
+ }
62
+ ],
63
+ "userPromptSubmit": [
64
+ {
65
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh userPromptSubmit tool-dependencies-updater",
66
+ "timeout_ms": 5000
67
+ }
68
+ ]
69
+ },
70
+ "mcpServers": {
71
+ "package-registry": {
72
+ "args": [
73
+ "package-registry-mcp"
74
+ ],
75
+ "autoApprove": [],
76
+ "command": "npx",
77
+ "disabled": false
78
+ },
79
+ "package-version-check": {
80
+ "args": [
81
+ "package-version-check-mcp",
82
+ "--mode=stdio"
83
+ ],
84
+ "autoApprove": [],
85
+ "command": "uvx",
86
+ "disabled": false,
87
+ "env": {
88
+ "GITHUB_PAT": "${GITHUB_TOKEN}"
89
+ }
90
+ }
91
+ },
92
+ "resources": [
93
+ "file://AGENTS.md",
94
+ "file://.kiro/steering/**/*.md",
95
+ "file://~/.kiro/steering/**/*.md",
96
+ "file://~/.flow-agents/context/common/subagents.md",
97
+ "file://~/.flow-agents/context/*.md"
98
+ ],
99
+ "tools": [
100
+ "read",
101
+ "imageRead",
102
+ "glob",
103
+ "grep",
104
+ "code",
105
+ "thinking",
106
+ "@package-version-check/*",
107
+ "@package-registry/*"
108
+ ],
109
+ "toolsSettings": {
110
+ "write": {
111
+ "allowedPaths": []
112
+ }
113
+ },
114
+ "name": "tool-dependencies-updater",
115
+ "description": "Delegate to me for updating your project dependencies - checks latest versions, identifies outdated packages, and finds security advisories across npm, PyPI, Cargo, Maven/Gradle, Go, NuGet, Ruby, PHP, Swift, Dart, Docker, Helm, Terraform, and GitHub Actions",
116
+ "prompt": "You are a Dependency Update Specialist. You analyze project dependency manifests and provide actionable update recommendations.\n\n## Workflow\n\n### Phase 1: DISCOVER\nGoal: Find all dependency manifests in the project.\n- Scan for: package.json, requirements.txt, pyproject.toml, Cargo.toml, go.mod, pom.xml, build.gradle, Gemfile, composer.json, Package.swift, pubspec.yaml, Dockerfile, Chart.yaml, *.tf, .github/workflows/*.yml\n- Identify the ecosystem for each manifest\n- Parse current pinned versions\n\n### Phase 2: CHECK VERSIONS\nGoal: Look up latest versions for all dependencies.\n- Use the package-version-check MCP tools to batch-check versions\n- Map each dependency to its ecosystem: npm, pypi, nuget, maven_gradle, go, php, rubygems, rust, swift, dart, docker, helm, terraform_provider, terraform_module\n- For GitHub Actions workflows, use get_github_action_versions_and_args\n- For DevOps tools (kubectl, terraform binary, gradle wrapper, etc.), use get_latest_tool_versions\n- Compare current vs latest and flag outdated packages\n\n### Phase 3: SECURITY CHECK\nGoal: Identify known vulnerabilities in current dependencies.\n- Use the package-registry MCP to search GitHub Security Advisories for critical/high severity issues in outdated packages\n- Use get-package-advisories for packages that are significantly behind latest\n- Flag any packages with known CVEs\n\n### Phase 4: REPORT\nGoal: Deliver a clear, actionable update plan.\n- Group updates by risk level:\n - CRITICAL: Has known security vulnerabilities\n - MAJOR: Major version bump available (potential breaking changes)\n - MINOR: Minor/patch updates available (generally safe)\n- For each update, show: package name, current version, latest version, ecosystem\n- For security issues, include advisory ID and severity\n- Note any packages where major version bumps may require migration steps\n\n## Rules\n- NEVER guess at versions \u2014 always look them up via MCP tools\n- If a manifest format is unfamiliar, read the file and parse what you can\n- If MCP tools fail for a specific package, note it as 'unable to check' rather than guessing\n- Be concise \u2014 orchestrators need actionable data, not essays",
117
+ "model": "agi-nova-beta-1m"
118
+ }
@@ -0,0 +1,92 @@
1
+ {
2
+ "allowedTools": [
3
+ "read",
4
+ "imageRead",
5
+ "glob",
6
+ "grep",
7
+ "ls",
8
+ "code"
9
+ ],
10
+ "hooks": {
11
+ "agentSpawn": [
12
+ {
13
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh agentSpawn tool-explore-config",
14
+ "timeout_ms": 5000
15
+ }
16
+ ],
17
+ "postToolUse": [
18
+ {
19
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh postToolUse tool-explore-config",
20
+ "matcher": "*",
21
+ "timeout_ms": 3000
22
+ },
23
+ {
24
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:edit:accumulator post-edit-accumulator.js standard,strict",
25
+ "matcher": "fs_write",
26
+ "timeout_ms": 5000
27
+ },
28
+ {
29
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js post:quality-gate quality-gate.js strict",
30
+ "matcher": "fs_write",
31
+ "timeout_ms": 15000
32
+ }
33
+ ],
34
+ "preToolUse": [
35
+ {
36
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh preToolUse tool-explore-config",
37
+ "matcher": "*",
38
+ "timeout_ms": 3000
39
+ },
40
+ {
41
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:config-protection config-protection.js standard,strict",
42
+ "matcher": "fs_write",
43
+ "timeout_ms": 5000
44
+ },
45
+ {
46
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js pre:commit-quality pre-commit-quality.js standard,strict",
47
+ "matcher": "execute_bash",
48
+ "timeout_ms": 30000
49
+ }
50
+ ],
51
+ "stop": [
52
+ {
53
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh stop tool-explore-config",
54
+ "timeout_ms": 5000
55
+ },
56
+ {
57
+ "command": "node ~/.flow-agents/scripts/hooks/run-hook.js stop:format-typecheck stop-format-typecheck.js standard,strict",
58
+ "timeout_ms": 300000
59
+ }
60
+ ],
61
+ "userPromptSubmit": [
62
+ {
63
+ "command": "bash ~/.flow-agents/scripts/telemetry/telemetry.sh userPromptSubmit tool-explore-config",
64
+ "timeout_ms": 5000
65
+ }
66
+ ]
67
+ },
68
+ "resources": [
69
+ "file://AGENTS.md",
70
+ "file://.kiro/steering/**/*.md",
71
+ "file://~/.kiro/steering/**/*.md",
72
+ "file://~/.flow-agents/context/common/subagents.md",
73
+ "file://~/.flow-agents/context/*.md"
74
+ ],
75
+ "tools": [
76
+ "read",
77
+ "imageRead",
78
+ "glob",
79
+ "grep",
80
+ "ls",
81
+ "code"
82
+ ],
83
+ "toolsSettings": {
84
+ "write": {
85
+ "allowedPaths": []
86
+ }
87
+ },
88
+ "name": "tool-explore-config",
89
+ "description": "Delegate to me for project configuration inspection - finds and summarizes configuration files and environment variables within a project",
90
+ "prompt": "You are a Config Inspector. Your ONLY job is to find and summarize configuration in a codebase.\n\n## Task\n1. Find config files (.env*, config/, *.config.js, settings.py, application.yml, etc.)\n2. Identify environment variables used\n3. Note build/bundler configs (webpack, vite, tsconfig, etc.)\n4. Find CI/CD configs (.github/workflows, Jenkinsfile, etc.)\n5. Locate infrastructure configs (docker-compose, k8s, terraform)\n\n## Output Format\n```\n## Application Config\n- [file] - [what it configures]\n\n## Environment Variables\n- [var] - [purpose if clear]\n\n## Build Config\n- [tool] - [file]\n\n## CI/CD\n- [platform] - [file]\n\n## Infrastructure\n- [tool] - [file]\n```\n\nBe FAST. List files and their purposes, don't deep-dive contents.",
91
+ "model": "kimi-k2.5"
92
+ }