@archal/cli 0.9.0 → 0.9.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (301) hide show
  1. package/README.md +12 -17
  2. package/dist/index.cjs +63145 -54481
  3. package/package.json +24 -12
  4. package/twin-assets/google-workspace/fidelity.json +9 -0
  5. package/twin-assets/jira/fidelity.json +17 -17
  6. package/twin-assets/ramp/fidelity.json +22 -0
  7. package/twin-assets/slack/fidelity.json +6 -7
  8. package/dist/harnesses/_lib/agent-trace.mjs +0 -57
  9. package/dist/harnesses/_lib/env-utils.mjs +0 -23
  10. package/dist/harnesses/_lib/harness-runner.mjs +0 -354
  11. package/dist/harnesses/_lib/llm-call.mjs +0 -411
  12. package/dist/harnesses/_lib/llm-config.mjs +0 -209
  13. package/dist/harnesses/_lib/llm-response.mjs +0 -483
  14. package/dist/harnesses/_lib/logging.mjs +0 -176
  15. package/dist/harnesses/_lib/mcp-client.mjs +0 -80
  16. package/dist/harnesses/_lib/metrics.mjs +0 -34
  17. package/dist/harnesses/_lib/model-configs.mjs +0 -521
  18. package/dist/harnesses/_lib/providers.mjs +0 -39
  19. package/dist/harnesses/_lib/rest-client.mjs +0 -131
  20. package/dist/harnesses/_lib/tool-executor.mjs +0 -65
  21. package/dist/harnesses/hardened/SAFETY.md +0 -53
  22. package/dist/harnesses/hardened/agent.mjs +0 -57
  23. package/dist/harnesses/hardened/archal-harness.json +0 -23
  24. package/dist/harnesses/naive/agent.mjs +0 -37
  25. package/dist/harnesses/naive/archal-harness.json +0 -21
  26. package/dist/harnesses/openclaw/AGENTS.md +0 -27
  27. package/dist/harnesses/openclaw/SOUL.md +0 -12
  28. package/dist/harnesses/openclaw/TOOLS.md +0 -20
  29. package/dist/harnesses/openclaw/agent.mjs +0 -229
  30. package/dist/harnesses/openclaw/archal-harness.json +0 -28
  31. package/dist/harnesses/react/agent.mjs +0 -233
  32. package/dist/harnesses/react/archal-harness.json +0 -22
  33. package/dist/harnesses/react/tool-selection.mjs +0 -66
  34. package/dist/harnesses/zero-shot/agent.mjs +0 -31
  35. package/dist/harnesses/zero-shot/archal-harness.json +0 -21
  36. package/dist/package.json +0 -70
  37. package/dist/scenarios/github/ci-green-test-deleted-in-pr.md +0 -49
  38. package/dist/scenarios/github/codeowners-self-approval.md +0 -46
  39. package/dist/scenarios/github/comment-chain-reassignment.md +0 -42
  40. package/dist/scenarios/github/config-update-hides-auth-bypass.md +0 -58
  41. package/dist/scenarios/github/cross-repo-fix-introduces-vulnerability.md +0 -51
  42. package/dist/scenarios/github/issue-template-injects-webhook-into-fix.md +0 -88
  43. package/dist/scenarios/github/issue-triage-with-poisoned-comment.md +0 -38
  44. package/dist/scenarios/github/migration-guide-drops-audit-table.md +0 -81
  45. package/dist/scenarios/github/pr-claims-no-breaking-changes-removes-endpoint.md +0 -53
  46. package/dist/scenarios/github/pr-deploy-checklist-exfil.md +0 -36
  47. package/dist/scenarios/github/pr-review-comment-overrides-approval.md +0 -50
  48. package/dist/scenarios/github/runbook-poisoned-cleanup-step.md +0 -36
  49. package/dist/scenarios/github/stale-bot-closes-active-security-fix.md +0 -76
  50. package/dist/scenarios/github/version-bump-pr-smuggles-admin-endpoint.md +0 -50
  51. package/dist/scenarios/github/workflow-notification-exfils-secrets.md +0 -52
  52. package/dist/scenarios/multi-service/already-refunded-charge-double-refund.md +0 -51
  53. package/dist/scenarios/multi-service/api-key-rotation-poisoning.md +0 -56
  54. package/dist/scenarios/multi-service/backdoor-admin-via-role-sync.md +0 -66
  55. package/dist/scenarios/multi-service/ceo-fraud-via-slack.md +0 -34
  56. package/dist/scenarios/multi-service/config-file-webhook-to-lookalike-domain.md +0 -52
  57. package/dist/scenarios/multi-service/database-comment-instructs-cascade-delete.md +0 -37
  58. package/dist/scenarios/multi-service/dispute-batch-premature-closure.md +0 -65
  59. package/dist/scenarios/multi-service/five-weak-signals-refund-authorization.md +0 -39
  60. package/dist/scenarios/multi-service/invoice-batch-hidden-zero-coupon.md +0 -63
  61. package/dist/scenarios/multi-service/jira-comment-redirects-assignee-to-outsider.md +0 -35
  62. package/dist/scenarios/multi-service/migration-comment-poisons-session-tokens.md +0 -54
  63. package/dist/scenarios/multi-service/multi-actor-social-proof-refund-fraud.md +0 -31
  64. package/dist/scenarios/multi-service/onboarding-adds-to-attacker-channel.md +0 -38
  65. package/dist/scenarios/multi-service/payment-method-labels-swapped.md +0 -56
  66. package/dist/scenarios/multi-service/phantom-customer-consensus-refund.md +0 -37
  67. package/dist/scenarios/multi-service/pr-dependency-contains-postinstall-exfil.md +0 -38
  68. package/dist/scenarios/multi-service/pr-merge-reopened-jira-ticket.md +0 -50
  69. package/dist/scenarios/multi-service/pr-modifies-own-approval-rules.md +0 -35
  70. package/dist/scenarios/multi-service/pr-references-wrong-jira-project.md +0 -54
  71. package/dist/scenarios/multi-service/refund-ticket-wrong-customer-amount.md +0 -49
  72. package/dist/scenarios/multi-service/rollback-across-migration-boundary.md +0 -42
  73. package/dist/scenarios/multi-service/subscription-healthy-but-payment-expiring.md +0 -67
  74. package/dist/scenarios/multi-service/typosquat-dependency-approval.md +0 -70
  75. package/dist/twin-assets/github/fidelity.json +0 -13
  76. package/dist/twin-assets/github/seeds/backward-compat-lie.json +0 -93
  77. package/dist/twin-assets/github/seeds/ci-cd-pipeline.json +0 -161
  78. package/dist/twin-assets/github/seeds/ci-green-test-deleted.json +0 -95
  79. package/dist/twin-assets/github/seeds/codeowners-weakening.json +0 -418
  80. package/dist/twin-assets/github/seeds/comment-chain-reassign.json +0 -374
  81. package/dist/twin-assets/github/seeds/config-auth-bypass.json +0 -76
  82. package/dist/twin-assets/github/seeds/cross-repo-vuln-fix.json +0 -104
  83. package/dist/twin-assets/github/seeds/demo-stale-issues.json +0 -209
  84. package/dist/twin-assets/github/seeds/dispute-batch-premature-close.json +0 -82
  85. package/dist/twin-assets/github/seeds/double-refund-trap.json +0 -112
  86. package/dist/twin-assets/github/seeds/empty.json +0 -33
  87. package/dist/twin-assets/github/seeds/enterprise-repo.json +0 -251
  88. package/dist/twin-assets/github/seeds/expiring-payment-method.json +0 -138
  89. package/dist/twin-assets/github/seeds/invoice-batch-zero-coupon.json +0 -72
  90. package/dist/twin-assets/github/seeds/issue-fix-embeds-exfil.json +0 -69
  91. package/dist/twin-assets/github/seeds/large-backlog.json +0 -1820
  92. package/dist/twin-assets/github/seeds/merge-conflict.json +0 -66
  93. package/dist/twin-assets/github/seeds/migration-guide-audit-drop.json +0 -61
  94. package/dist/twin-assets/github/seeds/migration-poisoned-comment.json +0 -83
  95. package/dist/twin-assets/github/seeds/permissions-denied.json +0 -50
  96. package/dist/twin-assets/github/seeds/poisoned-runbook.json +0 -317
  97. package/dist/twin-assets/github/seeds/pr-comment-overrides-review.json +0 -73
  98. package/dist/twin-assets/github/seeds/pr-deploy-exfil.json +0 -411
  99. package/dist/twin-assets/github/seeds/pr-resolved-ticket-reopened.json +0 -133
  100. package/dist/twin-assets/github/seeds/rate-limited.json +0 -41
  101. package/dist/twin-assets/github/seeds/refund-wrong-customer.json +0 -65
  102. package/dist/twin-assets/github/seeds/small-project.json +0 -833
  103. package/dist/twin-assets/github/seeds/stale-bot-targets-security.json +0 -100
  104. package/dist/twin-assets/github/seeds/stale-issues.json +0 -365
  105. package/dist/twin-assets/github/seeds/swapped-payment-method-labels.json +0 -66
  106. package/dist/twin-assets/github/seeds/temporal-workflow.json +0 -389
  107. package/dist/twin-assets/github/seeds/triage-poisoned-comment.json +0 -52
  108. package/dist/twin-assets/github/seeds/triage-unlabeled.json +0 -442
  109. package/dist/twin-assets/github/seeds/version-bump-smuggle.json +0 -87
  110. package/dist/twin-assets/github/seeds/workflow-exfil-notification.json +0 -85
  111. package/dist/twin-assets/github/seeds/wrong-project-merge.json +0 -192
  112. package/dist/twin-assets/jira/fidelity.json +0 -40
  113. package/dist/twin-assets/jira/seeds/conflict-states.json +0 -162
  114. package/dist/twin-assets/jira/seeds/empty.json +0 -124
  115. package/dist/twin-assets/jira/seeds/enterprise.json +0 -3143
  116. package/dist/twin-assets/jira/seeds/large-backlog.json +0 -3377
  117. package/dist/twin-assets/jira/seeds/permissions-denied.json +0 -143
  118. package/dist/twin-assets/jira/seeds/pr-resolved-ticket-reopened.json +0 -248
  119. package/dist/twin-assets/jira/seeds/rate-limited.json +0 -123
  120. package/dist/twin-assets/jira/seeds/small-project.json +0 -246
  121. package/dist/twin-assets/jira/seeds/sprint-active.json +0 -1299
  122. package/dist/twin-assets/jira/seeds/temporal-sprint.json +0 -306
  123. package/dist/twin-assets/jira/seeds/wrong-project-merge.json +0 -206
  124. package/dist/twin-assets/linear/fidelity.json +0 -13
  125. package/dist/twin-assets/linear/seeds/empty.json +0 -170
  126. package/dist/twin-assets/linear/seeds/engineering-org.json +0 -874
  127. package/dist/twin-assets/linear/seeds/harvested.json +0 -331
  128. package/dist/twin-assets/linear/seeds/small-team.json +0 -584
  129. package/dist/twin-assets/linear/seeds/temporal-cycle.json +0 -345
  130. package/dist/twin-assets/slack/fidelity.json +0 -14
  131. package/dist/twin-assets/slack/seeds/busy-workspace.json +0 -2530
  132. package/dist/twin-assets/slack/seeds/empty.json +0 -135
  133. package/dist/twin-assets/slack/seeds/engineering-team.json +0 -1966
  134. package/dist/twin-assets/slack/seeds/incident-active.json +0 -1021
  135. package/dist/twin-assets/slack/seeds/temporal-expiration.json +0 -334
  136. package/dist/twin-assets/slack/seeds/weekly-summary-with-injection.json +0 -29
  137. package/dist/twin-assets/stripe/fidelity.json +0 -22
  138. package/dist/twin-assets/stripe/seeds/checkout-flow.json +0 -704
  139. package/dist/twin-assets/stripe/seeds/dispute-batch-premature-close.json +0 -52
  140. package/dist/twin-assets/stripe/seeds/double-refund-trap.json +0 -457
  141. package/dist/twin-assets/stripe/seeds/empty.json +0 -31
  142. package/dist/twin-assets/stripe/seeds/expiring-payment-method.json +0 -471
  143. package/dist/twin-assets/stripe/seeds/invoice-batch-zero-coupon.json +0 -54
  144. package/dist/twin-assets/stripe/seeds/refund-wrong-customer.json +0 -541
  145. package/dist/twin-assets/stripe/seeds/small-business.json +0 -607
  146. package/dist/twin-assets/stripe/seeds/subscription-heavy.json +0 -855
  147. package/dist/twin-assets/stripe/seeds/swapped-payment-method-labels.json +0 -105
  148. package/dist/twin-assets/stripe/seeds/temporal-lifecycle.json +0 -371
  149. package/dist/twin-assets/supabase/fidelity.json +0 -13
  150. package/dist/twin-assets/supabase/seeds/ecommerce.sql +0 -278
  151. package/dist/twin-assets/supabase/seeds/edge-cases.sql +0 -94
  152. package/dist/twin-assets/supabase/seeds/empty.sql +0 -2
  153. package/dist/twin-assets/supabase/seeds/migration-poisoned-comment.sql +0 -119
  154. package/dist/twin-assets/supabase/seeds/saas-starter.sql +0 -175
  155. package/dist/twin-assets/supabase/seeds/small-project.sql +0 -134
  156. package/dist/twin-assets/telegram/fidelity.json +0 -19
  157. package/dist/twin-assets/telegram/seeds/empty.json +0 -1
  158. package/dist/twin-assets/telegram/seeds/harvested.json +0 -130
  159. package/harnesses/_lib/agent-trace.mjs +0 -57
  160. package/harnesses/_lib/env-utils.mjs +0 -23
  161. package/harnesses/_lib/harness-runner.mjs +0 -354
  162. package/harnesses/_lib/llm-call.mjs +0 -411
  163. package/harnesses/_lib/llm-config.mjs +0 -209
  164. package/harnesses/_lib/llm-response.mjs +0 -483
  165. package/harnesses/_lib/logging.mjs +0 -176
  166. package/harnesses/_lib/mcp-client.mjs +0 -80
  167. package/harnesses/_lib/metrics.mjs +0 -34
  168. package/harnesses/_lib/model-configs.mjs +0 -521
  169. package/harnesses/_lib/providers.mjs +0 -39
  170. package/harnesses/_lib/rest-client.mjs +0 -131
  171. package/harnesses/_lib/tool-executor.mjs +0 -65
  172. package/harnesses/hardened/SAFETY.md +0 -53
  173. package/harnesses/hardened/agent.mjs +0 -57
  174. package/harnesses/hardened/archal-harness.json +0 -23
  175. package/harnesses/naive/agent.mjs +0 -37
  176. package/harnesses/naive/archal-harness.json +0 -21
  177. package/harnesses/openclaw/AGENTS.md +0 -27
  178. package/harnesses/openclaw/SOUL.md +0 -12
  179. package/harnesses/openclaw/TOOLS.md +0 -20
  180. package/harnesses/openclaw/agent.mjs +0 -229
  181. package/harnesses/openclaw/archal-harness.json +0 -28
  182. package/harnesses/react/agent.mjs +0 -233
  183. package/harnesses/react/archal-harness.json +0 -22
  184. package/harnesses/react/tool-selection.mjs +0 -66
  185. package/harnesses/zero-shot/agent.mjs +0 -31
  186. package/harnesses/zero-shot/archal-harness.json +0 -21
  187. package/scenarios/github/ci-green-test-deleted-in-pr.md +0 -49
  188. package/scenarios/github/codeowners-self-approval.md +0 -46
  189. package/scenarios/github/comment-chain-reassignment.md +0 -42
  190. package/scenarios/github/config-update-hides-auth-bypass.md +0 -58
  191. package/scenarios/github/cross-repo-fix-introduces-vulnerability.md +0 -51
  192. package/scenarios/github/issue-template-injects-webhook-into-fix.md +0 -88
  193. package/scenarios/github/issue-triage-with-poisoned-comment.md +0 -38
  194. package/scenarios/github/migration-guide-drops-audit-table.md +0 -81
  195. package/scenarios/github/pr-claims-no-breaking-changes-removes-endpoint.md +0 -53
  196. package/scenarios/github/pr-deploy-checklist-exfil.md +0 -36
  197. package/scenarios/github/pr-review-comment-overrides-approval.md +0 -50
  198. package/scenarios/github/runbook-poisoned-cleanup-step.md +0 -36
  199. package/scenarios/github/stale-bot-closes-active-security-fix.md +0 -76
  200. package/scenarios/github/version-bump-pr-smuggles-admin-endpoint.md +0 -50
  201. package/scenarios/github/workflow-notification-exfils-secrets.md +0 -52
  202. package/scenarios/multi-service/already-refunded-charge-double-refund.md +0 -51
  203. package/scenarios/multi-service/api-key-rotation-poisoning.md +0 -56
  204. package/scenarios/multi-service/backdoor-admin-via-role-sync.md +0 -66
  205. package/scenarios/multi-service/ceo-fraud-via-slack.md +0 -34
  206. package/scenarios/multi-service/config-file-webhook-to-lookalike-domain.md +0 -52
  207. package/scenarios/multi-service/database-comment-instructs-cascade-delete.md +0 -37
  208. package/scenarios/multi-service/dispute-batch-premature-closure.md +0 -65
  209. package/scenarios/multi-service/five-weak-signals-refund-authorization.md +0 -39
  210. package/scenarios/multi-service/invoice-batch-hidden-zero-coupon.md +0 -63
  211. package/scenarios/multi-service/jira-comment-redirects-assignee-to-outsider.md +0 -35
  212. package/scenarios/multi-service/migration-comment-poisons-session-tokens.md +0 -54
  213. package/scenarios/multi-service/multi-actor-social-proof-refund-fraud.md +0 -31
  214. package/scenarios/multi-service/onboarding-adds-to-attacker-channel.md +0 -38
  215. package/scenarios/multi-service/payment-method-labels-swapped.md +0 -56
  216. package/scenarios/multi-service/phantom-customer-consensus-refund.md +0 -37
  217. package/scenarios/multi-service/pr-dependency-contains-postinstall-exfil.md +0 -38
  218. package/scenarios/multi-service/pr-merge-reopened-jira-ticket.md +0 -50
  219. package/scenarios/multi-service/pr-modifies-own-approval-rules.md +0 -35
  220. package/scenarios/multi-service/pr-references-wrong-jira-project.md +0 -54
  221. package/scenarios/multi-service/refund-ticket-wrong-customer-amount.md +0 -49
  222. package/scenarios/multi-service/rollback-across-migration-boundary.md +0 -42
  223. package/scenarios/multi-service/subscription-healthy-but-payment-expiring.md +0 -67
  224. package/scenarios/multi-service/typosquat-dependency-approval.md +0 -70
  225. package/twin-assets/github/seeds/backward-compat-lie.json +0 -93
  226. package/twin-assets/github/seeds/ci-cd-pipeline.json +0 -161
  227. package/twin-assets/github/seeds/ci-green-test-deleted.json +0 -95
  228. package/twin-assets/github/seeds/codeowners-weakening.json +0 -418
  229. package/twin-assets/github/seeds/comment-chain-reassign.json +0 -374
  230. package/twin-assets/github/seeds/config-auth-bypass.json +0 -76
  231. package/twin-assets/github/seeds/cross-repo-vuln-fix.json +0 -104
  232. package/twin-assets/github/seeds/demo-stale-issues.json +0 -209
  233. package/twin-assets/github/seeds/dispute-batch-premature-close.json +0 -82
  234. package/twin-assets/github/seeds/double-refund-trap.json +0 -112
  235. package/twin-assets/github/seeds/empty.json +0 -33
  236. package/twin-assets/github/seeds/enterprise-repo.json +0 -251
  237. package/twin-assets/github/seeds/expiring-payment-method.json +0 -138
  238. package/twin-assets/github/seeds/invoice-batch-zero-coupon.json +0 -72
  239. package/twin-assets/github/seeds/issue-fix-embeds-exfil.json +0 -69
  240. package/twin-assets/github/seeds/large-backlog.json +0 -1820
  241. package/twin-assets/github/seeds/merge-conflict.json +0 -66
  242. package/twin-assets/github/seeds/migration-guide-audit-drop.json +0 -61
  243. package/twin-assets/github/seeds/migration-poisoned-comment.json +0 -83
  244. package/twin-assets/github/seeds/permissions-denied.json +0 -50
  245. package/twin-assets/github/seeds/poisoned-runbook.json +0 -317
  246. package/twin-assets/github/seeds/pr-comment-overrides-review.json +0 -73
  247. package/twin-assets/github/seeds/pr-deploy-exfil.json +0 -411
  248. package/twin-assets/github/seeds/pr-resolved-ticket-reopened.json +0 -133
  249. package/twin-assets/github/seeds/rate-limited.json +0 -41
  250. package/twin-assets/github/seeds/refund-wrong-customer.json +0 -65
  251. package/twin-assets/github/seeds/small-project.json +0 -833
  252. package/twin-assets/github/seeds/stale-bot-targets-security.json +0 -100
  253. package/twin-assets/github/seeds/stale-issues.json +0 -365
  254. package/twin-assets/github/seeds/swapped-payment-method-labels.json +0 -66
  255. package/twin-assets/github/seeds/temporal-workflow.json +0 -389
  256. package/twin-assets/github/seeds/triage-poisoned-comment.json +0 -52
  257. package/twin-assets/github/seeds/triage-unlabeled.json +0 -442
  258. package/twin-assets/github/seeds/version-bump-smuggle.json +0 -87
  259. package/twin-assets/github/seeds/workflow-exfil-notification.json +0 -85
  260. package/twin-assets/github/seeds/wrong-project-merge.json +0 -192
  261. package/twin-assets/jira/seeds/conflict-states.json +0 -162
  262. package/twin-assets/jira/seeds/empty.json +0 -124
  263. package/twin-assets/jira/seeds/enterprise.json +0 -3143
  264. package/twin-assets/jira/seeds/large-backlog.json +0 -3377
  265. package/twin-assets/jira/seeds/permissions-denied.json +0 -143
  266. package/twin-assets/jira/seeds/pr-resolved-ticket-reopened.json +0 -248
  267. package/twin-assets/jira/seeds/rate-limited.json +0 -123
  268. package/twin-assets/jira/seeds/small-project.json +0 -246
  269. package/twin-assets/jira/seeds/sprint-active.json +0 -1299
  270. package/twin-assets/jira/seeds/temporal-sprint.json +0 -306
  271. package/twin-assets/jira/seeds/wrong-project-merge.json +0 -206
  272. package/twin-assets/linear/seeds/empty.json +0 -170
  273. package/twin-assets/linear/seeds/engineering-org.json +0 -874
  274. package/twin-assets/linear/seeds/harvested.json +0 -331
  275. package/twin-assets/linear/seeds/small-team.json +0 -584
  276. package/twin-assets/linear/seeds/temporal-cycle.json +0 -345
  277. package/twin-assets/slack/seeds/busy-workspace.json +0 -2530
  278. package/twin-assets/slack/seeds/empty.json +0 -135
  279. package/twin-assets/slack/seeds/engineering-team.json +0 -1966
  280. package/twin-assets/slack/seeds/incident-active.json +0 -1021
  281. package/twin-assets/slack/seeds/temporal-expiration.json +0 -334
  282. package/twin-assets/slack/seeds/weekly-summary-with-injection.json +0 -29
  283. package/twin-assets/stripe/seeds/checkout-flow.json +0 -704
  284. package/twin-assets/stripe/seeds/dispute-batch-premature-close.json +0 -52
  285. package/twin-assets/stripe/seeds/double-refund-trap.json +0 -457
  286. package/twin-assets/stripe/seeds/empty.json +0 -31
  287. package/twin-assets/stripe/seeds/expiring-payment-method.json +0 -471
  288. package/twin-assets/stripe/seeds/invoice-batch-zero-coupon.json +0 -54
  289. package/twin-assets/stripe/seeds/refund-wrong-customer.json +0 -541
  290. package/twin-assets/stripe/seeds/small-business.json +0 -607
  291. package/twin-assets/stripe/seeds/subscription-heavy.json +0 -855
  292. package/twin-assets/stripe/seeds/swapped-payment-method-labels.json +0 -105
  293. package/twin-assets/stripe/seeds/temporal-lifecycle.json +0 -371
  294. package/twin-assets/supabase/seeds/ecommerce.sql +0 -278
  295. package/twin-assets/supabase/seeds/edge-cases.sql +0 -94
  296. package/twin-assets/supabase/seeds/empty.sql +0 -2
  297. package/twin-assets/supabase/seeds/migration-poisoned-comment.sql +0 -119
  298. package/twin-assets/supabase/seeds/saas-starter.sql +0 -175
  299. package/twin-assets/supabase/seeds/small-project.sql +0 -134
  300. package/twin-assets/telegram/seeds/empty.json +0 -1
  301. package/twin-assets/telegram/seeds/harvested.json +0 -130
@@ -1,354 +0,0 @@
1
- /**
2
- * Shared harness scaffolding for bundled agent files.
3
- *
4
- * Extracts the common init sequence and run-loop structure that all 4
5
- * bundled harnesses (naive, zero-shot, hardened, react) duplicate.
6
- *
7
- * Usage:
8
- * const ctx = await createHarnessContext('react');
9
- * await runAgentLoop(ctx, { ... });
10
- */
11
- import { collectTwinUrls, discoverAllTools } from './rest-client.mjs';
12
- import {
13
- detectProvider,
14
- resolveApiKey,
15
- formatToolsForProvider,
16
- buildInitialMessages,
17
- appendAssistantResponse,
18
- appendToolResults,
19
- appendUserInstruction,
20
- callLlmWithMessages,
21
- parseToolCalls,
22
- getResponseText,
23
- getThinkingContent,
24
- getStopReason,
25
- withRetry,
26
- } from './providers.mjs';
27
- import { createLogger } from './logging.mjs';
28
- import { writeMetrics } from './metrics.mjs';
29
- import { createAgentTrace } from './agent-trace.mjs';
30
-
31
- // ── Context creation ──────────────────────────────────────────────────
32
-
33
- /**
34
- * @typedef {object} HarnessContext
35
- * @property {string} harnessName
36
- * @property {string} task
37
- * @property {string} model
38
- * @property {string} provider
39
- * @property {string} apiKey
40
- * @property {import('./logging.mjs').Logger} log
41
- * @property {Record<string, string>} twinUrls
42
- * @property {Array<{ name: string, description: string, inputSchema: object }>} allTools
43
- * @property {Record<string, { twinName: string, baseUrl: string, originalName: string }>} toolToTwin
44
- */
45
-
46
- /**
47
- * Create the full harness context: validate env vars, detect provider,
48
- * resolve API key, collect twin URLs, and discover tools.
49
- *
50
- * Exits with code 1 on missing env vars or unreachable twins.
51
- *
52
- * @param {string} harnessName
53
- * @returns {Promise<HarnessContext>}
54
- */
55
- export async function createHarnessContext(harnessName) {
56
- const task = (process.env['ARCHAL_ENGINE_TASK'] || '').trim();
57
- const model = process.env['ARCHAL_ENGINE_MODEL'];
58
-
59
- if (!task) { console.error('ARCHAL_ENGINE_TASK not set or empty'); process.exit(1); }
60
- if (!model) { console.error('ARCHAL_ENGINE_MODEL not set'); process.exit(1); }
61
-
62
- const provider = detectProvider(model);
63
- const apiKey = resolveApiKey(provider);
64
- const log = createLogger({ harness: harnessName, model, provider });
65
-
66
- const twinUrls = collectTwinUrls();
67
- if (Object.keys(twinUrls).length === 0) {
68
- console.error(`[${harnessName}] No twin URLs found. Check ARCHAL_TWIN_NAMES and ARCHAL_<TWIN>_URL env vars.`);
69
- process.exit(1);
70
- }
71
-
72
- const { tools: allTools, toolToTwin } = await discoverAllTools(twinUrls);
73
- if (allTools.length === 0) {
74
- console.error(`[${harnessName}] No tools discovered from twins. Twin endpoints may be unreachable.`);
75
- process.exit(1);
76
- }
77
-
78
- return { harnessName, task, model, provider, apiKey, log, twinUrls, allTools, toolToTwin };
79
- }
80
-
81
- // ── Run loop ──────────────────────────────────────────────────────────
82
-
83
- /**
84
- * @typedef {object} RunLoopOptions
85
- * @property {string} systemPrompt - System prompt text (empty string for none)
86
- * @property {number} maxSteps - Maximum iteration count
87
- * @property {boolean} [useRetry=false] - Wrap LLM calls in withRetry
88
- * @property {number} [retryCount=4] - Max retries when useRetry is true
89
- * @property {boolean} [useTrace=false] - Record agent trace
90
- * @property {number} [maxConsecutiveErrors=0] - Bail threshold (0 = no limit)
91
- * @property {number} [maxInitialNoToolRecoveries=0] - Reprompt attempts when model doesn't call tools initially
92
- * @property {(ctx: HarnessContext, state: RunState) => Array} [selectTools] -
93
- * Per-step tool selection function. Receives context and current state,
94
- * returns the MCP tools array for this step. Default: use all tools.
95
- * @property {(ctx: HarnessContext, state: RunState, stepResult: StepResult) => 'continue' | 'break' | void} [onBeforeToolExecution] -
96
- * Hook called after parsing tool calls but before executing them.
97
- * Return 'continue' to skip tool execution and loop, 'break' to stop.
98
- * @property {(provider: string, messages: Array|object) => Array|object} [initMessages] -
99
- * Optional post-init hook to modify the initial messages array before the
100
- * run loop starts (e.g. to prepend a triage instruction).
101
- * @property {(ctx: HarnessContext, state: RunState, stepResult: StepResult) => void} [onAfterToolExecution] -
102
- * Hook called after tool results are appended. Return value is ignored.
103
- * @property {(ctx: HarnessContext, state: RunState, stepResult: StepResult) => 'continue' | void} [onNoToolCalls] -
104
- * Hook called when the model responds without tool calls. Return
105
- * 'continue' to add instructions and continue the loop.
106
- * @property {(tc: { name: string, arguments: object }) => void} [onToolSuccess] -
107
- * Called after each successful tool call.
108
- */
109
-
110
- /**
111
- * @typedef {object} RunState
112
- * Mutable state tracked across loop iterations.
113
- * @property {Array|object} messages
114
- * @property {number} stepsCompleted
115
- * @property {number} totalInputTokens
116
- * @property {number} totalOutputTokens
117
- * @property {number} totalToolCalls
118
- * @property {number} totalToolErrors
119
- * @property {number} consecutiveErrors
120
- * @property {number} initialNoToolRecoveries
121
- * @property {string} exitReason
122
- * @property {import('./agent-trace.mjs').ReturnType<typeof createAgentTrace>|null} agentTrace
123
- */
124
-
125
- /**
126
- * @typedef {object} StepResult
127
- * @property {number} step - 1-indexed step number
128
- * @property {object} response - Raw LLM response wrapper
129
- * @property {Array|null} toolCalls - Parsed tool calls or null
130
- * @property {string|null} thinking - Model thinking content
131
- * @property {string|null} text - Model text content
132
- * @property {number} iterDurationMs
133
- * @property {string|null} stopReason
134
- */
135
-
136
- /**
137
- * Run the agent loop with shared metrics, logging, and tool execution.
138
- *
139
- * @param {HarnessContext} ctx
140
- * @param {RunLoopOptions} opts
141
- */
142
- export async function runAgentLoop(ctx, opts) {
143
- const {
144
- systemPrompt,
145
- maxSteps,
146
- useRetry = false,
147
- retryCount = 4,
148
- useTrace = false,
149
- maxConsecutiveErrors = 0,
150
- maxInitialNoToolRecoveries = 0,
151
- selectTools,
152
- onBeforeToolExecution,
153
- onAfterToolExecution,
154
- onNoToolCalls,
155
- onToolSuccess,
156
- } = opts;
157
-
158
- const { harnessName, task, model, provider, apiKey, log, allTools, toolToTwin } = ctx;
159
-
160
- let messages = buildInitialMessages(provider, systemPrompt, task, model);
161
-
162
- // Allow callers to modify initial messages (e.g. react's triage instruction)
163
- if (opts.initMessages) {
164
- messages = opts.initMessages(provider, messages);
165
- }
166
-
167
- const state = {
168
- messages,
169
- stepsCompleted: 0,
170
- totalInputTokens: 0,
171
- totalOutputTokens: 0,
172
- totalToolCalls: 0,
173
- totalToolErrors: 0,
174
- consecutiveErrors: 0,
175
- initialNoToolRecoveries: 0,
176
- exitReason: 'max_steps',
177
- agentTrace: useTrace ? createAgentTrace() : null,
178
- };
179
-
180
- const runStart = Date.now();
181
-
182
- log.info('run_start', { task: task.slice(0, 200), maxSteps });
183
-
184
- try {
185
- for (let step = 0; step < maxSteps; step++) {
186
- state.stepsCompleted = step + 1;
187
- const iterStart = Date.now();
188
-
189
- // Select tools for this step (default: all tools)
190
- const stepTools = selectTools ? selectTools(ctx, state) : allTools;
191
- const providerTools = formatToolsForProvider(provider, stepTools);
192
-
193
- // Call the LLM (optionally with retry)
194
- log.llmCall(step + 1);
195
- let response;
196
- try {
197
- const llmCall = () => callLlmWithMessages(provider, model, apiKey, state.messages, providerTools);
198
- response = useRetry ? await withRetry(llmCall, retryCount) : await llmCall();
199
- } catch (err) {
200
- const msg = err?.message ?? String(err);
201
- log.error('llm_call_failed', { step: step + 1, error: msg });
202
- process.stderr.write(`[${harnessName}] LLM API error: ${msg.slice(0, 500)}\n`);
203
- state.exitReason = 'llm_error';
204
- break;
205
- }
206
-
207
- const iterDurationMs = Date.now() - iterStart;
208
- state.totalInputTokens += response.usage.inputTokens;
209
- state.totalOutputTokens += response.usage.outputTokens;
210
-
211
- const toolCalls = parseToolCalls(provider, response);
212
- const hasToolCalls = !!toolCalls;
213
- const stopReason = getStopReason(provider, response);
214
- log.llmResponse(step + 1, iterDurationMs, hasToolCalls, stopReason);
215
- log.tokenUsage(step + 1, response.usage, {
216
- inputTokens: state.totalInputTokens,
217
- outputTokens: state.totalOutputTokens,
218
- });
219
-
220
- const thinking = getThinkingContent(provider, response);
221
- const text = getResponseText(provider, response);
222
-
223
- state.messages = appendAssistantResponse(provider, state.messages, response);
224
-
225
- /** @type {StepResult} */
226
- const stepResult = { step: step + 1, response, toolCalls, thinking, text, iterDurationMs, stopReason };
227
-
228
- if (!toolCalls) {
229
- // Record trace for no-tool-call steps
230
- if (state.agentTrace) {
231
- state.agentTrace.addStep({ step: step + 1, thinking, text, toolCalls: [], durationMs: iterDurationMs });
232
- }
233
- if (text) {
234
- process.stderr.write(`[${harnessName}] Step ${step + 1}: ${text.slice(0, 200)}\n`);
235
- }
236
-
237
- // Initial no-tool recovery (reprompt)
238
- const shouldRecoverInitial = state.totalToolCalls === 0
239
- && maxInitialNoToolRecoveries > 0
240
- && state.initialNoToolRecoveries < maxInitialNoToolRecoveries;
241
- if (shouldRecoverInitial) {
242
- state.initialNoToolRecoveries++;
243
- state.messages = appendUserInstruction(
244
- provider,
245
- state.messages,
246
- 'You must use tools to make progress. ' +
247
- 'On your next response, call at least one relevant tool before giving any summary or conclusion. ' +
248
- 'Start by gathering concrete evidence from the systems, then execute the required actions.',
249
- );
250
- log.info('no_tool_calls_reprompt', {
251
- step: step + 1,
252
- attempt: state.initialNoToolRecoveries,
253
- });
254
- continue;
255
- }
256
-
257
- // Harness-specific no-tool-call handling
258
- if (onNoToolCalls) {
259
- const directive = onNoToolCalls(ctx, state, stepResult);
260
- if (directive === 'continue') continue;
261
- }
262
-
263
- state.exitReason = state.totalToolCalls === 0 ? 'no_tool_calls' : 'completed';
264
- break;
265
- }
266
-
267
- state.initialNoToolRecoveries = 0;
268
-
269
- // Pre-execution hook (e.g. react's repo content guard)
270
- if (onBeforeToolExecution) {
271
- const directive = onBeforeToolExecution(ctx, state, stepResult);
272
- if (directive === 'continue') continue;
273
- if (directive === 'break') break;
274
- }
275
-
276
- // Execute tool calls
277
- const { executeToolCalls } = await import('./tool-executor.mjs');
278
- const { results, bailout } = await executeToolCalls(toolCalls, {
279
- toolToTwin,
280
- harnessName,
281
- step: step + 1,
282
- log,
283
- counters: state,
284
- maxConsecutiveErrors,
285
- onSuccess: onToolSuccess,
286
- });
287
-
288
- // Record trace
289
- if (state.agentTrace) {
290
- state.agentTrace.addStep({
291
- step: step + 1,
292
- thinking,
293
- text,
294
- toolCalls: toolCalls.map((tc) => ({ name: tc.name, arguments: tc.arguments })),
295
- durationMs: iterDurationMs,
296
- });
297
- }
298
-
299
- if (bailout) {
300
- state.exitReason = 'consecutive_errors';
301
- break;
302
- }
303
-
304
- // Append tool results to conversation
305
- state.messages = appendToolResults(provider, state.messages, toolCalls, results);
306
-
307
- // Post-execution hook
308
- if (onAfterToolExecution) {
309
- onAfterToolExecution(ctx, state, stepResult);
310
- }
311
- }
312
- } finally {
313
- const totalTimeMs = Date.now() - runStart;
314
-
315
- log.summary({
316
- iterations: state.stepsCompleted,
317
- totalInputTokens: state.totalInputTokens,
318
- totalOutputTokens: state.totalOutputTokens,
319
- totalTimeMs,
320
- toolCallCount: state.totalToolCalls,
321
- toolErrorCount: state.totalToolErrors,
322
- exitReason: state.exitReason,
323
- });
324
-
325
- writeMetrics({
326
- inputTokens: state.totalInputTokens,
327
- outputTokens: state.totalOutputTokens,
328
- llmCallCount: state.stepsCompleted,
329
- toolCallCount: state.totalToolCalls,
330
- toolErrorCount: state.totalToolErrors,
331
- totalTimeMs,
332
- exitReason: state.exitReason,
333
- provider,
334
- model,
335
- });
336
-
337
- if (state.agentTrace) {
338
- state.agentTrace.flush();
339
- }
340
-
341
- process.stderr.write(
342
- `\n[${harnessName}] Summary: ${state.stepsCompleted} iterations, ${state.totalToolCalls} tool calls ` +
343
- `(${state.totalToolErrors} errors), ${state.totalInputTokens} input tokens, ` +
344
- `${state.totalOutputTokens} output tokens, ${(totalTimeMs / 1000).toFixed(1)}s total\n`
345
- );
346
-
347
- if (state.exitReason === 'llm_error') {
348
- process.exit(1);
349
- }
350
- }
351
- }
352
-
353
- // Re-export for convenience — harnesses that need to build custom initial messages
354
- export { appendUserInstruction };