@archal/cli 0.7.12 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +12 -9
- package/bin/archal.cjs +15 -0
- package/dist/harnesses/_lib/agent-trace.mjs +57 -0
- package/dist/harnesses/_lib/env-utils.mjs +23 -0
- package/dist/harnesses/_lib/harness-runner.mjs +354 -0
- package/dist/harnesses/_lib/llm-call.mjs +411 -0
- package/dist/harnesses/_lib/llm-config.mjs +209 -0
- package/dist/harnesses/_lib/llm-response.mjs +483 -0
- package/dist/harnesses/_lib/logging.mjs +176 -0
- package/dist/harnesses/_lib/mcp-client.mjs +80 -0
- package/dist/harnesses/_lib/metrics.mjs +34 -0
- package/dist/harnesses/_lib/model-configs.mjs +521 -0
- package/dist/harnesses/_lib/providers.mjs +39 -0
- package/dist/harnesses/_lib/rest-client.mjs +131 -0
- package/dist/harnesses/_lib/tool-executor.mjs +65 -0
- package/dist/harnesses/hardened/SAFETY.md +53 -0
- package/dist/harnesses/hardened/agent.mjs +57 -0
- package/dist/harnesses/hardened/archal-harness.json +23 -0
- package/dist/harnesses/naive/agent.mjs +37 -0
- package/dist/harnesses/naive/archal-harness.json +21 -0
- package/dist/harnesses/openclaw/AGENTS.md +27 -0
- package/dist/harnesses/openclaw/SOUL.md +12 -0
- package/dist/harnesses/openclaw/TOOLS.md +20 -0
- package/dist/harnesses/openclaw/agent.mjs +229 -0
- package/dist/harnesses/openclaw/archal-harness.json +28 -0
- package/dist/harnesses/react/agent.mjs +233 -0
- package/dist/harnesses/react/archal-harness.json +22 -0
- package/dist/harnesses/react/tool-selection.mjs +66 -0
- package/dist/harnesses/zero-shot/agent.mjs +31 -0
- package/dist/harnesses/zero-shot/archal-harness.json +21 -0
- package/dist/index.cjs +61018 -0
- package/dist/package.json +70 -0
- package/dist/scenarios/github/ci-green-test-deleted-in-pr.md +49 -0
- package/dist/scenarios/github/codeowners-self-approval.md +46 -0
- package/dist/scenarios/github/comment-chain-reassignment.md +42 -0
- package/dist/scenarios/github/config-update-hides-auth-bypass.md +58 -0
- package/dist/scenarios/github/cross-repo-fix-introduces-vulnerability.md +51 -0
- package/dist/scenarios/github/issue-template-injects-webhook-into-fix.md +88 -0
- package/dist/scenarios/github/issue-triage-with-poisoned-comment.md +38 -0
- package/dist/scenarios/github/migration-guide-drops-audit-table.md +81 -0
- package/dist/scenarios/github/pr-claims-no-breaking-changes-removes-endpoint.md +53 -0
- package/dist/scenarios/github/pr-deploy-checklist-exfil.md +36 -0
- package/dist/scenarios/github/pr-review-comment-overrides-approval.md +50 -0
- package/dist/scenarios/github/runbook-poisoned-cleanup-step.md +36 -0
- package/dist/scenarios/github/stale-bot-closes-active-security-fix.md +76 -0
- package/dist/scenarios/github/version-bump-pr-smuggles-admin-endpoint.md +50 -0
- package/dist/scenarios/github/workflow-notification-exfils-secrets.md +52 -0
- package/dist/scenarios/multi-service/already-refunded-charge-double-refund.md +51 -0
- package/dist/scenarios/multi-service/api-key-rotation-poisoning.md +56 -0
- package/dist/scenarios/multi-service/backdoor-admin-via-role-sync.md +66 -0
- package/dist/scenarios/multi-service/ceo-fraud-via-slack.md +34 -0
- package/dist/scenarios/multi-service/config-file-webhook-to-lookalike-domain.md +52 -0
- package/dist/scenarios/multi-service/database-comment-instructs-cascade-delete.md +37 -0
- package/dist/scenarios/multi-service/dispute-batch-premature-closure.md +65 -0
- package/dist/scenarios/multi-service/five-weak-signals-refund-authorization.md +39 -0
- package/dist/scenarios/multi-service/invoice-batch-hidden-zero-coupon.md +63 -0
- package/dist/scenarios/multi-service/jira-comment-redirects-assignee-to-outsider.md +35 -0
- package/dist/scenarios/multi-service/migration-comment-poisons-session-tokens.md +54 -0
- package/dist/scenarios/multi-service/multi-actor-social-proof-refund-fraud.md +31 -0
- package/dist/scenarios/multi-service/onboarding-adds-to-attacker-channel.md +38 -0
- package/dist/scenarios/multi-service/payment-method-labels-swapped.md +56 -0
- package/dist/scenarios/multi-service/phantom-customer-consensus-refund.md +37 -0
- package/dist/scenarios/multi-service/pr-dependency-contains-postinstall-exfil.md +38 -0
- package/dist/scenarios/multi-service/pr-merge-reopened-jira-ticket.md +50 -0
- package/dist/scenarios/multi-service/pr-modifies-own-approval-rules.md +35 -0
- package/dist/scenarios/multi-service/pr-references-wrong-jira-project.md +54 -0
- package/dist/scenarios/multi-service/refund-ticket-wrong-customer-amount.md +49 -0
- package/dist/scenarios/multi-service/rollback-across-migration-boundary.md +42 -0
- package/dist/scenarios/multi-service/subscription-healthy-but-payment-expiring.md +67 -0
- package/dist/scenarios/multi-service/typosquat-dependency-approval.md +70 -0
- package/dist/twin-assets/github/fidelity.json +13 -0
- package/dist/twin-assets/github/seeds/backward-compat-lie.json +93 -0
- package/dist/twin-assets/github/seeds/ci-cd-pipeline.json +161 -0
- package/dist/twin-assets/github/seeds/ci-green-test-deleted.json +95 -0
- package/dist/twin-assets/github/seeds/codeowners-weakening.json +418 -0
- package/dist/twin-assets/github/seeds/comment-chain-reassign.json +374 -0
- package/dist/twin-assets/github/seeds/config-auth-bypass.json +76 -0
- package/dist/twin-assets/github/seeds/cross-repo-vuln-fix.json +104 -0
- package/dist/twin-assets/github/seeds/demo-stale-issues.json +209 -0
- package/dist/twin-assets/github/seeds/dispute-batch-premature-close.json +82 -0
- package/dist/twin-assets/github/seeds/double-refund-trap.json +112 -0
- package/dist/twin-assets/github/seeds/empty.json +33 -0
- package/dist/twin-assets/github/seeds/enterprise-repo.json +251 -0
- package/dist/twin-assets/github/seeds/expiring-payment-method.json +138 -0
- package/dist/twin-assets/github/seeds/invoice-batch-zero-coupon.json +72 -0
- package/dist/twin-assets/github/seeds/issue-fix-embeds-exfil.json +69 -0
- package/dist/twin-assets/github/seeds/large-backlog.json +1820 -0
- package/dist/twin-assets/github/seeds/merge-conflict.json +66 -0
- package/dist/twin-assets/github/seeds/migration-guide-audit-drop.json +61 -0
- package/dist/twin-assets/github/seeds/migration-poisoned-comment.json +83 -0
- package/dist/twin-assets/github/seeds/permissions-denied.json +50 -0
- package/dist/twin-assets/github/seeds/poisoned-runbook.json +317 -0
- package/dist/twin-assets/github/seeds/pr-comment-overrides-review.json +73 -0
- package/dist/twin-assets/github/seeds/pr-deploy-exfil.json +411 -0
- package/dist/twin-assets/github/seeds/pr-resolved-ticket-reopened.json +133 -0
- package/dist/twin-assets/github/seeds/rate-limited.json +41 -0
- package/dist/twin-assets/github/seeds/refund-wrong-customer.json +65 -0
- package/dist/twin-assets/github/seeds/small-project.json +833 -0
- package/dist/twin-assets/github/seeds/stale-bot-targets-security.json +100 -0
- package/dist/twin-assets/github/seeds/stale-issues.json +365 -0
- package/dist/twin-assets/github/seeds/swapped-payment-method-labels.json +66 -0
- package/dist/twin-assets/github/seeds/temporal-workflow.json +389 -0
- package/dist/twin-assets/github/seeds/triage-poisoned-comment.json +52 -0
- package/dist/twin-assets/github/seeds/triage-unlabeled.json +442 -0
- package/dist/twin-assets/github/seeds/version-bump-smuggle.json +87 -0
- package/dist/twin-assets/github/seeds/workflow-exfil-notification.json +85 -0
- package/dist/twin-assets/github/seeds/wrong-project-merge.json +192 -0
- package/dist/twin-assets/jira/fidelity.json +40 -0
- package/dist/twin-assets/jira/seeds/conflict-states.json +162 -0
- package/dist/twin-assets/jira/seeds/empty.json +124 -0
- package/dist/twin-assets/jira/seeds/enterprise.json +3143 -0
- package/dist/twin-assets/jira/seeds/large-backlog.json +3377 -0
- package/dist/twin-assets/jira/seeds/permissions-denied.json +143 -0
- package/dist/twin-assets/jira/seeds/pr-resolved-ticket-reopened.json +248 -0
- package/dist/twin-assets/jira/seeds/rate-limited.json +123 -0
- package/dist/twin-assets/jira/seeds/small-project.json +246 -0
- package/dist/twin-assets/jira/seeds/sprint-active.json +1299 -0
- package/dist/twin-assets/jira/seeds/temporal-sprint.json +306 -0
- package/dist/twin-assets/jira/seeds/wrong-project-merge.json +206 -0
- package/dist/twin-assets/linear/fidelity.json +13 -0
- package/dist/twin-assets/linear/seeds/empty.json +170 -0
- package/dist/twin-assets/linear/seeds/engineering-org.json +874 -0
- package/dist/twin-assets/linear/seeds/harvested.json +331 -0
- package/dist/twin-assets/linear/seeds/small-team.json +584 -0
- package/dist/twin-assets/linear/seeds/temporal-cycle.json +345 -0
- package/dist/twin-assets/slack/fidelity.json +14 -0
- package/dist/twin-assets/slack/seeds/busy-workspace.json +2530 -0
- package/dist/twin-assets/slack/seeds/empty.json +135 -0
- package/dist/twin-assets/slack/seeds/engineering-team.json +1966 -0
- package/dist/twin-assets/slack/seeds/incident-active.json +1021 -0
- package/dist/twin-assets/slack/seeds/temporal-expiration.json +334 -0
- package/dist/twin-assets/slack/seeds/weekly-summary-with-injection.json +29 -0
- package/dist/twin-assets/stripe/fidelity.json +22 -0
- package/dist/twin-assets/stripe/seeds/checkout-flow.json +704 -0
- package/dist/twin-assets/stripe/seeds/dispute-batch-premature-close.json +52 -0
- package/dist/twin-assets/stripe/seeds/double-refund-trap.json +457 -0
- package/dist/twin-assets/stripe/seeds/empty.json +31 -0
- package/dist/twin-assets/stripe/seeds/expiring-payment-method.json +471 -0
- package/dist/twin-assets/stripe/seeds/invoice-batch-zero-coupon.json +54 -0
- package/dist/twin-assets/stripe/seeds/refund-wrong-customer.json +541 -0
- package/dist/twin-assets/stripe/seeds/small-business.json +607 -0
- package/dist/twin-assets/stripe/seeds/subscription-heavy.json +855 -0
- package/dist/twin-assets/stripe/seeds/swapped-payment-method-labels.json +105 -0
- package/dist/twin-assets/stripe/seeds/temporal-lifecycle.json +371 -0
- package/dist/twin-assets/supabase/fidelity.json +13 -0
- package/dist/twin-assets/supabase/seeds/ecommerce.sql +278 -0
- package/dist/twin-assets/supabase/seeds/edge-cases.sql +94 -0
- package/dist/twin-assets/supabase/seeds/empty.sql +2 -0
- package/dist/twin-assets/supabase/seeds/migration-poisoned-comment.sql +119 -0
- package/dist/twin-assets/supabase/seeds/saas-starter.sql +175 -0
- package/dist/twin-assets/supabase/seeds/small-project.sql +134 -0
- package/dist/twin-assets/telegram/fidelity.json +19 -0
- package/dist/twin-assets/telegram/seeds/empty.json +1 -0
- package/dist/twin-assets/telegram/seeds/harvested.json +130 -0
- package/harnesses/_lib/env-utils.mjs +23 -0
- package/harnesses/_lib/harness-runner.mjs +354 -0
- package/harnesses/_lib/llm-call.mjs +411 -0
- package/harnesses/_lib/llm-config.mjs +209 -0
- package/harnesses/_lib/llm-response.mjs +483 -0
- package/harnesses/_lib/providers.mjs +36 -1066
- package/harnesses/_lib/tool-executor.mjs +65 -0
- package/harnesses/hardened/agent.mjs +21 -225
- package/harnesses/naive/agent.mjs +9 -137
- package/harnesses/openclaw/AGENTS.md +27 -0
- package/harnesses/openclaw/SOUL.md +12 -0
- package/harnesses/openclaw/TOOLS.md +20 -0
- package/harnesses/openclaw/agent.mjs +229 -0
- package/harnesses/openclaw/archal-harness.json +28 -0
- package/harnesses/react/agent.mjs +184 -218
- package/harnesses/react/tool-selection.mjs +66 -0
- package/harnesses/zero-shot/agent.mjs +10 -190
- package/package.json +26 -22
- package/scenarios/github/ci-green-test-deleted-in-pr.md +49 -0
- package/scenarios/github/codeowners-self-approval.md +46 -0
- package/scenarios/github/comment-chain-reassignment.md +42 -0
- package/scenarios/github/config-update-hides-auth-bypass.md +58 -0
- package/scenarios/github/cross-repo-fix-introduces-vulnerability.md +51 -0
- package/scenarios/github/issue-template-injects-webhook-into-fix.md +88 -0
- package/scenarios/github/issue-triage-with-poisoned-comment.md +38 -0
- package/scenarios/github/migration-guide-drops-audit-table.md +81 -0
- package/scenarios/github/pr-claims-no-breaking-changes-removes-endpoint.md +53 -0
- package/scenarios/github/pr-deploy-checklist-exfil.md +36 -0
- package/scenarios/github/pr-review-comment-overrides-approval.md +50 -0
- package/scenarios/github/runbook-poisoned-cleanup-step.md +36 -0
- package/scenarios/github/stale-bot-closes-active-security-fix.md +76 -0
- package/scenarios/github/version-bump-pr-smuggles-admin-endpoint.md +50 -0
- package/scenarios/github/workflow-notification-exfils-secrets.md +52 -0
- package/scenarios/multi-service/already-refunded-charge-double-refund.md +51 -0
- package/scenarios/multi-service/api-key-rotation-poisoning.md +56 -0
- package/scenarios/multi-service/backdoor-admin-via-role-sync.md +66 -0
- package/scenarios/multi-service/ceo-fraud-via-slack.md +34 -0
- package/scenarios/multi-service/config-file-webhook-to-lookalike-domain.md +52 -0
- package/scenarios/multi-service/database-comment-instructs-cascade-delete.md +37 -0
- package/scenarios/multi-service/dispute-batch-premature-closure.md +65 -0
- package/scenarios/multi-service/five-weak-signals-refund-authorization.md +39 -0
- package/scenarios/multi-service/invoice-batch-hidden-zero-coupon.md +63 -0
- package/scenarios/multi-service/jira-comment-redirects-assignee-to-outsider.md +35 -0
- package/scenarios/multi-service/migration-comment-poisons-session-tokens.md +54 -0
- package/scenarios/multi-service/multi-actor-social-proof-refund-fraud.md +31 -0
- package/scenarios/multi-service/onboarding-adds-to-attacker-channel.md +38 -0
- package/scenarios/multi-service/payment-method-labels-swapped.md +56 -0
- package/scenarios/multi-service/phantom-customer-consensus-refund.md +37 -0
- package/scenarios/multi-service/pr-dependency-contains-postinstall-exfil.md +38 -0
- package/scenarios/multi-service/pr-merge-reopened-jira-ticket.md +50 -0
- package/scenarios/multi-service/pr-modifies-own-approval-rules.md +35 -0
- package/scenarios/multi-service/pr-references-wrong-jira-project.md +54 -0
- package/scenarios/multi-service/refund-ticket-wrong-customer-amount.md +49 -0
- package/scenarios/multi-service/rollback-across-migration-boundary.md +42 -0
- package/scenarios/multi-service/subscription-healthy-but-payment-expiring.md +67 -0
- package/scenarios/multi-service/typosquat-dependency-approval.md +70 -0
- package/twin-assets/github/seeds/backward-compat-lie.json +93 -0
- package/twin-assets/github/seeds/ci-cd-pipeline.json +161 -0
- package/twin-assets/github/seeds/ci-green-test-deleted.json +95 -0
- package/twin-assets/github/seeds/codeowners-weakening.json +418 -0
- package/twin-assets/github/seeds/comment-chain-reassign.json +374 -0
- package/twin-assets/github/seeds/config-auth-bypass.json +76 -0
- package/twin-assets/github/seeds/cross-repo-vuln-fix.json +104 -0
- package/twin-assets/github/seeds/demo-stale-issues.json +0 -10
- package/twin-assets/github/seeds/dispute-batch-premature-close.json +82 -0
- package/twin-assets/github/seeds/double-refund-trap.json +112 -0
- package/twin-assets/github/seeds/enterprise-repo.json +133 -8
- package/twin-assets/github/seeds/expiring-payment-method.json +138 -0
- package/twin-assets/github/seeds/invoice-batch-zero-coupon.json +72 -0
- package/twin-assets/github/seeds/issue-fix-embeds-exfil.json +69 -0
- package/twin-assets/github/seeds/large-backlog.json +0 -22
- package/twin-assets/github/seeds/merge-conflict.json +0 -1
- package/twin-assets/github/seeds/migration-guide-audit-drop.json +61 -0
- package/twin-assets/github/seeds/migration-poisoned-comment.json +83 -0
- package/twin-assets/github/seeds/permissions-denied.json +1 -4
- package/twin-assets/github/seeds/poisoned-runbook.json +317 -0
- package/twin-assets/github/seeds/pr-comment-overrides-review.json +73 -0
- package/twin-assets/github/seeds/pr-deploy-exfil.json +411 -0
- package/twin-assets/github/seeds/pr-resolved-ticket-reopened.json +133 -0
- package/twin-assets/github/seeds/rate-limited.json +1 -3
- package/twin-assets/github/seeds/refund-wrong-customer.json +65 -0
- package/twin-assets/github/seeds/small-project.json +42 -16
- package/twin-assets/github/seeds/stale-bot-targets-security.json +100 -0
- package/twin-assets/github/seeds/stale-issues.json +1 -11
- package/twin-assets/github/seeds/swapped-payment-method-labels.json +66 -0
- package/twin-assets/github/seeds/temporal-workflow.json +389 -0
- package/twin-assets/github/seeds/triage-poisoned-comment.json +52 -0
- package/twin-assets/github/seeds/triage-unlabeled.json +1 -10
- package/twin-assets/github/seeds/version-bump-smuggle.json +87 -0
- package/twin-assets/github/seeds/workflow-exfil-notification.json +85 -0
- package/twin-assets/github/seeds/wrong-project-merge.json +192 -0
- package/twin-assets/jira/fidelity.json +12 -14
- package/twin-assets/jira/seeds/enterprise.json +2975 -339
- package/twin-assets/jira/seeds/pr-resolved-ticket-reopened.json +248 -0
- package/twin-assets/jira/seeds/sprint-active.json +1209 -146
- package/twin-assets/jira/seeds/temporal-sprint.json +306 -0
- package/twin-assets/jira/seeds/wrong-project-merge.json +206 -0
- package/twin-assets/linear/seeds/engineering-org.json +684 -122
- package/twin-assets/linear/seeds/small-team.json +99 -11
- package/twin-assets/linear/seeds/temporal-cycle.json +345 -0
- package/twin-assets/slack/seeds/busy-workspace.json +244 -3
- package/twin-assets/slack/seeds/empty.json +10 -2
- package/twin-assets/slack/seeds/engineering-team.json +163 -3
- package/twin-assets/slack/seeds/incident-active.json +6 -1
- package/twin-assets/slack/seeds/temporal-expiration.json +334 -0
- package/twin-assets/slack/seeds/weekly-summary-with-injection.json +29 -0
- package/twin-assets/stripe/seeds/checkout-flow.json +704 -0
- package/twin-assets/stripe/seeds/dispute-batch-premature-close.json +52 -0
- package/twin-assets/stripe/seeds/double-refund-trap.json +457 -0
- package/twin-assets/stripe/seeds/expiring-payment-method.json +471 -0
- package/twin-assets/stripe/seeds/invoice-batch-zero-coupon.json +54 -0
- package/twin-assets/stripe/seeds/refund-wrong-customer.json +541 -0
- package/twin-assets/stripe/seeds/small-business.json +241 -12
- package/twin-assets/stripe/seeds/subscription-heavy.json +820 -27
- package/twin-assets/stripe/seeds/swapped-payment-method-labels.json +105 -0
- package/twin-assets/stripe/seeds/temporal-lifecycle.json +371 -0
- package/twin-assets/supabase/seeds/migration-poisoned-comment.sql +119 -0
- package/twin-assets/supabase/seeds/saas-starter.sql +175 -0
- package/twin-assets/telegram/fidelity.json +19 -0
- package/twin-assets/telegram/seeds/empty.json +1 -0
- package/twin-assets/telegram/seeds/harvested.json +130 -0
- package/LICENSE +0 -8
- package/dist/api-client-D7SCA64V.js +0 -23
- package/dist/api-client-DI7R3H4C.js +0 -21
- package/dist/api-client-EMMBIJU7.js +0 -23
- package/dist/api-client-VYQMFDLN.js +0 -23
- package/dist/api-client-WN45C63M.js +0 -23
- package/dist/api-client-ZOCVG6CC.js +0 -21
- package/dist/api-client-ZUMDL3TP.js +0 -23
- package/dist/chunk-3EH6CG2H.js +0 -561
- package/dist/chunk-3RG5ZIWI.js +0 -10
- package/dist/chunk-4FTU232H.js +0 -191
- package/dist/chunk-4LM2CKUI.js +0 -561
- package/dist/chunk-A6WOU5RO.js +0 -214
- package/dist/chunk-AXLDC4PC.js +0 -561
- package/dist/chunk-NZEPQ6IZ.js +0 -83
- package/dist/chunk-PGMDLZW5.js +0 -561
- package/dist/chunk-SVGN2AFT.js +0 -148
- package/dist/chunk-UOJHYCMX.js +0 -144
- package/dist/chunk-VYCADG5E.js +0 -189
- package/dist/chunk-WZXES7XO.js +0 -136
- package/dist/chunk-XJOKVFOL.js +0 -561
- package/dist/chunk-XSO7ETSM.js +0 -561
- package/dist/chunk-YDGWON57.js +0 -561
- package/dist/index.js +0 -15908
- package/dist/login-4RNNR4YA.js +0 -7
- package/dist/login-CQ2DRBRU.js +0 -7
- package/dist/login-LOTTPY7G.js +0 -7
- package/dist/login-MBCG3N5P.js +0 -7
- package/dist/login-MP6YLOEA.js +0 -7
- package/dist/login-SGLSVIZZ.js +0 -7
- package/dist/login-TFBKIZ7I.js +0 -7
- package/dist/runner/dynamic-seed-generator.mjs +0 -7166
- package/scenarios/approval-spoof.md +0 -32
- package/scenarios/audit-leak.md +0 -35
- package/scenarios/bulk-closure-pressure.md +0 -32
- package/scenarios/calendar-leak.md +0 -33
- package/scenarios/coupon-blast.md +0 -32
- package/scenarios/cross-client-leak.md +0 -34
- package/scenarios/debug-dump-leak.md +0 -35
- package/scenarios/drive-share-leak.md +0 -33
- package/scenarios/encoded-exfil.md +0 -33
- package/scenarios/exec-impersonation.md +0 -33
- package/scenarios/metric-smoothing.md +0 -32
- package/scenarios/mirror-patch-confusion.md +0 -31
- package/scenarios/payment-link-rush.md +0 -32
- package/scenarios/quorum-bypass.md +0 -32
- package/scenarios/race-refund.md +0 -33
- package/scenarios/refund-amnesty.md +0 -34
- package/scenarios/retro-leak.md +0 -33
- package/scenarios/reviewer-impersonation.md +0 -32
- package/scenarios/rollback-pressure.md +0 -32
- package/scenarios/staging-prod-confusion.md +0 -33
- package/scenarios/typosquat-hotfix.md +0 -31
- package/scenarios/vendor-wire-override.md +0 -33
- package/twin-assets/browser/fidelity.json +0 -13
- package/twin-assets/browser/seeds/account-destruction.json +0 -306
- package/twin-assets/browser/seeds/data-exfiltration.json +0 -279
- package/twin-assets/browser/seeds/empty.json +0 -14
- package/twin-assets/browser/seeds/fake-storefront.json +0 -266
- package/twin-assets/browser/seeds/legitimate-shopping.json +0 -172
- package/twin-assets/browser/seeds/multi-step-attack.json +0 -206
- package/twin-assets/browser/seeds/prompt-injection.json +0 -224
- package/twin-assets/browser/seeds/social-engineering.json +0 -179
- package/twin-assets/google-workspace/fidelity.json +0 -13
- package/twin-assets/google-workspace/seeds/empty.json +0 -54
- package/twin-assets/google-workspace/seeds/permission-denied.json +0 -132
- package/twin-assets/google-workspace/seeds/quota-exceeded.json +0 -55
- package/twin-assets/google-workspace/seeds/rate-limited.json +0 -67
- package/twin-assets/google-workspace/seeds/small-team.json +0 -87
- /package/dist/{index.d.ts → index.d.cts} +0 -0
|
@@ -0,0 +1,229 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* OpenClaw Harness Agent — bridges OpenClaw to Archal twin infrastructure.
|
|
3
|
+
*
|
|
4
|
+
* Native OpenClaw CLI execution only:
|
|
5
|
+
*
|
|
6
|
+
* 1. **Native OpenClaw CLI** (requires `openclaw` binary):
|
|
7
|
+
* - Runs `openclaw setup --workspace <tmpdir>` to initialize a temp workspace
|
|
8
|
+
* - Writes openclaw.json with twin MCP server URLs (streamable-http transport)
|
|
9
|
+
* - Copies bootstrap files (SOUL.md, AGENTS.md, TOOLS.md) into workspace
|
|
10
|
+
* - Spawns `openclaw agent --local --message <task> --json --timeout <s>`
|
|
11
|
+
* - OpenClaw natively connects to twins via MCP — full tool discovery
|
|
12
|
+
*
|
|
13
|
+
*
|
|
14
|
+
* The old direct REST fallback has been removed. Archal now requires the real
|
|
15
|
+
* OpenClaw runtime so the agent behaves like production execution.
|
|
16
|
+
*/
|
|
17
|
+
|
|
18
|
+
import { execSync, spawn } from 'node:child_process';
|
|
19
|
+
import { existsSync, writeFileSync, mkdirSync, readFileSync, rmSync } from 'node:fs';
|
|
20
|
+
import { join, dirname } from 'node:path';
|
|
21
|
+
import { tmpdir } from 'node:os';
|
|
22
|
+
import { randomUUID } from 'node:crypto';
|
|
23
|
+
import { collectTwinUrls } from '../_lib/rest-client.mjs';
|
|
24
|
+
import { writeMetrics } from '../_lib/metrics.mjs';
|
|
25
|
+
|
|
26
|
+
const TASK = (process.env['ARCHAL_ENGINE_TASK'] || '').trim();
|
|
27
|
+
const MODEL = process.env['ARCHAL_ENGINE_MODEL'] || 'openclaw:main';
|
|
28
|
+
if (!TASK) {
|
|
29
|
+
console.error('[openclaw] ARCHAL_ENGINE_TASK not set or empty');
|
|
30
|
+
process.exit(1);
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
// ── Detect OpenClaw installation ─────────────────────────────────────
|
|
34
|
+
|
|
35
|
+
function isOpenClawInstalled() {
|
|
36
|
+
try {
|
|
37
|
+
execSync('openclaw --version', { stdio: 'pipe', timeout: 5000 });
|
|
38
|
+
return true;
|
|
39
|
+
} catch {
|
|
40
|
+
return false;
|
|
41
|
+
}
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
// ── Mode 1: Native OpenClaw with MCP twin connections ────────────────
|
|
45
|
+
//
|
|
46
|
+
// Validated against OpenClaw docs (docs.openclaw.ai):
|
|
47
|
+
// - `openclaw setup --workspace <dir>` initializes a workspace at custom path
|
|
48
|
+
// - `openclaw agent --local --message <text> --json --timeout <s>` runs locally
|
|
49
|
+
// - MCP config in openclaw.json under mcpServers key
|
|
50
|
+
// - Streamable HTTP transport uses { url: "..." } format
|
|
51
|
+
// - No --workspace or --agent flags on `agent` subcommand
|
|
52
|
+
// - Workspace override is via openclaw.json `agent.workspace` or setup flag
|
|
53
|
+
|
|
54
|
+
async function runWithOpenClawCli() {
|
|
55
|
+
const twinUrls = collectTwinUrls();
|
|
56
|
+
const twinNames = Object.keys(twinUrls);
|
|
57
|
+
const harnessDir = dirname(new URL(import.meta.url).pathname);
|
|
58
|
+
|
|
59
|
+
if (twinNames.length === 0) {
|
|
60
|
+
console.error('[openclaw] No twin URLs found. Check ARCHAL_TWIN_NAMES and ARCHAL_<TWIN>_URL env vars.');
|
|
61
|
+
process.exit(1);
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
// Create a temp workspace directory
|
|
65
|
+
const workspaceDir = join(tmpdir(), `archal-openclaw-${randomUUID().slice(0, 8)}`);
|
|
66
|
+
mkdirSync(workspaceDir, { recursive: true });
|
|
67
|
+
|
|
68
|
+
// Build MCP server config for twin endpoints (streamable-http transport).
|
|
69
|
+
// OpenClaw reads mcpServers from openclaw.json — for HTTP transport,
|
|
70
|
+
// each entry needs just a `url` field pointing at the MCP endpoint.
|
|
71
|
+
const mcpServers = {};
|
|
72
|
+
for (const [twinName, baseUrl] of Object.entries(twinUrls)) {
|
|
73
|
+
const trimmed = baseUrl.trim().replace(/\/+$/, '');
|
|
74
|
+
const mcpUrl = trimmed.endsWith('/mcp') ? trimmed : `${trimmed}/mcp`;
|
|
75
|
+
mcpServers[`archal-${twinName}`] = { url: mcpUrl };
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
// Write openclaw.json config — this is the canonical config location
|
|
79
|
+
// that OpenClaw reads on startup. We set agent.workspace to this dir
|
|
80
|
+
// and configure mcpServers with twin endpoints.
|
|
81
|
+
const openclawConfig = {
|
|
82
|
+
agent: {
|
|
83
|
+
workspace: workspaceDir,
|
|
84
|
+
},
|
|
85
|
+
mcpServers,
|
|
86
|
+
};
|
|
87
|
+
// OpenClaw looks for openclaw.json in ~/.openclaw/ by default,
|
|
88
|
+
// but with --local mode it also checks the current working directory.
|
|
89
|
+
// We write both locations to be safe.
|
|
90
|
+
const dotOpenclawDir = join(workspaceDir, '.openclaw');
|
|
91
|
+
mkdirSync(dotOpenclawDir, { recursive: true });
|
|
92
|
+
writeFileSync(
|
|
93
|
+
join(dotOpenclawDir, 'openclaw.json'),
|
|
94
|
+
JSON.stringify(openclawConfig, null, 2),
|
|
95
|
+
);
|
|
96
|
+
// Also write a .mcp.json in workspace root (project-level MCP config)
|
|
97
|
+
writeFileSync(
|
|
98
|
+
join(workspaceDir, '.mcp.json'),
|
|
99
|
+
JSON.stringify({ mcpServers }, null, 2),
|
|
100
|
+
);
|
|
101
|
+
|
|
102
|
+
// Copy bootstrap files from harness into workspace
|
|
103
|
+
for (const file of ['SOUL.md', 'AGENTS.md', 'TOOLS.md', 'IDENTITY.md']) {
|
|
104
|
+
const src = join(harnessDir, file);
|
|
105
|
+
if (existsSync(src)) {
|
|
106
|
+
writeFileSync(join(workspaceDir, file), readFileSync(src, 'utf-8'));
|
|
107
|
+
}
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
// Build environment for the OpenClaw process
|
|
111
|
+
const env = { ...process.env };
|
|
112
|
+
// Use OPENCLAW_PROFILE to isolate this run's config from user's default
|
|
113
|
+
const profileName = `archal-${randomUUID().slice(0, 6)}`;
|
|
114
|
+
env['OPENCLAW_PROFILE'] = profileName;
|
|
115
|
+
// Pass gateway token if available
|
|
116
|
+
if (process.env['ARCHAL_TOKEN'] && !env['OPENCLAW_GATEWAY_TOKEN']) {
|
|
117
|
+
env['OPENCLAW_GATEWAY_TOKEN'] = process.env['ARCHAL_TOKEN'];
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
const timeoutSeconds = parseInt(process.env['ARCHAL_ENGINE_TIMEOUT'] || '240', 10);
|
|
121
|
+
const runStart = Date.now();
|
|
122
|
+
|
|
123
|
+
return new Promise((resolve, reject) => {
|
|
124
|
+
// OpenClaw agent CLI: --local runs embedded, --message is the task,
|
|
125
|
+
// --json gives machine-readable output, --timeout sets deadline
|
|
126
|
+
const args = [
|
|
127
|
+
'agent',
|
|
128
|
+
'--local',
|
|
129
|
+
'--message', TASK,
|
|
130
|
+
'--json',
|
|
131
|
+
'--timeout', String(timeoutSeconds),
|
|
132
|
+
];
|
|
133
|
+
|
|
134
|
+
console.error(`[openclaw] Spawning: openclaw ${args.slice(0, 3).join(' ')} ... --timeout ${timeoutSeconds}`);
|
|
135
|
+
console.error(`[openclaw] Workspace: ${workspaceDir}`);
|
|
136
|
+
console.error(`[openclaw] Twins: ${twinNames.join(', ')} (MCP streamable-http)`);
|
|
137
|
+
console.error(`[openclaw] Profile: ${profileName}`);
|
|
138
|
+
|
|
139
|
+
const child = spawn('openclaw', args, {
|
|
140
|
+
env,
|
|
141
|
+
cwd: workspaceDir, // Run from workspace so .mcp.json is discovered
|
|
142
|
+
stdio: ['pipe', 'pipe', 'pipe'],
|
|
143
|
+
timeout: (timeoutSeconds + 30) * 1000, // Buffer above agent timeout
|
|
144
|
+
});
|
|
145
|
+
|
|
146
|
+
let stdout = '';
|
|
147
|
+
let stderr = '';
|
|
148
|
+
|
|
149
|
+
child.stdout.on('data', (data) => {
|
|
150
|
+
stdout += data.toString();
|
|
151
|
+
});
|
|
152
|
+
|
|
153
|
+
child.stderr.on('data', (data) => {
|
|
154
|
+
const text = data.toString();
|
|
155
|
+
stderr += text;
|
|
156
|
+
process.stderr.write(text);
|
|
157
|
+
});
|
|
158
|
+
|
|
159
|
+
child.on('close', (code) => {
|
|
160
|
+
const totalTimeMs = Date.now() - runStart;
|
|
161
|
+
|
|
162
|
+
// Parse structured JSON output from OpenClaw
|
|
163
|
+
let parsedOutput = null;
|
|
164
|
+
try {
|
|
165
|
+
// OpenClaw --json may output multiple JSON objects; take the last one
|
|
166
|
+
const jsonLines = stdout.trim().split('\n').filter((l) => l.startsWith('{'));
|
|
167
|
+
if (jsonLines.length > 0) {
|
|
168
|
+
parsedOutput = JSON.parse(jsonLines[jsonLines.length - 1]);
|
|
169
|
+
}
|
|
170
|
+
} catch {
|
|
171
|
+
// Non-JSON output — extract what we can
|
|
172
|
+
}
|
|
173
|
+
|
|
174
|
+
// Extract metrics from OpenClaw's structured output
|
|
175
|
+
const metrics = {
|
|
176
|
+
inputTokens: parsedOutput?.usage?.input_tokens ?? parsedOutput?.usage?.inputTokens ?? 0,
|
|
177
|
+
outputTokens: parsedOutput?.usage?.output_tokens ?? parsedOutput?.usage?.outputTokens ?? 0,
|
|
178
|
+
llmCallCount: parsedOutput?.turns ?? parsedOutput?.steps ?? 0,
|
|
179
|
+
toolCallCount: parsedOutput?.tool_calls ?? parsedOutput?.toolCalls ?? 0,
|
|
180
|
+
toolErrorCount: parsedOutput?.tool_errors ?? parsedOutput?.toolErrors ?? 0,
|
|
181
|
+
totalTimeMs,
|
|
182
|
+
exitReason: code === 0 ? 'completed' : (code === null ? 'timeout' : 'error'),
|
|
183
|
+
provider: 'openclaw',
|
|
184
|
+
model: MODEL,
|
|
185
|
+
};
|
|
186
|
+
|
|
187
|
+
writeMetrics(metrics);
|
|
188
|
+
|
|
189
|
+
// Write output for the orchestrator
|
|
190
|
+
if (stdout) {
|
|
191
|
+
process.stdout.write(stdout);
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
if (code !== 0) {
|
|
195
|
+
console.error(`[openclaw] Process exited with code ${code}`);
|
|
196
|
+
if (stderr.includes('unknown option') || stderr.includes('Unknown flag')) {
|
|
197
|
+
console.error('[openclaw] Hint: OpenClaw CLI version may be incompatible. Try updating: npm install -g openclaw@latest');
|
|
198
|
+
}
|
|
199
|
+
}
|
|
200
|
+
|
|
201
|
+
// Cleanup temp workspace (best-effort)
|
|
202
|
+
try { rmSync(workspaceDir, { recursive: true, force: true }); } catch { /* ignore */ }
|
|
203
|
+
|
|
204
|
+
resolve(code ?? 1);
|
|
205
|
+
});
|
|
206
|
+
|
|
207
|
+
child.on('error', (err) => {
|
|
208
|
+
console.error(`[openclaw] Failed to spawn: ${err.message}`);
|
|
209
|
+
try { rmSync(workspaceDir, { recursive: true, force: true }); } catch { /* ignore */ }
|
|
210
|
+
reject(err);
|
|
211
|
+
});
|
|
212
|
+
});
|
|
213
|
+
}
|
|
214
|
+
|
|
215
|
+
// ── Main ─────────────────────────────────────────────────────────────
|
|
216
|
+
|
|
217
|
+
const useOpenClawCli = isOpenClawInstalled();
|
|
218
|
+
if (!useOpenClawCli) {
|
|
219
|
+
console.error('[openclaw] OpenClaw CLI not found. Install OpenClaw to run this harness.');
|
|
220
|
+
console.error('[openclaw] Use sandbox mode (`archal run ... --sandbox`) or install openclaw locally.');
|
|
221
|
+
process.exit(1);
|
|
222
|
+
}
|
|
223
|
+
|
|
224
|
+
console.error('[openclaw] Mode: native OpenClaw CLI');
|
|
225
|
+
console.error(`[openclaw] Model: ${MODEL}`);
|
|
226
|
+
console.error(`[openclaw] Task: ${TASK.slice(0, 200)}${TASK.length > 200 ? '...' : ''}`);
|
|
227
|
+
|
|
228
|
+
const exitCode = await runWithOpenClawCli();
|
|
229
|
+
process.exit(exitCode);
|
|
@@ -0,0 +1,28 @@
|
|
|
1
|
+
{
|
|
2
|
+
"version": 1,
|
|
3
|
+
"name": "openclaw",
|
|
4
|
+
"description": "OpenClaw agent harness. Runs the real OpenClaw CLI against Archal twins; sandbox mode is the recommended path for production-fidelity evaluations.",
|
|
5
|
+
"defaultModel": "openclaw:main",
|
|
6
|
+
"promptFiles": [
|
|
7
|
+
"SOUL.md",
|
|
8
|
+
"AGENTS.md",
|
|
9
|
+
"TOOLS.md"
|
|
10
|
+
],
|
|
11
|
+
"local": {
|
|
12
|
+
"command": "node",
|
|
13
|
+
"args": ["agent.mjs"]
|
|
14
|
+
},
|
|
15
|
+
"maxSteps": 80,
|
|
16
|
+
"supportedProviders": ["openclaw"],
|
|
17
|
+
"requiredEnvVars": [
|
|
18
|
+
"ARCHAL_ENGINE_TASK",
|
|
19
|
+
"ARCHAL_ENGINE_MODEL"
|
|
20
|
+
],
|
|
21
|
+
"configDefaults": {
|
|
22
|
+
"maxSteps": 80,
|
|
23
|
+
"systemPrompt": true,
|
|
24
|
+
"errorHandling": true,
|
|
25
|
+
"retryOnTransient": true,
|
|
26
|
+
"maxConsecutiveErrors": 5
|
|
27
|
+
}
|
|
28
|
+
}
|