npm - @agent-native/core - Versions diffs - 0.52.0 → 0.54.0 - Mend

@agent-native/core 0.52.0 → 0.54.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (267) hide show

package/README.md +41 -95
package/blueprints/action/crud.md +98 -0
package/blueprints/channel/discord.md +74 -0
package/blueprints/provider/stripe.md +87 -0
package/blueprints/sandbox/docker.md +78 -0
package/dist/action.d.ts +64 -1
package/dist/action.d.ts.map +1 -1
package/dist/action.js +73 -2
package/dist/action.js.map +1 -1
package/dist/agent/index.d.ts +1 -0
package/dist/agent/index.d.ts.map +1 -1
package/dist/agent/index.js +1 -0
package/dist/agent/index.js.map +1 -1
package/dist/agent/observational-memory/compactor.d.ts +43 -0
package/dist/agent/observational-memory/compactor.d.ts.map +1 -0
package/dist/agent/observational-memory/compactor.js +50 -0
package/dist/agent/observational-memory/compactor.js.map +1 -0
package/dist/agent/observational-memory/config.d.ts +37 -0
package/dist/agent/observational-memory/config.d.ts.map +1 -0
package/dist/agent/observational-memory/config.js +48 -0
package/dist/agent/observational-memory/config.js.map +1 -0
package/dist/agent/observational-memory/index.d.ts +26 -0
package/dist/agent/observational-memory/index.d.ts.map +1 -0
package/dist/agent/observational-memory/index.js +25 -0
package/dist/agent/observational-memory/index.js.map +1 -0
package/dist/agent/observational-memory/internal-run.d.ts +37 -0
package/dist/agent/observational-memory/internal-run.d.ts.map +1 -0
package/dist/agent/observational-memory/internal-run.js +59 -0
package/dist/agent/observational-memory/internal-run.js.map +1 -0
package/dist/agent/observational-memory/message-text.d.ts +13 -0
package/dist/agent/observational-memory/message-text.d.ts.map +1 -0
package/dist/agent/observational-memory/message-text.js +46 -0
package/dist/agent/observational-memory/message-text.js.map +1 -0
package/dist/agent/observational-memory/migrations.d.ts +13 -0
package/dist/agent/observational-memory/migrations.d.ts.map +1 -0
package/dist/agent/observational-memory/migrations.js +43 -0
package/dist/agent/observational-memory/migrations.js.map +1 -0
package/dist/agent/observational-memory/observer.d.ts +37 -0
package/dist/agent/observational-memory/observer.d.ts.map +1 -0
package/dist/agent/observational-memory/observer.js +82 -0
package/dist/agent/observational-memory/observer.js.map +1 -0
package/dist/agent/observational-memory/plugin.d.ts +16 -0
package/dist/agent/observational-memory/plugin.d.ts.map +1 -0
package/dist/agent/observational-memory/plugin.js +26 -0
package/dist/agent/observational-memory/plugin.js.map +1 -0
package/dist/agent/observational-memory/prompts.d.ts +27 -0
package/dist/agent/observational-memory/prompts.d.ts.map +1 -0
package/dist/agent/observational-memory/prompts.js +42 -0
package/dist/agent/observational-memory/prompts.js.map +1 -0
package/dist/agent/observational-memory/read.d.ts +45 -0
package/dist/agent/observational-memory/read.d.ts.map +1 -0
package/dist/agent/observational-memory/read.js +97 -0
package/dist/agent/observational-memory/read.js.map +1 -0
package/dist/agent/observational-memory/reflector.d.ts +31 -0
package/dist/agent/observational-memory/reflector.d.ts.map +1 -0
package/dist/agent/observational-memory/reflector.js +76 -0
package/dist/agent/observational-memory/reflector.js.map +1 -0
package/dist/agent/observational-memory/schema.d.ts +267 -0
package/dist/agent/observational-memory/schema.d.ts.map +1 -0
package/dist/agent/observational-memory/schema.js +48 -0
package/dist/agent/observational-memory/schema.js.map +1 -0
package/dist/agent/observational-memory/store.d.ts +52 -0
package/dist/agent/observational-memory/store.d.ts.map +1 -0
package/dist/agent/observational-memory/store.js +197 -0
package/dist/agent/observational-memory/store.js.map +1 -0
package/dist/agent/observational-memory/types.d.ts +61 -0
package/dist/agent/observational-memory/types.d.ts.map +1 -0
package/dist/agent/observational-memory/types.js +9 -0
package/dist/agent/observational-memory/types.js.map +1 -0
package/dist/agent/processors.d.ts +146 -0
package/dist/agent/processors.d.ts.map +1 -0
package/dist/agent/processors.js +122 -0
package/dist/agent/processors.js.map +1 -0
package/dist/agent/production-agent.d.ts +25 -0
package/dist/agent/production-agent.d.ts.map +1 -1
package/dist/agent/production-agent.js +341 -1
package/dist/agent/production-agent.js.map +1 -1
package/dist/agent/run-loop-with-resume.d.ts.map +1 -1
package/dist/agent/run-loop-with-resume.js +48 -0
package/dist/agent/run-loop-with-resume.js.map +1 -1
package/dist/agent/run-store.d.ts +17 -0
package/dist/agent/run-store.d.ts.map +1 -1
package/dist/agent/run-store.js +55 -0
package/dist/agent/run-store.js.map +1 -1
package/dist/agent/runtime-context.d.ts +30 -0
package/dist/agent/runtime-context.d.ts.map +1 -1
package/dist/agent/runtime-context.js +54 -1
package/dist/agent/runtime-context.js.map +1 -1
package/dist/agent/tool-call-journal.d.ts +99 -0
package/dist/agent/tool-call-journal.d.ts.map +1 -0
package/dist/agent/tool-call-journal.js +212 -0
package/dist/agent/tool-call-journal.js.map +1 -0
package/dist/agent/types.d.ts +35 -0
package/dist/agent/types.d.ts.map +1 -1
package/dist/agent/types.js.map +1 -1
package/dist/cli/add.d.ts +109 -0
package/dist/cli/add.d.ts.map +1 -0
package/dist/cli/add.js +352 -0
package/dist/cli/add.js.map +1 -0
package/dist/cli/connect.d.ts +2 -2
package/dist/cli/connect.d.ts.map +1 -1
package/dist/cli/connect.js +92 -24
package/dist/cli/connect.js.map +1 -1
package/dist/cli/eval.d.ts +17 -0
package/dist/cli/eval.d.ts.map +1 -0
package/dist/cli/eval.js +121 -0
package/dist/cli/eval.js.map +1 -0
package/dist/cli/index.js +44 -3
package/dist/cli/index.js.map +1 -1
package/dist/cli/mcp.d.ts.map +1 -1
package/dist/cli/mcp.js +11 -5
package/dist/cli/mcp.js.map +1 -1
package/dist/cli/plan-local.d.ts +66 -5
package/dist/cli/plan-local.d.ts.map +1 -1
package/dist/cli/plan-local.js +622 -21
package/dist/cli/plan-local.js.map +1 -1
package/dist/cli/skills.d.ts +2 -2
package/dist/cli/skills.d.ts.map +1 -1
package/dist/cli/skills.js +108 -62
package/dist/cli/skills.js.map +1 -1
package/dist/client/AssistantChat.d.ts.map +1 -1
package/dist/client/AssistantChat.js +118 -92
package/dist/client/AssistantChat.js.map +1 -1
package/dist/client/agent-chat-adapter.d.ts.map +1 -1
package/dist/client/agent-chat-adapter.js +16 -0
package/dist/client/agent-chat-adapter.js.map +1 -1
package/dist/client/chat/tool-call-display.d.ts +20 -1
package/dist/client/chat/tool-call-display.d.ts.map +1 -1
package/dist/client/chat/tool-call-display.js +32 -7
package/dist/client/chat/tool-call-display.js.map +1 -1
package/dist/client/sse-event-processor.d.ts +13 -0
package/dist/client/sse-event-processor.d.ts.map +1 -1
package/dist/client/sse-event-processor.js +21 -0
package/dist/client/sse-event-processor.js.map +1 -1
package/dist/coding-tools/run-code.d.ts.map +1 -1
package/dist/coding-tools/run-code.js +18 -2
package/dist/coding-tools/run-code.js.map +1 -1
package/dist/db/client.d.ts +4 -2
package/dist/db/client.d.ts.map +1 -1
package/dist/db/client.js +6 -4
package/dist/db/client.js.map +1 -1
package/dist/deploy/route-discovery.d.ts.map +1 -1
package/dist/deploy/route-discovery.js +1 -0
package/dist/deploy/route-discovery.js.map +1 -1
package/dist/eval/agent-runner.d.ts +63 -0
package/dist/eval/agent-runner.d.ts.map +1 -0
package/dist/eval/agent-runner.js +142 -0
package/dist/eval/agent-runner.js.map +1 -0
package/dist/eval/define-eval.d.ts +29 -0
package/dist/eval/define-eval.d.ts.map +1 -0
package/dist/eval/define-eval.js +43 -0
package/dist/eval/define-eval.js.map +1 -0
package/dist/eval/index.d.ts +18 -0
package/dist/eval/index.d.ts.map +1 -0
package/dist/eval/index.js +17 -0
package/dist/eval/index.js.map +1 -0
package/dist/eval/report.d.ts +8 -0
package/dist/eval/report.d.ts.map +1 -0
package/dist/eval/report.js +44 -0
package/dist/eval/report.js.map +1 -0
package/dist/eval/runner.d.ts +67 -0
package/dist/eval/runner.d.ts.map +1 -0
package/dist/eval/runner.js +256 -0
package/dist/eval/runner.js.map +1 -0
package/dist/eval/scorer.d.ts +83 -0
package/dist/eval/scorer.d.ts.map +1 -0
package/dist/eval/scorer.js +195 -0
package/dist/eval/scorer.js.map +1 -0
package/dist/eval/types.d.ts +162 -0
package/dist/eval/types.d.ts.map +1 -0
package/dist/eval/types.js +20 -0
package/dist/eval/types.js.map +1 -0
package/dist/extensions/fetch-tool.d.ts.map +1 -1
package/dist/extensions/fetch-tool.js +80 -15
package/dist/extensions/fetch-tool.js.map +1 -1
package/dist/extensions/web-content.d.ts +61 -0
package/dist/extensions/web-content.d.ts.map +1 -0
package/dist/extensions/web-content.js +468 -0
package/dist/extensions/web-content.js.map +1 -0
package/dist/extensions/web-search-tool.js +3 -3
package/dist/extensions/web-search-tool.js.map +1 -1
package/dist/mcp/build-server.d.ts.map +1 -1
package/dist/mcp/build-server.js +4 -1
package/dist/mcp/build-server.js.map +1 -1
package/dist/observability/traces.d.ts.map +1 -1
package/dist/observability/traces.js +100 -1
package/dist/observability/traces.js.map +1 -1
package/dist/observability/tracing.d.ts +73 -0
package/dist/observability/tracing.d.ts.map +1 -0
package/dist/observability/tracing.js +126 -0
package/dist/observability/tracing.js.map +1 -0
package/dist/onboarding/default-steps.d.ts.map +1 -1
package/dist/onboarding/default-steps.js +4 -1
package/dist/onboarding/default-steps.js.map +1 -1
package/dist/provider-api/actions/query-staged-dataset.d.ts +1 -1
package/dist/provider-api/corpus-jobs.d.ts +80 -0
package/dist/provider-api/corpus-jobs.d.ts.map +1 -1
package/dist/provider-api/corpus-jobs.js +219 -22
package/dist/provider-api/corpus-jobs.js.map +1 -1
package/dist/provider-api/index.d.ts +24 -32
package/dist/provider-api/index.d.ts.map +1 -1
package/dist/provider-api/index.js +28 -1
package/dist/provider-api/index.js.map +1 -1
package/dist/scripts/agent-engines/list-agent-engines.d.ts.map +1 -1
package/dist/scripts/agent-engines/list-agent-engines.js +10 -3
package/dist/scripts/agent-engines/list-agent-engines.js.map +1 -1
package/dist/server/action-discovery.d.ts.map +1 -1
package/dist/server/action-discovery.js +4 -0
package/dist/server/action-discovery.js.map +1 -1
package/dist/server/agent-chat-plugin.d.ts +9 -0
package/dist/server/agent-chat-plugin.d.ts.map +1 -1
package/dist/server/agent-chat-plugin.js +119 -111
package/dist/server/agent-chat-plugin.js.map +1 -1
package/dist/server/agent-teams.d.ts +62 -0
package/dist/server/agent-teams.d.ts.map +1 -1
package/dist/server/agent-teams.js +99 -2
package/dist/server/agent-teams.js.map +1 -1
package/dist/server/better-auth-instance.d.ts +7 -0
package/dist/server/better-auth-instance.d.ts.map +1 -1
package/dist/server/better-auth-instance.js +90 -0
package/dist/server/better-auth-instance.js.map +1 -1
package/dist/server/core-routes-plugin.d.ts.map +1 -1
package/dist/server/core-routes-plugin.js +7 -4
package/dist/server/core-routes-plugin.js.map +1 -1
package/dist/server/credential-provider.d.ts.map +1 -1
package/dist/server/credential-provider.js +2 -0
package/dist/server/credential-provider.js.map +1 -1
package/dist/server/deep-link.d.ts +7 -0
package/dist/server/deep-link.d.ts.map +1 -1
package/dist/server/deep-link.js +13 -2
package/dist/server/deep-link.js.map +1 -1
package/dist/server/framework-request-handler.d.ts.map +1 -1
package/dist/server/framework-request-handler.js +33 -1
package/dist/server/framework-request-handler.js.map +1 -1
package/dist/server/index.d.ts +2 -1
package/dist/server/index.d.ts.map +1 -1
package/dist/server/index.js +2 -1
package/dist/server/index.js.map +1 -1
package/dist/templates/default/.agents/skills/actions/SKILL.md +52 -1
package/dist/templates/default/.agents/skills/security/SKILL.md +22 -0
package/dist/templates/workspace-core/.agents/skills/actions/SKILL.md +52 -1
package/dist/templates/workspace-core/.agents/skills/external-agents/SKILL.md +16 -4
package/dist/templates/workspace-core/.agents/skills/harness-agents/SKILL.md +20 -0
package/dist/templates/workspace-core/.agents/skills/observability/SKILL.md +31 -0
package/dist/templates/workspace-core/.agents/skills/security/SKILL.md +22 -0
package/docs/content/actions.md +50 -0
package/docs/content/agent-teams.md +32 -0
package/docs/content/blueprint-installer.md +73 -0
package/docs/content/durable-resume.md +49 -0
package/docs/content/evals.md +141 -0
package/docs/content/external-agents.md +2 -2
package/docs/content/human-approval.md +101 -0
package/docs/content/observability.md +21 -0
package/docs/content/observational-memory.md +63 -0
package/docs/content/plan-plugin.md +5 -0
package/docs/content/pr-visual-recap.md +9 -5
package/docs/content/processors.md +99 -0
package/docs/content/sandbox-adapters.md +134 -0
package/docs/content/template-plan.md +97 -21
package/package.json +10 -1
package/src/templates/default/.agents/skills/actions/SKILL.md +52 -1
package/src/templates/default/.agents/skills/security/SKILL.md +22 -0
package/src/templates/workspace-core/.agents/skills/actions/SKILL.md +52 -1
package/src/templates/workspace-core/.agents/skills/external-agents/SKILL.md +16 -4
package/src/templates/workspace-core/.agents/skills/harness-agents/SKILL.md +20 -0
package/src/templates/workspace-core/.agents/skills/observability/SKILL.md +31 -0
package/src/templates/workspace-core/.agents/skills/security/SKILL.md +22 -0

package/src/templates/default/.agents/skills/actions/SKILL.md CHANGED Viewed

@@ -112,7 +112,10 @@ action trio instead:
   docs/spec URLs, placeholders, and examples without exposing secrets.
 - `provider-api-docs`: fetches public provider docs/spec/changelog URLs when
   the exact endpoint, filter operator, payload shape, or pagination contract is
-  uncertain. Registered docs URLs are curated starting points.
+  uncertain. Registered docs URLs are curated starting points. Use
+  `responseMode: "markdown"` for clean readable docs, or
+  `responseMode: "matches"` with `search: { query | terms | regex }` for
+  compact snippets instead of flooding context with raw HTML.
 - `provider-api-request`: makes a constrained authenticated HTTP request to the
   provider host, injects configured credentials, blocks private/internal URLs,
   and redacts secrets.
@@ -151,6 +154,12 @@ pagination status, truncation, failed pages, and uncovered gaps. They must not
 turn default limits, sampled rows, truncated excerpts, or aborted calls into a
 confident "none found", "all records", or exhaustive conclusion.
+For public web pages and docs, prefer the token-efficient path: `web-search`
+to find likely URLs, `web-request` or `provider-api-docs` with clean
+`responseMode` output to read a page, and `run-code` with `webRead()` /
+`webFetch()` when you need to grep, aggregate, or compare many pages before
+returning a small result.
 ### The `http` Option
 Controls how the action is exposed as an HTTP endpoint:
@@ -195,6 +204,48 @@ run: async (args) => {
 }
 ```
+### Validating Return Values (`outputSchema`)
+`schema` validates inputs; `outputSchema` validates what the action **returns**. Pass any Standard Schema-compatible schema (Zod, Valibot, ArkType) and the framework validates the result _after_ `run()` resolves — input validated before `run`, output after.
+```ts
+export default defineAction({
+  description: "Summarize a thread.",
+  schema: z.object({ threadId: z.string() }),
+  outputSchema: z.object({ summary: z.string(), messageCount: z.number() }),
+  outputErrorStrategy: "warn", // default; "strict" | "fallback"
+  // outputFallback: { summary: "", messageCount: 0 }, // used only by "fallback"
+  run: async ({ threadId }) => {
+    /* ... */
+  },
+});
+```
+- `"warn"` (default) — `console.warn` the issues and return the **original** result unchanged. Non-breaking.
+- `"strict"` — throw a clear error so a buggy action surfaces loudly.
+- `"fallback"` — return `outputFallback` in place of the invalid result.
+On success the validated value is returned, so coercion/defaults on `outputSchema` apply. Omit `outputSchema` and behavior is byte-for-byte unchanged (no wrapping).
+### Human-in-the-Loop Approval (`needsApproval`)
+For high-consequence, outward-facing, hard-to-undo actions (sending an email, charging a card, deleting an account), set `needsApproval` so the agent **cannot** run the action without a human approving the specific call:
+```ts
+export default defineAction({
+  description: "Send an email via Gmail.",
+  schema: z.object({ to: z.string(), subject: z.string(), body: z.string() }),
+  needsApproval: true, // boolean, or (args, ctx) => boolean | Promise<boolean>
+  run: async (args) => {
+    /* ...actually send... */
+  },
+});
+```
+When the gate is truthy and the call isn't yet approved, the loop emits an `approval_required` event and **stops the turn — `run()` never executes**. A predicate gates conditionally (e.g. only external recipients) and **fails closed**: a throw is treated as "approval required". The human approves via the chat UI's Approve affordance, which re-issues the turn with the call's `approvalKey`, and only then does the action run.
+**Keep approvals rare** — the default is off and almost every action should leave it off. The canonical example is Mail's `send-email` (`needsApproval: true`). See the `security` skill and the Human Approval doc.
 ## Frontend Hooks
 The frontend calls actions using React Query hooks from `@agent-native/core/client`. Components should not hand-write `fetch("/_agent-native/actions/...")`; add or reuse a client hook/helper instead. Use `callAction` from the same package for imperative cases that do not fit a hook, such as debounced search, prefetching, or non-React event handlers.

package/src/templates/default/.agents/skills/security/SKILL.md CHANGED Viewed

@@ -139,6 +139,28 @@ export default defineEventHandler(async (event) => {
 - Never create unprotected routes that modify data.
+## Human-in-the-Loop Approval for High-Consequence Actions
+For a small set of outward-facing, hard-to-undo operations — sending an email, charging a card, deleting an account, posting publicly — auth and access control are necessary but not sufficient: you also do not want the **agent** to perform them autonomously. Set `needsApproval` on the `defineAction` so the agent cannot run the action without a human approving the specific call.
+```ts
+export default defineAction({
+  description: "Send an email via Gmail.",
+  schema: z.object({ to: z.string(), subject: z.string(), body: z.string() }),
+  needsApproval: true, // or (args, ctx) => boolean | Promise<boolean>
+  run: async (args) => {
+    /* ...actually send... */
+  },
+});
+```
+When the gate is truthy and the call is not yet approved, the loop emits an `approval_required` event and **stops the turn — `run()` never executes**. The human approves via the chat UI's Approve affordance, which re-issues the turn with the call's stable `approvalKey`; only then does the action run. A predicate gates conditionally (e.g. only external recipients) and **fails closed** — a throw is treated as "approval required".
+Rules:
+- Reach for `needsApproval` only for genuinely high-consequence operations. The default is off, and the framework intentionally keeps approvals rare — over-gating turns the agent into a click-through wizard. The canonical (and intentionally lone) framework example is Mail's `send-email`.
+- `needsApproval` is **not** a substitute for `accessFilter` / `assertAccess` or for hiding sensitive operations from the model with `agentTool: false` / `toolCallable: false`. It is the layer for "a human must explicitly bless this specific outward-facing call," not for scoping data. See the `actions` skill for the full surface.
 ## Custom HTTP Routes Must Apply Access Control Themselves
 This is the single most-failed rule in the codebase. Auto-mounted action routes (`/_agent-native/actions/...`) get a request context wired up automatically. **Hand-written `/api/*` Nitro routes do not.** If your handler queries an ownable resource (any table with `...ownableColumns()`), you MUST:

package/src/templates/workspace-core/.agents/skills/actions/SKILL.md CHANGED Viewed

@@ -112,7 +112,10 @@ action trio instead:
   docs/spec URLs, placeholders, and examples without exposing secrets.
 - `provider-api-docs`: fetches public provider docs/spec/changelog URLs when
   the exact endpoint, filter operator, payload shape, or pagination contract is
-  uncertain. Registered docs URLs are curated starting points.
+  uncertain. Registered docs URLs are curated starting points. Use
+  `responseMode: "markdown"` for clean readable docs, or
+  `responseMode: "matches"` with `search: { query | terms | regex }` for
+  compact snippets instead of flooding context with raw HTML.
 - `provider-api-request`: makes a constrained authenticated HTTP request to the
   provider host, injects configured credentials, blocks private/internal URLs,
   and redacts secrets.
@@ -151,6 +154,12 @@ pagination status, truncation, failed pages, and uncovered gaps. They must not
 turn default limits, sampled rows, truncated excerpts, or aborted calls into a
 confident "none found", "all records", or exhaustive conclusion.
+For public web pages and docs, prefer the token-efficient path: `web-search`
+to find likely URLs, `web-request` or `provider-api-docs` with clean
+`responseMode` output to read a page, and `run-code` with `webRead()` /
+`webFetch()` when you need to grep, aggregate, or compare many pages before
+returning a small result.
 ### The `http` Option
 Controls how the action is exposed as an HTTP endpoint:
@@ -195,6 +204,48 @@ run: async (args) => {
 }
 ```
+### Validating Return Values (`outputSchema`)
+`schema` validates inputs; `outputSchema` validates what the action **returns**. Pass any Standard Schema-compatible schema (Zod, Valibot, ArkType) and the framework validates the result _after_ `run()` resolves — input validated before `run`, output after.
+```ts
+export default defineAction({
+  description: "Summarize a thread.",
+  schema: z.object({ threadId: z.string() }),
+  outputSchema: z.object({ summary: z.string(), messageCount: z.number() }),
+  outputErrorStrategy: "warn", // default; "strict" | "fallback"
+  // outputFallback: { summary: "", messageCount: 0 }, // used only by "fallback"
+  run: async ({ threadId }) => {
+    /* ... */
+  },
+});
+```
+- `"warn"` (default) — `console.warn` the issues and return the **original** result unchanged. Non-breaking.
+- `"strict"` — throw a clear error so a buggy action surfaces loudly.
+- `"fallback"` — return `outputFallback` in place of the invalid result.
+On success the validated value is returned, so coercion/defaults on `outputSchema` apply. Omit `outputSchema` and behavior is byte-for-byte unchanged (no wrapping).
+### Human-in-the-Loop Approval (`needsApproval`)
+For high-consequence, outward-facing, hard-to-undo actions (sending an email, charging a card, deleting an account), set `needsApproval` so the agent **cannot** run the action without a human approving the specific call:
+```ts
+export default defineAction({
+  description: "Send an email via Gmail.",
+  schema: z.object({ to: z.string(), subject: z.string(), body: z.string() }),
+  needsApproval: true, // boolean, or (args, ctx) => boolean | Promise<boolean>
+  run: async (args) => {
+    /* ...actually send... */
+  },
+});
+```
+When the gate is truthy and the call isn't yet approved, the loop emits an `approval_required` event and **stops the turn — `run()` never executes**. A predicate gates conditionally (e.g. only external recipients) and **fails closed**: a throw is treated as "approval required". The human approves via the chat UI's Approve affordance, which re-issues the turn with the call's `approvalKey`, and only then does the action run.
+**Keep approvals rare** — the default is off and almost every action should leave it off. The canonical example is Mail's `send-email` (`needsApproval: true`). See the `security` skill and the Human Approval doc.
 ## Frontend Hooks
 The frontend calls actions using React Query hooks from `@agent-native/core/client`. Components should not hand-write `fetch("/_agent-native/actions/...")`; add or reuse a client hook/helper instead. Use `callAction` from the same package for imperative cases that do not fit a hook, such as debounced search, prefetching, or non-React event handlers.

package/src/templates/workspace-core/.agents/skills/external-agents/SKILL.md CHANGED Viewed

@@ -197,7 +197,7 @@ path is obvious.
 `defineAction` accepts an optional `link` builder. When set, every MCP/A2A
 result for that tool auto-appends a markdown `[label →](absoluteUrl)` block and
 a structured `_meta["agent-native/openLink"] = { label, view, webUrl,
-desktopUrl }`; `tools/list` adds
+desktopUrl, vscodeUrl }`; `tools/list` adds
 `annotations["agent-native/producesOpenLink"]` plus a description suffix so the
 external agent knows the tool yields an openable link.
@@ -285,9 +285,11 @@ ngrok/prod testing caveats are documented in
 `buildDeepLink(...)` returns the app-relative path
 `/_agent-native/open?app=…&view=…&<recordId>=…`. The MCP layer turns that into
-an absolute web URL (`toAbsoluteOpenUrl`, using the request origin) and a
-desktop `agentnative://open?…` URL (`toDesktopOpenUrl`). When the user clicks
-it in any browser or inline webview, `GET /_agent-native/open`
+an absolute web URL (`toAbsoluteOpenUrl`, using the request origin), a
+desktop `agentnative://open?…` URL (`toDesktopOpenUrl`), and a VS Code
+extension URL (`toVsCodeOpenUrl`) for
+`vscode://builderio.agent-native/open?url=…`. When the user clicks the web
+link in any browser or inline webview, `GET /_agent-native/open`
 (`createOpenRouteHandler`, mounted by the core routes plugin, gated by
 `disableOpenRoute`, customizable via `resolveOpenPath`):
@@ -416,3 +418,13 @@ before telling the user they are unauthenticated.
 - **a2a-protocol** — the `ask-agent` meta-tool and JSON-RPC peer calls
 - **adding-a-feature** — the four-area checklist (add a `link` builder when a
   feature produces a navigable resource)
+## Blueprint installer
+To add a whole new integration the agent-native way, `agent-native add <kind>
+<name|url>` prints a curated Markdown blueprint to stdout — pipe it into the
+external coding agent you connected (`agent-native add provider stripe |
+claude`) and it applies the changes against the live repo. A URL emits a
+generic research-and-integrate blueprint instead. Seeded kinds:
+`provider` / `channel` / `sandbox` / `action`. Add your own by dropping a
+`.md` in `packages/core/blueprints/<kind>/`. See the Blueprint Installer doc.

package/src/templates/workspace-core/.agents/skills/harness-agents/SKILL.md CHANGED Viewed

@@ -80,6 +80,26 @@ existing run routes as `goalId=agent-harness`.
   Preserve `defineAction` auth, request context, timeouts, truncation, and
   read-only metadata.
+## Code Execution Sandbox
+- The `run-code` tool executes through a pluggable `SandboxAdapter`
+  (`packages/core/src/coding-tools/sandbox/`). The default
+  `LocalChildProcessAdapter` spawns a locked-down local Node child process;
+  swap it via `AGENT_NATIVE_SANDBOX` or `registerSandboxAdapter()` for a
+  Docker/remote/durable backend (the lever to exceed the hosted ~40s code-exec
+  ceiling). An adapter only runs the already-prepared, non-secret module source
+  — it never sees app secrets. See the Sandbox Adapters doc; `agent-native add
+  sandbox docker` emits a full Docker-adapter recipe.
+## Sub-Agent Delegation Depth
+- Sub-agent spawning is capped server-side (default depth `2`) so delegation
+  chains can't fan out indefinitely. Override at deploy time with
+  `AGENT_NATIVE_MAX_SUBAGENT_DEPTH` (`0` disables sub-agents; clamped to `16`).
+  Enforcement is ambient via `evaluateSubagentDepth` in
+  `packages/core/src/server/agent-teams.ts` — independent of any tool-level
+  guard. See the Agent Teams doc for the depth model.
 ## Don't
 - Don't add Claude Code, Codex, Cursor, Mastra, or Pi as an `AgentEngine`.

package/src/templates/workspace-core/.agents/skills/observability/SKILL.md CHANGED Viewed

@@ -75,6 +75,26 @@ const criteria: EvalCriteria = {
 };
 ```
+#### Evals (CI gate)
+The three layers above score *real production runs* after the fact. For an active, deterministic gate, use the first-class `*.eval.ts` primitive from `@agent-native/core/eval` (source: `packages/core/src/eval/*`). It runs the actual agent loop against fixed inputs and exits non-zero below threshold, so it gates CI/deploys.
+```ts
+// evals/faq.eval.ts
+import { defineEval, contains, llmJudge } from "@agent-native/core/eval";
+export default defineEval({
+  name: "answers the FAQ",
+  input: { prompt: "What is your return policy?" },
+  threshold: 0.7,
+  scorers: [contains("30 days"), llmJudge({ criteria: "accuracy" })],
+});
+```
+- Built-in scorers: `exactMatch` / `contains` / `usesTool` (pure JS) and `llmJudge` (provider-agnostic judge).
+- Custom scorers: `createScorer` with the 4-step `preprocess → analyze → generateScore → generateReason` pipeline (only `generateScore` is required).
+- Run as a gate: `agent-native eval [pattern] [--json] [--threshold N]` — discovers `**/*.eval.ts` and `evals/*.ts`, runs the agent, and exits non-zero if any eval is below its threshold. An app with no eval files exits `0`. Complements (does not replace) the post-hoc scoring in `evals.ts`. See the Evals doc.
 ### 4. Experiments
 A/B testing with sticky user-level assignment:
@@ -200,3 +220,14 @@ await putSetting("observability-config", {
 ```
 The framework emits `gen_ai.*` semantic convention spans compatible with Langfuse, Datadog, Grafana, New Relic, and any OTel-compatible backend.
+## Live OpenTelemetry Spans (Optional)
+Separate from the `exporters` config above (which ships the in-house traces to an OTLP endpoint), the agent loop can also emit **live OpenTelemetry spans** for every run, model call, and tool call, so a host that already runs an OTel collector sees agent activity alongside its other distributed traces.
+This layer is optional and **no-op by default**:
+- `@opentelemetry/api` is an **optional dependency**. If it isn't installed, the span helpers degrade to silent no-ops — they never throw into the agent loop.
+- Even with the api package installed, it ships a default no-op tracer. Spans become real only once the **host registers a `TracerProvider`** (via `@opentelemetry/sdk-node` or similar). The framework deliberately does not depend on the heavy SDK/exporter packages and never registers a provider itself — instrumentation is opt-in by the embedding app.
+The loop emits `agent.run` (with `agent.run_id`, `agent.thread_id`, `agent.user_id`, `agent.model`), `tool.call` (`tool.name` + status), and `llm.call` spans, each finished with OK/ERROR status. This is purely additive to the in-house `agent_trace_spans` / `agent_trace_summaries` tables. Source: `packages/core/src/observability/tracing.ts` + `traces.ts`. See the Observability doc for the full table.

package/src/templates/workspace-core/.agents/skills/security/SKILL.md CHANGED Viewed

@@ -139,6 +139,28 @@ export default defineEventHandler(async (event) => {
 - Never create unprotected routes that modify data.
+## Human-in-the-Loop Approval for High-Consequence Actions
+For a small set of outward-facing, hard-to-undo operations — sending an email, charging a card, deleting an account, posting publicly — auth and access control are necessary but not sufficient: you also do not want the **agent** to perform them autonomously. Set `needsApproval` on the `defineAction` so the agent cannot run the action without a human approving the specific call.
+```ts
+export default defineAction({
+  description: "Send an email via Gmail.",
+  schema: z.object({ to: z.string(), subject: z.string(), body: z.string() }),
+  needsApproval: true, // or (args, ctx) => boolean | Promise<boolean>
+  run: async (args) => {
+    /* ...actually send... */
+  },
+});
+```
+When the gate is truthy and the call is not yet approved, the loop emits an `approval_required` event and **stops the turn — `run()` never executes**. The human approves via the chat UI's Approve affordance, which re-issues the turn with the call's stable `approvalKey`; only then does the action run. A predicate gates conditionally (e.g. only external recipients) and **fails closed** — a throw is treated as "approval required".
+Rules:
+- Reach for `needsApproval` only for genuinely high-consequence operations. The default is off, and the framework intentionally keeps approvals rare — over-gating turns the agent into a click-through wizard. The canonical (and intentionally lone) framework example is Mail's `send-email`.
+- `needsApproval` is **not** a substitute for `accessFilter` / `assertAccess` or for hiding sensitive operations from the model with `agentTool: false` / `toolCallable: false`. It is the layer for "a human must explicitly bless this specific outward-facing call," not for scoping data. See the `actions` skill for the full surface.
 ## Custom HTTP Routes Must Apply Access Control Themselves
 This is the single most-failed rule in the codebase. Auto-mounted action routes (`/_agent-native/actions/...`) get a request context wired up automatically. **Hand-written `/api/*` Nitro routes do not.** If your handler queries an ownable resource (any table with `...ownableColumns()`), you MUST: