npm - @wrongstack/core - Versions diffs - 0.148.0 → 0.155.0 - Mend

@wrongstack/core 0.148.0 → 0.155.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/dist/{agent-bridge-r9y6gdn4.d.ts → agent-bridge-BbZU5TPN.d.ts} +1 -1
package/dist/{agent-subagent-runner-1GeQE_L0.d.ts → agent-subagent-runner-Bsueu0J2.d.ts} +2 -2
package/dist/{brain-Cp_3GIS2.d.ts → brain-CS_B0vIE.d.ts} +2 -0
package/dist/coordination/index.d.ts +7 -7
package/dist/coordination/index.js +143 -6
package/dist/coordination/index.js.map +1 -1
package/dist/defaults/index.d.ts +13 -13
package/dist/defaults/index.js +223 -65
package/dist/defaults/index.js.map +1 -1
package/dist/execution/index.d.ts +6 -6
package/dist/execution/index.js +143 -6
package/dist/execution/index.js.map +1 -1
package/dist/extension/index.d.ts +2 -2
package/dist/{goal-preamble-CYJLg0wk.d.ts → goal-preamble-CbV8pXLD.d.ts} +3 -3
package/dist/{index-CPweVoFM.d.ts → index-B5wz-GXm.d.ts} +1 -1
package/dist/{index-BZdezm3g.d.ts → index-CI1hRfPt.d.ts} +2 -2
package/dist/index.d.ts +22 -22
package/dist/index.js +233 -70
package/dist/index.js.map +1 -1
package/dist/infrastructure/index.d.ts +3 -3
package/dist/infrastructure/index.js +11 -2
package/dist/infrastructure/index.js.map +1 -1
package/dist/kernel/index.d.ts +3 -3
package/dist/kernel/index.js.map +1 -1
package/dist/{mcp-servers-Bl5LTvQg.d.ts → mcp-servers-CPERR2De.d.ts} +8 -1
package/dist/{multi-agent-coordinator-QWEzJDlm.d.ts → multi-agent-coordinator-BSKSFNhv.d.ts} +1 -1
package/dist/{null-fleet-bus-BUyfqh23.d.ts → null-fleet-bus-CGOez8Le.d.ts} +4 -4
package/dist/observability/index.d.ts +1 -1
package/dist/{parallel-eternal-engine-C75QuhAI.d.ts → parallel-eternal-engine-CYoTKjsz.d.ts} +4 -4
package/dist/{path-resolver-DRjQBkoO.d.ts → path-resolver-DuhlmPil.d.ts} +1 -1
package/dist/{plan-templates-CkKNPU3I.d.ts → plan-templates-DbH7lg-t.d.ts} +2 -2
package/dist/{provider-runner-BNpuIyOL.d.ts → provider-runner-Cocq0O9E.d.ts} +1 -1
package/dist/sdd/index.d.ts +3 -3
package/dist/sdd/index.js +143 -6
package/dist/sdd/index.js.map +1 -1
package/dist/{secret-vault-DoISxaKO.d.ts → secret-vault-BJDY28ev.d.ts} +7 -1
package/dist/{secret-vault-BTcC_T5v.d.ts → secret-vault-w8MbUe2Q.d.ts} +1 -1
package/dist/security/index.d.ts +2 -2
package/dist/security/index.js +59 -22
package/dist/security/index.js.map +1 -1
package/dist/storage/index.d.ts +5 -5
package/dist/storage/index.js +76 -42
package/dist/storage/index.js.map +1 -1
package/dist/types/index.d.ts +11 -11
package/dist/types/index.js +59 -22
package/dist/types/index.js.map +1 -1
package/dist/utils/index.d.ts +65 -1
package/dist/utils/index.js +61 -2
package/dist/utils/index.js.map +1 -1
package/package.json +1 -1

package/dist/sdd/index.js CHANGED Viewed

@@ -2987,6 +2987,7 @@ var SubagentBudget = class _SubagentBudget {
 function makeAgentSubagentRunner(opts) {
   const format = opts.formatTaskInput ?? defaultFormatTaskInput;
   return async (task, ctx) => {
+    const taskStartedAt = Date.now();
     const factoryResult = await opts.factory(ctx.config);
     const { agent, events } = factoryResult;
     const detachFleet = opts.fleetBus?.attach(ctx.subagentId, events, task.id);
@@ -3083,7 +3084,7 @@ function makeAgentSubagentRunner(opts) {
       }),
       events.on("provider.text_delta", (e) => {
         ctx.budget.markActivity();
-        streamingTextAcc = (streamingTextAcc + e.text).slice(-200);
+        streamingTextAcc = (streamingTextAcc + e.text).slice(-2e3);
       })
     );
     const onParentAbort = () => aborter.abort();
@@ -3091,6 +3092,15 @@ function makeAgentSubagentRunner(opts) {
     let result;
     try {
       result = await agent.run(format(task, ctx.config), { signal: aborter.signal });
+      events.emit("subagent.task_completed", {
+        subagentId: ctx.subagentId,
+        taskId: task.id,
+        status: result.status === "done" ? "success" : "failed",
+        iterations: result.iterations,
+        toolCalls: ctx.budget.usage().toolCalls,
+        durationMs: Date.now() - taskStartedAt,
+        finalText: result.finalText?.trim() || void 0
+      });
     } finally {
       detachFleet?.();
       ctx.signal.removeEventListener("abort", onParentAbort);
@@ -4175,15 +4185,44 @@ Working rules:
       id: "e2e",
       name: "E2E",
       role: "e2e",
-      tools: [...TOOLS.build, "fetch"],
+      tools: [
+        ...TOOLS.build,
+        "fetch",
+        "playwright_navigate",
+        "playwright_screenshot",
+        "playwright_click",
+        "playwright_type",
+        "playwright_evaluate",
+        "playwright_select_option",
+        "playwright_hover",
+        "playwright_fill_form",
+        "playwright_wait_for",
+        "playwright_press_key",
+        "playwright_drag"
+      ],
       prompt: `You are the E2E agent. Your job is end-to-end testing: drive the whole
 system the way a user would and verify the full flow works across boundaries.
 Scope:
 - Author end-to-end scenarios that exercise real user journeys
 - Drive UI/CLI/API across process and network boundaries
+- Use Playwright browser tools (navigate, click, type, screenshot, evaluate)
+  to automate web UI flows \u2014 open pages, interact with forms, capture evidence
 - Set up and tear down realistic test state
-- Capture failures with enough detail to reproduce (screenshots, logs)
+- Capture failures with enough detail to reproduce (screenshots, logs, page HTML)
+Playwright tools available (require the "playwright" MCP server to be enabled):
+  playwright_navigate(url)     \u2014 open a page at the given URL
+  playwright_screenshot()      \u2014 capture a full-page or viewport screenshot
+  playwright_click(selector)   \u2014 click on an element matching a CSS selector
+  playwright_type(selector, text) \u2014 type text into a focused input element
+  playwright_evaluate(script)  \u2014 run arbitrary JavaScript in the page context
+  playwright_select_option(selector, value) \u2014 pick a <select> dropdown option
+  playwright_hover(selector)   \u2014 hover the mouse over an element
+  playwright_fill_form(fields) \u2014 fill multiple form fields in one call
+  playwright_wait_for(selector) \u2014 block until an element appears on the page
+  playwright_press_key(key)    \u2014 press a keyboard key (Enter, Tab, Escape, \u2026)
+  playwright_drag(from, to)    \u2014 drag an element from one selector to another
 Input format you accept:
 { "task": "scenario | smoke | journey", "flow": "<user journey>", "surface": "ui | cli | api" }
@@ -4197,8 +4236,10 @@ Output: Markdown e2e report:
 Working rules:
 - Test the real flow end to end; don't stub the thing under test
 - Make scenarios deterministic \u2014 control time, randomness, and external state
-- On failure, capture artifacts (logs/screenshots) for reproduction
-- Keep scenarios independent so one failure doesn't cascade`
+- On failure, capture artifacts (screenshots, page HTML, logs) for reproduction
+- Keep scenarios independent so one failure doesn't cascade
+- For browser tests: playwright_navigate first, then interact, then playwright_screenshot as evidence
+- If playwright tools are unavailable, report it and fall back to API/CLI testing`
     },
     budget: HEAVY_BUDGET,
     capability: {
@@ -4211,10 +4252,106 @@ Working rules:
         "user journey",
         "smoke test",
         "playwright",
+        "browser",
+        "screenshot",
+        "web ui",
+        "headless",
         "cypress",
         "full flow",
         "browser test",
-        "acceptance test"
+        "acceptance test",
+        "navigate",
+        "click",
+        "form fill",
+        "dom",
+        "page load"
+      ]
+    }
+  },
+  {
+    config: {
+      id: "browser",
+      name: "Browser",
+      role: "browser",
+      tools: [
+        ...TOOLS.read,
+        "fetch",
+        "playwright_navigate",
+        "playwright_screenshot",
+        "playwright_click",
+        "playwright_type",
+        "playwright_evaluate",
+        "playwright_select_option",
+        "playwright_hover",
+        "playwright_fill_form",
+        "playwright_wait_for",
+        "playwright_press_key",
+        "playwright_drag"
+      ],
+      prompt: `You are the Browser agent. Your job is browser automation: open web pages,
+interact with them, extract data, capture screenshots, and return structured
+results. You are a read-focused agent \u2014 you drive the browser, not the filesystem.
+Scope:
+- Navigate to URLs and wait for pages to load
+- Take full-page or element screenshots as evidence
+- Click buttons, fill forms, select options, type text \u2014 full user simulation
+- Extract page content: text, HTML, element attributes, data tables
+- Evaluate JavaScript in the page context to extract structured data
+- Verify visual state (element visibility, text content, attribute values)
+Playwright tools available (require the "playwright" MCP server to be enabled):
+  playwright_navigate(url)          \u2014 open a page at the given URL
+  playwright_screenshot()           \u2014 capture a full-page or viewport screenshot
+  playwright_click(selector)        \u2014 click on an element matching a CSS selector
+  playwright_type(selector, text)   \u2014 type text into a focused input element
+  playwright_evaluate(script)       \u2014 run arbitrary JavaScript in the page context
+  playwright_select_option(selector, value) \u2014 pick a <select> dropdown option
+  playwright_hover(selector)        \u2014 hover the mouse over an element
+  playwright_fill_form(fields)      \u2014 fill multiple form fields in one call
+  playwright_wait_for(selector)     \u2014 block until an element appears on the page
+  playwright_press_key(key)         \u2014 press a keyboard key (Enter, Tab, Escape, \u2026)
+  playwright_drag(from, to)         \u2014 drag an element from one selector to another
+Input format you accept:
+{ "task": "navigate | screenshot | extract | interact | verify", "url": "<url>", "steps": ["step1", "step2"] }
+Output: Structured markdown report:
+- ## Page (URL, title, load status)
+- ## Actions Taken (step-by-step with timestamps)
+- ## Results (extracted data, element states, verification results)
+- ## Screenshots (list attached screenshot references)
+- ## Errors (any failures with stack traces)
+Working rules:
+- Always playwright_navigate first before any interaction
+- Always playwright_wait_for after navigation to ensure the page is ready
+- playwright_screenshot is your primary evidence \u2014 use it before and after interactions
+- Use playwright_evaluate for structured data extraction (JSON, text content)
+- If a selector fails, try alternative selectors before giving up
+- Report exact CSS selectors used \u2014 they're part of the evidence
+- If playwright tools are unavailable, report the error immediately \u2014 do not guess`
+    },
+    budget: MEDIUM_BUDGET,
+    capability: {
+      phase: "verify",
+      summary: "Browser automation: opens pages, clicks, types, screenshots, extracts data via Playwright headless Chromium.",
+      keywords: [
+        "browser",
+        "screenshot",
+        "navigate",
+        "web page",
+        "scrape",
+        "crawl",
+        "headless",
+        "chrome",
+        "open url",
+        "capture",
+        "page title",
+        "extract data",
+        "fill form",
+        "click button",
+        "take screenshot"
       ]
     }
   },