npm - @desplega.ai/agent-swarm - Versions diffs - 1.74.4 → 1.76.0 - Mend

@desplega.ai/agent-swarm 1.74.4 → 1.76.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

package/README.md +1 -1
package/openapi.json +1264 -46
package/package.json +2 -2
package/src/be/db.ts +563 -9
package/src/be/memory/edges-store.ts +69 -0
package/src/be/memory/providers/sqlite-store.ts +4 -0
package/src/be/memory/raters/explicit-self.ts +22 -0
package/src/be/memory/raters/implicit-citation.ts +44 -0
package/src/be/memory/raters/llm-client.ts +172 -0
package/src/be/memory/raters/llm-summarizer.ts +218 -0
package/src/be/memory/raters/llm.ts +375 -0
package/src/be/memory/raters/noop.ts +14 -0
package/src/be/memory/raters/registry.ts +86 -0
package/src/be/memory/raters/retrieval.ts +88 -0
package/src/be/memory/raters/run-server-raters.ts +97 -0
package/src/be/memory/raters/store.ts +228 -0
package/src/be/memory/raters/types.ts +101 -0
package/src/be/memory/reranker.ts +32 -2
package/src/be/memory/retrieval-store.ts +116 -0
package/src/be/memory/types.ts +3 -0
package/src/be/migrations/051_memory_posteriors_and_retrieval.sql +67 -0
package/src/be/migrations/052_memory_edges.sql +36 -0
package/src/be/migrations/053_agent_waiting_for_credentials_status.sql +61 -0
package/src/be/migrations/054_agent_harness_provider.sql +21 -0
package/src/be/migrations/055_agent_cred_status.sql +15 -0
package/src/be/migrations/056_drop_agent_tasks_source_check.sql +139 -0
package/src/be/migrations/057_inbox_item_state.sql +27 -0
package/src/be/migrations/058_task_templates.sql +31 -0
package/src/be/swarm-config-guard.ts +24 -0
package/src/commands/credential-wait.ts +186 -0
package/src/commands/provider-credentials.ts +434 -0
package/src/commands/runner.ts +253 -21
package/src/hooks/hook.ts +143 -66
package/src/http/agents.ts +191 -1
package/src/http/config.ts +11 -1
package/src/http/core.ts +5 -0
package/src/http/inbox-state.ts +89 -0
package/src/http/index.ts +10 -0
package/src/http/memory.ts +230 -1
package/src/http/sessions.ts +86 -0
package/src/http/status.ts +665 -0
package/src/http/task-templates.ts +51 -0
package/src/http/tasks.ts +85 -5
package/src/http/users.ts +134 -0
package/src/prompts/memories.ts +62 -0
package/src/providers/claude-adapter.ts +22 -0
package/src/providers/claude-managed-adapter.ts +24 -0
package/src/providers/codex-adapter.ts +43 -1
package/src/providers/devin-adapter.ts +18 -0
package/src/providers/index.ts +7 -0
package/src/providers/opencode-adapter.ts +60 -0
package/src/providers/pi-mono-adapter.ts +71 -0
package/src/providers/types.ts +34 -0
package/src/server.ts +2 -0
package/src/slack/handlers.ts +0 -1
package/src/tests/agents-harness-provider.test.ts +333 -0
package/src/tests/credential-check.test.ts +367 -0
package/src/tests/credential-status-api.test.ts +223 -0
package/src/tests/credential-status-routing.test.ts +150 -0
package/src/tests/credential-wait.test.ts +282 -0
package/src/tests/harness-provider-resolution.test.ts +242 -0
package/src/tests/jira-sync.test.ts +1 -1
package/src/tests/memory-edges.test.ts +722 -0
package/src/tests/memory-rate-endpoint.test.ts +330 -0
package/src/tests/memory-rate-tool.test.ts +252 -0
package/src/tests/memory-rater-e2e.test.ts +578 -0
package/src/tests/memory-rater-implicit-citation.test.ts +304 -0
package/src/tests/memory-rater-llm-summarizer.test.ts +317 -0
package/src/tests/memory-rater-llm.test.ts +964 -0
package/src/tests/memory-rater-store.test.ts +249 -0
package/src/tests/memory-reranker.test.ts +161 -2
package/src/tests/migration-runner-regressions.test.ts +17 -2
package/src/tests/mocks/mock-llm-rater-client.ts +35 -0
package/src/tests/run-server-raters.test.ts +291 -0
package/src/tests/sessions.test.ts +141 -0
package/src/tests/status.test.ts +843 -0
package/src/tests/stop-hook-task-resolution.test.ts +98 -0
package/src/tests/template-recommendations.test.ts +148 -0
package/src/tests/tool-annotations.test.ts +2 -2
package/src/tests/use-dismissible-card.test.ts +140 -0
package/src/tools/memory-rate.ts +166 -0
package/src/tools/memory-search.ts +18 -0
package/src/tools/store-progress.ts +37 -0
package/src/tools/swarm-config/set-config.ts +17 -1
package/src/tools/tool-config.ts +1 -0
package/src/types.ts +122 -1
package/src/utils/harness-provider.ts +32 -0
package/tsconfig.json +0 -2

package/src/http/memory.ts CHANGED Viewed

@@ -3,10 +3,19 @@ import { z } from "zod";
 import { chunkContent } from "../be/chunking";
 import { getEmbeddingProvider, getMemoryStore } from "../be/memory";
 import { CANDIDATE_SET_MULTIPLIER } from "../be/memory/constants";
+import { listEdgesForAgent } from "../be/memory/edges-store";
+import { recordRetrievals } from "../be/memory/raters/retrieval";
+import { applyRating, ExplicitSelfDuplicateError } from "../be/memory/raters/store";
+import {
+  type RatingEvent,
+  REFERENCES_SOURCE_MAX_LENGTH,
+  sanitizeReferencesSource,
+} from "../be/memory/raters/types";
 import { rerank } from "../be/memory/reranker";
+import { getRetrievalsForAgent, hasRetrievalForTask } from "../be/memory/retrieval-store";
 import { AgentMemoryScopeSchema, AgentMemorySourceSchema } from "../types";
 import { route } from "./route-def";
-import { json, jsonError } from "./utils";
+import { json, jsonError, parseQueryParams } from "./utils";
 // ─── Route Definitions ───────────────────────────────────────────────────────
@@ -115,6 +124,105 @@ const deleteMemoryById = route({
   },
 });
+// Memory rater v1.5 — worker-facing rating endpoints. Plan:
+// thoughts/taras/plans/2026-05-05-memory-rater-v1.5/step-3.md
+//
+// `source` is restricted to `llm` and `explicit-self` at the HTTP boundary —
+// `implicit-citation` runs in-process server-side via applyRating directly
+// and must never arrive over HTTP (defence against worker spoofing).
+// `referencesSource` (step-6 §4) — Q2 free-form contract: ≤512 chars,
+// control-char strip, NUL byte rejection. Convention `<source>:<identifier>`
+// (e.g. github:owner/repo#N, linear:KEY-N, customer:<slug>) is documented
+// only in the OpenAPI description — server does NOT validate prefixes and
+// does NOT enforce a closed enum. The transform throws via `z.NEVER` when
+// sanitization rejects the input so the request fails with a clear 400.
+const ReferencesSourceSchema = z
+  .string()
+  .min(1)
+  .max(REFERENCES_SOURCE_MAX_LENGTH)
+  .transform((value, ctx) => {
+    const cleaned = sanitizeReferencesSource(value);
+    if (cleaned === null) {
+      ctx.addIssue({
+        code: z.ZodIssueCode.custom,
+        message: "referencesSource must not contain NUL bytes or strip to empty",
+      });
+      return z.NEVER;
+    }
+    return cleaned;
+  })
+  .describe(
+    'Optional external source ID this memory references. Free-form string, convention "<source>:<identifier>" (e.g. "github:owner/repo#N", "linear:KEY-N", "customer:<slug>", "slack:<channel>:<ts>", "agentmail:<thread-id>"). Pick any prefix that fits — no closed enum. When present, an edge from this memory to the external source is created/updated.',
+  );
+const RateEventSchema = z.object({
+  memoryId: z.string().min(1),
+  signal: z.number().min(-1).max(1),
+  weight: z.number().min(0).max(1),
+  source: z.enum(["llm", "explicit-self"]),
+  reasoning: z.string().max(500).optional(),
+  taskId: z.string().uuid().optional(),
+  referencesSource: ReferencesSourceSchema.optional(),
+});
+const rateMemory = route({
+  method: "post",
+  path: "/api/memory/rate",
+  pattern: ["api", "memory", "rate"],
+  summary: "Submit RatingEvents to update memory usefulness posteriors",
+  tags: ["Memory"],
+  auth: { apiKey: true, agentId: true },
+  body: z.object({
+    events: z.array(RateEventSchema).min(1).max(50),
+  }),
+  responses: {
+    200: { description: "Ratings applied; per-event rejections returned in body" },
+    400: { description: "Validation error or explicit-self R6 spam-guard rejection" },
+    409: { description: "Duplicate explicit-self rating for (taskId, memoryId)" },
+  },
+});
+const getRetrievals = route({
+  method: "get",
+  path: "/api/memory/retrievals",
+  pattern: ["api", "memory", "retrievals"],
+  summary: "List memories retrieved for a task or session (rater input)",
+  tags: ["Memory"],
+  auth: { apiKey: true, agentId: true },
+  query: z
+    .object({
+      taskId: z.string().uuid().optional(),
+      sessionId: z.string().optional(),
+    })
+    .refine((q) => q.taskId || q.sessionId, {
+      message: "taskId or sessionId required",
+    }),
+  responses: {
+    200: { description: "Retrieval rows joined with agent_memory" },
+    400: { description: "Missing taskId/sessionId or X-Agent-ID" },
+  },
+});
+// Memory rater v1.5 step-6 — the edges-list endpoint that powers the
+// homepage demo ("this memory references PR #377"). Auth by X-Agent-ID +
+// Bearer with defence-in-depth: the joined `agent_memory` row must either
+// be swarm-scope or owned by the requesting agent. Plan §7.
+const getMemoryEdges = route({
+  method: "get",
+  path: "/api/memory/edges",
+  pattern: ["api", "memory", "edges"],
+  summary: "List references-source edges for a memory",
+  tags: ["Memory"],
+  auth: { apiKey: true, agentId: true },
+  query: z.object({
+    memoryId: z.string().min(1),
+  }),
+  responses: {
+    200: { description: "Edges with computed usefulness scores" },
+    400: { description: "Missing memoryId or X-Agent-ID" },
+  },
+});
 // ─── Handler ─────────────────────────────────────────────────────────────────
 export async function handleMemory(
@@ -211,6 +319,27 @@ export async function handleMemory(
       });
       const ranked = rerank(candidates, { limit: Math.min(limit, 20) });
+      // Retrieval bridge — when caller passed `X-Source-Task-ID`, record one
+      // `memory_retrieval` row per returned memory so server-side raters
+      // (ImplicitCitationRater, fired from store-progress on task completion)
+      // know which memories were surfaced. Best-effort: a logging failure must
+      // never poison search.
+      const sourceTaskIdHeader = req.headers["x-source-task-id"];
+      const sourceTaskId = Array.isArray(sourceTaskIdHeader)
+        ? sourceTaskIdHeader[0]
+        : sourceTaskIdHeader;
+      if (sourceTaskId) {
+        try {
+          recordRetrievals(
+            sourceTaskId,
+            myAgentId,
+            ranked.map((r) => ({ memoryId: r.id, similarity: r.similarity })),
+          );
+        } catch (err) {
+          console.error("[memory-search] recordRetrievals failed:", (err as Error).message);
+        }
+      }
       json(res, {
         results: ranked.map((r) => ({
           id: r.id,
@@ -389,5 +518,105 @@ export async function handleMemory(
     return true;
   }
+  if (rateMemory.match(req.method, pathSegments)) {
+    if (!myAgentId) {
+      jsonError(res, "Missing X-Agent-ID header", 400);
+      return true;
+    }
+    const parsed = await rateMemory.parse(req, res, pathSegments, new URLSearchParams());
+    if (!parsed) return true;
+    const { events } = parsed.body;
+    // R6 spam guard: explicit-self requires a matching memory_retrieval row.
+    // Reject the whole batch on first offender so the worker sees a clear 400.
+    for (const evt of events) {
+      if (evt.source !== "explicit-self") continue;
+      if (!evt.taskId) {
+        jsonError(res, `explicit-self rating for memoryId=${evt.memoryId} requires taskId`, 400);
+        return true;
+      }
+      if (!hasRetrievalForTask(evt.taskId, evt.memoryId)) {
+        jsonError(
+          res,
+          `explicit-self rating rejected: memoryId=${evt.memoryId} not present in memory_retrieval for task=${evt.taskId}`,
+          400,
+        );
+        return true;
+      }
+    }
+    // applyRating's ctx carries a single taskId for the batch. Group events by
+    // taskId so each call gets a single coherent ctx (and one transaction).
+    const groups = new Map<string | undefined, typeof events>();
+    for (const evt of events) {
+      const list = groups.get(evt.taskId) ?? [];
+      list.push(evt);
+      groups.set(evt.taskId, list);
+    }
+    let applied = 0;
+    const rejected: { memoryId: string; reason: string }[] = [];
+    try {
+      for (const [taskId, batch] of groups) {
+        const ratingEvents: RatingEvent[] = batch.map((e) => ({
+          memoryId: e.memoryId,
+          signal: e.signal,
+          weight: e.weight,
+          source: e.source,
+          reasoning: e.reasoning,
+          ...(e.referencesSource !== undefined ? { referencesSource: e.referencesSource } : {}),
+        }));
+        const result = applyRating(ratingEvents, { taskId });
+        applied += result.applied;
+        for (const r of result.rejected) {
+          rejected.push({ memoryId: r.event.memoryId, reason: r.reason });
+        }
+      }
+    } catch (err) {
+      if (err instanceof ExplicitSelfDuplicateError) {
+        jsonError(res, `Duplicate explicit-self rating for memoryId=${err.event.memoryId}`, 409);
+        return true;
+      }
+      throw err;
+    }
+    json(res, { applied, rejected });
+    return true;
+  }
+  if (getRetrievals.match(req.method, pathSegments)) {
+    if (!myAgentId) {
+      jsonError(res, "Missing X-Agent-ID header", 400);
+      return true;
+    }
+    const queryParams = parseQueryParams(req.url || "");
+    const parsed = await getRetrievals.parse(req, res, pathSegments, queryParams);
+    if (!parsed) return true;
+    const { taskId, sessionId } = parsed.query;
+    const rows = getRetrievalsForAgent(myAgentId, { taskId, sessionId });
+    json(res, { results: rows });
+    return true;
+  }
+  if (getMemoryEdges.match(req.method, pathSegments)) {
+    if (!myAgentId) {
+      jsonError(res, "Missing X-Agent-ID header", 400);
+      return true;
+    }
+    const queryParams = parseQueryParams(req.url || "");
+    const parsed = await getMemoryEdges.parse(req, res, pathSegments, queryParams);
+    if (!parsed) return true;
+    const { memoryId } = parsed.query;
+    const edges = listEdgesForAgent(myAgentId, memoryId);
+    json(res, { edges });
+    return true;
+  }
   return false;
 }

package/src/http/sessions.ts ADDED Viewed

@@ -0,0 +1,86 @@
+import type { IncomingMessage, ServerResponse } from "node:http";
+import { z } from "zod";
+import { getRootTaskChain, getTaskById, listRecentSessions } from "../be/db";
+import { route } from "./route-def";
+import { json, jsonError } from "./utils";
+// ─── Route Definitions ───────────────────────────────────────────────────────
+const listSessions = route({
+  method: "get",
+  path: "/api/sessions",
+  pattern: ["api", "sessions"],
+  summary: "List recent task sessions (root tasks + chain summary)",
+  tags: ["Sessions"],
+  query: z.object({
+    limit: z.coerce.number().int().optional(),
+    offset: z.coerce.number().int().optional(),
+    /** Comma-separated source filter (e.g. `ui,slack`). Omit to include all. */
+    source: z.string().optional(),
+    /** Case-insensitive substring match against the root task's text. */
+    q: z.string().optional(),
+  }),
+  responses: {
+    200: { description: "Recent sessions ordered by chain-wide last activity" },
+    401: { description: "Unauthorized" },
+  },
+  auth: { apiKey: true },
+});
+const getSession = route({
+  method: "get",
+  path: "/api/sessions/{rootTaskId}",
+  pattern: ["api", "sessions", null],
+  summary: "Get a session — root task + the entire descendant chain",
+  tags: ["Sessions"],
+  params: z.object({ rootTaskId: z.string() }),
+  responses: {
+    200: { description: "Root task + chain (ordered by createdAt)" },
+    401: { description: "Unauthorized" },
+    404: { description: "Root task not found" },
+  },
+  auth: { apiKey: true },
+});
+// ─── Handler ─────────────────────────────────────────────────────────────────
+export async function handleSessions(
+  req: IncomingMessage,
+  res: ServerResponse,
+  pathSegments: string[],
+  queryParams: URLSearchParams,
+): Promise<boolean> {
+  if (listSessions.match(req.method, pathSegments)) {
+    const parsed = await listSessions.parse(req, res, pathSegments, queryParams);
+    if (!parsed) return true;
+    const sources = parsed.query.source
+      ? parsed.query.source
+          .split(",")
+          .map((s) => s.trim())
+          .filter(Boolean)
+      : undefined;
+    const sessions = listRecentSessions({
+      limit: parsed.query.limit,
+      offset: parsed.query.offset,
+      source: sources,
+      q: parsed.query.q,
+    });
+    json(res, { sessions });
+    return true;
+  }
+  if (getSession.match(req.method, pathSegments)) {
+    const parsed = await getSession.parse(req, res, pathSegments, queryParams);
+    if (!parsed) return true;
+    const root = getTaskById(parsed.params.rootTaskId);
+    if (!root) {
+      jsonError(res, "Root task not found", 404);
+      return true;
+    }
+    const chain = getRootTaskChain(parsed.params.rootTaskId);
+    json(res, { root, chain });
+    return true;
+  }
+  return false;
+}