npm - @bluecopa/harness - Versions diffs - 0.1.0-snapshot.129 → 0.1.0-snapshot.130 - Mend

@bluecopa/harness 0.1.0-snapshot.129 → 0.1.0-snapshot.130

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/arc/create-arc-agent.js +100 -77
package/dist/arc/create-arc-agent.js.map +1 -1
package/dist/arc/profile-builder.js +2 -3
package/dist/arc/profile-builder.js.map +1 -1
package/package.json +1 -1

package/dist/arc/create-arc-agent.js CHANGED Viewed

@@ -2601,7 +2601,7 @@ function createProcess(request, config) {
       }
     }
   };
-  const seedPromise = buildSeedMessages(request.contextEpisodeIds ?? [], config.episodeStore);
+  const seedPromise = buildSessionContext(config.episodeStore, config.taskId, request.expectedFiles);
   const startTime = Date.now();
   void (async () => {
     const traceMarkers = [];
@@ -2945,37 +2945,70 @@ async function getNextEpisodeIndex(store, taskId) {
   const episodes = await store.getEpisodesByTask(taskId);
   return episodes.length;
 }
-async function buildSeedMessages(episodeIds, episodeStore) {
-  if (episodeIds.length === 0) return [];
-  const messages = [];
-  for (const id of episodeIds) {
-    const episode = await episodeStore.getEpisode(id);
-    if (!episode) continue;
-    const blocks = [
-      `Action: ${episode.threadAction}`,
-      `Status: ${episode.success ? "success" : "failed"}`,
-      `Summary:
-${episode.summary}`
-    ];
-    if (episode.structuredOutput && Object.keys(episode.structuredOutput).length > 0) {
-      const structuredOutput = JSON.stringify(episode.structuredOutput, null, 2);
-      const truncated = structuredOutput.length > 2e3 ? structuredOutput.slice(0, 2e3) + "\n... [truncated]" : structuredOutput;
-      blocks.push(`Structured output:
-${truncated}`);
-    }
-    if (episode.artifactKeys && episode.artifactKeys.length > 0) {
-      blocks.push(`Artifact handles:
-${episode.artifactKeys.join(", ")}`);
+async function buildSessionContext(episodeStore, taskId, expectedFiles) {
+  const episodes = await episodeStore.getEpisodesByTask(taskId);
+  if (episodes.length === 0) return [];
+  const normalizedExpected = new Set(
+    (expectedFiles ?? []).map((f) => f.trim().replace(/\\/g, "/").replace(/^\.\//, ""))
+  );
+  const overlappingIds = /* @__PURE__ */ new Set();
+  for (const ep of episodes) {
+    const epFiles = [...ep.filesModified ?? [], ...ep.filesRead ?? []].map(
+      (f) => f.trim().replace(/\\/g, "/").replace(/^\.\//, "")
+    );
+    if (epFiles.some((f) => normalizedExpected.has(f) || [...normalizedExpected].some((e) => f.endsWith(`/${e}`) || e.endsWith(`/${f}`)))) {
+      overlappingIds.add(ep.id);
     }
-    blocks.push('Use ReadEpisode with detail: "trace" or "artifacts" only if you need more than this summary.');
+  }
+  const recentEpisodes = episodes.slice(-5);
+  const recentIds = new Set(recentEpisodes.map((e) => e.id));
+  const oldEpisodes = episodes.filter((e) => !recentIds.has(e.id) && !overlappingIds.has(e.id));
+  const overlapEpisodes = episodes.filter((e) => overlappingIds.has(e.id) && !recentIds.has(e.id));
+  const messages = [];
+  if (oldEpisodes.length > 0) {
+    const groupSummary = [
+      `Grouped summary of ${oldEpisodes.length} earlier episodes:`,
+      `  Successful: ${oldEpisodes.filter((e) => e.success).length}`,
+      `  Failed: ${oldEpisodes.filter((e) => !e.success).length}`,
+      `  Files modified: ${[...new Set(oldEpisodes.flatMap((e) => e.filesModified))].slice(0, 10).join(", ")}${oldEpisodes.flatMap((e) => e.filesModified).length > 10 ? "..." : ""}`,
+      `  Actions: ${oldEpisodes.map((e) => e.threadAction.slice(0, 40)).slice(0, 5).join("; ")}${oldEpisodes.length > 5 ? "..." : ""}`
+    ].join("\n");
+    messages.push({ role: "system", content: groupSummary });
+  }
+  for (const episode of overlapEpisodes) {
+    messages.push({
+      role: "system",
+      content: formatEpisodeDetail(episode, "file-overlap")
+    });
+  }
+  for (const episode of recentEpisodes) {
     messages.push({
       role: "system",
-      content: `Context from prior episode (${id}):
-${blocks.join("\n\n")}`
+      content: formatEpisodeDetail(episode, "recent")
     });
   }
   return messages;
 }
+function formatEpisodeDetail(episode, tag) {
+  const blocks = [
+    `Episode E${episode.index} [${episode.id}] (${tag}, ${episode.success ? "ok" : "failed"}):`,
+    `Action: ${episode.threadAction}`,
+    `Summary:
+${episode.summary}`
+  ];
+  if (episode.structuredOutput && Object.keys(episode.structuredOutput).length > 0) {
+    const structuredOutput = JSON.stringify(episode.structuredOutput, null, 2);
+    const truncated = structuredOutput.length > 2e3 ? structuredOutput.slice(0, 2e3) + "\n... [truncated]" : structuredOutput;
+    blocks.push(`Structured output:
+${truncated}`);
+  }
+  if (episode.artifactKeys && episode.artifactKeys.length > 0) {
+    blocks.push(`Artifact handles:
+${episode.artifactKeys.join(", ")}`);
+  }
+  blocks.push("Use ReadEpisode for more detail if needed.");
+  return blocks.join("\n\n");
+}
 function normalizeSeedContext(ctx) {
   if (!ctx) return [];
   if (typeof ctx === "string") {
@@ -3484,6 +3517,39 @@ var ProcessManager = class {
     const existingId = this.actionIndex.get(normalizeAction(action));
     return existingId ? this.processes.get(existingId) : void 0;
   }
+  /**
+   * Auto-inject contextEpisodeIds for file ownership.
+   * Returns a new request with any missing episode IDs added.
+   * This eliminates the need for the LLM to track episode IDs manually.
+   */
+  autoInjectFileOwnership(request) {
+    if (!isExclusiveRequest(request)) return request;
+    const currentOwnedFiles = ownedFiles(request);
+    const currentContextEpisodeIds = new Set(request.contextEpisodeIds ?? []);
+    const injectedIds = [];
+    for (const proc of this.processes.values()) {
+      if (proc.status !== "completed" || !proc.result) continue;
+      const procRequest = this.processRequests.get(proc.id);
+      if (!isExclusiveRequest(procRequest)) continue;
+      const procEpisodeId = proc.result.episode.id;
+      if (currentContextEpisodeIds.has(procEpisodeId)) continue;
+      const procOwnedFiles = /* @__PURE__ */ new Set([
+        ...ownedFiles(procRequest),
+        ...(proc.result.episode.filesModified ?? []).map(normalizeExpectedPath)
+      ]);
+      const hasOverlap = currentOwnedFiles.some(
+        (currentFile) => [...procOwnedFiles].some((ownedFile) => pathsOverlap(currentFile, ownedFile))
+      );
+      if (hasOverlap) {
+        injectedIds.push(procEpisodeId);
+      }
+    }
+    if (injectedIds.length === 0) return request;
+    return {
+      ...request,
+      contextEpisodeIds: [...request.contextEpisodeIds ?? [], ...injectedIds]
+    };
+  }
   findDispatchConflict(request) {
     const existing = this.findByAction(request.action ?? "");
     if (existing && (existing.status === "running" || existing.status === "pending")) {
@@ -3494,7 +3560,7 @@ var ProcessManager = class {
     }
     const currentExclusive = isExclusiveRequest(request);
     const currentOwnedFiles = ownedFiles(request);
-    const currentContextEpisodeIds = new Set(request.contextEpisodeIds ?? []);
+    new Set(request.contextEpisodeIds ?? []);
     for (const proc of this.processes.values()) {
       if (proc.status !== "running" && proc.status !== "pending") continue;
       const procRequest = this.processRequests.get(proc.id);
@@ -3511,30 +3577,6 @@ var ProcessManager = class {
         return { kind: "exclusive_running", process: proc };
       }
     }
-    if (currentExclusive) {
-      for (const proc of this.processes.values()) {
-        if (proc.status !== "completed" || !proc.result) continue;
-        const procRequest = this.processRequests.get(proc.id);
-        if (!isExclusiveRequest(procRequest)) continue;
-        const procEpisodeId = proc.result.episode.id;
-        if (currentContextEpisodeIds.has(procEpisodeId)) continue;
-        const procOwnedFiles = /* @__PURE__ */ new Set([
-          ...ownedFiles(procRequest),
-          ...(proc.result.episode.filesModified ?? []).map(normalizeExpectedPath)
-        ]);
-        const overlappingFiles = currentOwnedFiles.filter(
-          (currentFile) => [...procOwnedFiles].some((ownedFile) => pathsOverlap(currentFile, ownedFile))
-        );
-        if (overlappingFiles.length > 0) {
-          return {
-            kind: "missing_context_for_edit_retry",
-            process: proc,
-            files: overlappingFiles,
-            episodeId: procEpisodeId
-          };
-        }
-      }
-    }
     return null;
   }
   validateDispatchRequest(request) {
@@ -3618,13 +3660,6 @@ var ProcessManager = class {
         message: `FILE OWNERSHIP CONFLICT \u2014 process ${conflict.process.id} currently owns ${conflict.files.join(", ")}. Wait for it to finish before dispatching overlapping work.`
       };
     }
-    if (conflict.kind === "missing_context_for_edit_retry") {
-      return {
-        allow: false,
-        reason: `missing contextEpisodeIds for follow-up edit on files owned by episode ${conflict.episodeId}`,
-        message: `EDIT RETRY MUST CHAIN CONTEXT \u2014 overlapping files ${conflict.files.join(", ")} were already edited in process ${conflict.process.id} (episodeId: ${conflict.episodeId}). Dispatch exactly one follow-up edit thread with contextEpisodeIds: ["${conflict.episodeId}"] instead of starting a fresh edit thread.`
-      };
-    }
     return {
       allow: false,
       reason: `exclusive edit/verify conflict with process ${conflict.process.id}`,
@@ -3875,15 +3910,6 @@ var ProcessManager = class {
     const { loopConfig } = this.config;
     return async (action) => {
       if (action.name === "ReadEpisode") {
-        const allowedEpisodeIds = new Set(request.contextEpisodeIds ?? []);
-        const requestedEpisodeId = String(action.args.id ?? "");
-        if (!allowedEpisodeIds.has(requestedEpisodeId)) {
-          return {
-            success: false,
-            output: "",
-            error: `ReadEpisode is limited to contextEpisodeIds for this thread. Allowed episode IDs: ${[...allowedEpisodeIds].join(", ") || "(none)"}`
-          };
-        }
         const output = await renderEpisodeReadResult({
           episodeStore: loopConfig.episodeStore,
           args: action.args,
@@ -4064,7 +4090,7 @@ var OrchestratorTurnRunner = class {
       const toolCallId = call.toolCallId ?? randomUUID();
       this.config.trace({ type: "tool_call", tool: call.toolName });
       if (call.toolName === "Thread") {
-        const request = this.toProcessRequest(call.args);
+        const rawRequest = this.toProcessRequest(call.args);
         if (exclusiveThreadIndex !== -1 && index !== exclusiveThreadIndex) {
           const resultText2 = "SAME-TURN EDIT SERIALIZATION \u2014 a bounded edit or verification thread is already being dispatched in this turn. Let that single owner thread read, edit, and verify before dispatching any other threads.";
           toolResultMessages.push({
@@ -4072,9 +4098,10 @@ var OrchestratorTurnRunner = class {
             content: resultText2,
             toolResults: [{ toolCallId, toolName: "Thread", result: resultText2 }]
           });
-          yield { type: "thread_rejected", action: request.action ?? "", reason: "same-turn exclusive edit/verify work must run alone" };
+          yield { type: "thread_rejected", action: rawRequest.action ?? "", reason: "same-turn exclusive edit/verify work must run alone" };
           continue;
         }
+        const request = this.config.processManager.autoInjectFileOwnership(rawRequest);
         const validation = this.config.processManager.validateDispatchRequest(request);
         if (!validation.allow) {
           toolResultMessages.push({
@@ -4445,9 +4472,7 @@ ${failureSummary}`;
         (toolResult) => toolResult.toolName === "DownloadRawFile" && !toolResult.isError
       )
     );
-    const hints = [
-      `To give a dependent thread the full data from this thread, pass contextEpisodeIds: ["${episode.id}"]`
-    ];
+    const hints = [];
     const structuredOutputText = this.formatStructuredOutput(episode.structuredOutput);
     if (structuredOutputText) {
       hints.push("Prefer the structured output above as the canonical handoff artifact for dependent threads.");
@@ -4478,7 +4503,7 @@ ${structuredOutputText}` : null,
   buildRetryHint(process2) {
     const files = process2.result?.episode.filesModified?.filter(Boolean) ?? [];
     const fileList = files.length > 0 ? files.join(", ") : "(same file scope)";
-    return `If you retry this edit, dispatch exactly one follow-up edit thread for ${fileList} and include contextEpisodeIds: ["${process2.result?.episode.id}"].`;
+    return `If you retry this edit, dispatch exactly one follow-up edit thread for ${fileList}. File ownership is auto-chained.`;
   }
   formatStructuredOutput(structuredOutput) {
     if (!structuredOutput || Object.keys(structuredOutput).length === 0) {
@@ -4515,7 +4540,7 @@ var DEFAULT_ORCHESTRATOR_PROMPT = `You are an orchestrator agent. You accomplish
 Dispatch when the task requires tool use (search, code, file I/O, web access). Examples:
 - "Research X and Y" \u2192 2 parallel research threads
-- "Read file A, then modify it" \u2192 1 read thread, then 1 write thread with contextEpisodeIds
+- "Read file A, then modify it" \u2192 1 read thread, then 1 write thread
 - "Create a report with data from 3 sources" \u2192 3 parallel data threads, then 1 synthesis thread
 ## When NOT to dispatch
@@ -4541,13 +4566,11 @@ Dispatch at most 3 threads per turn. If more are needed, dispatch the first batc
 Research and read-only work may parallelize.
 Do not split one small edit into multiple edit threads.
 For a bounded edit, dispatch exactly one editor thread that reads, edits, and verifies the change.
-If a prior edit already touched the same files, dispatch a single follow-up edit thread with that episode in contextEpisodeIds.
+File ownership is auto-chained by the harness \u2014 you don't need to track episode IDs manually.
 ## Context passing
-Threads automatically receive the user's current message and any attachment metadata as seed context. You do NOT need to copy-paste URLs, file contents, or pasted data into the action text \u2014 threads can read this directly from their context.
-Use contextEpisodeIds to chain dependent threads: research threads first (parallel), then implementation threads with their episodeIds.
+Threads automatically receive the user's current message, attachment metadata, and compressed session history as seed context. You do NOT need to copy-paste URLs, file contents, or pasted data into the action text \u2014 threads can read this directly from their context.
 ## Completion