npm - @bluecopa/harness - Versions diffs - 1.0.0 → 2.0.1-snapshot.1 - Mend

@bluecopa/harness 1.0.0 → 2.0.1-snapshot.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/README.md +212 -117
package/dist/arc/index.d.ts +1107 -0
package/dist/arc/index.js +4986 -0
package/dist/arc/index.js.map +1 -0
package/dist/observability/otel.d.ts +36 -0
package/dist/observability/otel.js +73 -0
package/dist/observability/otel.js.map +1 -0
package/dist/shared-types-vZuVoy_H.d.ts +147 -0
package/dist/skills/index.d.ts +67 -0
package/dist/skills/index.js +282 -0
package/dist/skills/index.js.map +1 -0
package/package.json +25 -1
package/AGENTS.md +0 -18
package/docs/guides/observability.md +0 -32
package/docs/guides/providers.md +0 -51
package/docs/guides/skills.md +0 -25
package/docs/security/skill-sandbox-threat-model.md +0 -20
package/src/agent/create-agent.ts +0 -884
package/src/agent/create-tools.ts +0 -33
package/src/agent/step-executor.ts +0 -15
package/src/agent/types.ts +0 -57
package/src/context/llm-compaction-strategy.ts +0 -37
package/src/context/prepare-step.ts +0 -65
package/src/context/token-tracker.ts +0 -26
package/src/extracted/manifest.json +0 -10
package/src/extracted/prompts/compaction.md +0 -5
package/src/extracted/prompts/system.md +0 -5
package/src/extracted/tools.json +0 -82
package/src/hooks/hook-runner.ts +0 -22
package/src/hooks/tool-wrappers.ts +0 -64
package/src/interfaces/compaction-strategy.ts +0 -18
package/src/interfaces/hooks.ts +0 -24
package/src/interfaces/sandbox-provider.ts +0 -29
package/src/interfaces/session-store.ts +0 -48
package/src/interfaces/tool-provider.ts +0 -70
package/src/loop/bridge.ts +0 -363
package/src/loop/context-store.ts +0 -207
package/src/loop/lcm-tool-loop.ts +0 -163
package/src/loop/vercel-agent-loop.ts +0 -279
package/src/observability/context.ts +0 -17
package/src/observability/metrics.ts +0 -27
package/src/observability/otel.ts +0 -105
package/src/observability/tracing.ts +0 -13
package/src/optimization/agent-evaluator.ts +0 -40
package/src/optimization/config-serializer.ts +0 -16
package/src/optimization/optimization-runner.ts +0 -39
package/src/optimization/trace-collector.ts +0 -33
package/src/permissions/permission-manager.ts +0 -34
package/src/providers/composite-tool-provider.ts +0 -72
package/src/providers/control-plane-e2b-executor.ts +0 -218
package/src/providers/e2b-tool-provider.ts +0 -68
package/src/providers/local-tool-provider.ts +0 -190
package/src/providers/skill-sandbox-provider.ts +0 -46
package/src/sessions/file-session-store.ts +0 -61
package/src/sessions/in-memory-session-store.ts +0 -39
package/src/sessions/session-manager.ts +0 -44
package/src/skills/skill-loader.ts +0 -52
package/src/skills/skill-manager.ts +0 -175
package/src/skills/skill-router.ts +0 -99
package/src/skills/skill-types.ts +0 -26
package/src/subagents/subagent-manager.ts +0 -22
package/src/subagents/task-tool.ts +0 -13
package/tests/integration/agent-loop-basic.spec.ts +0 -56
package/tests/integration/agent-skill-default-from-sandbox.spec.ts +0 -66
package/tests/integration/concurrency-single-turn.spec.ts +0 -35
package/tests/integration/otel-metrics-emission.spec.ts +0 -62
package/tests/integration/otel-trace-propagation.spec.ts +0 -48
package/tests/integration/parity-benchmark.spec.ts +0 -45
package/tests/integration/provider-local-smoke.spec.ts +0 -63
package/tests/integration/session-resume.spec.ts +0 -30
package/tests/integration/skill-install-rollback.spec.ts +0 -64
package/tests/integration/skill-sandbox-file-blob.spec.ts +0 -54
package/tests/integration/skills-progressive-disclosure.spec.ts +0 -61
package/tests/integration/streaming-compaction-boundary.spec.ts +0 -43
package/tests/integration/structured-messages-agent.spec.ts +0 -265
package/tests/integration/subagent-isolation.spec.ts +0 -24
package/tests/security/skill-sandbox-isolation.spec.ts +0 -51
package/tests/unit/create-tools-schema-parity.spec.ts +0 -22
package/tests/unit/extracted-manifest.spec.ts +0 -41
package/tests/unit/interfaces-contract.spec.ts +0 -101
package/tests/unit/structured-messages.spec.ts +0 -176
package/tests/unit/token-tracker.spec.ts +0 -22
package/tsconfig.json +0 -14
package/vitest.config.ts +0 -7

package/dist/arc/index.d.ts ADDED Viewed

@@ -0,0 +1,1107 @@
+import { A as AnyTool, T as ToolProvider, a as ToolResult, M as ModelFactory, b as ToolResultArtifact } from '../shared-types-vZuVoy_H.js';
+export { c as ActionType, B as BashOptions, d as BatchOp, e as BatchResult, G as GlobOptions, f as GrepOptions, R as ReadOptions, g as TextEditorRequest, h as ThreadStatus, i as ToolProviderCapabilities, W as WebFetchOptions } from '../shared-types-vZuVoy_H.js';
+import { HarnessTelemetry } from '../observability/otel.js';
+import 'ai';
+/** Long-running job orchestration primitives. Generic; no coding-agent assumptions. */
+type JobKind = "local" | "remote";
+/** Discriminated on `kind` so remote-only fields only exist on remote transports. */
+type JobTransport = {
+    kind: "local";
+} | {
+    kind: "remote";
+    host: string;
+    user?: string | undefined;
+    keyPath?: string | undefined;
+};
+interface JobSpec {
+    id: string;
+    label: string;
+    command: string;
+    cwd?: string | undefined;
+    env?: Record<string, string> | undefined;
+    transport: JobTransport;
+    startedAt: number;
+    startedBy?: {
+        tupleId?: string | undefined;
+        turn?: number | undefined;
+    } | undefined;
+}
+type JobState = "running" | "exited" | "failed" | "killed" | "unknown";
+interface JobStatus {
+    spec: JobSpec;
+    state: JobState;
+    /** Local supervisor PID. */
+    pid?: number | undefined;
+    /** Remote parent PID (only set when transport.kind === "remote"). */
+    remotePid?: number | undefined;
+    exitCode?: number | undefined;
+    /** Mirrors spec.startedAt; kept on the status for convenience when reading status without spec unpacking. */
+    startedAt: number;
+    endedAt?: number | undefined;
+    lastSeenAliveAt: number;
+    tailLines: string[];
+    bytesWritten: number;
+}
+type JobEvent = {
+    type: "job_started";
+    status: JobStatus;
+} | {
+    type: "job_output";
+    id: string;
+    chunk: string;
+    at: number;
+} | {
+    type: "job_exited";
+    status: JobStatus;
+} | {
+    type: "job_failed";
+    status: JobStatus;
+    error: string;
+} | {
+    type: "job_killed";
+    status: JobStatus;
+    reason: string;
+};
+interface JobStartOptions {
+    label: string;
+    command: string;
+    transport?: JobTransport | undefined;
+    cwd?: string | undefined;
+    env?: Record<string, string> | undefined;
+}
+interface JobRegistry {
+    start(opts: JobStartOptions, startedBy?: JobSpec["startedBy"]): Promise<JobStatus>;
+    check(id: string): Promise<JobStatus | null>;
+    cancel(id: string, signal?: "TERM" | "KILL"): Promise<JobStatus | null>;
+    list(): Promise<JobStatus[]>;
+    tail(id: string, lines?: number): Promise<string[]>;
+    waitFor(id: string, signal?: AbortSignal): Promise<JobStatus>;
+    subscribe(handler: (e: JobEvent) => void): () => void;
+    /** Cheap synchronous snapshot — suitable for orchestrator context each turn. */
+    snapshot(): JobStatus[];
+    /** Remove completed/killed/failed jobs older than `olderThanMs` (default 24h). Returns count removed. */
+    prune(olderThanMs?: number): Promise<number>;
+}
+interface ToolCallInfo {
+    toolCallId: string;
+    toolName: string;
+    args: Record<string, unknown>;
+    /** Provider-specific metadata preserved across round-trips (e.g., Gemini thought signatures). */
+    providerMetadata?: Record<string, unknown>;
+}
+interface ToolResultInfo {
+    toolCallId: string;
+    toolName: string;
+    result: string;
+    isError?: boolean;
+    durationMs?: number;
+}
+type ContentPart = {
+    type: "text";
+    text: string;
+} | {
+    type: "image";
+    image: Buffer | Uint8Array;
+    mimeType: string;
+};
+interface AgentMessage {
+    role: "system" | "user" | "assistant" | "tool";
+    content: string | ContentPart[];
+    toolCalls?: ToolCallInfo[];
+    toolResults?: ToolResultInfo[];
+    /** Provider-specific metadata preserved across round-trips (e.g., Gemini thought signatures). */
+    providerMetadata?: Record<string, unknown>;
+}
+/**
+ * Tool registry: the Tool contract and schema extraction.
+ *
+ * Agent tool definitions (Bash, Read, Write, etc.) live in the consumer
+ * (truecode). The harness only provides the Tool contract and helpers.
+ */
+type ToolExecutionMode = "serial" | "parallel";
+/** A registered tool: schema for the model, execute for the worker */
+interface Tool {
+    name: string;
+    /** AI SDK tool schema. Optional for ARC-internal tools (ReadEpisode, LCM_*, ScratchPad_*). */
+    schema?: AnyTool | undefined;
+    /** Worker execution mode for batched tool calls. Defaults to serial. */
+    executionMode?: ToolExecutionMode | ((args: Record<string, unknown>) => ToolExecutionMode);
+    /** Execute using the ToolProvider. If not set, tool is handled externally (e.g. ARC tools). */
+    execute?: (provider: ToolProvider, args: Record<string, unknown>, workDir: string) => Promise<ToolResult>;
+    /**
+     * When true, this tool may yield the worker loop if the operation is incomplete.
+     * After execution, the worker checks if the target thread is still running.
+     * If it is and `waitForThread` is available on the ToolProvider, the worker
+     * suspends (does not count a step) until the thread completes.
+     * The tool args must include a `threadId` field for the worker to track.
+     */
+    yieldsOnIncomplete?: boolean | undefined;
+}
+/**
+ * Serialized attachment form suitable for JSON persistence. Unlike the in-flight
+ * `ContentPart` (which carries a `Buffer`), the stored form keeps image bytes
+ * base64-encoded so messages round-trip cleanly through session snapshots.
+ * Converted to a real `ContentPart` only when building AgentMessage[] for the model.
+ */
+interface StoredAttachment {
+    type: "image";
+    imageBase64: string;
+    mimeType: string;
+}
+interface StoredMessage {
+    id: string;
+    conversationId: string;
+    index: number;
+    role: "user" | "assistant" | "tool";
+    content: string;
+    toolCalls?: ToolCallInfo[];
+    toolResults?: ToolResultInfo[];
+    /** Multimodal image attachments. Persisted as base64; converted to ContentPart[] at model-call time. */
+    attachments?: StoredAttachment[];
+    timestamp: number;
+}
+interface GrepResult {
+    messageId: string;
+    conversationId: string;
+    messageIndex: number;
+    excerpt: string;
+    matchContext: string;
+}
+interface MessageStore {
+    append(message: StoredMessage): void;
+    getConversation(conversationId: string): StoredMessage[];
+    getMessage(conversationId: string, index: number): StoredMessage | null;
+    grep(pattern: string, opts?: {
+        conversationId?: string;
+        maxResults?: number;
+    }): GrepResult[];
+    /** Serialize all messages for session persistence. */
+    serialize(): StoredMessage[];
+    /** Load serialized messages into this store (for session hydration). */
+    loadFrom(messages: StoredMessage[]): void;
+}
+declare class MemoryMessageStore implements MessageStore {
+    private messages;
+    private byConversation;
+    append(message: StoredMessage): void;
+    getConversation(conversationId: string): StoredMessage[];
+    getMessage(conversationId: string, index: number): StoredMessage | null;
+    serialize(): StoredMessage[];
+    loadFrom(messages: StoredMessage[]): void;
+    static hydrate(messages: StoredMessage[]): MemoryMessageStore;
+    grep(pattern: string, opts?: {
+        conversationId?: string;
+        maxResults?: number;
+    }): GrepResult[];
+}
+interface SummaryNode {
+    id: string;
+    depth: number;
+    sourceIds: string[];
+    sourceConversationIds: string[];
+    summary: string;
+    artifacts: string[];
+    operations: string[];
+    outcome: string;
+    tokenCount: number;
+    createdAt: number;
+}
+interface CompactionOpts {
+    /** Minimum number of uncovered children before compaction triggers (default: 4) */
+    minChildren?: number;
+    /** Soft token budget — compact when total tokens at a depth exceed this (default: 8000) */
+    softTokenBudget?: number;
+}
+interface SummaryDAG {
+    addLeaf(node: SummaryNode): void;
+    compact(opts?: CompactionOpts): SummaryNode[];
+    getNode(id: string): SummaryNode | null;
+    getLineage(id: string, visited?: Set<string>): string[];
+    getFrontier(budget: number): {
+        frontier: SummaryNode[];
+        coveredIds: Set<string>;
+    };
+    getAllNodes(): SummaryNode[];
+    /** Serialize DAG state for session persistence. */
+    serialize(): {
+        nodes: SummaryNode[];
+        coveredBy: [string, string][];
+    };
+    /** Load serialized DAG state into this instance (for session hydration). */
+    loadFrom(data: {
+        nodes: SummaryNode[];
+        coveredBy: [string, string][];
+    }): void;
+}
+declare class MemorySummaryDAG implements SummaryDAG {
+    private nodes;
+    /** Tracks which source IDs have been covered by a parent node */
+    private coveredBy;
+    serialize(): {
+        nodes: SummaryNode[];
+        coveredBy: [string, string][];
+    };
+    loadFrom(data: {
+        nodes: SummaryNode[];
+        coveredBy: [string, string][];
+    }): void;
+    static hydrate(data: {
+        nodes: SummaryNode[];
+        coveredBy: [string, string][];
+    }): MemorySummaryDAG;
+    addLeaf(node: SummaryNode): void;
+    compact(opts?: CompactionOpts): SummaryNode[];
+    getNode(id: string): SummaryNode | null;
+    getLineage(id: string, visited?: Set<string>): string[];
+    getFrontier(budget: number): {
+        frontier: SummaryNode[];
+        coveredIds: Set<string>;
+    };
+    getAllNodes(): SummaryNode[];
+}
+interface GhostCue {
+    summaryId: string;
+    conversationIds: string[];
+    depth: number;
+    label: string;
+}
+interface AssembledContext {
+    messages: AgentMessage[];
+    ghostCues: GhostCue[];
+    tokenEstimate: number;
+    /** Structured sections for downstream consumers (avoids string matching) */
+    frontierText?: string;
+    ghostCueText?: string;
+}
+type HookEventName = 'PreToolUse' | 'PostToolUse' | 'BeforeWorker' | 'AfterWorker';
+interface HookContext {
+    event: HookEventName;
+    toolName?: string;
+    input?: Record<string, unknown>;
+    output?: ToolResult;
+    metadata?: Record<string, unknown>;
+}
+interface HookDecision {
+    allow: boolean;
+    reason?: string;
+}
+type HookCallback = (context: HookContext) => Promise<HookDecision | void>;
+declare class HookRunner {
+    private readonly hooks;
+    register(event: HookContext['event'], callback: HookCallback): void;
+    run(context: HookContext): Promise<HookDecision>;
+}
+/** Raw worker transcript, append-only storage */
+interface Transcript {
+    id: string;
+    tupleId: string;
+    instruction: string;
+    messages: AgentMessage[];
+    timestamp: number;
+}
+/** Artifact produced by a worker dispatch */
+interface Artifact {
+    id: string;
+    tupleId: string;
+    /** File path or returned value */
+    output: string | null;
+    /** Full textual worker result, preserved even when expected file artifacts are missing */
+    textOutput?: string | undefined;
+    status: "complete" | "incomplete" | "failed" | "interrupted";
+    /** One-line summary from worker's final message */
+    summary: string;
+    stepsUsed: number;
+    /** Tool calls with results (for orchestrator reasoning) */
+    actions?: string[];
+    /** The dispatch instruction that produced this artifact */
+    instruction?: string;
+}
+interface ExpectedArtifact {
+    type: "file" | "directory" | "value" | "unknown";
+    path?: string | undefined;
+    description?: string | undefined;
+}
+interface ExpectedOutputContract {
+    artifacts: ExpectedArtifact[];
+    successCriteria?: string[] | undefined;
+    verification?: string | undefined;
+    description?: string | undefined;
+}
+/** Worker model tier for dispatch routing. */
+type DispatchTier = "fast" | "medium" | "strong";
+/** Worker instruction tuple */
+interface Tuple {
+    id: string;
+    instruction: string;
+    /** Artifact IDs to provide as input */
+    inputs: string[];
+    /** Structured contract for what the worker should produce */
+    expectedOutput: ExpectedOutputContract;
+    /** Tool names available to worker */
+    tools: string[];
+    /** Step budget */
+    steps: number;
+    /** Worker model tier. Omitted dispatches use the default step budget and strong worker model. */
+    tier?: DispatchTier | undefined;
+    /** Semantic role label for this worker (e.g. "Debugger", "Researcher", "Sysadmin").
+     *  Shown in the TUI instead of the generic tier name to give the user a clear
+     *  mental model of what the worker is doing. */
+    role?: string | undefined;
+    /** Public orchestrator rationale that preceded this dispatch */
+    orchestratorContext?: string | undefined;
+    /** Prior tuple this dispatch is continuing from, when ARC resumes internally. */
+    continuationOf?: string | undefined;
+    /** Why ARC created this continuation dispatch. */
+    continuationReason?: "step_budget" | "user_steering" | undefined;
+    /** Compact user-facing checkpoint summary for continuation UI. */
+    continuationSummary?: string | undefined;
+}
+interface DispatchRecord {
+    tuple: Tuple;
+    artifact: Artifact;
+    /** Reference to transcript in TranscriptStore — NOT the full transcript body. */
+    transcriptId: string;
+    progress: WorkerProgressEvent[];
+    completedAt: number;
+    /** Worker execution result (artifacts, actions, status) */
+    workerResult?: WorkerResult | undefined;
+}
+interface OodaSnapshot {
+    observations: string[];
+    beliefs: string[];
+    disprovenApproaches: string[];
+    blockers: string[];
+    decisionPressure: {
+        turn: number;
+        maxTurns: number;
+        turnsRemaining: number;
+        dispatchCount: number;
+        allIncomplete: boolean;
+    };
+}
+type ReadEpisodeDetail = "summary" | "trace" | "artifacts";
+interface ReadEpisodeArgs {
+    id: string;
+    detail?: ReadEpisodeDetail | undefined;
+    artifactKey?: string | undefined;
+    maxTokens?: number | undefined;
+}
+interface TraceToolCall {
+    toolName: string;
+    toolCallId?: string | undefined;
+    args: Record<string, unknown>;
+}
+type ArcTraceEvent = {
+    scope: "orchestrator";
+    phase: "context_assembled";
+    turn: number;
+    totalChars: number;
+    estimatedTokens: number;
+    sections: Record<string, {
+        chars: number;
+        estimatedTokens: number;
+    }>;
+} | {
+    scope: "orchestrator";
+    phase: "model_input";
+    turn: number;
+    model: string;
+    system: string;
+    /** Full AgentMessage context before SDK conversion. */
+    messages: AgentMessage[];
+    /** Full SDK-facing messages after conversion. */
+    modelMessages: unknown[];
+    toolNames: string[];
+} | {
+    scope: "orchestrator";
+    phase: "model_output";
+    turn: number;
+    text: string;
+    toolCalls: TraceToolCall[];
+} | {
+    scope: "orchestrator";
+    phase: "public_rationale_missing";
+    turn: number;
+    toolCalls: TraceToolCall[];
+} | {
+    scope: "orchestrator";
+    phase: "tool_call";
+    turn: number;
+    toolName: string;
+    args: Record<string, unknown>;
+} | {
+    scope: "orchestrator";
+    phase: "tool_result";
+    turn: number;
+    toolName: string;
+    args: Record<string, unknown>;
+    result: unknown;
+} | {
+    scope: "worker";
+    phase: "model_input";
+    tupleId: string;
+    step: number;
+    model: string;
+    system: string;
+    messages: AgentMessage[];
+    toolNames: string[];
+} | {
+    scope: "worker";
+    phase: "model_output";
+    tupleId: string;
+    step: number;
+    action: unknown;
+} | {
+    scope: "worker";
+    phase: "public_rationale_missing";
+    tupleId: string;
+    step: number;
+    toolNames: string[];
+} | {
+    scope: "worker";
+    phase: "textual_tool_call_rescued";
+    tupleId: string;
+    step: number;
+    toolNames: string[];
+} | {
+    scope: "worker";
+    phase: "tool_call";
+    tupleId: string;
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    args: Record<string, unknown>;
+} | {
+    scope: "worker";
+    phase: "tool_result";
+    tupleId: string;
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    result: unknown;
+    resultText: string;
+} | {
+    scope: "worker";
+    phase: "worker_result";
+    tupleId: string;
+    result: unknown;
+};
+interface TranscriptStore {
+    append(transcript: Transcript): Promise<void>;
+    getAll(): Promise<Transcript[]>;
+    get(id: string): Promise<Transcript | null>;
+}
+interface VectorIndex {
+    add(id: string, text: string): Promise<void>;
+    search(query: string, k: number): Promise<string[]>;
+    load(): Promise<void>;
+    save(): Promise<void>;
+    /** Number of documents currently indexed. Used to detect empty index on session resume. */
+    size(): Promise<number>;
+}
+interface ArtifactStore {
+    set(id: string, artifact: Artifact): Promise<void>;
+    get(id: string): Promise<Artifact | null>;
+    getAll(): Promise<Record<string, Artifact>>;
+}
+interface ScratchPad {
+    write(key: string, content: string): Promise<void>;
+    read(key: string): Promise<string | null>;
+    list(): Promise<string[]>;
+    clear(): Promise<void>;
+}
+/** Serialized session state — everything needed to hydrate an ArcLoop. */
+interface SessionSnapshot {
+    messages: StoredMessage[];
+    dispatches: DispatchRecord[];
+    dagNodes: SummaryNode[];
+    dagCoveredBy: [string, string][];
+    turn: number;
+    dispatchCount: number;
+    orchestratorMessageIndex: number;
+}
+/** Lightweight session metadata for listing/picking. */
+interface SessionMeta {
+    id: string;
+    slug: string;
+    createdAt: number;
+    lastActiveAt: number;
+    taskCount?: number;
+    summary: string;
+}
+interface SessionStore {
+    load(id: string): Promise<SessionSnapshot | null>;
+    save(id: string, snapshot: SessionSnapshot): Promise<void>;
+    getMeta(id: string): Promise<SessionMeta | null>;
+    saveMeta(id: string, meta: SessionMeta): Promise<void>;
+    list(): Promise<SessionMeta[]>;
+}
+/** What the orchestrator sees each turn */
+interface OrchestratorContext {
+    task: string;
+    artifacts: Record<string, Artifact>;
+    lastResult: Artifact | null;
+    /** Rolling window of recent orchestrator messages */
+    recentTurns: AgentMessage[];
+    /** Current turn number */
+    turn: number;
+    /** Max turns allowed */
+    maxTurns: number;
+    /** Turns remaining after the current turn */
+    turnsRemaining: number;
+    /** Number of dispatches so far */
+    dispatchCount: number;
+    /** Artifact status counts across all completed dispatches */
+    artifactStatusCounts: Record<Artifact["status"], number>;
+    /** True when no dispatch artifact has reached complete status */
+    allIncomplete: boolean;
+    /** Completed dispatches in chronological order */
+    dispatches: DispatchRecord[];
+    /** Current observe/orient state rendered into the orchestrator prompt */
+    ooda: OodaSnapshot;
+    /** LCM message store (all conversations) */
+    messageStore?: MessageStore | undefined;
+    /** LCM summary DAG */
+    summaryDAG?: SummaryDAG | undefined;
+}
+interface ArcConfig {
+    task: string;
+    /**
+     * Image attachments to inject alongside the initial task when the orchestrator
+     * model is multimodal. Subsequent task attachments flow through pushTask instead.
+     */
+    initialAttachments?: StoredAttachment[] | undefined;
+    workDir: string;
+    /** Model ID for the orchestrator */
+    model: string;
+    /** Model ID for workers */
+    workerModel: string;
+    /** Optional per-tier worker model overrides. Falls back to workerModel when a tier is missing. */
+    workerModelMap?: Partial<Record<DispatchTier, string>> | undefined;
+    /** Optional per-tier worker step budgets. Falls back to ARC defaults when unset. */
+    workerStepBudgets?: Partial<Record<DispatchTier, number>> | undefined;
+    /** Optional cheap model for post-dispatch completion gating. Falls back to workerModelMap.fast, then workerModel. */
+    doneGateModel?: string | undefined;
+    createModel?: ModelFactory;
+    toolProvider: ToolProvider;
+    /** Agent-provided tool definitions (Bash, Read, Write, etc.) with schemas, execute, and artifact metadata. Harness adds ARC framework tools internally. */
+    tools?: Map<string, Tool> | undefined;
+    /** Max orchestrator turns before stopping (default: 12) */
+    maxTurns?: number;
+    /** Max steps per untiered worker (default: 30). Explicit tiers use workerStepBudgets/default tier budgets. */
+    maxStepsPerWorker?: number;
+    /** Rolling window size for orchestrator context (default: 10) */
+    orchestratorWindowSize?: number;
+    /** Directory where agent memory lives (default: workDir/.arc) */
+    memDir?: string;
+    /** Injected vector index (default: in-memory for tests) */
+    vectorIndex?: VectorIndex;
+    /** Injected scratch pad for inter-worker note sharing (default: in-memory for tests) */
+    scratchPad?: ScratchPad;
+    /** Injected transcript store (default: in-memory) */
+    transcriptStore?: TranscriptStore;
+    /** Injected artifact store (default: in-memory) */
+    artifactStore?: ArtifactStore;
+    /** Custom orchestrator system prompt (appended to default) */
+    orchestratorSystemPromptSuffix?: string | undefined;
+    /** Custom worker system prompt (appended to default) */
+    workerSystemPromptSuffix?: string | undefined;
+    /** Custom messages after the core task/budget block */
+    formatOrchestratorContext?: ((context: OrchestratorContext) => AgentMessage[]) | undefined;
+    /** Provider options passed to generateText (e.g. reasoningEffort for OpenAI). */
+    providerOptions?: Record<string, unknown> | undefined;
+    /** Optional hook runner for PreToolUse/PostToolUse/BeforeWorker/AfterWorker events */
+    hookRunner?: HookRunner | undefined;
+    /** Optional telemetry collector for profiling spans and metrics. */
+    telemetry?: HarnessTelemetry | undefined;
+    /** Callback for AskUser orchestrator tool. If provided, AskUser is available to the orchestrator. */
+    askUser?: ((question: string, options?: string[]) => Promise<string>) | undefined;
+    /** Session store for persistence across restarts. */
+    sessionStore?: SessionStore | undefined;
+    /** Session ID to resume. If provided with sessionStore, loop hydrates from saved state. */
+    sessionId?: string | undefined;
+    /** Job registry for long-running process orchestration. Default: MemoryJobRegistry. */
+    jobRegistry?: JobRegistry | undefined;
+    /** Per model-call timeout in milliseconds. Applied to both orchestrator and worker generateText. Default: 180000 (3 min). */
+    modelCallTimeoutMs?: number | undefined;
+}
+type ArcEvent = {
+    type: "orchestrator_turn";
+    turn: number;
+    contextTokens: number;
+} | {
+    type: "trace";
+    trace: ArcTraceEvent;
+} | {
+    type: "dispatch";
+    tupleId: string;
+    instruction: string;
+} | {
+    type: "dispatch_full";
+    tuple: Tuple;
+} | {
+    type: "worker_continuation";
+    tupleId: string;
+    fromTupleId: string;
+    reason: "step_budget" | "user_steering";
+    summary: string;
+} | {
+    type: "worker_progress";
+    tupleId: string;
+    progress: WorkerProgressEvent;
+} | {
+    type: "worker_complete";
+    tupleId: string;
+    status: Artifact["status"];
+    summary: string;
+    stepsUsed: number;
+    actions?: string[] | undefined;
+} | {
+    type: "recall";
+    query: string;
+    answer: string;
+} | {
+    type: "read_episode";
+    id: string;
+    detail: ReadEpisodeDetail;
+    output: string;
+} | {
+    type: "ask_user";
+    question: string;
+    options?: string[] | undefined;
+} | {
+    type: "interrupt_status";
+    summary: string;
+} | {
+    type: "orchestrator_usage";
+    turn: number;
+    inputTokens?: number;
+    outputTokens?: number;
+} | {
+    type: "done";
+    output: string;
+} | {
+    type: "session_saved";
+    sessionId: string;
+} | {
+    type: "text_delta";
+    text: string;
+} | {
+    type: "reasoning_delta";
+    text: string;
+} | {
+    type: "job_event";
+    event: JobEvent;
+} | {
+    type: "interjection_queued";
+    position: number;
+    text: string;
+} | {
+    type: "interjection_delivered";
+    position: number;
+    turn: number;
+};
+type WorkerProgressEvent = {
+    kind: "model_start";
+    step: number;
+    maxSteps: number;
+} | {
+    kind: "model_complete";
+    step: number;
+    actionType: "final" | "tool" | "tool_batch";
+    durationMs: number;
+    toolNames?: string[] | undefined;
+    publicRationale?: string | undefined;
+    missingPublicRationale?: boolean | undefined;
+    outputSummary?: string | undefined;
+    inputTokens?: number | undefined;
+    outputTokens?: number | undefined;
+} | {
+    kind: "model_error";
+    step: number;
+    durationMs: number;
+    error: string;
+} | {
+    kind: "tool_start";
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    argsSummary?: string | undefined;
+} | {
+    kind: "tool_complete";
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    success: boolean;
+    durationMs: number;
+    outputSummary: string;
+    output?: string | undefined;
+    artifact?: ToolResultArtifact | undefined;
+    exitCode?: unknown;
+    metadata?: Record<string, unknown> | undefined;
+} | {
+    kind: "tool_error";
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    durationMs: number;
+    error: string;
+} | {
+    kind: "worker_result";
+    status: "complete" | "incomplete" | "failed" | "interrupted";
+    stepsUsed: number;
+    summary: string;
+} | {
+    kind: "yield_start";
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    threadId: string;
+} | {
+    kind: "yield_resume";
+    step: number;
+    toolCallId: string;
+    toolName: string;
+    threadId: string;
+};
+interface RunWorkerConfig {
+    /** Original top-level task */
+    task?: string | undefined;
+    instruction: string;
+    /** Structured contract for this dispatch */
+    expectedOutput?: ExpectedOutputContract | undefined;
+    /** LCM-assembled context for this worker */
+    lcmContext?: AssembledContext | undefined;
+    /** Artifact ID -> file content */
+    inputArtifacts: Map<string, string>;
+    tools: Record<string, AnyTool>;
+    /** Tool registry with execute/artifact metadata for dispatch and episode projection */
+    toolRegistry: Map<string, Tool>;
+    maxSteps: number;
+    toolProvider: ToolProvider;
+    createModel: ModelFactory;
+    model: string;
+    workDir: string;
+    signal?: AbortSignal | undefined;
+    /** Extra text prefixed to worker system prompt */
+    systemPromptPrefix?: string | undefined;
+    /** Semantic role label for TUI display (e.g. "Debugger", "Researcher"). */
+    role?: string | undefined;
+    /** Extra text appended to worker system prompt */
+    systemPromptSuffix?: string | undefined;
+    /** Provider options passed to generateText (e.g. reasoning config). */
+    providerOptions?: Record<string, unknown> | undefined;
+    /** Public orchestrator rationale that preceded this dispatch */
+    orchestratorContext?: string | undefined;
+    /** Tuple id for full-fidelity trace events */
+    tupleId?: string | undefined;
+    /** Optional diagnostic hook for streaming worker internals to the caller */
+    onProgress?: ((event: WorkerProgressEvent) => void) | undefined;
+    /** Optional full-fidelity trace hook for raw model/tool IO */
+    onTrace?: ((event: ArcTraceEvent) => void) | undefined;
+    /** Optional hook runner for PreToolUse/PostToolUse events */
+    hookRunner?: HookRunner | undefined;
+    /** Optional telemetry collector for profiling spans and metrics. */
+    telemetry?: HarnessTelemetry | undefined;
+    /** Current sub-dispatch depth (0 = top-level worker). Used to enforce max depth. */
+    dispatchDepth?: number | undefined;
+    /** Existing messages to resume from (for continuations). When set, the worker
+     *  appends `instruction` as a user message to these messages instead of building
+     *  a fresh initial prompt. */
+    resumeMessages?: AgentMessage[] | undefined;
+    /** Steps already consumed before this resume (for accurate step counting). */
+    stepsAlreadyUsed?: number | undefined;
+    /** Per model-call timeout in milliseconds. Default: 180000 (3 min). */
+    modelCallTimeoutMs?: number | undefined;
+}
+interface WorkerResult {
+    transcript: AgentMessage[];
+    output: string | null;
+    status: "complete" | "incomplete" | "failed" | "interrupted";
+    stepsUsed: number;
+    /** Last message content for summary */
+    lastMessage: string;
+    /** All tool calls with results for orchestrator visibility */
+    actions: string[];
+    /** Artifacts touched during execution (from ToolResult.artifact) */
+    artifacts: ToolResultArtifact[];
+}
+interface ArcRunResult {
+    output: string;
+    events: ArcEvent[];
+}
+type PushResult = {
+    delivered: "as_task";
+} | {
+    delivered: "as_interjection";
+    position: number;
+} | {
+    delivered: "dropped";
+    reason: "in_ask_user";
+};
+interface PushTaskOptions {
+    /** Multimodal attachments to attach to the resulting user message. */
+    attachments?: StoredAttachment[];
+}
+declare class ArcLoop {
+    private config;
+    private readonly transcriptStore;
+    private readonly vectorIndex;
+    private readonly scratchPad;
+    private readonly artifactStore;
+    private readonly jobRegistry;
+    /** Non-output job events queued for orchestrator turn-boundary injection. */
+    private pendingJobEvents;
+    /** Events that need to flow out of the async generator stream (job events, interjection lifecycle). */
+    private pendingArcEvents;
+    private jobUnsubscribe;
+    private readonly telemetry;
+    private messageStore;
+    private summaryDAG;
+    private readonly createModel;
+    private readonly windowSize;
+    private readonly model;
+    private readonly doneGateModel;
+    /** Full orchestrator system prompt (base + optional suffix). */
+    private readonly orchestratorSystem;
+    /** Orchestrator tool schemas (for the model) */
+    private readonly orchestratorToolSchemas;
+    /** Orchestrator tool registry (for execute) — excludes dispatch/done (control flow) */
+    private readonly orchestratorToolRegistry;
+    /** ARC framework tools that are always available to workers. */
+    private readonly workerArcTools;
+    /** Dispatcher deps + mutable state — shared with dispatcher.ts functions */
+    private readonly dispatchDeps;
+    private readonly dispatchState;
+    private orchestratorMessageIndex;
+    private turn;
+    private maxTurns;
+    private readonly inFlightDispatches;
+    private readonly historySearchesThisTask;
+    private readonly historyReadsThisTask;
+    private readonly historyExpansionsThisTask;
+    private readonly historyExpansionSummaryCache;
+    private lastSessionCheckpointAt;
+    /** Per-turn abort controller — cancelled by interrupt(), refreshed each turn. */
+    private turnController;
+    /** Resolver for the next task — set when the loop is waiting between tasks. */
+    private taskResolve;
+    private pendingInterjections;
+    /** Image attachments for the currently active task. Injected into orchestrator prompts. */
+    private currentTaskAttachments;
+    /** Consecutive dispatch rounds where every dispatch ended in failed/incomplete. Forces done at threshold. */
+    private consecutiveFailedDispatchRounds;
+    private askUserPending;
+    private readonly modelCallTimeoutMs;
+    constructor(config: ArcConfig);
+    /**
+     * Replace agent-provided worker tools for future dispatches.
+     * Already-running workers keep the tool set they started with.
+     */
+    refreshWorkerTools(tools: Map<string, Tool>): void;
+    /** Drain events from asynchronous sources (job registry, interjections) into the generator stream. */
+    private drainPendingArcEvents;
+    private drainPendingJobEvents;
+    private drainPendingInterjections;
+    /** Release subscriptions and free resources held by this loop. */
+    dispose(): void;
+    /**
+     * Interrupt the current turn — cancels in-flight model calls and workers.
+     * The orchestrator loop stays alive and will prompt for user steering.
+     */
+    interrupt(): void;
+    private refreshTurnSignal;
+    /** True when the loop is waiting for the next task (between done boundaries). */
+    get idle(): boolean;
+    /** Serialize current loop state for UI-level checkpoints. */
+    getSessionSnapshot(): SessionSnapshot;
+    /** Restore loop state from a prior UI-level checkpoint. */
+    restoreSessionSnapshot(snapshot: SessionSnapshot | null): void;
+    /**
+     * Deliver a message to the orchestrator regardless of loop state.
+     * - Idle (waiting for next task): resolves waitForNextTask → becomes next task.
+     * - Running: queued as [user interjection], drained at next turn boundary.
+     * - Inside askUser: dropped; caller should resolve the askUser promise directly.
+     */
+    pushTask(msg: string, options?: PushTaskOptions): PushResult;
+    private wrappedAskUser;
+    private waitForNextTask;
+    /** Save session snapshot + update meta if a session store is configured. */
+    private saveSession;
+    private buildSessionSnapshot;
+    private checkpointSession;
+    private checkpointAfterDispatchEvent;
+    private clearCompletedInFlightDispatches;
+    /** Reset per-task state while keeping full conversation history. */
+    private resetForNewTask;
+    /**
+     * Stream events from the orchestration loop.
+     */
+    stream(signal?: AbortSignal): AsyncGenerator<ArcEvent>;
+    /**
+     * Run a single task to completion (for headless/test use).
+     * Breaks after the first `done` event — does not wait for follow-up tasks.
+     */
+    run(signal?: AbortSignal): Promise<ArcRunResult>;
+    private runDispatchCalls;
+    private continueStepBudgetDispatches;
+    private buildContinuationDispatchArgs;
+    private runDoneGate;
+    private completeCurrentTask;
+    /** Append a message to the LCM message store (single source of truth) */
+    private appendOrchestratorMessage;
+    private findEpisodeRecordBySummaryId;
+    private searchHistoryWithGuardrails;
+    private readHistoryWithGuardrails;
+    private expandHistoryWithGuardrails;
+    private summarizeHistoryExpansion;
+    private buildContext;
+    private buildOrchestratorMessages;
+    private buildTaskContextText;
+    private buildAttachmentMessage;
+    private readEpisode;
+    /**
+     * Handle a turn interrupt without routing every follow-up through the
+     * orchestrator. Status questions are answered from the saved worker record;
+     * steering/continue become an internal worker continuation.
+     */
+    private handleInterrupt;
+    private formatInterruptStatus;
+}
+/**
+ * Episode projection: minimal formatting for orchestrator context.
+ *
+ * The worker collects artifacts and actions during execution.
+ * This module just formats DispatchRecords for the orchestrator prompt.
+ */
+/** Format a single dispatch record for the orchestrator prompt */
+declare function formatDispatchForPrompt(record: DispatchRecord, options?: {
+    compact?: boolean;
+    maxChars?: number;
+}): string;
+declare function cloneForTrace<T>(value: T): T;
+/** Default budget for dispatches that do not request a tier. */
+declare const DEFAULT_MAX_STEPS_PER_WORKER = 30;
+/** Per-tier initial budgets. Strong is intentionally larger for implementation loops. */
+declare const DEFAULT_WORKER_STEP_BUDGETS: Record<DispatchTier, number>;
+/** Hard ceiling on worker steps after RequestMoreSteps extensions. */
+declare const ABSOLUTE_MAX_WORKER_STEPS = 60;
+/** Recommended extension size when workers need to keep their current context. */
+declare const REQUEST_MORE_STEPS_INCREMENT = 15;
+/** In-memory transcript store for testing */
+declare class MemoryTranscriptStore implements TranscriptStore {
+    private transcripts;
+    private byId;
+    append(transcript: Transcript): Promise<void>;
+    getAll(): Promise<Transcript[]>;
+    get(id: string): Promise<Transcript | null>;
+}
+/** In-memory vector index for testing (no actual embeddings) */
+declare class MemoryVectorIndex implements VectorIndex {
+    private entries;
+    add(id: string, text: string): Promise<void>;
+    search(query: string, k: number): Promise<string[]>;
+    load(): Promise<void>;
+    save(): Promise<void>;
+    size(): Promise<number>;
+}
+/** In-memory scratch pad for testing */
+declare class MemoryScratchPad implements ScratchPad {
+    private entries;
+    write(key: string, content: string): Promise<void>;
+    read(key: string): Promise<string | null>;
+    list(): Promise<string[]>;
+    clear(): Promise<void>;
+}
+/** In-memory artifact store for testing */
+declare class MemoryArtifactStore implements ArtifactStore {
+    private artifacts;
+    set(id: string, artifact: Artifact): Promise<void>;
+    get(id: string): Promise<Artifact | null>;
+    getAll(): Promise<Record<string, Artifact>>;
+}
+/** In-memory session store for testing */
+declare class MemorySessionStore implements SessionStore {
+    private snapshots;
+    private metas;
+    load(id: string): Promise<SessionSnapshot | null>;
+    save(id: string, snapshot: SessionSnapshot): Promise<void>;
+    getMeta(id: string): Promise<SessionMeta | null>;
+    saveMeta(id: string, meta: SessionMeta): Promise<void>;
+    list(): Promise<SessionMeta[]>;
+}
+/**
+ * File-based transcript store.
+ * Stores transcripts as individual JSON files in a directory.
+ */
+declare class FsTranscriptStore implements TranscriptStore {
+    private readonly dir;
+    private readonly indexPath;
+    private index;
+    private loaded;
+    constructor(dir: string);
+    append(transcript: Transcript): Promise<void>;
+    getAll(): Promise<Transcript[]>;
+    get(id: string): Promise<Transcript | null>;
+    private ensureLoaded;
+}
+/**
+ * File-based artifact store.
+ * Stores artifacts in a single JSON file.
+ */
+declare class FsArtifactStore implements ArtifactStore {
+    private readonly filePath;
+    private artifacts;
+    private loaded;
+    constructor(filePath: string);
+    set(id: string, artifact: Artifact): Promise<void>;
+    get(id: string): Promise<Artifact | null>;
+    getAll(): Promise<Record<string, Artifact>>;
+    private ensureLoaded;
+    private save;
+}
+/**
+ * In-memory reference implementation of JobRegistry.
+ *
+ * Jobs here never actually spawn processes — callers use `simulateExit` /
+ * `simulateOutput` / `simulateFailure` to drive state. Intended for tests
+ * and agents that don't need filesystem-backed persistence.
+ */
+declare class MemoryJobRegistry implements JobRegistry {
+    private jobs;
+    private handlers;
+    private seq;
+    start(opts: JobStartOptions, startedBy?: JobSpec["startedBy"]): Promise<JobStatus>;
+    check(id: string): Promise<JobStatus | null>;
+    cancel(id: string, _signal?: "TERM" | "KILL"): Promise<JobStatus | null>;
+    list(): Promise<JobStatus[]>;
+    tail(id: string, lines?: number): Promise<string[]>;
+    waitFor(id: string, signal?: AbortSignal): Promise<JobStatus>;
+    subscribe(handler: (e: JobEvent) => void): () => void;
+    snapshot(): JobStatus[];
+    prune(_olderThanMs?: number): Promise<number>;
+    simulateOutput(id: string, chunk: string): void;
+    simulateExit(id: string, exitCode: number): void;
+    private emit;
+}
+export { ABSOLUTE_MAX_WORKER_STEPS, AnyTool, type ArcConfig, type ArcEvent, ArcLoop, type ArcRunResult, type ArcTraceEvent, type Artifact, type ArtifactStore, DEFAULT_MAX_STEPS_PER_WORKER, DEFAULT_WORKER_STEP_BUDGETS, type DispatchRecord, type DispatchTier, type ExpectedArtifact, type ExpectedOutputContract, FsArtifactStore, FsTranscriptStore, type JobEvent, type JobKind, type JobRegistry, type JobSpec, type JobStartOptions, type JobState, type JobStatus, type JobTransport, MemoryArtifactStore, MemoryJobRegistry, MemoryMessageStore, MemoryScratchPad, MemorySessionStore, MemorySummaryDAG, MemoryTranscriptStore, MemoryVectorIndex, type MessageStore, ModelFactory, type OodaSnapshot, type OrchestratorContext, type PushResult, REQUEST_MORE_STEPS_INCREMENT, type ReadEpisodeArgs, type ReadEpisodeDetail, type RunWorkerConfig, type ScratchPad, type SessionMeta, type SessionSnapshot, type SessionStore, type StoredAttachment, type StoredMessage, type SummaryDAG, type SummaryNode, type Tool, type ToolExecutionMode, ToolProvider, ToolResult, ToolResultArtifact, type TraceToolCall, type Transcript, type TranscriptStore, type Tuple, type VectorIndex, type WorkerProgressEvent, type WorkerResult, cloneForTrace, formatDispatchForPrompt };