npm - sneakoscope - Versions diffs - 2.0.15 → 2.0.16 - Mend

sneakoscope 2.0.15 → 2.0.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/README.md +1 -1
package/crates/sks-core/Cargo.lock +1 -1
package/crates/sks-core/Cargo.toml +1 -1
package/crates/sks-core/src/main.rs +1 -1
package/dist/.sks-build-stamp.json +4 -4
package/dist/bin/sks.js +1 -1
package/dist/cli/command-registry.js +1 -1
package/dist/core/agents/agent-orchestrator.js +66 -3
package/dist/core/agents/agent-scheduler.js +204 -86
package/dist/core/agents/agent-schema.js +1 -1
package/dist/core/agents/native-cli-session-swarm.js +87 -21
package/dist/core/agents/parallel-runtime-proof.js +217 -0
package/dist/core/codex-control/codex-task-runner.js +32 -4
package/dist/core/codex-control/model-call-concurrency.js +106 -0
package/dist/core/commands/naruto-command.js +48 -5
package/dist/core/commands/team-command.js +0 -176
package/dist/core/db-safety.js +34 -6
package/dist/core/fsx.js +1 -1
package/dist/core/git/git-worktree-capability.js +18 -0
package/dist/core/git/git-worktree-manager.js +80 -0
package/dist/core/git/git-worktree-pool.js +4 -0
package/dist/core/mad-db/mad-db-capability.js +33 -1
package/dist/core/mad-db/mad-db-ledger.js +14 -0
package/dist/core/mad-db/mad-db-policy-resolver.js +2 -0
package/dist/core/naruto/naruto-concurrency-governor.js +14 -1
package/dist/core/version.js +1 -1
package/dist/core/zellij/zellij-slot-telemetry.js +56 -1
package/dist/scripts/release-speed-summary.js +2 -0
package/package.json +25 -1
package/schemas/agents/parallel-runtime-proof.schema.json +48 -0

package/README.md CHANGED Viewed

@@ -16,7 +16,7 @@ Set up this agent project with Sneakoscope Codex. Use [[mandarange/Sneakoscope-C
 ## Current Release
-SKS **2.0.15** is the ultra-stabilized Research synthesis release. It keeps the 2.0.14 stage-aware runtime, then hardens final synthesis so non-mock Research uses an evidence-bound Codex/GPT writer, rejects repeated or template-like reports, records source/claim density, and produces handoffs that Team or Naruto can consume directly.
+SKS **2.0.16** is the real parallelism closure release. It proves Naruto/agent runtime concurrency with PID, launch overlap, wall-clock speedup, active/headless worker, model-call, worktree allocation, and incremental Zellij telemetry evidence while keeping Naruto as the execution SSOT.
 What changed:

package/crates/sks-core/Cargo.lock CHANGED Viewed

@@ -76,7 +76,7 @@ dependencies = [
 [[package]]
 name = "sks-core"
-version = "2.0.15"
+version = "2.0.16"
 dependencies = [
  "serde_json",
 ]

package/crates/sks-core/Cargo.toml CHANGED Viewed

@@ -1,6 +1,6 @@
 [package]
 name = "sks-core"
-version = "2.0.15"
+version = "2.0.16"
 edition = "2021"
 [dependencies]

package/crates/sks-core/src/main.rs CHANGED Viewed

@@ -4,7 +4,7 @@ use std::io::{self, Read, Seek, SeekFrom};
 fn main() {
     let mut args = std::env::args().skip(1);
     match args.next().as_deref() {
-        Some("--version") => println!("sks-rs 2.0.15"),
+        Some("--version") => println!("sks-rs 2.0.16"),
         Some("compact-info") => {
             let mut input = String::new();
             let _ = io::stdin().read_to_string(&mut input);

package/dist/.sks-build-stamp.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "schema": "sks.dist-build-stamp.v1",
   "package_name": "sneakoscope",
-  "package_version": "2.0.15",
-  "source_digest": "18f7432c59dd0bbd8090697c2cd4e0c4681d05923e3086f4a96cdc4e0b420280",
-  "source_file_count": 2160,
-  "built_at_source_time": 1780893056447
+  "package_version": "2.0.16",
+  "source_digest": "cafc32cad87d3b6c7aeb0ec0e8e56258f830b35e71fd919440a8c1b95b78432a",
+  "source_file_count": 2187,
+  "built_at_source_time": 1780927200051
 }

package/dist/bin/sks.js CHANGED Viewed

@@ -1,5 +1,5 @@
 #!/usr/bin/env node
-const FAST_PACKAGE_VERSION = '2.0.15';
+const FAST_PACKAGE_VERSION = '2.0.16';
 const args = process.argv.slice(2);
 try {
     if (args[0] === '--agent' && args[1] === 'worker') {

package/dist/cli/command-registry.js CHANGED Viewed

@@ -119,7 +119,7 @@ export const COMMANDS = {
     commit: entry('stable', 'Create a simple git commit', 'dist/commands/commit.js', directCommand(() => import('../commands/commit.js'), 'dist/commands/commit.js')),
     'commit-and-push': entry('stable', 'Create a simple git commit and push', 'dist/commands/commit-and-push.js', directCommand(() => import('../commands/commit-and-push.js'), 'dist/commands/commit-and-push.js')),
     dfix: entry('stable', 'Run DFix diagnose/plan/patch/verify loop', 'dist/core/commands/dfix-command.js', commandArgsCommand(() => import('../core/commands/dfix-command.js'), 'dfixCommand', 'dist/core/commands/dfix-command.js')),
-    team: entry('beta', 'Create and observe Team missions', 'dist/core/commands/team-command.js', argsCommand(() => import('../core/commands/team-command.js'), 'team', 'dist/core/commands/team-command.js')),
+    team: entry('beta', 'Deprecated Team alias; create redirects to Naruto, observe legacy Team missions', 'dist/core/commands/team-command.js', argsCommand(() => import('../core/commands/team-command.js'), 'team', 'dist/core/commands/team-command.js')),
     agent: entry('beta', 'Run native multi-session agent missions', 'dist/core/commands/agent-command.js', argsCommand(() => import('../core/commands/agent-command.js'), 'agentCommand', 'dist/core/commands/agent-command.js')),
     'with-local-llm': entry('beta', 'Enable or inspect local Ollama worker backend', 'dist/core/commands/local-model-command.js', argsCommand(() => import('../core/commands/local-model-command.js'), 'localModelCommand', 'dist/core/commands/local-model-command.js')),
     naruto: entry('labs', 'Run $Naruto shadow-clone swarm (up to 100 parallel sessions)', 'dist/core/commands/naruto-command.js', argsCommand(() => import('../core/commands/naruto-command.js'), 'narutoCommand', 'dist/core/commands/naruto-command.js')),

package/dist/core/agents/agent-orchestrator.js CHANGED Viewed

@@ -54,7 +54,7 @@ import { CODEX_AGENT_WORKER_RESULT_SCHEMA_ID, codexAgentWorkerResultSchema } fro
 import { resolveLocalCollaborationPolicy, localCollaborationParticipated } from '../local-llm/local-collaboration-policy.js';
 import { runFinalGptReviewStage } from '../pipeline/final-gpt-review-stage.js';
 import { selectFinalGptPatchSource } from '../pipeline/final-gpt-patch-stage.js';
-import { allocateWorkerWorktree } from '../git/git-worktree-manager.js';
+import { allocateWorkerWorktree, allocateWorkerWorktreesBatch } from '../git/git-worktree-manager.js';
 import { exportGitWorktreeDiff } from '../git/git-worktree-diff.js';
 import { buildGitWorktreePatchEnvelope } from '../git/git-worktree-patch-envelope.js';
 import { checkpointWorkerWorktree } from '../git/git-worktree-checkpoint.js';
@@ -63,6 +63,7 @@ import { createGitIntegrationWorktree } from '../git/git-integration-worktree.js
 import { applyGitWorktreeMergeQueue } from '../git/git-worktree-merge-queue.js';
 import { crossRebaseIdleWorktrees } from '../git/git-worktree-cross-rebase.js';
 import { gitOutputLine, runGitCommand } from '../git/git-worktree-runner.js';
+import { writeParallelRuntimeProof } from './parallel-runtime-proof.js';
 export async function runNativeAgentOrchestrator(opts = {}) {
     const root = path.resolve(opts.root || process.cwd());
     const prompt = String(opts.prompt || 'Native agent run');
@@ -289,9 +290,46 @@ export async function runNativeAgentOrchestrator(opts = {}) {
         diffs: [],
         checkpoints: [],
         cleanup: [],
+        prewarmed_allocations: [],
         blockers: []
     };
     await writeJsonAtomic(path.join(ledgerRoot, 'agent-git-worktree-runtime.json'), gitWorktreeRuntime);
+    const preparedWorktreeAllocations = new Map();
+    if (gitWorktreePolicy?.mode === 'git-worktree') {
+        const writeSlices = uniqueWritableSlicesForWorktrees(partition.slices, Math.max(1, targetActiveSlots));
+        if (writeSlices.length) {
+            const prewarmed = await allocateWorkerWorktreesBatch({
+                root: gitWorktreePolicy.main_repo_root || root,
+                missionId,
+                workers: writeSlices.map((slice, index) => ({
+                    workerId: String(slice.owner_agent_id || slice.owner || `worker-${index + 1}`),
+                    slotId: String(slice.owner_agent_id || slice.owner || `slot-${index + 1}`),
+                    generationIndex: 1
+                })),
+                maxParallel: Math.min(targetActiveSlots, Number(process.env.SKS_NARUTO_GIT_WORKTREE_CAP || targetActiveSlots))
+            }).catch((err) => {
+                gitWorktreeRuntime.blockers.push('git_worktree_batch_prewarm_failed:' + (err instanceof Error ? err.message : String(err)));
+                gitWorktreeRuntime.ok = false;
+                return [];
+            });
+            gitWorktreeRuntime.prewarmed_allocations = prewarmed.map((allocation) => ({
+                worker_id: allocation.worker_id,
+                slot_id: allocation.slot_id,
+                ok: allocation.ok,
+                worktree_path: allocation.worktree_path,
+                branch: allocation.branch,
+                blockers: allocation.blockers
+            }));
+            for (const allocation of prewarmed) {
+                if (allocation.ok)
+                    preparedWorktreeAllocations.set(String(allocation.worker_id), allocation);
+                else
+                    gitWorktreeRuntime.blockers.push(...allocation.blockers);
+            }
+            gitWorktreeRuntime.ok = gitWorktreeRuntime.blockers.length === 0;
+            await writeJsonAtomic(path.join(ledgerRoot, 'agent-git-worktree-runtime.json'), gitWorktreeRuntime);
+        }
+    }
     const nativeCliSwarm = createNativeCliSessionSwarmRecorder(ledgerRoot, {
         missionId,
         requestedAgents: Number(opts.agents || roster.agent_count || targetActiveSlots),
@@ -329,7 +367,8 @@ export async function runNativeAgentOrchestrator(opts = {}) {
                 agent,
                 slice,
                 policy: gitWorktreePolicy,
-                runtime: gitWorktreeRuntime
+                runtime: gitWorktreeRuntime,
+                preparedAllocation: preparedWorktreeAllocations.get(String(agent.id || '')) || null
             });
             const runtimeAgent = workerWorktree ? { ...agent, worktree: workerWorktree.context } : agent;
             const runtimeSlice = workerWorktree ? { ...slice, worktree: workerWorktree.context } : slice;
@@ -432,6 +471,13 @@ export async function runNativeAgentOrchestrator(opts = {}) {
         }
     });
     await nativeCliSwarm.finalize();
+    const parallelRuntimeProof = await writeParallelRuntimeProof(ledgerRoot, missionId, {
+        requestedWorkers: Number(opts.agents || roster.agent_count || targetActiveSlots),
+        targetActiveSlots,
+        visiblePanes: visualLaneCount,
+        expectedWorkerRuntimeMs: targetActiveSlots >= 10 ? 8000 : targetActiveSlots >= 2 ? 2000 : 25,
+        minActiveWorkers: Math.min(targetActiveSlots, desiredWorkItemCount)
+    });
     const results = scheduler.results;
     const nativeCliSessionProof = await writeNativeCliSessionProof(ledgerRoot, {
         requestedAgents: Number(opts.agents || roster.agent_count || targetActiveSlots),
@@ -600,6 +646,7 @@ export async function runNativeAgentOrchestrator(opts = {}) {
         gpt_final_arbiter: gptFinalArbiter,
         final_gpt_patch_stage: finalGptPatchStage,
         patch_swarm: patchSwarm,
+        parallel_runtime_proof: parallelRuntimeProof,
         proof
     };
 }
@@ -620,6 +667,22 @@ function withFinalGptPatchEnvelopes(results, patchEnvelopes = []) {
         next[0] = { ...next[0], patch_envelopes: patchEnvelopes };
     return next;
 }
+function uniqueWritableSlicesForWorktrees(slices = [], limit) {
+    const selected = [];
+    const seenOwners = new Set();
+    for (const slice of Array.isArray(slices) ? slices : []) {
+        if (!Array.isArray(slice?.write_paths) || slice.write_paths.length === 0)
+            continue;
+        const owner = String(slice.owner_agent_id || slice.owner || slice.id || '');
+        if (!owner || seenOwners.has(owner))
+            continue;
+        seenOwners.add(owner);
+        selected.push(slice);
+        if (selected.length >= Math.max(1, limit))
+            break;
+    }
+    return selected;
+}
 function applyNarutoWorkGraphToPartition(partition, graph, roster, targetActiveSlots, parentPrompt = '') {
     const activeRoster = (Array.isArray(roster?.roster) ? roster.roster : []).slice(0, Math.max(1, targetActiveSlots));
     const activeAgentIds = new Set(activeRoster.map((row) => String(row.id || '')).filter(Boolean));
@@ -873,7 +936,7 @@ async function prepareWorkerGitWorktree(input) {
     if (!sliceHasWritePaths && !agentWriteCapable)
         return null;
     const generationIndex = Math.max(1, Math.floor(Number(input.agent.generation_index || 1)));
-    const allocation = await allocateWorkerWorktree({
+    const allocation = input.preparedAllocation || await allocateWorkerWorktree({
         repoRoot: input.policy.main_repo_root || input.root,
         missionId: input.missionId,
         workerId: String(input.agent.id || input.slice.id || 'worker'),

package/dist/core/agents/agent-scheduler.js CHANGED Viewed

@@ -4,6 +4,7 @@ import { MAX_AGENT_COUNT } from './agent-schema.js';
 import { appendAgentWorkQueueEvent, completeWorkItem, createAgentWorkQueue, enqueueFollowUpWorkItems, leaseNextWorkItem, pendingWorkItems, writeAgentWorkQueue } from './agent-work-queue.js';
 import { closeWorkerSlotsAfterDrain, createAgentWorkerSlots, markWorkerSlotGenerationClosed, openWorkerSlotGeneration, writeAgentWorkerSlots } from './agent-worker-slot.js';
 import { closeAgentSessionGeneration, createAgentSessionGeneration, writeAgentSessionGeneration } from './agent-session-generation.js';
+import { appendParallelRuntimeEvent } from './parallel-runtime-proof.js';
 export const AGENT_SCHEDULER_SCHEMA = 'sks.agent-scheduler.v1';
 export const AGENT_SCHEDULER_EVENT_SCHEMA = 'sks.agent-scheduler-event.v1';
 export async function runAgentScheduler(input) {
@@ -19,6 +20,10 @@ export async function runAgentScheduler(input) {
     });
     const active = new Map();
     const results = [];
+    const schedulerStartedAt = Date.now();
+    let batchCounter = 0;
+    let batchLaunchSpanTotalMs = 0;
+    let batchDispatchInProgress = false;
     let state = buildState(input.missionId, targetActiveSlots, queue, slots, active, {
         status: 'initializing',
         refillDelayMs: input.refillDelayMs || 0,
@@ -27,7 +32,7 @@ export async function runAgentScheduler(input) {
     await writeAll(input.root, state, slots, queue, active, { event_type: 'scheduler_initialized' }, input.onSchedulerEvent);
     await refillSlots(null);
     while (active.size > 0 || pendingWorkItems(queue).length > 0) {
-        if (active.size === 0 && pendingWorkItems(queue).length > 0) {
+        if (!batchDispatchInProgress && active.size === 0 && pendingWorkItems(queue).length > 0) {
             state.blockers.push('scheduler_pending_queue_without_active_sessions');
             state.status = 'blocked';
             await writeAll(input.root, state, slots, queue, active, { event_type: 'scheduler_blocked', pending_count: pendingWorkItems(queue).length }, input.onSchedulerEvent);
@@ -94,6 +99,7 @@ export async function runAgentScheduler(input) {
     state.all_generations_closed = true;
     if (!state.pending_queue_drained)
         state.blockers.push('scheduler_pending_queue_not_drained');
+    updateUtilizationMetrics();
     await writeAll(input.root, state, slots, queue, active, { event_type: 'scheduler_drained' }, input.onSchedulerEvent);
     return {
         schema: 'sks.agent-scheduler-result.v1',
@@ -105,9 +111,179 @@ export async function runAgentScheduler(input) {
     };
     async function refillSlots(backfill) {
         state.status = 'running';
+        const launches = collectLaunchBatch();
+        if (!launches.length)
+            return;
+        batchDispatchInProgress = true;
+        const batchId = `batch-${Date.now().toString(36)}-${batchCounter++}`;
+        const batchStart = Date.now();
         const launchEvents = [];
-        while (active.size < targetActiveSlots && pendingWorkItems(queue).length > 0) {
-            const slotIndex = slots.findIndex((slot) => slot.status === 'idle');
+        try {
+            for (const launch of launches)
+                slots[launch.slotIndex] = launch.openedSlot;
+            await Promise.all(launches.map((launch) => writeAgentSessionGeneration(input.root, launch.generation)));
+            await writeAll(input.root, state, slots, queue, active, {
+                event_type: 'batch_dispatch_started',
+                batch_id: batchId,
+                launch_count: launches.length,
+                session_ids: launches.map((launch) => launch.generation.session_id)
+            }, input.onSchedulerEvent);
+            await appendParallelRuntimeEvent(input.root, input.missionId, {
+                event_type: 'batch_dispatch_started',
+                slot_id: null,
+                generation_index: null,
+                session_id: null,
+                pid: null,
+                backend: 'scheduler',
+                placement: 'unknown',
+                batch_id: batchId,
+                meta: { launch_count: launches.length, active_count_before: active.size }
+            }).catch(() => undefined);
+            for (const launch of launches) {
+                const { slot, openedSlot, generation, agent, workItem } = launch;
+                await appendParallelRuntimeEvent(input.root, input.missionId, {
+                    event_type: 'slot_reserved',
+                    slot_id: slot.slot_id,
+                    generation_index: generation.generation_index,
+                    session_id: generation.session_id,
+                    pid: null,
+                    backend: 'scheduler',
+                    placement: 'unknown',
+                    batch_id: batchId,
+                    meta: { work_item_id: workItem.id }
+                }).catch(() => undefined);
+                await appendParallelRuntimeEvent(input.root, input.missionId, {
+                    event_type: 'worker_launch_invoked',
+                    slot_id: slot.slot_id,
+                    generation_index: generation.generation_index,
+                    session_id: generation.session_id,
+                    pid: null,
+                    backend: 'scheduler',
+                    placement: 'unknown',
+                    batch_id: batchId,
+                    meta: { work_item_id: workItem.id }
+                }).catch(() => undefined);
+                const promise = Promise.resolve()
+                    .then(() => input.launchSession({ agent, workItem, generation, slot: openedSlot, queue, state }))
+                    .then((result) => ({
+                    result,
+                    session_id: generation.session_id,
+                    slot_id: slot.slot_id,
+                    generation_index: generation.generation_index,
+                    terminal_close_report_path: path.join(generation.artifact_dir, 'agent-terminal-close-report.json')
+                }))
+                    .catch((err) => ({
+                    result: {
+                        schema: 'sks.agent-result.v1',
+                        mission_id: input.missionId,
+                        agent_id: agent.id,
+                        session_id: generation.session_id,
+                        persona_id: agent.persona_id,
+                        task_slice_id: workItem.id,
+                        status: 'failed',
+                        backend: 'fake',
+                        summary: err instanceof Error ? err.message : String(err),
+                        findings: [],
+                        proposed_changes: [],
+                        changed_files: [],
+                        lease_compliance: { ok: true, violations: [] },
+                        artifacts: [],
+                        blockers: ['scheduler_launch_failed'],
+                        confidence: 'failed',
+                        handoff_notes: '',
+                        unverified: [],
+                        writes: [],
+                        recursion_guard: { ok: true, violations: [] },
+                        verification: { status: 'failed', checks: [] },
+                        source_intelligence_refs: input.sourceIntelligenceRefs || null,
+                        goal_mode_ref: input.goalModeRef || null
+                    },
+                    session_id: generation.session_id,
+                    slot_id: slot.slot_id,
+                    generation_index: generation.generation_index,
+                    error: err instanceof Error ? err.message : String(err),
+                    terminal_close_report_path: path.join(generation.artifact_dir, 'agent-terminal-close-report.json')
+                }));
+                active.set(generation.session_id, { slot_id: slot.slot_id, work_item_id: workItem.id, session_id: generation.session_id, promise });
+            }
+            await appendAgentWorkQueueEvent(input.root, 'batch_work_items_dispatched', {
+                batch_id: batchId,
+                launch_count: launches.length,
+                session_ids: launches.map((launch) => launch.generation.session_id),
+                work_item_ids: launches.map((launch) => launch.workItem.id)
+            });
+            for (const launch of launches)
+                await appendAgentWorkQueueEvent(input.root, 'work_item_dispatched', { work_item_id: launch.workItem.id, session_id: launch.generation.session_id, slot_id: launch.slot.slot_id });
+            if (backfill) {
+                const firstLaunch = launches[0];
+                const refillLatencyMs = Math.max(0, Date.now() - backfill.closed_at_ms);
+                state.backfill_count += 1;
+                state.refill_latency_events_ms.push(refillLatencyMs);
+                state.refill_latency_p95_ms = percentile95(state.refill_latency_events_ms);
+                launchEvents.push({
+                    event_type: 'backfill_event',
+                    closed_session_id: backfill.closed_session_id,
+                    new_session_id: firstLaunch?.generation.session_id || null,
+                    slot_id: firstLaunch?.slot.slot_id || null,
+                    batch_id: batchId,
+                    launch_count: launches.length,
+                    active_count_before: backfill.active_count_before,
+                    active_count_after: active.size,
+                    refill_latency_ms: refillLatencyMs
+                });
+                backfill = null;
+            }
+            else {
+                for (const launch of launches)
+                    launchEvents.push({
+                        event_type: 'session_launched',
+                        session_id: launch.generation.session_id,
+                        slot_id: launch.slot.slot_id,
+                        work_item_id: launch.workItem.id,
+                        active_count_after: active.size
+                    });
+            }
+            if (input.refillDelayMs && input.refillDelayMs > 0)
+                await delay(input.refillDelayMs);
+            const launchSpanMs = Math.max(0, Date.now() - batchStart);
+            batchLaunchSpanTotalMs += launchSpanMs;
+            state.batch_dispatch_count += 1;
+            state.largest_batch_size = Math.max(state.largest_batch_size, launches.length);
+            if (state.first_batch_launch_span_ms === 0)
+                state.first_batch_launch_span_ms = launchSpanMs;
+            state.average_batch_launch_span_ms = Math.round(batchLaunchSpanTotalMs / Math.max(1, state.batch_dispatch_count));
+            updateUtilizationMetrics();
+            await appendParallelRuntimeEvent(input.root, input.missionId, {
+                event_type: 'batch_dispatch_completed',
+                slot_id: null,
+                generation_index: null,
+                session_id: null,
+                pid: null,
+                backend: 'scheduler',
+                placement: 'unknown',
+                batch_id: batchId,
+                meta: { launch_count: launches.length, launch_span_ms: launchSpanMs, active_count_after: active.size }
+            }).catch(() => undefined);
+            await writeAll(input.root, state, slots, queue, active, {
+                event_type: 'batch_dispatch_completed',
+                batch_id: batchId,
+                launch_count: launches.length,
+                launch_span_ms: launchSpanMs,
+                active_count_after: active.size,
+                session_ids: launches.map((launch) => launch.generation.session_id)
+            }, input.onSchedulerEvent);
+        }
+        finally {
+            batchDispatchInProgress = false;
+        }
+        for (const event of launchEvents)
+            await appendJsonl(path.join(input.root, 'agent-scheduler-events.jsonl'), { schema: AGENT_SCHEDULER_EVENT_SCHEMA, ts: nowIso(), ...event });
+    }
+    function collectLaunchBatch() {
+        const launches = [];
+        const reservedSlots = new Set();
+        while (active.size + launches.length < targetActiveSlots && pendingWorkItems(queue).length > 0) {
+            const slotIndex = slots.findIndex((slot, index) => slot.status === 'idle' && !reservedSlots.has(index));
             if (slotIndex < 0)
                 break;
             const slot = slots[slotIndex];
@@ -133,90 +309,18 @@ export async function runAgentScheduler(input) {
                 goalModeRef: workItem.goal_mode_ref
             });
             workItem.running_session_id = generation.session_id;
-            await writeAgentSessionGeneration(input.root, generation);
-            const agent = buildAgentForGeneration(slot, generation, workItem);
             const openedSlot = openWorkerSlotGeneration(slot, generation);
-            slots[slotIndex] = openedSlot;
-            await writeAll(input.root, state, slots, queue, active, {
-                event_type: 'session_launch_started',
-                session_id: generation.session_id,
-                slot_id: slot.slot_id,
-                generation_index: generation.generation_index,
-                work_item_id: workItem.id
-            }, input.onSchedulerEvent);
-            const promise = Promise.resolve()
-                .then(() => input.launchSession({ agent, workItem, generation, slot: openedSlot, queue, state }))
-                .then((result) => ({
-                result,
-                session_id: generation.session_id,
-                slot_id: slot.slot_id,
-                generation_index: generation.generation_index,
-                terminal_close_report_path: path.join(generation.artifact_dir, 'agent-terminal-close-report.json')
-            }))
-                .catch((err) => ({
-                result: {
-                    schema: 'sks.agent-result.v1',
-                    mission_id: input.missionId,
-                    agent_id: agent.id,
-                    session_id: generation.session_id,
-                    persona_id: agent.persona_id,
-                    task_slice_id: workItem.id,
-                    status: 'failed',
-                    backend: 'fake',
-                    summary: err instanceof Error ? err.message : String(err),
-                    findings: [],
-                    proposed_changes: [],
-                    changed_files: [],
-                    lease_compliance: { ok: true, violations: [] },
-                    artifacts: [],
-                    blockers: ['scheduler_launch_failed'],
-                    confidence: 'failed',
-                    handoff_notes: '',
-                    unverified: [],
-                    writes: [],
-                    recursion_guard: { ok: true, violations: [] },
-                    verification: { status: 'failed', checks: [] },
-                    source_intelligence_refs: input.sourceIntelligenceRefs || null,
-                    goal_mode_ref: input.goalModeRef || null
-                },
-                session_id: generation.session_id,
-                slot_id: slot.slot_id,
-                generation_index: generation.generation_index,
-                error: err instanceof Error ? err.message : String(err),
-                terminal_close_report_path: path.join(generation.artifact_dir, 'agent-terminal-close-report.json')
-            }));
-            active.set(generation.session_id, { slot_id: slot.slot_id, work_item_id: workItem.id, session_id: generation.session_id, promise });
-            await appendAgentWorkQueueEvent(input.root, 'work_item_dispatched', { work_item_id: workItem.id, session_id: generation.session_id, slot_id: slot.slot_id });
-            if (backfill) {
-                const refillLatencyMs = Math.max(0, Date.now() - backfill.closed_at_ms);
-                state.backfill_count += 1;
-                state.refill_latency_events_ms.push(refillLatencyMs);
-                state.refill_latency_p95_ms = percentile95(state.refill_latency_events_ms);
-                launchEvents.push({
-                    event_type: 'backfill_event',
-                    closed_session_id: backfill.closed_session_id,
-                    new_session_id: generation.session_id,
-                    slot_id: slot.slot_id,
-                    active_count_before: backfill.active_count_before,
-                    active_count_after: active.size,
-                    refill_latency_ms: refillLatencyMs
-                });
-                backfill = null;
-            }
-            else {
-                launchEvents.push({
-                    event_type: 'session_launched',
-                    session_id: generation.session_id,
-                    slot_id: slot.slot_id,
-                    work_item_id: workItem.id,
-                    active_count_after: active.size
-                });
-            }
-            if (input.refillDelayMs && input.refillDelayMs > 0)
-                await delay(input.refillDelayMs);
+            const agent = buildAgentForGeneration(slot, generation, workItem);
+            launches.push({ slotIndex, slot, openedSlot, generation, agent, workItem, provisionalSessionId });
+            reservedSlots.add(slotIndex);
         }
-        for (const event of launchEvents)
-            await writeAll(input.root, state, slots, queue, active, event, input.onSchedulerEvent);
+        return launches;
+    }
+    function updateUtilizationMetrics() {
+        state.wall_time_ms = Math.max(0, Date.now() - schedulerStartedAt);
+        state.active_slot_time_ms = Math.max(state.active_slot_time_ms, state.completed_count * state.wall_time_ms);
+        const denominator = Math.max(1, state.wall_time_ms * targetActiveSlots);
+        state.scheduler_utilization = Number(Math.min(1, state.active_slot_time_ms / denominator).toFixed(3));
     }
 }
 export function normalizeTargetActiveSlots(value, maxActiveSlots = MAX_AGENT_COUNT) {
@@ -261,7 +365,14 @@ function buildState(missionId, targetActiveSlots, queue, slots, active, opts) {
         pending_queue_drained: pendingCount === 0,
         all_slots_closed_after_drain: slots.length > 0 && slots.every((slot) => slot.status === 'closed'),
         all_generations_closed: false,
-        blockers: [...(previous?.blockers || [])]
+        blockers: [...(previous?.blockers || [])],
+        batch_dispatch_count: previous?.batch_dispatch_count || 0,
+        largest_batch_size: previous?.largest_batch_size || 0,
+        first_batch_launch_span_ms: previous?.first_batch_launch_span_ms || 0,
+        average_batch_launch_span_ms: previous?.average_batch_launch_span_ms || 0,
+        scheduler_utilization: previous?.scheduler_utilization || 0,
+        active_slot_time_ms: previous?.active_slot_time_ms || 0,
+        wall_time_ms: previous?.wall_time_ms || 0
     };
 }
 async function writeAll(root, currentState, slots, queue, active, event, onSchedulerEvent) {
@@ -289,6 +400,13 @@ async function writeAll(root, currentState, slots, queue, active, event, onSched
     currentState.blocked = nextState.blocked;
     currentState.pending_queue_drained = nextState.pending_queue_drained;
     currentState.all_slots_closed_after_drain = nextState.all_slots_closed_after_drain;
+    currentState.batch_dispatch_count = nextState.batch_dispatch_count;
+    currentState.largest_batch_size = nextState.largest_batch_size;
+    currentState.first_batch_launch_span_ms = nextState.first_batch_launch_span_ms;
+    currentState.average_batch_launch_span_ms = nextState.average_batch_launch_span_ms;
+    currentState.scheduler_utilization = nextState.scheduler_utilization;
+    currentState.active_slot_time_ms = nextState.active_slot_time_ms;
+    currentState.wall_time_ms = nextState.wall_time_ms;
     await writeAgentWorkQueue(root, queue);
     await writeAgentWorkerSlots(root, slots);
     await writeJsonAtomic(path.join(root, 'agent-scheduler-state.json'), currentState);

package/dist/core/agents/agent-schema.js CHANGED Viewed

@@ -13,7 +13,7 @@ export const DEFAULT_AGENT_CONCURRENCY = 5;
 // ceiling to up to 100 concurrent clone sessions. Only the naruto path opts into this
 // cap; every other roster/scheduler caller keeps MAX_AGENT_COUNT as the default.
 export const MAX_NARUTO_AGENT_COUNT = 100;
-export const DEFAULT_NARUTO_CLONES = 12;
+export const DEFAULT_NARUTO_CLONES = 32;
 export const AGENT_BACKENDS = ['fake', 'process', 'codex-sdk', 'zellij', 'ollama', 'local-llm'];
 export function normalizeAgentBackend(input) {
     const value = String(input || 'codex-sdk');