npm - @lnilluv/pi-ralph-loop - Versions diffs - 0.3.0 → 1.0.0 - Mend

@lnilluv/pi-ralph-loop 0.3.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

package/.github/workflows/release.yml +8 -39
package/README.md +50 -160
package/package.json +2 -2
package/scripts/version-helper.ts +210 -0
package/src/index.ts +1085 -188
package/src/ralph-draft-context.ts +618 -0
package/src/ralph-draft-llm.ts +297 -0
package/src/ralph-draft.ts +33 -0
package/src/ralph.ts +917 -102
package/src/runner-rpc.ts +434 -0
package/src/runner-state.ts +822 -0
package/src/runner.ts +957 -0
package/src/secret-paths.ts +66 -0
package/src/shims.d.ts +0 -3
package/tests/fixtures/parity/migrate/OPEN_QUESTIONS.md +3 -0
package/tests/fixtures/parity/migrate/RALPH.md +27 -0
package/tests/fixtures/parity/migrate/golden/MIGRATED.md +15 -0
package/tests/fixtures/parity/migrate/legacy/source.md +6 -0
package/tests/fixtures/parity/migrate/legacy/source.yaml +3 -0
package/tests/fixtures/parity/migrate/scripts/show-legacy.sh +10 -0
package/tests/fixtures/parity/migrate/scripts/verify.sh +15 -0
package/tests/fixtures/parity/research/OPEN_QUESTIONS.md +3 -0
package/tests/fixtures/parity/research/RALPH.md +45 -0
package/tests/fixtures/parity/research/claim-evidence-checklist.md +15 -0
package/tests/fixtures/parity/research/expected-outputs.md +22 -0
package/tests/fixtures/parity/research/scripts/show-snapshots.sh +13 -0
package/tests/fixtures/parity/research/scripts/verify.sh +55 -0
package/tests/fixtures/parity/research/snapshots/app-factory-ai-cli.md +11 -0
package/tests/fixtures/parity/research/snapshots/docs-factory-ai-cli-features-missions.md +11 -0
package/tests/fixtures/parity/research/snapshots/factory-ai-news-missions.md +11 -0
package/tests/fixtures/parity/research/source-manifest.md +20 -0
package/tests/index.test.ts +3529 -0
package/tests/parity/README.md +9 -0
package/tests/parity/harness.py +526 -0
package/tests/parity-harness.test.ts +42 -0
package/tests/parity-research-fixture.test.ts +34 -0
package/tests/ralph-draft-context.test.ts +672 -0
package/tests/ralph-draft-llm.test.ts +434 -0
package/tests/ralph-draft.test.ts +168 -0
package/tests/ralph.test.ts +1389 -19
package/tests/runner-event-contract.test.ts +235 -0
package/tests/runner-rpc.test.ts +358 -0
package/tests/runner-state.test.ts +553 -0
package/tests/runner.test.ts +1347 -0
package/tests/secret-paths.test.ts +55 -0
package/tests/version-helper.test.ts +75 -0

package/src/index.ts CHANGED Viewed

@@ -1,56 +1,147 @@
-import { minimatch } from "minimatch";
-import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
-import { basename, dirname, join, relative } from "node:path";
-import type { ExtensionAPI } from "@mariozechner/pi-coding-agent";
+import { createHash, randomUUID } from "node:crypto";
+import { existsSync, mkdirSync, readFileSync, readdirSync, writeFileSync } from "node:fs";
+import { basename, dirname, join, relative, resolve } from "node:path";
+import type { ExtensionAPI, ExtensionCommandContext, SessionEntry, AgentEndEvent as PiAgentEndEvent, ToolResultEvent as PiToolResultEvent } from "@mariozechner/pi-coding-agent";
 import {
   buildMissionBrief,
-  classifyIdleState,
-  generateDraft,
   inspectExistingTarget,
-  inspectRepo,
   parseCommandArgs,
   parseRalphMarkdown,
   planTaskDraftTarget,
   renderIterationPrompt,
   renderRalphBody,
-  shouldResetFailCount,
+  resolveCommandRun,
+  replaceArgsPlaceholders,
+  runtimeArgEntriesToMap,
   shouldStopForCompletionPromise,
   shouldWarnForBashFailure,
   shouldValidateExistingDraft,
   validateDraftContent,
   validateFrontmatter as validateFrontmatterMessage,
+  validateRuntimeArgs,
   createSiblingTarget,
   findBlockedCommandPattern,
 } from "./ralph.ts";
-import type { CommandDef, CommandOutput, DraftTarget, Frontmatter } from "./ralph.ts";
+import { matchesProtectedPath } from "./secret-paths.ts";
+import type { CommandDef, CommandOutput, DraftPlan, DraftTarget, Frontmatter, RuntimeArgs } from "./ralph.ts";
+import { createDraftPlan as createDraftPlanService } from "./ralph-draft.ts";
+import type { StrengthenDraftRuntime } from "./ralph-draft-llm.ts";
+import { runRalphLoop } from "./runner.ts";
+import {
+  checkStopSignal,
+  createStopSignal,
+  listActiveLoopRegistryEntries,
+  readActiveLoopRegistry,
+  readIterationRecords,
+  readStatusFile,
+  recordActiveLoopStopRequest,
+  writeActiveLoopRegistryEntry,
+  type ActiveLoopRegistryEntry,
+} from "./runner-state.ts";
+type ProgressState = boolean | "unknown";
+type IterationSummary = {
+  iteration: number;
+  duration: number;
+  progress: ProgressState;
+  changedFiles: string[];
+  noProgressStreak: number;
+  snapshotTruncated?: boolean;
+  snapshotErrorCount?: number;
+};
 type LoopState = {
   active: boolean;
   ralphPath: string;
+  taskDir: string;
+  cwd: string;
   iteration: number;
   maxIterations: number;
   timeout: number;
   completionPromise?: string;
   stopRequested: boolean;
-  iterationSummaries: Array<{ iteration: number; duration: number }>;
+  noProgressStreak: number;
+  iterationSummaries: IterationSummary[];
   guardrails: { blockCommands: string[]; protectedFiles: string[] };
-  loopSessionFile?: string;
+  observedTaskDirWrites: Set<string>;
+  loopToken?: string;
 };
 type PersistedLoopState = {
   active: boolean;
-  sessionFile?: string;
+  loopToken?: string;
+  cwd?: string;
+  taskDir?: string;
   iteration?: number;
   maxIterations?: number;
-  iterationSummaries?: Array<{ iteration: number; duration: number }>;
+  noProgressStreak?: number;
+  iterationSummaries?: IterationSummary[];
   guardrails?: { blockCommands: string[]; protectedFiles: string[] };
   stopRequested?: boolean;
 };
-function parseRalphMd(filePath: string) {
-  return parseRalphMarkdown(readFileSync(filePath, "utf8"));
-}
+type ActiveLoopState = PersistedLoopState & { active: true; loopToken: string; envMalformed?: boolean };
+type ActiveIterationState = ActiveLoopState & { iteration: number };
+const RALPH_RUNNER_TASK_DIR_ENV = "RALPH_RUNNER_TASK_DIR";
+const RALPH_RUNNER_CWD_ENV = "RALPH_RUNNER_CWD";
+const RALPH_RUNNER_LOOP_TOKEN_ENV = "RALPH_RUNNER_LOOP_TOKEN";
+const RALPH_RUNNER_CURRENT_ITERATION_ENV = "RALPH_RUNNER_CURRENT_ITERATION";
+const RALPH_RUNNER_MAX_ITERATIONS_ENV = "RALPH_RUNNER_MAX_ITERATIONS";
+const RALPH_RUNNER_NO_PROGRESS_STREAK_ENV = "RALPH_RUNNER_NO_PROGRESS_STREAK";
+const RALPH_RUNNER_GUARDRAILS_ENV = "RALPH_RUNNER_GUARDRAILS";
+type CommandContext = ExtensionCommandContext;
+type CommandSessionEntry = SessionEntry;
+type DraftPlanFactory = (
+  task: string,
+  target: DraftTarget,
+  cwd: string,
+  runtime?: StrengthenDraftRuntime,
+) => Promise<DraftPlan>;
+type RegisterRalphCommandServices = {
+  createDraftPlan?: DraftPlanFactory;
+  runRalphLoopFn?: typeof runRalphLoop;
+};
+type StopTargetSource = "session" | "registry" | "status";
+type StopTarget = {
+  cwd: string;
+  taskDir: string;
+  ralphPath: string;
+  loopToken: string;
+  currentIteration: number;
+  maxIterations: number;
+  startedAt: string;
+  source: StopTargetSource;
+};
+type ToolEvent = {
+  toolName?: string;
+  toolCallId?: string;
+  input?: {
+    path?: string;
+    command?: string;
+  };
+  isError?: boolean;
+  success?: boolean;
+};
-function validateFrontmatter(fm: Frontmatter, ctx: any): boolean {
+type AgentEndEvent = PiAgentEndEvent;
+type ToolResultEvent = PiToolResultEvent;
+type BeforeAgentStartEvent = {
+  systemPrompt: string;
+};
+type EventContext = Pick<CommandContext, "sessionManager">;
+function validateFrontmatter(fm: Frontmatter, ctx: Pick<CommandContext, "ui">): boolean {
   const error = validateFrontmatterMessage(fm);
   if (error) {
     ctx.ui.notify(error, "error");
@@ -59,17 +150,30 @@ function validateFrontmatter(fm: Frontmatter, ctx: any): boolean {
   return true;
 }
-export async function runCommands(commands: CommandDef[], blockPatterns: string[], pi: ExtensionAPI): Promise<CommandOutput[]> {
+export async function runCommands(
+  commands: CommandDef[],
+  blockPatterns: string[],
+  pi: ExtensionAPI,
+  runtimeArgs: RuntimeArgs = {},
+  cwd?: string,
+  taskDir?: string,
+): Promise<CommandOutput[]> {
+  const repoCwd = cwd ?? process.cwd();
   const results: CommandOutput[] = [];
   for (const cmd of commands) {
-    const blockedPattern = findBlockedCommandPattern(cmd.run, blockPatterns);
+    const semanticRun = replaceArgsPlaceholders(cmd.run, runtimeArgs);
+    const blockedPattern = findBlockedCommandPattern(semanticRun, blockPatterns);
+    const resolvedRun = resolveCommandRun(cmd.run, runtimeArgs);
     if (blockedPattern) {
+      pi.appendEntry?.("ralph-blocked-command", { name: cmd.name, command: semanticRun, blockedPattern, cwd: repoCwd, taskDir });
       results.push({ name: cmd.name, output: `[blocked by guardrail: ${blockedPattern}]` });
       continue;
     }
+    const commandCwd = semanticRun.trim().startsWith("./") ? taskDir ?? repoCwd : repoCwd;
     try {
-      const result = await pi.exec("bash", ["-c", cmd.run], { timeout: cmd.timeout * 1000 });
+      const result = await pi.exec("bash", ["-c", resolvedRun], { timeout: cmd.timeout * 1000, cwd: commandCwd });
       results.push(
         result.killed
           ? { name: cmd.name, output: `[timed out after ${cmd.timeout}s]` }
@@ -83,22 +187,99 @@ export async function runCommands(commands: CommandDef[], blockPatterns: string[
   return results;
 }
+const SNAPSHOT_IGNORED_DIR_NAMES = new Set([
+  ".git",
+  "node_modules",
+  ".next",
+  ".turbo",
+  ".cache",
+  "coverage",
+  "dist",
+  "build",
+  ".ralph-runner",
+]);
+const SNAPSHOT_MAX_FILES = 200;
+const SNAPSHOT_MAX_BYTES = 2 * 1024 * 1024;
+const SNAPSHOT_POST_IDLE_POLL_INTERVAL_MS = 20;
+const SNAPSHOT_POST_IDLE_POLL_WINDOW_MS = 100;
+const RALPH_PROGRESS_FILE = "RALPH_PROGRESS.md";
+type WorkspaceSnapshot = {
+  files: Map<string, string>;
+  truncated: boolean;
+  errorCount: number;
+};
+type ProgressAssessment = {
+  progress: ProgressState;
+  changedFiles: string[];
+  snapshotTruncated: boolean;
+  snapshotErrorCount: number;
+};
+type IterationCompletion = {
+  messages: PiAgentEndEvent["messages"];
+  observedTaskDirWrites: Set<string>;
+  error?: Error;
+};
+type Deferred<T> = {
+  promise: Promise<T>;
+  resolve(value: T): void;
+  reject(reason?: unknown): void;
+  settled: boolean;
+};
+type PendingIterationState = {
+  prompt: string;
+  completion: Deferred<IterationCompletion>;
+  toolCallPaths: Map<string, string>;
+  observedTaskDirWrites: Set<string>;
+};
+function createDeferred<T>(): Deferred<T> {
+  let resolvePromise!: (value: T) => void;
+  let rejectPromise!: (reason?: unknown) => void;
+  const deferred: Deferred<T> = {
+    promise: new Promise<T>((resolve, reject) => {
+      resolvePromise = resolve;
+      rejectPromise = reject;
+    }),
+    resolve(value: T) {
+      if (deferred.settled) return;
+      deferred.settled = true;
+      resolvePromise(value);
+    },
+    reject(reason?: unknown) {
+      if (deferred.settled) return;
+      deferred.settled = true;
+      rejectPromise(reason);
+    },
+    settled: false,
+  };
+  return deferred;
+}
 function defaultLoopState(): LoopState {
   return {
     active: false,
     ralphPath: "",
+    taskDir: "",
     iteration: 0,
     maxIterations: 50,
     timeout: 300,
     completionPromise: undefined,
     stopRequested: false,
+    noProgressStreak: 0,
     iterationSummaries: [],
     guardrails: { blockCommands: [], protectedFiles: [] },
-    loopSessionFile: undefined,
+    observedTaskDirWrites: new Set(),
+    loopToken: undefined,
+    cwd: "",
   };
 }
-function readPersistedLoopState(ctx: any): PersistedLoopState | undefined {
+function readPersistedLoopState(ctx: Pick<CommandContext, "sessionManager">): PersistedLoopState | undefined {
   const entries = ctx.sessionManager.getEntries();
   for (let i = entries.length - 1; i >= 0; i--) {
     const entry = entries[i];
@@ -113,6 +294,419 @@ function persistLoopState(pi: ExtensionAPI, data: PersistedLoopState) {
   pi.appendEntry("ralph-loop-state", data);
 }
+function toPersistedLoopState(state: LoopState, overrides: Partial<PersistedLoopState> = {}): PersistedLoopState {
+  return {
+    active: state.active,
+    loopToken: state.loopToken,
+    cwd: state.cwd,
+    taskDir: state.taskDir,
+    iteration: state.iteration,
+    maxIterations: state.maxIterations,
+    noProgressStreak: state.noProgressStreak,
+    iterationSummaries: state.iterationSummaries,
+    guardrails: { blockCommands: state.guardrails.blockCommands, protectedFiles: state.guardrails.protectedFiles },
+    stopRequested: state.stopRequested,
+    ...overrides,
+  };
+}
+function readActiveLoopState(ctx: Pick<CommandContext, "sessionManager">): ActiveLoopState | undefined {
+  const state = readPersistedLoopState(ctx);
+  if (state?.active !== true) return undefined;
+  if (typeof state.loopToken !== "string" || state.loopToken.length === 0) return undefined;
+  return state as ActiveLoopState;
+}
+function sanitizeStringArray(value: unknown): string[] {
+  return Array.isArray(value) ? value.filter((item): item is string => typeof item === "string") : [];
+}
+function sanitizeGuardrails(value: unknown): { blockCommands: string[]; protectedFiles: string[] } {
+  if (!value || typeof value !== "object") {
+    return { blockCommands: [], protectedFiles: [] };
+  }
+  const guardrails = value as { blockCommands?: unknown; protectedFiles?: unknown };
+  return {
+    blockCommands: sanitizeStringArray(guardrails.blockCommands),
+    protectedFiles: sanitizeStringArray(guardrails.protectedFiles),
+  };
+}
+function sanitizeProgressState(value: unknown): ProgressState {
+  return value === true || value === false || value === "unknown" ? value : "unknown";
+}
+function sanitizeIterationSummary(record: unknown, loopToken: string): IterationSummary | undefined {
+  if (!record || typeof record !== "object") return undefined;
+  const iterationRecord = record as {
+    loopToken?: unknown;
+    iteration?: unknown;
+    durationMs?: unknown;
+    progress?: unknown;
+    changedFiles?: unknown;
+    noProgressStreak?: unknown;
+    snapshotTruncated?: unknown;
+    snapshotErrorCount?: unknown;
+  };
+  if (iterationRecord.loopToken !== loopToken) return undefined;
+  if (typeof iterationRecord.iteration !== "number" || !Number.isFinite(iterationRecord.iteration)) return undefined;
+  const durationMs = typeof iterationRecord.durationMs === "number" && Number.isFinite(iterationRecord.durationMs)
+    ? iterationRecord.durationMs
+    : 0;
+  const noProgressStreak = typeof iterationRecord.noProgressStreak === "number" && Number.isFinite(iterationRecord.noProgressStreak)
+    ? iterationRecord.noProgressStreak
+    : 0;
+  const snapshotErrorCount = typeof iterationRecord.snapshotErrorCount === "number" && Number.isFinite(iterationRecord.snapshotErrorCount)
+    ? iterationRecord.snapshotErrorCount
+    : undefined;
+  return {
+    iteration: iterationRecord.iteration,
+    duration: Math.round(durationMs / 1000),
+    progress: sanitizeProgressState(iterationRecord.progress),
+    changedFiles: sanitizeStringArray(iterationRecord.changedFiles),
+    noProgressStreak,
+    snapshotTruncated: typeof iterationRecord.snapshotTruncated === "boolean" ? iterationRecord.snapshotTruncated : undefined,
+    snapshotErrorCount,
+  };
+}
+function parseLoopContractInteger(raw: string | undefined): number | undefined {
+  if (typeof raw !== "string") return undefined;
+  const trimmed = raw.trim();
+  if (!/^-?\d+$/.test(trimmed)) return undefined;
+  const parsed = Number(trimmed);
+  return Number.isSafeInteger(parsed) ? parsed : undefined;
+}
+function parseLoopContractGuardrails(raw: string | undefined): { blockCommands: string[]; protectedFiles: string[] } | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed: unknown = JSON.parse(raw);
+    if (!parsed || typeof parsed !== "object") return undefined;
+    const guardrails = parsed as { blockCommands?: unknown; protectedFiles?: unknown };
+    if (
+      !Array.isArray(guardrails.blockCommands) ||
+      !guardrails.blockCommands.every((item) => typeof item === "string") ||
+      !Array.isArray(guardrails.protectedFiles) ||
+      !guardrails.protectedFiles.every((item) => typeof item === "string")
+    ) {
+      return undefined;
+    }
+    return {
+      blockCommands: [...guardrails.blockCommands],
+      protectedFiles: [...guardrails.protectedFiles],
+    };
+  } catch {
+    return undefined;
+  }
+}
+function isStringArray(value: unknown): value is string[] {
+  return Array.isArray(value) && value.every((item) => typeof item === "string");
+}
+function areStringArraysEqual(left: string[], right: string[]): boolean {
+  return left.length === right.length && left.every((item, index) => item === right[index]);
+}
+function createFailClosedLoopState(taskDir: string, cwd?: string): ActiveLoopState {
+  return {
+    active: true,
+    loopToken: "",
+    cwd: cwd && cwd.length > 0 ? cwd : taskDir,
+    taskDir,
+    iteration: 0,
+    maxIterations: 0,
+    noProgressStreak: 0,
+    iterationSummaries: [],
+    guardrails: { blockCommands: [".*"], protectedFiles: ["**/*"] },
+    stopRequested: checkStopSignal(taskDir),
+    envMalformed: true,
+  };
+}
+function readEnvLoopState(taskDir: string): ActiveLoopState | undefined {
+  const cwd = process.env[RALPH_RUNNER_CWD_ENV]?.trim();
+  const loopToken = process.env[RALPH_RUNNER_LOOP_TOKEN_ENV]?.trim();
+  const currentIteration = parseLoopContractInteger(process.env[RALPH_RUNNER_CURRENT_ITERATION_ENV]);
+  const maxIterations = parseLoopContractInteger(process.env[RALPH_RUNNER_MAX_ITERATIONS_ENV]);
+  const noProgressStreak = parseLoopContractInteger(process.env[RALPH_RUNNER_NO_PROGRESS_STREAK_ENV]);
+  const guardrails = parseLoopContractGuardrails(process.env[RALPH_RUNNER_GUARDRAILS_ENV]);
+  if (
+    !cwd ||
+    !loopToken ||
+    currentIteration === undefined ||
+    currentIteration < 0 ||
+    maxIterations === undefined ||
+    maxIterations <= 0 ||
+    noProgressStreak === undefined ||
+    noProgressStreak < 0 ||
+    !guardrails
+  ) {
+    return undefined;
+  }
+  const iterationSummaries = readIterationRecords(taskDir)
+    .map((record) => sanitizeIterationSummary(record, loopToken))
+    .filter((summary): summary is IterationSummary => summary !== undefined);
+  return {
+    active: true,
+    loopToken,
+    cwd,
+    taskDir,
+    iteration: currentIteration,
+    maxIterations,
+    noProgressStreak,
+    iterationSummaries,
+    guardrails,
+    stopRequested: checkStopSignal(taskDir),
+  };
+}
+function readDurableLoopState(taskDir: string, envState: ActiveLoopState): ActiveLoopState | undefined {
+  const envGuardrails = envState.guardrails;
+  if (!envGuardrails) return undefined;
+  const durableStatus = readStatusFile(taskDir);
+  if (!durableStatus || typeof durableStatus !== "object") return undefined;
+  const status = durableStatus as Record<string, unknown>;
+  const guardrails = status.guardrails as Record<string, unknown> | undefined;
+  if (
+    typeof status.loopToken !== "string" ||
+    status.loopToken.length === 0 ||
+    typeof status.cwd !== "string" ||
+    status.cwd.length === 0 ||
+    typeof status.currentIteration !== "number" ||
+    !Number.isInteger(status.currentIteration) ||
+    status.currentIteration < 0 ||
+    typeof status.maxIterations !== "number" ||
+    !Number.isInteger(status.maxIterations) ||
+    status.maxIterations <= 0 ||
+    typeof status.taskDir !== "string" ||
+    status.taskDir !== taskDir ||
+    !guardrails ||
+    !isStringArray(guardrails.blockCommands) ||
+    !isStringArray(guardrails.protectedFiles)
+  ) {
+    return undefined;
+  }
+  const durableLoopToken = status.loopToken;
+  const durableCwd = status.cwd;
+  const durableGuardrails = guardrails as { blockCommands: string[]; protectedFiles: string[] };
+  if (
+    durableLoopToken !== envState.loopToken ||
+    durableCwd !== envState.cwd ||
+    status.currentIteration !== envState.iteration ||
+    status.maxIterations !== envState.maxIterations ||
+    !areStringArraysEqual(durableGuardrails.blockCommands, envGuardrails.blockCommands) ||
+    !areStringArraysEqual(durableGuardrails.protectedFiles, envGuardrails.protectedFiles)
+  ) {
+    return undefined;
+  }
+  const iterationSummaries = readIterationRecords(taskDir)
+    .map((record) => sanitizeIterationSummary(record, durableLoopToken))
+    .filter((summary): summary is IterationSummary => summary !== undefined);
+  return {
+    active: true,
+    loopToken: durableLoopToken,
+    cwd: durableCwd,
+    taskDir,
+    iteration: status.currentIteration,
+    maxIterations: status.maxIterations,
+    noProgressStreak: envState.noProgressStreak,
+    iterationSummaries,
+    guardrails: {
+      blockCommands: [...durableGuardrails.blockCommands],
+      protectedFiles: [...durableGuardrails.protectedFiles],
+    },
+    stopRequested: checkStopSignal(taskDir),
+  };
+}
+function resolveActiveLoopState(ctx: Pick<CommandContext, "sessionManager">): ActiveLoopState | undefined {
+  const taskDir = process.env[RALPH_RUNNER_TASK_DIR_ENV]?.trim();
+  if (taskDir) {
+    const envState = readEnvLoopState(taskDir);
+    if (!envState) return createFailClosedLoopState(taskDir, process.env[RALPH_RUNNER_CWD_ENV]?.trim() || undefined);
+    return readDurableLoopState(taskDir, envState) ?? createFailClosedLoopState(taskDir, envState.cwd);
+  }
+  return readActiveLoopState(ctx);
+}
+function resolveActiveIterationState(ctx: Pick<CommandContext, "sessionManager">): ActiveIterationState | undefined {
+  const state = resolveActiveLoopState(ctx);
+  if (!state || typeof state.iteration !== "number") return undefined;
+  return state as ActiveIterationState;
+}
+function getLoopIterationKey(loopToken: string, iteration: number): string {
+  return `${loopToken}:${iteration}`;
+}
+function normalizeSnapshotPath(filePath: string): string {
+  return filePath.split("\\").join("/");
+}
+function captureTaskDirectorySnapshot(ralphPath: string): WorkspaceSnapshot {
+  const taskDir = dirname(ralphPath);
+  const progressMemoryPath = join(taskDir, RALPH_PROGRESS_FILE);
+  const files = new Map<string, string>();
+  let truncated = false;
+  let bytesRead = 0;
+  let errorCount = 0;
+  const walk = (dirPath: string) => {
+    let entries;
+    try {
+      entries = readdirSync(dirPath, { withFileTypes: true }).sort((a, b) => a.name.localeCompare(b.name));
+    } catch {
+      errorCount += 1;
+      return;
+    }
+    for (const entry of entries) {
+      if (truncated) return;
+      const fullPath = join(dirPath, entry.name);
+      if (entry.isDirectory()) {
+        if (SNAPSHOT_IGNORED_DIR_NAMES.has(entry.name)) continue;
+        walk(fullPath);
+        continue;
+      }
+      if (!entry.isFile() || fullPath === ralphPath || fullPath === progressMemoryPath) continue;
+      if (files.size >= SNAPSHOT_MAX_FILES) {
+        truncated = true;
+        return;
+      }
+      const relPath = normalizeSnapshotPath(relative(taskDir, fullPath));
+      if (!relPath || relPath.startsWith("..")) continue;
+      let content;
+      try {
+        content = readFileSync(fullPath);
+      } catch {
+        errorCount += 1;
+        continue;
+      }
+      if (bytesRead + content.byteLength > SNAPSHOT_MAX_BYTES) {
+        truncated = true;
+        return;
+      }
+      bytesRead += content.byteLength;
+      files.set(relPath, `${content.byteLength}:${createHash("sha1").update(content).digest("hex")}`);
+    }
+  };
+  if (existsSync(taskDir)) walk(taskDir);
+  return { files, truncated, errorCount };
+}
+function diffTaskDirectorySnapshots(before: WorkspaceSnapshot, after: WorkspaceSnapshot): string[] {
+  const changed = new Set<string>();
+  for (const [filePath, fingerprint] of before.files) {
+    if (after.files.get(filePath) !== fingerprint) changed.add(filePath);
+  }
+  for (const filePath of after.files.keys()) {
+    if (!before.files.has(filePath)) changed.add(filePath);
+  }
+  return [...changed].sort((a, b) => a.localeCompare(b));
+}
+function resolveTaskDirObservedPath(taskDir: string, cwd: string, filePath: string): string | undefined {
+  if (!taskDir || !cwd || !filePath) return undefined;
+  const relPath = normalizeSnapshotPath(relative(resolve(taskDir), resolve(cwd, filePath)));
+  if (!relPath || relPath === "." || relPath.startsWith("..")) return undefined;
+  return relPath;
+}
+function delay(ms: number): Promise<void> {
+  return new Promise((resolveDelay) => {
+    setTimeout(resolveDelay, ms);
+  });
+}
+async function assessTaskDirectoryProgress(
+  ralphPath: string,
+  before: WorkspaceSnapshot,
+  observedTaskDirWrites: ReadonlySet<string>,
+): Promise<ProgressAssessment> {
+  let after = captureTaskDirectorySnapshot(ralphPath);
+  let changedFiles = diffTaskDirectorySnapshots(before, after);
+  let snapshotTruncated = before.truncated || after.truncated;
+  let snapshotErrorCount = before.errorCount + after.errorCount;
+  if (changedFiles.length > 0) {
+    return { progress: true, changedFiles, snapshotTruncated, snapshotErrorCount };
+  }
+  for (let remainingMs = SNAPSHOT_POST_IDLE_POLL_WINDOW_MS; remainingMs > 0; remainingMs -= SNAPSHOT_POST_IDLE_POLL_INTERVAL_MS) {
+    await delay(Math.min(SNAPSHOT_POST_IDLE_POLL_INTERVAL_MS, remainingMs));
+    after = captureTaskDirectorySnapshot(ralphPath);
+    changedFiles = diffTaskDirectorySnapshots(before, after);
+    snapshotTruncated ||= after.truncated;
+    snapshotErrorCount += after.errorCount;
+    if (changedFiles.length > 0) {
+      return { progress: true, changedFiles, snapshotTruncated, snapshotErrorCount };
+    }
+  }
+  if (observedTaskDirWrites.size > 0) {
+    return { progress: "unknown", changedFiles: [], snapshotTruncated, snapshotErrorCount };
+  }
+  return {
+    progress: snapshotTruncated || snapshotErrorCount > 0 ? "unknown" : false,
+    changedFiles,
+    snapshotTruncated,
+    snapshotErrorCount,
+  };
+}
+function summarizeChangedFiles(changedFiles: string[]): string {
+  if (changedFiles.length === 0) return "none";
+  const visible = changedFiles.slice(0, 5);
+  if (visible.length === changedFiles.length) return visible.join(", ");
+  return `${visible.join(", ")} (+${changedFiles.length - visible.length} more)`;
+}
+function summarizeSnapshotCoverage(truncated: boolean, errorCount: number): string {
+  const parts: string[] = [];
+  if (truncated) parts.push("snapshot truncated");
+  if (errorCount > 0) parts.push(errorCount === 1 ? "1 file unreadable" : `${errorCount} files unreadable`);
+  return parts.join(", ");
+}
+function summarizeIterationProgress(summary: Pick<IterationSummary, "progress" | "changedFiles" | "snapshotTruncated" | "snapshotErrorCount">): string {
+  if (summary.progress === true) return `durable progress (${summarizeChangedFiles(summary.changedFiles)})`;
+  if (summary.progress === false) return "no durable progress";
+  const coverage = summarizeSnapshotCoverage(summary.snapshotTruncated ?? false, summary.snapshotErrorCount ?? 0);
+  return coverage ? `durable progress unknown (${coverage})` : "durable progress unknown";
+}
+function summarizeLastIterationFeedback(summary: IterationSummary | undefined, fallbackNoProgressStreak: number): string {
+  if (!summary) return "";
+  if (summary.progress === true) {
+    return `Last iteration durable progress: ${summarizeChangedFiles(summary.changedFiles)}.`;
+  }
+  if (summary.progress === false) {
+    return `Last iteration made no durable progress. No-progress streak: ${summary.noProgressStreak ?? fallbackNoProgressStreak}.`;
+  }
+  const coverage = summarizeSnapshotCoverage(summary.snapshotTruncated ?? false, summary.snapshotErrorCount ?? 0);
+  const detail = coverage ? ` (${coverage})` : "";
+  return `Last iteration durable progress could not be verified${detail}. No-progress streak remains ${summary.noProgressStreak ?? fallbackNoProgressStreak}.`;
+}
 function writeDraftFile(ralphPath: string, content: string) {
   mkdirSync(dirname(ralphPath), { recursive: true });
   writeFileSync(ralphPath, content, "utf8");
@@ -123,14 +717,14 @@ function displayPath(cwd: string, filePath: string): string {
   return rel && !rel.startsWith("..") ? `./${rel}` : filePath;
 }
-async function promptForTask(ctx: any, title: string, placeholder: string): Promise<string | undefined> {
+async function promptForTask(ctx: Pick<CommandContext, "hasUI" | "ui">, title: string, placeholder: string): Promise<string | undefined> {
   if (!ctx.hasUI) return undefined;
   const value = await ctx.ui.input(title, placeholder);
   const trimmed = value?.trim();
   return trimmed ? trimmed : undefined;
 }
-async function reviewDraft(plan: ReturnType<typeof generateDraft>, mode: "run" | "draft", ctx: any): Promise<{ action: "start" | "save" | "cancel"; content: string }> {
+async function reviewDraft(plan: DraftPlan, mode: "run" | "draft", ctx: Pick<CommandContext, "ui">): Promise<{ action: "start" | "save" | "cancel"; content: string }> {
   let content = plan.content;
   while (true) {
@@ -162,7 +756,7 @@ async function reviewDraft(plan: ReturnType<typeof generateDraft>, mode: "run" |
   }
 }
-async function editExistingDraft(ralphPath: string, ctx: any, saveMessage = "Saved RALPH.md") {
+async function editExistingDraft(ralphPath: string, ctx: Pick<CommandContext, "cwd" | "hasUI" | "ui">, saveMessage = "Saved RALPH.md") {
   if (!ctx.hasUI) {
     ctx.ui.notify(`Use ${displayPath(ctx.cwd, ralphPath)} in an interactive session to edit the draft.`, "warning");
     return;
@@ -194,7 +788,7 @@ async function editExistingDraft(ralphPath: string, ctx: any, saveMessage = "Sav
 async function chooseRecoveryMode(
   input: string,
   dirPath: string,
-  ctx: any,
+  ctx: Pick<CommandContext, "cwd" | "ui">,
   allowTaskFallback = true,
 ): Promise<"draft-path" | "task" | "cancel"> {
   const options = allowTaskFallback ? ["Draft in that folder", "Treat as task text", "Cancel"] : ["Draft in that folder", "Cancel"];
@@ -204,7 +798,7 @@ async function chooseRecoveryMode(
   return "cancel";
 }
-async function chooseConflictTarget(commandName: "ralph" | "ralph-draft", task: string, target: DraftTarget, ctx: any): Promise<{ action: "run-existing" | "open-existing" | "draft-target" | "cancel"; target?: DraftTarget }> {
+async function chooseConflictTarget(commandName: "ralph" | "ralph-draft", task: string, target: DraftTarget, ctx: Pick<CommandContext, "cwd" | "ui">): Promise<{ action: "run-existing" | "open-existing" | "draft-target" | "cancel"; target?: DraftTarget }> {
   const hasExistingDraft = existsSync(target.ralphPath);
   const title = hasExistingDraft
     ? `Found an existing RALPH at ${displayPath(ctx.cwd, target.ralphPath)} for “${task}”.`
@@ -225,8 +819,23 @@ async function chooseConflictTarget(commandName: "ralph" | "ralph-draft", task:
   return { action: "draft-target", target: createSiblingTarget(ctx.cwd, target.slug) };
 }
-async function draftFromTask(commandName: "ralph" | "ralph-draft", task: string, target: DraftTarget, ctx: any): Promise<string | undefined> {
-  const plan = generateDraft(task, target, inspectRepo(ctx.cwd));
+function getDraftStrengtheningRuntime(ctx: Pick<CommandContext, "model" | "modelRegistry">): StrengthenDraftRuntime | undefined {
+  if (!ctx.model || !ctx.modelRegistry) return undefined;
+  return {
+    model: ctx.model,
+    modelRegistry: ctx.modelRegistry,
+  };
+}
+async function draftFromTask(
+  commandName: "ralph" | "ralph-draft",
+  task: string,
+  target: DraftTarget,
+  ctx: Pick<CommandContext, "cwd" | "ui">,
+  draftPlanFactory: DraftPlanFactory,
+  runtime?: StrengthenDraftRuntime,
+): Promise<string | undefined> {
+  const plan = await draftPlanFactory(task, target, ctx.cwd, runtime);
   const review = await reviewDraft(plan, commandName === "ralph" ? "run" : "draft", ctx);
   if (review.action === "cancel") return undefined;
@@ -238,41 +847,223 @@ async function draftFromTask(commandName: "ralph" | "ralph-draft", task: string,
   return target.ralphPath;
 }
+function resolveSessionStopTarget(ctx: Pick<CommandContext, "cwd" | "sessionManager">, now: string): {
+  target?: StopTarget;
+  persistedSessionState?: ActiveLoopState;
+} {
+  if (loopState.active) {
+    return {
+      target: {
+        cwd: loopState.cwd || ctx.cwd,
+        taskDir: loopState.taskDir,
+        ralphPath: loopState.ralphPath,
+        loopToken: loopState.loopToken ?? "",
+        currentIteration: loopState.iteration,
+        maxIterations: loopState.maxIterations,
+        startedAt: now,
+        source: "session",
+      },
+    };
+  }
+  const persistedSessionState = readActiveLoopState(ctx);
+  if (
+    !persistedSessionState ||
+    typeof persistedSessionState.taskDir !== "string" ||
+    persistedSessionState.taskDir.length === 0 ||
+    typeof persistedSessionState.loopToken !== "string" ||
+    persistedSessionState.loopToken.length === 0 ||
+    typeof persistedSessionState.iteration !== "number" ||
+    typeof persistedSessionState.maxIterations !== "number"
+  ) {
+    return { persistedSessionState };
+  }
+  return {
+    persistedSessionState,
+    target: {
+      cwd: typeof persistedSessionState.cwd === "string" && persistedSessionState.cwd.length > 0 ? persistedSessionState.cwd : ctx.cwd,
+      taskDir: persistedSessionState.taskDir,
+      ralphPath: join(persistedSessionState.taskDir, "RALPH.md"),
+      loopToken: persistedSessionState.loopToken,
+      currentIteration: persistedSessionState.iteration,
+      maxIterations: persistedSessionState.maxIterations,
+      startedAt: now,
+      source: "session",
+    },
+  };
+}
+function materializeRegistryStopTarget(entry: ActiveLoopRegistryEntry): StopTarget {
+  return {
+    cwd: entry.cwd,
+    taskDir: entry.taskDir,
+    ralphPath: entry.ralphPath,
+    loopToken: entry.loopToken,
+    currentIteration: entry.currentIteration,
+    maxIterations: entry.maxIterations,
+    startedAt: entry.startedAt,
+    source: "registry",
+  };
+}
+function applyStopTarget(
+  pi: ExtensionAPI,
+  ctx: Pick<CommandContext, "cwd" | "ui">,
+  target: StopTarget,
+  now: string,
+  persistedSessionState?: ActiveLoopState,
+): void {
+  createStopSignal(target.taskDir);
+  const registryCwd = target.cwd;
+  const existingEntry = readActiveLoopRegistry(registryCwd).find((entry) => entry.taskDir === target.taskDir);
+  const registryEntry: ActiveLoopRegistryEntry = existingEntry
+    ? {
+        ...existingEntry,
+        taskDir: target.taskDir,
+        ralphPath: target.ralphPath,
+        cwd: registryCwd,
+        updatedAt: now,
+      }
+    : {
+        taskDir: target.taskDir,
+        ralphPath: target.ralphPath,
+        cwd: registryCwd,
+        loopToken: target.loopToken,
+        status: "running",
+        currentIteration: target.currentIteration,
+        maxIterations: target.maxIterations,
+        startedAt: target.startedAt,
+        updatedAt: now,
+      };
+  writeActiveLoopRegistryEntry(registryCwd, registryEntry);
+  recordActiveLoopStopRequest(registryCwd, target.taskDir, now);
+  if (target.source === "session") {
+    loopState.stopRequested = true;
+    if (loopState.active) {
+      persistLoopState(pi, toPersistedLoopState(loopState, { active: true, stopRequested: true }));
+    } else if (persistedSessionState?.active) {
+      persistLoopState(pi, { ...persistedSessionState, stopRequested: true });
+    }
+  }
+  ctx.ui.notify("Ralph loop stopping after current iteration…", "info");
+}
 let loopState: LoopState = defaultLoopState();
+const RALPH_EXTENSION_REGISTERED = Symbol.for("pi-ralph-loop.registered");
-export default function (pi: ExtensionAPI) {
+export default function (pi: ExtensionAPI, services: RegisterRalphCommandServices = {}) {
+  const registeredPi = pi as ExtensionAPI & Record<symbol, boolean | undefined>;
+  if (registeredPi[RALPH_EXTENSION_REGISTERED]) return;
+  registeredPi[RALPH_EXTENSION_REGISTERED] = true;
   const failCounts = new Map<string, number>();
-  const isLoopSession = (ctx: any): boolean => {
-    const state = readPersistedLoopState(ctx);
-    const sessionFile = ctx.sessionManager.getSessionFile();
-    return state?.active === true && state.sessionFile === sessionFile;
+  const pendingIterations = new Map<string, PendingIterationState>();
+  const draftPlanFactory = services.createDraftPlan ?? createDraftPlanService;
+  const isLoopSession = (ctx: Pick<CommandContext, "sessionManager">): boolean => resolveActiveLoopState(ctx) !== undefined;
+  const appendLoopProofEntry = (customType: string, data: Record<string, unknown>): void => {
+    try {
+      pi.appendEntry?.(customType, data);
+    } catch (err) {
+      const message = err instanceof Error ? err.message : String(err);
+      try {
+        process.stderr.write(`Ralph proof logging failed for ${customType}: ${message}\n`);
+      } catch {
+        // Best-effort surfacing only.
+      }
+    }
+  };
+  const getPendingIteration = (ctx: Pick<CommandContext, "sessionManager">): PendingIterationState | undefined => {
+    const state = resolveActiveIterationState(ctx);
+    return state ? pendingIterations.get(getLoopIterationKey(state.loopToken, state.iteration)) : undefined;
+  };
+  const registerPendingIteration = (loopToken: string, iteration: number, prompt: string): PendingIterationState => {
+    const pending: PendingIterationState = {
+      prompt,
+      completion: createDeferred<IterationCompletion>(),
+      toolCallPaths: new Map(),
+      observedTaskDirWrites: new Set(),
+    };
+    pendingIterations.set(getLoopIterationKey(loopToken, iteration), pending);
+    return pending;
+  };
+  const clearPendingIteration = (loopToken: string, iteration: number) => {
+    pendingIterations.delete(getLoopIterationKey(loopToken, iteration));
+  };
+  const resolvePendingIteration = (ctx: EventContext, event: AgentEndEvent) => {
+    const state = resolveActiveIterationState(ctx);
+    if (!state) return;
+    const pendingKey = getLoopIterationKey(state.loopToken, state.iteration);
+    const pending = pendingIterations.get(pendingKey);
+    if (!pending) return;
+    pendingIterations.delete(pendingKey);
+    const rawError = (event as { error?: unknown }).error;
+    const error = rawError instanceof Error ? rawError : rawError ? new Error(String(rawError)) : undefined;
+    pending.completion.resolve({
+      messages: event.messages ?? [],
+      observedTaskDirWrites: new Set(pending.observedTaskDirWrites),
+      error,
+    });
+  };
+  const recordPendingToolPath = (ctx: EventContext, event: ToolEvent) => {
+    const pending = getPendingIteration(ctx);
+    if (!pending) return;
+    if (event.toolName !== "write" && event.toolName !== "edit") return;
+    const toolCallId = typeof event.toolCallId === "string" ? event.toolCallId : undefined;
+    const filePath = event.input?.path ?? "";
+    if (toolCallId && filePath) pending.toolCallPaths.set(toolCallId, filePath);
+  };
+  const recordSuccessfulTaskDirWrite = (ctx: EventContext, event: ToolEvent) => {
+    const pending = getPendingIteration(ctx);
+    if (!pending) return;
+    if (event.toolName !== "write" && event.toolName !== "edit") return;
+    const toolCallId = typeof event.toolCallId === "string" ? event.toolCallId : undefined;
+    const filePath = toolCallId ? pending.toolCallPaths.get(toolCallId) : undefined;
+    if (toolCallId) pending.toolCallPaths.delete(toolCallId);
+    if (event.isError === true || event.success === false || !filePath) return;
+    const persisted = resolveActiveLoopState(ctx);
+    const taskDirPath = persisted?.taskDir ?? loopState.taskDir;
+    const cwd = persisted?.cwd ?? loopState.cwd;
+    const relPath = resolveTaskDirObservedPath(taskDirPath ?? "", cwd ?? taskDirPath ?? "", filePath);
+    if (relPath && relPath !== RALPH_PROGRESS_FILE) pending.observedTaskDirWrites.add(relPath);
   };
-  async function startRalphLoop(ralphPath: string, ctx: any) {
+  async function startRalphLoop(ralphPath: string, ctx: CommandContext, runLoopFn: typeof runRalphLoop = runRalphLoop, runtimeArgs: RuntimeArgs = {}) {
     let name: string;
     try {
       const raw = readFileSync(ralphPath, "utf8");
-      if (shouldValidateExistingDraft(raw)) {
-        const draftError = validateDraftContent(raw);
-        if (draftError) {
-          ctx.ui.notify(`Invalid RALPH.md: ${draftError}`, "error");
-          return;
-        }
+      const draftError = validateDraftContent(raw);
+      if (draftError) {
+        ctx.ui.notify(`Invalid RALPH.md: ${draftError}`, "error");
+        return;
       }
-      const { frontmatter } = parseRalphMd(ralphPath);
+      const parsed = parseRalphMarkdown(raw);
+      const { frontmatter } = parsed;
       if (!validateFrontmatter(frontmatter, ctx)) return;
-      name = basename(dirname(ralphPath));
+      const runtimeValidationError = validateRuntimeArgs(frontmatter, parsed.body, frontmatter.commands, runtimeArgs);
+      if (runtimeValidationError) {
+        ctx.ui.notify(runtimeValidationError, "error");
+        return;
+      }
+      const taskDir = dirname(ralphPath);
+      name = basename(taskDir);
       loopState = {
         active: true,
         ralphPath,
+        taskDir,
+        cwd: ctx.cwd,
         iteration: 0,
         maxIterations: frontmatter.maxIterations,
         timeout: frontmatter.timeout,
         completionPromise: frontmatter.completionPromise,
         stopRequested: false,
+        noProgressStreak: 0,
         iterationSummaries: [],
         guardrails: { blockCommands: frontmatter.guardrails.blockCommands, protectedFiles: frontmatter.guardrails.protectedFiles },
-        loopSessionFile: undefined,
+        observedTaskDirWrites: new Set(),
+        loopToken: randomUUID(),
       };
     } catch (err) {
       ctx.ui.notify(String(err), "error");
@@ -281,143 +1072,118 @@ export default function (pi: ExtensionAPI) {
     ctx.ui.notify(`Ralph loop started: ${name} (max ${loopState.maxIterations} iterations)`, "info");
     try {
-      iterationLoop: for (let i = 1; i <= loopState.maxIterations; i++) {
-        if (loopState.stopRequested) break;
-        const persistedBefore = readPersistedLoopState(ctx);
-        if (persistedBefore?.active && persistedBefore.stopRequested) {
-          loopState.stopRequested = true;
-          ctx.ui.notify("Ralph loop stopping after current iteration…", "info");
-          break;
-        }
+      const result = await runLoopFn({
+        ralphPath,
+        cwd: ctx.cwd,
+        timeout: loopState.timeout,
+        maxIterations: loopState.maxIterations,
+        guardrails: loopState.guardrails,
+        runtimeArgs,
+        modelPattern: ctx.model ? `${ctx.model.provider}/${ctx.model.id}` : undefined,
+        thinkingLevel: ctx.model?.reasoning ? "high" : undefined,
+        runCommandsFn: async (commands, blocked, commandPi, cwd, taskDir) => runCommands(commands, blocked, commandPi as ExtensionAPI, runtimeArgs, cwd, taskDir),
+        onStatusChange(status) {
+          ctx.ui.setStatus("ralph", status === "running" || status === "initializing" ? `🔁 ${name}: running` : undefined);
+        },
+        onNotify(message, level) {
+          ctx.ui.notify(message, level);
+        },
+        onIterationComplete(record) {
+          loopState.iteration = record.iteration;
+          loopState.noProgressStreak = record.noProgressStreak;
+          const summary: IterationSummary = {
+            iteration: record.iteration,
+            duration: record.durationMs ? Math.round(record.durationMs / 1000) : 0,
+            progress: record.progress,
+            changedFiles: record.changedFiles,
+            noProgressStreak: record.noProgressStreak,
+          };
+          loopState.iterationSummaries.push(summary);
+          pi.appendEntry("ralph-iteration", {
+            iteration: record.iteration,
+            duration: summary.duration,
+            ralphPath: loopState.ralphPath,
+            progress: record.progress,
+            changedFiles: record.changedFiles,
+            noProgressStreak: record.noProgressStreak,
+          });
+          persistLoopState(pi, toPersistedLoopState(loopState, { active: true, stopRequested: false }));
+        },
+        pi,
+      });
-        loopState.iteration = i;
-        const iterStart = Date.now();
-        const { frontmatter: fm, body: rawBody } = parseRalphMd(loopState.ralphPath);
-        if (!validateFrontmatter(fm, ctx)) {
-          ctx.ui.notify(`Invalid RALPH.md on iteration ${i}, stopping loop`, "error");
+      // Map runner result to UI notifications
+      const total = loopState.iterationSummaries.reduce((a, s) => a + s.duration, 0);
+      switch (result.status) {
+        case "complete":
+          ctx.ui.notify(`Ralph loop complete: completion promise matched on iteration ${result.iterations.length} (${total}s total)`, "info");
           break;
-        }
-        loopState.maxIterations = fm.maxIterations;
-        loopState.timeout = fm.timeout;
-        loopState.completionPromise = fm.completionPromise;
-        loopState.guardrails = { blockCommands: fm.guardrails.blockCommands, protectedFiles: fm.guardrails.protectedFiles };
-        const outputs = await runCommands(fm.commands, fm.guardrails.blockCommands, pi);
-        const body = renderRalphBody(rawBody, outputs, { iteration: i, name });
-        const prompt = renderIterationPrompt(body, i, loopState.maxIterations);
-        const prevPersisted = readPersistedLoopState(ctx);
-        if (prevPersisted?.active && prevPersisted.sessionFile === ctx.sessionManager.getSessionFile()) {
-          persistLoopState(pi, { ...prevPersisted, active: false });
-        }
-        ctx.ui.setStatus("ralph", `🔁 ${name}: iteration ${i}/${loopState.maxIterations}`);
-        const prevSessionFile = loopState.loopSessionFile;
-        const { cancelled } = await ctx.newSession();
-        if (cancelled) {
-          ctx.ui.notify("Session switch cancelled, stopping loop", "warning");
+        case "max-iterations":
+          ctx.ui.notify(`Ralph loop reached max iterations: ${result.iterations.length} iterations, ${total}s total`, "info");
           break;
-        }
-        loopState.loopSessionFile = ctx.sessionManager.getSessionFile();
-        if (shouldResetFailCount(prevSessionFile, loopState.loopSessionFile)) failCounts.delete(prevSessionFile!);
-        if (loopState.loopSessionFile) failCounts.set(loopState.loopSessionFile, 0);
-        persistLoopState(pi, {
-          active: true,
-          sessionFile: loopState.loopSessionFile,
-          iteration: loopState.iteration,
-          maxIterations: loopState.maxIterations,
-          iterationSummaries: loopState.iterationSummaries,
-          guardrails: { blockCommands: loopState.guardrails.blockCommands, protectedFiles: loopState.guardrails.protectedFiles },
-          stopRequested: false,
-        });
-        pi.sendUserMessage(prompt);
-        const timeoutMs = fm.timeout * 1000;
-        let timedOut = false;
-        let idleError: Error | undefined;
-        let timer: ReturnType<typeof setTimeout> | undefined;
-        try {
-          await Promise.race([
-            ctx.waitForIdle().catch((e: any) => {
-              idleError = e instanceof Error ? e : new Error(String(e));
-              throw e;
-            }),
-            new Promise<never>((_, reject) => {
-              timer = setTimeout(() => {
-                timedOut = true;
-                reject(new Error("timeout"));
-              }, timeoutMs);
-            }),
-          ]);
-        } catch {
-          // handled below
-        }
-        if (timer) clearTimeout(timer);
-        const idleState = classifyIdleState(timedOut, idleError);
-        if (idleState === "timeout") {
-          ctx.ui.notify(`Iteration ${i} timed out after ${fm.timeout}s, stopping loop`, "warning");
+        case "no-progress-exhaustion":
+          ctx.ui.notify(`Ralph loop exhausted without verified progress: ${result.iterations.length} iterations, ${total}s total`, "warning");
           break;
-        }
-        if (idleState === "error") {
-          ctx.ui.notify(`Iteration ${i} agent error: ${idleError!.message}, stopping loop`, "error");
+        case "stopped":
+          ctx.ui.notify(`Ralph loop stopped: ${result.iterations.length} iterations, ${total}s total`, "info");
           break;
-        }
-        const elapsed = Math.round((Date.now() - iterStart) / 1000);
-        loopState.iterationSummaries.push({ iteration: i, duration: elapsed });
-        pi.appendEntry("ralph-iteration", { iteration: i, duration: elapsed, ralphPath: loopState.ralphPath });
-        const persistedAfter = readPersistedLoopState(ctx);
-        if (persistedAfter?.active && persistedAfter.stopRequested) {
-          loopState.stopRequested = true;
-          ctx.ui.notify("Ralph loop stopping after current iteration…", "info");
+        case "timeout":
+          ctx.ui.notify(`Ralph loop stopped after a timeout: ${result.iterations.length} iterations, ${total}s total`, "warning");
+          break;
+        case "error":
+          ctx.ui.notify(`Ralph loop failed: ${result.iterations.length} iterations, ${total}s total`, "error");
+          break;
+        default:
+          ctx.ui.notify(`Ralph loop ended: ${result.status} (${total}s total)`, "info");
           break;
-        }
-        if (fm.completionPromise) {
-          const entries = ctx.sessionManager.getEntries();
-          for (const entry of entries) {
-            if (entry.type === "message" && entry.message?.role === "assistant") {
-              const text = entry.message.content?.filter((b: any) => b.type === "text")?.map((b: any) => b.text)?.join("") ?? "";
-              if (shouldStopForCompletionPromise(text, fm.completionPromise)) {
-                ctx.ui.notify(`Completion promise matched on iteration ${i}`, "info");
-                break iterationLoop;
-              }
-            }
-          }
-        }
-        ctx.ui.notify(`Iteration ${i} complete (${elapsed}s)`, "info");
       }
-      const total = loopState.iterationSummaries.reduce((a, s) => a + s.duration, 0);
-      ctx.ui.notify(`Ralph loop done: ${loopState.iteration} iterations, ${total}s total`, "info");
     } catch (err) {
       const message = err instanceof Error ? err.message : String(err);
       ctx.ui.notify(`Ralph loop failed: ${message}`, "error");
     } finally {
       failCounts.clear();
+      pendingIterations.clear();
       loopState.active = false;
       loopState.stopRequested = false;
-      loopState.loopSessionFile = undefined;
+      loopState.loopToken = undefined;
       ctx.ui.setStatus("ralph", undefined);
-      persistLoopState(pi, { active: false });
+      persistLoopState(pi, toPersistedLoopState(loopState, { active: false, stopRequested: false }));
     }
   }
-  async function handleDraftCommand(commandName: "ralph" | "ralph-draft", args: string, ctx: any): Promise<string | undefined> {
+  let runtimeArgsForStart: RuntimeArgs = {};
+  async function handleDraftCommand(commandName: "ralph" | "ralph-draft", args: string, ctx: CommandContext): Promise<string | undefined> {
     const parsed = parseCommandArgs(args);
+    if (parsed.error) {
+      ctx.ui.notify(parsed.error, "error");
+      return undefined;
+    }
+    const runtimeArgsResult = runtimeArgEntriesToMap(parsed.runtimeArgs);
+    if (runtimeArgsResult.error) {
+      ctx.ui.notify(runtimeArgsResult.error, "error");
+      return undefined;
+    }
+    const runtimeArgs = runtimeArgsResult.runtimeArgs;
+    if (parsed.runtimeArgs.length > 0 && (commandName === "ralph-draft" || parsed.mode !== "path")) {
+      ctx.ui.notify("--arg is only supported with /ralph --path", "error");
+      return undefined;
+    }
+    runtimeArgsForStart = runtimeArgs;
+    const draftRuntime = getDraftStrengtheningRuntime(ctx);
     const resolveTaskForFolder = async (target: DraftTarget): Promise<string | undefined> => {
       const task = await promptForTask(ctx, "What should Ralph work on in this folder?", "reverse engineer this app");
       if (!task) return undefined;
-      return draftFromTask(commandName, task, target, ctx);
+      return draftFromTask(commandName, task, target, ctx, draftPlanFactory, draftRuntime);
     };
-    const handleExistingInspection = async (input: string, explicitPath = false): Promise<string | undefined> => {
+    const handleExistingInspection = async (input: string, explicitPath = false, runtimeArgsProvided = false): Promise<string | undefined> => {
       const inspection = inspectExistingTarget(input, ctx.cwd, explicitPath);
+      if (runtimeArgsProvided && inspection.kind !== "run") {
+        ctx.ui.notify("--arg is only supported with /ralph --path to an existing RALPH.md", "error");
+        return undefined;
+      }
       switch (inspection.kind) {
         case "run":
           if (commandName === "ralph") return inspection.ralphPath;
@@ -466,14 +1232,14 @@ export default function (pi: ExtensionAPI) {
         }
         planned = { kind: "draft", target: decision.target! };
       }
-      return draftFromTask(commandName, task, planned.target, ctx);
+      return draftFromTask(commandName, task, planned.target, ctx, draftPlanFactory, draftRuntime);
     };
     if (parsed.mode === "task") {
       return handleTaskFlow(parsed.value);
     }
     if (parsed.mode === "path") {
-      return handleExistingInspection(parsed.value || ".", true);
+      return handleExistingInspection(parsed.value || ".", true, parsed.runtimeArgs.length > 0);
     }
     if (!parsed.value) {
       const inspection = inspectExistingTarget(".", ctx.cwd);
@@ -491,49 +1257,107 @@ export default function (pi: ExtensionAPI) {
     return handleExistingInspection(parsed.value);
   }
-  pi.on("tool_call", async (event: any, ctx: any) => {
-    if (!isLoopSession(ctx)) return;
-    const persisted = readPersistedLoopState(ctx);
+  pi.on("tool_call", async (event: ToolEvent, ctx: EventContext) => {
+    const persisted = resolveActiveLoopState(ctx);
     if (!persisted) return;
+    if (persisted.envMalformed && (event.toolName === "bash" || event.toolName === "write" || event.toolName === "edit")) {
+      return { block: true, reason: "ralph: invalid loop contract" };
+    }
     if (event.toolName === "bash") {
       const cmd = (event.input as { command?: string }).command ?? "";
       const blockedPattern = findBlockedCommandPattern(cmd, persisted.guardrails?.blockCommands ?? []);
-      if (blockedPattern) return { block: true, reason: `ralph: blocked (${blockedPattern})` };
+      if (blockedPattern) {
+        appendLoopProofEntry("ralph-blocked-command", {
+          loopToken: persisted.loopToken,
+          iteration: persisted.iteration,
+          command: cmd,
+          blockedPattern,
+        });
+        return { block: true, reason: `ralph: blocked (${blockedPattern})` };
+      }
     }
     if (event.toolName === "write" || event.toolName === "edit") {
       const filePath = (event.input as { path?: string }).path ?? "";
-      for (const glob of persisted.guardrails?.protectedFiles ?? []) {
-        if (minimatch(filePath, glob, { matchBase: true })) return { block: true, reason: `ralph: ${filePath} is protected` };
+      if (matchesProtectedPath(filePath, persisted.guardrails?.protectedFiles ?? [], persisted.cwd)) {
+        appendLoopProofEntry("ralph-blocked-write", {
+          loopToken: persisted.loopToken,
+          iteration: persisted.iteration,
+          toolName: event.toolName,
+          path: filePath,
+          reason: `ralph: ${filePath} is protected`,
+        });
+        return { block: true, reason: `ralph: ${filePath} is protected` };
       }
     }
+    recordPendingToolPath(ctx, event);
   });
-  pi.on("before_agent_start", async (event: any, ctx: any) => {
-    if (!isLoopSession(ctx)) return;
-    const persisted = readPersistedLoopState(ctx);
+  pi.on("tool_execution_start", async (event: ToolEvent, ctx: EventContext) => {
+    recordPendingToolPath(ctx, event);
+  });
+  pi.on("tool_execution_end", async (event: ToolEvent, ctx: EventContext) => {
+    recordSuccessfulTaskDirWrite(ctx, event);
+  });
+  pi.on("agent_end", async (event: AgentEndEvent, ctx: EventContext) => {
+    resolvePendingIteration(ctx, event);
+  });
+  pi.on("before_agent_start", async (event: BeforeAgentStartEvent, ctx: EventContext) => {
+    const persisted = resolveActiveLoopState(ctx);
+    if (!persisted) return;
     const summaries = persisted?.iterationSummaries ?? [];
     if (summaries.length === 0) return;
-    const history = summaries.map((s) => `- Iteration ${s.iteration}: ${s.duration}s`).join("\n");
+    const history = summaries
+      .map((summary) => {
+        const status = summarizeIterationProgress(summary);
+        return `- Iteration ${summary.iteration}: ${summary.duration}s — ${status}; no-progress streak: ${summary.noProgressStreak ?? persisted?.noProgressStreak ?? 0}`;
+      })
+      .join("\n");
+    const lastSummary = summaries[summaries.length - 1];
+    const lastFeedback = summarizeLastIterationFeedback(lastSummary, persisted?.noProgressStreak ?? 0);
+    const taskDirLabel = persisted?.taskDir ? displayPath(persisted.cwd ?? persisted.taskDir, persisted.taskDir) : "the Ralph task directory";
+    appendLoopProofEntry("ralph-steering-injected", {
+      loopToken: persisted?.loopToken,
+      iteration: persisted?.iteration,
+      maxIterations: persisted?.maxIterations,
+      taskDir: taskDirLabel,
+    });
+    appendLoopProofEntry("ralph-loop-context-injected", {
+      loopToken: persisted?.loopToken,
+      iteration: persisted?.iteration,
+      maxIterations: persisted?.maxIterations,
+      taskDir: taskDirLabel,
+      summaryCount: summaries.length,
+    });
     return {
       systemPrompt:
         event.systemPrompt +
-        `\n\n## Ralph Loop Context\nIteration ${persisted?.iteration ?? 0}/${persisted?.maxIterations ?? 0}\n\nPrevious iterations:\n${history}\n\nDo not repeat completed work. Check git log for recent changes.`,
+        `\n\n## Ralph Loop Context\nIteration ${persisted?.iteration ?? 0}/${persisted?.maxIterations ?? 0}\nTask directory: ${taskDirLabel}\n\nPrevious iterations:\n${history}\n\n${lastFeedback}\nPersist findings to files in the Ralph task directory. Do not only report them in chat. If you make progress this iteration, leave durable file changes and mention the changed paths.\nDo not repeat completed work. Check git log for recent changes.`,
     };
   });
-  pi.on("tool_result", async (event: any, ctx: any) => {
-    if (!isLoopSession(ctx) || event.toolName !== "bash") return;
-    const output = event.content.map((c: { type: string; text?: string }) => (c.type === "text" ? c.text ?? "" : "")).join("");
+  pi.on("tool_result", async (event: ToolResultEvent, ctx: EventContext) => {
+    const persisted = resolveActiveLoopState(ctx);
+    if (!persisted) return;
+    if (event.toolName !== "bash") return;
+    const output = event.content.map((c) => (c.type === "text" ? c.text ?? "" : "")).join("");
     if (!shouldWarnForBashFailure(output)) return;
-    const sessionFile = ctx.sessionManager.getSessionFile();
-    if (!sessionFile) return;
+    const state = resolveActiveIterationState(ctx);
+    if (!state) return;
-    const next = (failCounts.get(sessionFile) ?? 0) + 1;
-    failCounts.set(sessionFile, next);
+    const failKey = getLoopIterationKey(state.loopToken, state.iteration);
+    const next = (failCounts.get(failKey) ?? 0) + 1;
+    failCounts.set(failKey, next);
     if (next >= 3) {
       return {
         content: [
@@ -546,7 +1370,7 @@ export default function (pi: ExtensionAPI) {
   pi.registerCommand("ralph", {
     description: "Start Ralph from a task folder or RALPH.md",
-    handler: async (args: string, ctx: any) => {
+    handler: async (args: string, ctx: CommandContext) => {
       if (loopState.active) {
         ctx.ui.notify("A ralph loop is already running. Use /ralph-stop first.", "warning");
         return;
@@ -554,33 +1378,106 @@ export default function (pi: ExtensionAPI) {
       const ralphPath = await handleDraftCommand("ralph", args ?? "", ctx);
       if (!ralphPath) return;
-      await startRalphLoop(ralphPath, ctx);
+      await startRalphLoop(ralphPath, ctx, services.runRalphLoopFn, runtimeArgsForStart);
     },
   });
   pi.registerCommand("ralph-draft", {
     description: "Draft a Ralph task without starting it",
-    handler: async (args: string, ctx: any) => {
+    handler: async (args: string, ctx: CommandContext) => {
       await handleDraftCommand("ralph-draft", args ?? "", ctx);
     },
   });
   pi.registerCommand("ralph-stop", {
     description: "Stop the ralph loop after the current iteration",
-    handler: async (_args: string, ctx: any) => {
-      const persisted = readPersistedLoopState(ctx);
-      if (!persisted?.active) {
-        if (!loopState.active) {
-          ctx.ui.notify("No active ralph loop", "warning");
+    handler: async (args: string, ctx: CommandContext) => {
+      const parsed = parseCommandArgs(args ?? "");
+      if (parsed.error) {
+        ctx.ui.notify(parsed.error, "error");
+        return;
+      }
+      if (parsed.mode === "task") {
+        ctx.ui.notify("/ralph-stop expects a task folder or RALPH.md path, not task text.", "error");
+        return;
+      }
+      const now = new Date().toISOString();
+      const activeRegistryEntries = () => listActiveLoopRegistryEntries(ctx.cwd);
+      const { target: sessionTarget, persistedSessionState } = resolveSessionStopTarget(ctx, now);
+      if (sessionTarget && !parsed.value) {
+        applyStopTarget(pi, ctx, sessionTarget, now, persistedSessionState);
+        return;
+      }
+      if (parsed.value) {
+        const inspection = inspectExistingTarget(parsed.value, ctx.cwd, true);
+        if (inspection.kind !== "run") {
+          if (inspection.kind === "invalid-markdown") {
+            ctx.ui.notify(`Only task folders or RALPH.md can be stopped directly. ${displayPath(ctx.cwd, inspection.path)} is not stoppable.`, "error");
+            return;
+          }
+          if (inspection.kind === "invalid-target") {
+            ctx.ui.notify(`Only task folders or RALPH.md can be stopped directly. ${displayPath(ctx.cwd, inspection.path)} is a file, not a task folder.`, "error");
+            return;
+          }
+          if (inspection.kind === "dir-without-ralph" || inspection.kind === "missing-path") {
+            ctx.ui.notify(`No active ralph loop found at ${displayPath(ctx.cwd, inspection.dirPath)}.`, "warning");
+            return;
+          }
+          ctx.ui.notify("/ralph-stop expects a task folder or RALPH.md path.", "error");
+          return;
+        }
+        const taskDir = dirname(inspection.ralphPath);
+        if (sessionTarget && sessionTarget.taskDir === taskDir) {
+          applyStopTarget(pi, ctx, sessionTarget, now, persistedSessionState);
+          return;
+        }
+        const registryTarget = activeRegistryEntries().find((entry) => entry.taskDir === taskDir || entry.ralphPath === inspection.ralphPath);
+        if (registryTarget) {
+          applyStopTarget(pi, ctx, materializeRegistryStopTarget(registryTarget), now);
           return;
         }
-        loopState.stopRequested = true;
-        ctx.ui.notify("Ralph loop stopping after current iteration…", "info");
+        const statusFile = readStatusFile(taskDir);
+        if (
+          statusFile &&
+          (statusFile.status === "running" || statusFile.status === "initializing") &&
+          typeof statusFile.cwd === "string" &&
+          statusFile.cwd.length > 0
+        ) {
+          const statusRegistryTarget = listActiveLoopRegistryEntries(statusFile.cwd).find(
+            (entry) => entry.taskDir === taskDir && entry.loopToken === statusFile.loopToken,
+          );
+          if (statusRegistryTarget) {
+            applyStopTarget(pi, ctx, materializeRegistryStopTarget(statusRegistryTarget), now);
+            return;
+          }
+        }
+        ctx.ui.notify(`No active ralph loop found at ${displayPath(ctx.cwd, inspection.ralphPath)}.`, "warning");
         return;
       }
-      loopState.stopRequested = true;
-      persistLoopState(pi, { ...persisted, stopRequested: true });
-      ctx.ui.notify("Ralph loop stopping after current iteration…", "info");
+      if (sessionTarget) {
+        applyStopTarget(pi, ctx, sessionTarget, now, persistedSessionState);
+        return;
+      }
+      const activeEntries = activeRegistryEntries();
+      if (activeEntries.length === 0) {
+        ctx.ui.notify("No active ralph loops found.", "warning");
+        return;
+      }
+      if (activeEntries.length > 1) {
+        ctx.ui.notify("Multiple active ralph loops found. Use /ralph-stop --path <task folder or RALPH.md> for an explicit target path.", "error");
+        return;
+      }
+      applyStopTarget(pi, ctx, materializeRegistryStopTarget(activeEntries[0]), now);
     },
   });
 }