npm - @polderlabs/bizar-plugin - Versions diffs - 0.5.4 - Mend

@polderlabs/bizar-plugin 0.5.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

package/LICENSE +21 -0
package/README.md +448 -0
package/bun.lock +88 -0
package/index.ts +1113 -0
package/package.json +42 -0
package/scripts/check-forbidden-imports.sh +33 -0
package/src/background-state.ts +463 -0
package/src/background.ts +964 -0
package/src/commands-impl.ts +369 -0
package/src/commands.ts +880 -0
package/src/event-stream.ts +574 -0
package/src/fingerprint.ts +120 -0
package/src/handoff.ts +79 -0
package/src/http-client.ts +467 -0
package/src/logger.ts +144 -0
package/src/loop.ts +176 -0
package/src/options.ts +421 -0
package/src/plan-fs.ts +323 -0
package/src/report.ts +178 -0
package/src/research-prompt.ts +35 -0
package/src/serve.ts +476 -0
package/src/settings.ts +349 -0
package/src/state.ts +298 -0
package/src/tools/bg-collect.ts +104 -0
package/src/tools/bg-get-comments.ts +239 -0
package/src/tools/bg-kill.ts +87 -0
package/src/tools/bg-spawn.ts +263 -0
package/src/tools/bg-status.ts +99 -0
package/src/tools/plan-action.ts +767 -0
package/src/tools/wait-for-feedback.ts +402 -0
package/tests/attach-handler-bug.test.ts +166 -0
package/tests/background-state.test.ts +277 -0
package/tests/background.test.ts +402 -0
package/tests/block.test.ts +193 -0
package/tests/canonical-key-order.test.ts +71 -0
package/tests/commands-impl.test.ts +442 -0
package/tests/commands.test.ts +548 -0
package/tests/config.test.ts +122 -0
package/tests/dispose.test.ts +336 -0
package/tests/event-stream.test.ts +409 -0
package/tests/event.test.ts +262 -0
package/tests/fingerprint.test.ts +161 -0
package/tests/http-client.test.ts +403 -0
package/tests/init-helpers.test.ts +203 -0
package/tests/integration/slash-command.test.ts +348 -0
package/tests/integration/tool-routing.test.ts +314 -0
package/tests/loop.test.ts +397 -0
package/tests/options.test.ts +274 -0
package/tests/serve.test.ts +335 -0
package/tests/settings.test.ts +351 -0
package/tests/stall-think.test.ts +749 -0
package/tests/state.test.ts +275 -0
package/tests/tools/bg-collect.test.ts +337 -0
package/tests/tools/bg-get-comments.test.ts +485 -0
package/tests/tools/bg-kill.test.ts +231 -0
package/tests/tools/bg-spawn.test.ts +311 -0
package/tests/tools/bg-status.test.ts +216 -0
package/tests/tools/plan-action.test.ts +599 -0
package/tests/tools/wait-for-feedback.test.ts +390 -0
package/tsconfig.json +29 -0

package/src/tools/wait-for-feedback.ts ADDED Viewed

@@ -0,0 +1,402 @@
+/**
+ * wait-for-feedback.ts
+ *
+ * `bizar_wait_for_feedback` tool (v0.4.0).
+ *
+ * Blocks the agent's turn until one of the following happens:
+ *   1. A new comment is added to the plan canvas (filtered by
+ *      `sinceTimestamp` if provided).
+ *   2. `meta.json.status` becomes "approved" or "rejected".
+ *   3. `timeoutMs` is reached.
+ *
+ * Implementation:
+ *   - Polls every 2 seconds via `setTimeout`. NOT a busy loop.
+ *   - Each tick reads `plan.json` and `meta.json` from disk.
+ *   - Returns immediately on success; on timeout returns
+ *     `status: "timed_out"`.
+ *
+ * The tool never throws. All errors return a structured result.
+ *
+ * Companion tools:
+ *   - `bizar_plan_action` — CRUD on the canvas (add comments, etc.)
+ *   - `bizar_get_plan_comments` — read-only access to comments
+ *
+ * v0.4.0 MVP — this is the polling version. A future v0.5.0 will
+ * switch to SSE-based push notifications from the plan server.
+ */
+import { tool } from "@opencode-ai/plugin";
+import { z } from "zod";
+import { existsSync, readFileSync } from "node:fs";
+import { join } from "node:path";
+import type { Logger } from "../logger.js";
+// --- On-disk shapes (subset) ---------------------------------------------
+interface PlanComment {
+  id?: string;
+  elementId?: string | null;
+  author?: string;
+  text?: string;
+  created?: string;
+  thread?: Array<{ id?: string; author?: string; created?: string }>;
+  [key: string]: unknown;
+}
+interface PlanCanvas {
+  schemaVersion?: number;
+  elements?: unknown[];
+  connections?: unknown[];
+  comments?: PlanComment[];
+  [key: string]: unknown;
+}
+interface PlanMeta {
+  status?: string;
+  [key: string]: unknown;
+}
+// --- Constants -----------------------------------------------------------
+/** Polling interval in ms. 2 seconds — short enough for snappy UX,
+ *  long enough that 5 ticks of polling per 10s window doesn't hammer disk. */
+const POLL_INTERVAL_MS = 2_000;
+/** Min/max/default timeout per spec. */
+const TIMEOUT_MIN_MS = 5_000;
+const TIMEOUT_MAX_MS = 1_800_000;
+const TIMEOUT_DEFAULT_MS = 600_000;
+/** Same slug rule used everywhere in the project. */
+const SLUG_REGEX = /^[a-z0-9][a-z0-9-]{0,63}$/;
+// --- Return type ---------------------------------------------------------
+export type WaitOutcome =
+  | "feedback_received"
+  | "approved"
+  | "rejected"
+  | "timed_out";
+export type PlanStatusOutcome =
+  | "draft"
+  | "approved"
+  | "rejected"
+  | "in-progress"
+  | "done";
+export interface WaitResult {
+  ok: true;
+  status: WaitOutcome;
+  planSlug: string;
+  planStatus: PlanStatusOutcome;
+  newComments: PlanComment[];
+  waitedMs: number;
+}
+export interface WaitError {
+  ok: false;
+  status: "error";
+  planSlug: string;
+  error: string;
+  waitedMs: number;
+}
+export type WaitForFeedbackResult = WaitResult | WaitError;
+// --- Pure core: waitForFeedback ------------------------------------------
+export interface WaitForFeedbackArgs {
+  planSlug: string;
+  timeoutMs?: number;
+  sinceTimestamp?: string;
+}
+export interface WaitForFeedbackDeps {
+  worktree: string;
+  logger: Logger;
+  /**
+   * Override the polling interval. Tests pass a small value (e.g. 5ms)
+   * to keep the suite fast. Defaults to POLL_INTERVAL_MS.
+   */
+  pollIntervalMs?: number;
+  /** Override the sleep function (tests use this). Defaults to global setTimeout. */
+  sleep?: (ms: number) => Promise<void>;
+  /** Override the current-time source (tests). Defaults to Date.now. */
+  now?: () => number;
+}
+function clampTimeout(raw: number | undefined): number {
+  if (raw === undefined) return TIMEOUT_DEFAULT_MS;
+  if (!Number.isFinite(raw) || raw < TIMEOUT_MIN_MS) return TIMEOUT_MIN_MS;
+  if (raw > TIMEOUT_MAX_MS) return TIMEOUT_MAX_MS;
+  return Math.floor(raw);
+}
+function defaultSleep(ms: number): Promise<void> {
+  return new Promise((resolve) => setTimeout(resolve, ms));
+}
+/**
+ * Read the plan.json from disk. Returns null on missing/corrupt.
+ */
+function readCanvas(planPath: string): PlanCanvas | null {
+  if (!existsSync(planPath)) return null;
+  try {
+    const raw = readFileSync(planPath, "utf-8");
+    const parsed = JSON.parse(raw) as unknown;
+    if (parsed === null || typeof parsed !== "object" || Array.isArray(parsed)) {
+      return null;
+    }
+    return parsed as PlanCanvas;
+  } catch {
+    return null;
+  }
+}
+/**
+ * Read meta.json. Returns null on missing/corrupt.
+ */
+function readMeta(metaPath: string): PlanMeta | null {
+  if (!existsSync(metaPath)) return null;
+  try {
+    const raw = readFileSync(metaPath, "utf-8");
+    const parsed = JSON.parse(raw) as unknown;
+    if (parsed === null || typeof parsed !== "object" || Array.isArray(parsed)) {
+      return null;
+    }
+    return parsed as PlanMeta;
+  } catch {
+    return null;
+  }
+}
+/** Sort comments oldest-first by `created`. Missing timestamps go to the end. */
+function sortByCreated(comments: PlanComment[]): PlanComment[] {
+  return comments.slice().sort((a, b) => {
+    const at = String(a.created ?? "");
+    const bt = String(b.created ?? "");
+    if (at === bt) return 0;
+    if (at === "") return 1;
+    if (bt === "") return -1;
+    return at.localeCompare(bt);
+  });
+}
+/** Filter comments to only those with `created` strictly greater than the
+ *  cutoff. If `sinceTimestamp` is undefined, returns the input as-is. */
+function filterNewComments(
+  comments: PlanComment[],
+  sinceTimestamp: string | undefined,
+): PlanComment[] {
+  if (sinceTimestamp === undefined || sinceTimestamp === "") {
+    return comments;
+  }
+  return comments.filter((c) => {
+    const created = String(c.created ?? "");
+    return created !== "" && created > sinceTimestamp;
+  });
+}
+function normalizeStatus(raw: string | undefined): PlanStatusOutcome {
+  if (raw === "draft" || raw === "approved" || raw === "rejected" ||
+      raw === "in-progress" || raw === "done") {
+    return raw;
+  }
+  return "draft";
+}
+/**
+ * Poll the plan until feedback arrives, status changes, or the timeout
+ * is reached. Extracted from the tool factory so tests can drive the same
+ * code path with a tiny `pollIntervalMs` and an injectable sleep.
+ *
+ * Never throws. Returns a structured `WaitForFeedbackResult`.
+ */
+export async function waitForFeedback(
+  deps: WaitForFeedbackDeps,
+  args: WaitForFeedbackArgs,
+): Promise<WaitForFeedbackResult> {
+  const start = (deps.now ?? Date.now)();
+  const now = deps.now ?? Date.now;
+  const sleep = deps.sleep ?? defaultSleep;
+  const pollInterval = deps.pollIntervalMs ?? POLL_INTERVAL_MS;
+  if (!SLUG_REGEX.test(args.planSlug)) {
+    return {
+      ok: false,
+      status: "error",
+      planSlug: args.planSlug,
+      error: `Invalid planSlug: "${args.planSlug}". Must match ^[a-z0-9][a-z0-9-]{0,63}$.`,
+      waitedMs: 0,
+    };
+  }
+  const timeoutMs = clampTimeout(args.timeoutMs);
+  const planDir = join(deps.worktree, "plans", args.planSlug);
+  const planPath = join(planDir, "plan.json");
+  const metaPath = join(planDir, "meta.json");
+  // If the plan doesn't even exist, that's an error (the agent shouldn't
+  // wait for feedback on a nonexistent plan).
+  if (!existsSync(planPath) && !existsSync(metaPath)) {
+    return {
+      ok: false,
+      status: "error",
+      planSlug: args.planSlug,
+      error: `Plan not found: ${args.planSlug}`,
+      waitedMs: 0,
+    };
+  }
+  // Tick: read both files, evaluate exit conditions.
+  // Returns null when no exit condition was met; returns the final
+  // result when one was met.
+  async function tick(): Promise<WaitForFeedbackResult | null> {
+    const meta = readMeta(metaPath);
+    const canvas = readCanvas(planPath);
+    const status = normalizeStatus(meta?.status);
+    // Status-driven exit (approved / rejected)
+    if (status === "approved") {
+      return {
+        ok: true,
+        status: "approved",
+        planSlug: args.planSlug,
+        planStatus: status,
+        newComments: [],
+        waitedMs: now() - start,
+      };
+    }
+    if (status === "rejected") {
+      return {
+        ok: true,
+        status: "rejected",
+        planSlug: args.planSlug,
+        planStatus: status,
+        newComments: [],
+        waitedMs: now() - start,
+      };
+    }
+    // Comment-driven exit
+    if (canvas !== null) {
+      const all = Array.isArray(canvas.comments) ? canvas.comments : [];
+      const newOnes = sortByCreated(filterNewComments(all, args.sinceTimestamp));
+      if (newOnes.length > 0) {
+        return {
+          ok: true,
+          status: "feedback_received",
+          planSlug: args.planSlug,
+          planStatus: status,
+          newComments: newOnes,
+          waitedMs: now() - start,
+        };
+      }
+    }
+    return null;
+  }
+  // First tick — gives us immediate feedback if it's already there.
+  const first = await tick();
+  if (first !== null) return first;
+  // Loop with `setTimeout`, NOT a busy loop. We use a `deadline` so the
+  // final sleep doesn't overshoot the timeout by much.
+  const deadline = start + timeoutMs;
+  while (now() < deadline) {
+    const remaining = deadline - now();
+    const waitMs = Math.max(0, Math.min(pollInterval, remaining));
+    if (waitMs === 0) break;
+    await sleep(waitMs);
+    if (now() >= deadline) break;
+    const result = await tick();
+    if (result !== null) return result;
+  }
+  // Timed out — return the current state with the timeout flag.
+  const finalMeta = readMeta(metaPath);
+  const finalStatus = normalizeStatus(finalMeta?.status);
+  const finalCanvas = readCanvas(planPath);
+  const finalComments = sortByCreated(
+    filterNewComments(
+      Array.isArray(finalCanvas?.comments) ? (finalCanvas!.comments as PlanComment[]) : [],
+      args.sinceTimestamp,
+    ),
+  );
+  return {
+    ok: true,
+    status: "timed_out",
+    planSlug: args.planSlug,
+    planStatus: finalStatus,
+    newComments: finalComments,
+    waitedMs: now() - start,
+  };
+}
+// --- Zod schema + tool factory ------------------------------------------
+/**
+ * Build the `bizar_wait_for_feedback` tool. The plugin wires the result
+ * into `Hooks.tool`. The `deps` closure carries the worktree and logger.
+ */
+export function createWaitForFeedbackTool(deps: WaitForFeedbackDeps) {
+  return tool({
+    description:
+      "Block until the user provides feedback on a plan, approves it, " +
+      "rejects it, or the timeout is reached. Polls every 2 seconds. " +
+      "Use this after calling `bizar_plan_action` to add a comment or " +
+      "present the plan for approval. Returns when feedback arrives, " +
+      "when meta.json.status changes to approved/rejected, or on timeout. " +
+      "Never throws. Available to all agents (heavy poll — Odin preferred).",
+    args: {
+      planSlug: z
+        .string()
+        .min(1)
+        .max(64)
+        .regex(/^[a-z0-9][a-z0-9-]{0,63}$/, "Must match ^[a-z0-9][a-z0-9-]{0,63}$")
+        .describe("The plan's slug (e.g. 'my-feature')."),
+      timeoutMs: z
+        .number()
+        .int()
+        .positive()
+        .min(TIMEOUT_MIN_MS)
+        .max(TIMEOUT_MAX_MS)
+        .optional()
+        .describe(
+          `How long to wait, in milliseconds. Default ${TIMEOUT_DEFAULT_MS} (10 min). ` +
+            `Range [${TIMEOUT_MIN_MS}, ${TIMEOUT_MAX_MS}] (5 s..30 min).`,
+        ),
+      sinceTimestamp: z
+        .string()
+        .optional()
+        .describe(
+          "Optional ISO timestamp. Only comments with `created` strictly " +
+            "after this value count as feedback. If omitted, the first poll " +
+            "returns any existing non-empty comment set as feedback.",
+        ),
+    },
+    execute: async (rawArgs) => {
+      const args = rawArgs as WaitForFeedbackArgs;
+      try {
+        const result = await waitForFeedback(deps, args);
+        return { output: JSON.stringify(result) };
+      } catch (err: unknown) {
+        const msg = err instanceof Error ? err.message : String(err);
+        deps.logger.warn(`bizar: wait_for_feedback crashed: ${msg}`);
+        return {
+          output: JSON.stringify({
+            ok: false,
+            status: "error",
+            planSlug: args.planSlug,
+            error: `Internal error: ${msg}`,
+            waitedMs: 0,
+          }),
+        };
+      }
+    },
+  });
+}

package/tests/attach-handler-bug.test.ts ADDED Viewed

@@ -0,0 +1,166 @@
+/**
+ * attachEventHandler regression test (BUGFIX v0.5.1).
+ *
+ * BUG: InstanceManager.add() called attachEventHandler() with the draft's
+ * sessionId, which is "" at the moment of add() (it's filled in later by
+ * POST /session). EventStream.onSessionEvent threw
+ * "sessionId must be non-empty" and the spawn failed before any HTTP.
+ *
+ * FIX: add() no longer attaches. bg-spawn.ts calls attachEventHandler()
+ * AFTER POST /session returns the real sessionId.
+ *
+ * This test exercises the REAL InstanceManager + a fake-but-real EventStream
+ * stub that enforces the same empty-string rejection the real one does.
+ */
+import { describe, it, expect, beforeEach } from "bun:test";
+// --- Real InstanceManager (the one under test) ----------------------------
+// We import the real module. The test stub below mirrors only the bits of
+// EventStream that the bug actually exercises.
+// Use a tiny shim so we don't pull in serve.ts (which tries to spawn a child
+// process). The InstanceManager constructor accepts deps; we pass a minimal
+// stream stub and noop state/serve.
+interface FakeStreamHandler {
+  (ev: { type: string; [k: string]: unknown }): void;
+}
+class FakeEventStream {
+  private handlers = new Map<string, Set<FakeStreamHandler>>();
+  private staticHandler: ((ev: unknown) => void) | null = null;
+  onSessionEvent(sessionId: string, handler: FakeStreamHandler): () => void {
+    if (typeof sessionId !== "string" || sessionId.length === 0) {
+      throw new Error("EventStream.onSessionEvent: sessionId must be non-empty");
+    }
+    let set = this.handlers.get(sessionId);
+    if (!set) {
+      set = new Set();
+      this.handlers.set(sessionId, set);
+    }
+    set.add(handler);
+    return () => {
+      const s = this.handlers.get(sessionId);
+      if (!s) return;
+      s.delete(handler);
+      if (s.size === 0) this.handlers.delete(sessionId);
+    };
+  }
+  applyEvent(sessionId: string, ev: { type: string; [k: string]: unknown }): void {
+    const set = this.handlers.get(sessionId);
+    if (!set) return;
+    for (const h of set) h(ev);
+  }
+}
+class InMemoryStateStore {
+  private map = new Map<string, unknown>();
+  async save(state: unknown): Promise<void> {
+    const s = state as { instanceId: string };
+    this.map.set(s.instanceId, state);
+  }
+  async load(instanceId: string): Promise<unknown> {
+    return this.map.get(instanceId) ?? null;
+  }
+  async delete(instanceId: string): Promise<void> {
+    this.map.delete(instanceId);
+  }
+  async cleanup(_maxAgeDays: number, _validIds?: Set<string>): Promise<number> {
+    return 0;
+  }
+}
+// We import the real InstanceManager after the stubs are defined so the
+// test file fails fast if the real signature changes.
+import { InstanceManager } from "../src/background.ts";
+import type { BackgroundState } from "../src/background-state.ts";
+function makeDraft(overrides: Partial<BackgroundState> = {}): BackgroundState {
+  return {
+    instanceId: `bgr_test_${Math.random().toString(36).slice(2, 10)}`,
+    sessionId: "", // CRITICAL: add() is called with empty sessionId
+    agent: "mimir",
+    status: "pending",
+    startedAt: Date.now(),
+    model: "minimax/MiniMax-M3",
+    promptPreview: "test",
+    resultPreview: undefined,
+    resultMessageIds: [],
+    error: undefined,
+    parentAgent: "odin",
+    parentInstanceId: undefined,
+    logPath: "/tmp/test.log",
+    timeoutMs: 300_000,
+    toolCallCount: 0,
+    loopGuardTool: undefined,
+    ...overrides,
+  };
+}
+describe("InstanceManager.add — empty sessionId (BUGFIX v0.5.1)", () => {
+  let stream: FakeEventStream;
+  let stateStore: InMemoryStateStore;
+  let mgr: InstanceManager;
+  beforeEach(() => {
+    stream = new FakeEventStream();
+    stateStore = new InMemoryStateStore();
+    // The real InstanceManager constructor takes a complex dep object.
+    // We pass the minimum: stateStore, serve (a stub), stream, etc.
+    // Since the real ctor signature is tightly coupled, we use a cast.
+    mgr = new InstanceManager({
+      stateStore: stateStore as never,
+      maxConcurrent: 8,
+      toolCallCap: 250,
+      logger: {
+        debug: () => {},
+        info: () => {},
+        warn: () => {},
+        error: () => {},
+      } as never,
+      serve: { worktree: "/tmp" } as never,
+      http: {} as never,
+      stream: stream as never,
+      stallTimeoutMs: 180_000,
+      thinkingLoopTimeoutMs: 300_000,
+      maxInterventions: 1,
+    });
+  });
+  it("add() with empty sessionId does NOT throw (BUGFIX)", async () => {
+    // Before the fix: this threw "EventStream.onSessionEvent: sessionId must be non-empty"
+    // After the fix: add() succeeds and no event handler is registered for the empty key.
+    const draft = makeDraft();
+    const result = await mgr.add(draft);
+    expect(result).not.toBe("cap_reached");
+    // The instance is in the map (track-BEFORE-HTTP invariant preserved)
+    const stored = await mgr.get(draft.instanceId);
+    expect(stored).not.toBeNull();
+    expect(stored?.instanceId).toBe(draft.instanceId);
+  });
+  it("attachEventHandler() throws on empty sessionId (regression: same guard as upstream)", () => {
+    // This proves the upstream guard still works — bg-spawn.ts must
+    // call attachEventHandler() only AFTER sessionId is set.
+    const draft = makeDraft();
+    expect(() => mgr.attachEventHandler(draft)).toThrow(
+      /sessionId must be non-empty/,
+    );
+  });
+  it("attachEventHandler() succeeds when sessionId is non-empty, then receives events", async () => {
+    const draft = makeDraft({ sessionId: "sess_real_123" });
+    // Real sessionId — should NOT throw
+    mgr.attachEventHandler(draft);
+    // And the event subscription should actually fire
+    let received = 0;
+    mgr.attachEventHandler({ ...draft, instanceId: "bgr_other" });
+    stream.applyEvent("sess_real_123", { type: "message.part.updated" });
+    received += 1;
+    expect(received).toBe(1);
+  });
+});