npm - @calltelemetry/openclaw-linear - Versions diffs - 0.8.0 → 0.8.2 - Mend

@calltelemetry/openclaw-linear 0.8.0 → 0.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/README.md +152 -34
package/openclaw.plugin.json +3 -2
package/package.json +1 -1
package/prompts.yaml +27 -1
package/src/agent/agent.test.ts +49 -0
package/src/agent/agent.ts +26 -1
package/src/infra/doctor.ts +2 -2
package/src/pipeline/e2e-planning.test.ts +77 -54
package/src/pipeline/intent-classify.test.ts +285 -0
package/src/pipeline/intent-classify.ts +259 -0
package/src/pipeline/planner.test.ts +159 -40
package/src/pipeline/planner.ts +98 -32
package/src/pipeline/webhook.ts +340 -376
package/src/tools/claude-tool.ts +6 -0
package/src/tools/code-tool.test.ts +3 -3
package/src/tools/code-tool.ts +2 -2
package/src/tools/planner-tools.test.ts +1 -1
package/src/tools/planner-tools.ts +10 -2

package/src/pipeline/intent-classify.ts ADDED Viewed

@@ -0,0 +1,259 @@
+/**
+ * intent-classify.ts — LLM-based intent classification for Linear comments.
+ *
+ * Replaces static regex pattern matching with a lightweight LLM classifier.
+ * Follows the tier-assess.ts pattern: runAgent() subprocess call, JSON parsing,
+ * regex fallback on any failure.
+ *
+ * Cost: one short agent turn (~300 tokens). Latency: ~2-5s.
+ */
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+import type { OpenClawPluginApi } from "openclaw/plugin-sdk";
+// ---------------------------------------------------------------------------
+// Types
+// ---------------------------------------------------------------------------
+export type Intent =
+  | "plan_start"
+  | "plan_finalize"
+  | "plan_abandon"
+  | "plan_continue"
+  | "ask_agent"
+  | "request_work"
+  | "question"
+  | "general";
+export interface IntentResult {
+  intent: Intent;
+  agentId?: string;
+  reasoning: string;
+  fromFallback: boolean;
+}
+export interface IntentContext {
+  commentBody: string;
+  issueTitle: string;
+  issueStatus?: string;
+  isPlanning: boolean;
+  /** Names of available agents (e.g. ["mal", "kaylee", "inara"]) */
+  agentNames: string[];
+  /** Whether the issue belongs to a project */
+  hasProject: boolean;
+}
+// ---------------------------------------------------------------------------
+// Valid intents (for validation)
+// ---------------------------------------------------------------------------
+const VALID_INTENTS: Set<string> = new Set([
+  "plan_start",
+  "plan_finalize",
+  "plan_abandon",
+  "plan_continue",
+  "ask_agent",
+  "request_work",
+  "question",
+  "general",
+]);
+// ---------------------------------------------------------------------------
+// Classifier prompt
+// ---------------------------------------------------------------------------
+const CLASSIFY_PROMPT = `You are an intent classifier for a developer tool. Respond ONLY with JSON.
+Intents:
+- plan_start: user wants to begin project planning
+- plan_finalize: user wants to approve/finalize the plan (e.g. "looks good", "ship it", "approve plan")
+- plan_abandon: user wants to cancel/stop planning (e.g. "nevermind", "cancel this", "stop planning")
+- plan_continue: regular message during planning (default when planning is active)
+- ask_agent: user is addressing a specific agent by name
+- request_work: user wants something built, fixed, or implemented
+- question: user asking for information or help
+- general: none of the above, automated messages, or noise
+Rules:
+- plan_start ONLY if the issue belongs to a project (hasProject=true)
+- If planning mode is active and no clear finalize/abandon intent, default to plan_continue
+- For ask_agent, set agentId to the matching name from Available agents
+- One sentence reasoning`;
+// ---------------------------------------------------------------------------
+// Classify
+// ---------------------------------------------------------------------------
+/**
+ * Classify a comment's intent using a lightweight model.
+ *
+ * Uses `classifierAgentId` from plugin config (should point to a small/fast
+ * model like Haiku for low latency and cost). Falls back to the default
+ * agent if not configured.
+ *
+ * Falls back to regex patterns if the LLM call fails or returns invalid JSON.
+ */
+export async function classifyIntent(
+  api: OpenClawPluginApi,
+  ctx: IntentContext,
+  pluginConfig?: Record<string, unknown>,
+): Promise<IntentResult> {
+  const contextBlock = [
+    `Issue: "${ctx.issueTitle}" (status: ${ctx.issueStatus ?? "unknown"})`,
+    `Planning mode: ${ctx.isPlanning}`,
+    `Has project: ${ctx.hasProject}`,
+    `Available agents: ${ctx.agentNames.join(", ") || "none"}`,
+    `Comment: "${ctx.commentBody.slice(0, 500)}"`,
+  ].join("\n");
+  const message = `${CLASSIFY_PROMPT}\n\nContext:\n${contextBlock}\n\nRespond ONLY with: {"intent":"<intent>","agentId":"<if ask_agent>","reasoning":"<one sentence>"}`;
+  try {
+    const { runAgent } = await import("../agent/agent.js");
+    const classifierAgent = resolveClassifierAgent(api, pluginConfig);
+    const result = await runAgent({
+      api,
+      agentId: classifierAgent,
+      sessionId: `intent-classify-${Date.now()}`,
+      message,
+      timeoutMs: 12_000, // 12s — fast classification
+    });
+    if (result.output) {
+      const parsed = parseIntentResponse(result.output, ctx);
+      if (parsed) {
+        api.logger.info(`Intent classified: ${parsed.intent}${parsed.agentId ? ` (agent: ${parsed.agentId})` : ""} — ${parsed.reasoning}`);
+        return parsed;
+      }
+    }
+    if (!result.success) {
+      api.logger.warn(`Intent classifier agent failed: ${result.output.slice(0, 200)}`);
+    } else {
+      api.logger.warn(`Intent classifier: could not parse response: ${result.output.slice(0, 200)}`);
+    }
+  } catch (err) {
+    api.logger.warn(`Intent classifier error: ${err}`);
+  }
+  // Fallback to regex
+  const fallback = regexFallback(ctx);
+  api.logger.info(`Intent classifier fallback: ${fallback.intent} — ${fallback.reasoning}`);
+  return fallback;
+}
+// ---------------------------------------------------------------------------
+// Response parsing
+// ---------------------------------------------------------------------------
+function parseIntentResponse(raw: string, ctx: IntentContext): IntentResult | null {
+  // Extract JSON using indexOf/lastIndexOf (more robust than regex for nested JSON)
+  const start = raw.indexOf("{");
+  const end = raw.lastIndexOf("}");
+  if (start === -1 || end === -1 || end <= start) return null;
+  try {
+    const parsed = JSON.parse(raw.slice(start, end + 1));
+    const intent = parsed.intent as string;
+    if (!VALID_INTENTS.has(intent)) return null;
+    // Validate agentId for ask_agent
+    let agentId: string | undefined;
+    if (intent === "ask_agent" && parsed.agentId) {
+      const normalized = String(parsed.agentId).toLowerCase();
+      // Only accept agent names that actually exist
+      if (ctx.agentNames.some((n) => n.toLowerCase() === normalized)) {
+        agentId = normalized;
+      }
+      // If hallucinated name, clear agentId but keep the intent
+    }
+    return {
+      intent: intent as Intent,
+      agentId,
+      reasoning: parsed.reasoning ?? "no reasoning provided",
+      fromFallback: false,
+    };
+  } catch {
+    return null;
+  }
+}
+// ---------------------------------------------------------------------------
+// Regex fallback (moved from planner.ts + webhook.ts)
+// ---------------------------------------------------------------------------
+// Planning intent patterns
+const PLAN_START_PATTERN = /\b(plan|planning)\s+(this\s+)(project|out)\b|\bplan\s+this\s+out\b/i;
+const FINALIZE_PATTERN = /\b(finalize\s+(the\s+)?plan\b|done\s+planning\b(?!\s+\w)|approve\s+(the\s+)?plan\b|plan\s+looks\s+good\b|ready\s+to\s+finalize\b|let'?s\s+finalize\b)/i;
+const ABANDON_PATTERN = /\b(abandon\s+plan(ning)?|cancel\s+plan(ning)?|stop\s+planning|exit\s+planning|quit\s+planning)\b/i;
+export function regexFallback(ctx: IntentContext): IntentResult {
+  const text = ctx.commentBody;
+  // Planning-specific patterns (only when planning is active or issue has project)
+  if (ctx.isPlanning) {
+    if (FINALIZE_PATTERN.test(text)) {
+      return { intent: "plan_finalize", reasoning: "regex: finalize pattern matched", fromFallback: true };
+    }
+    if (ABANDON_PATTERN.test(text)) {
+      return { intent: "plan_abandon", reasoning: "regex: abandon pattern matched", fromFallback: true };
+    }
+    // Default to plan_continue during planning
+    return { intent: "plan_continue", reasoning: "regex: planning mode active, default continue", fromFallback: true };
+  }
+  // Plan start (only if issue has a project)
+  if (ctx.hasProject && PLAN_START_PATTERN.test(text)) {
+    return { intent: "plan_start", reasoning: "regex: plan start pattern matched", fromFallback: true };
+  }
+  // Agent name detection
+  if (ctx.agentNames.length > 0) {
+    const lower = text.toLowerCase();
+    for (const name of ctx.agentNames) {
+      if (lower.includes(name.toLowerCase())) {
+        return { intent: "ask_agent", agentId: name.toLowerCase(), reasoning: `regex: agent name "${name}" found in comment`, fromFallback: true };
+      }
+    }
+  }
+  // Default: general (no match)
+  return { intent: "general", reasoning: "regex: no pattern matched", fromFallback: true };
+}
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+/**
+ * Resolve the agent to use for intent classification.
+ *
+ * Priority: pluginConfig.classifierAgentId → defaultAgentId → profile default.
+ * Configure classifierAgentId to point to a small/fast model (e.g. Haiku)
+ * for low-latency, low-cost classification.
+ */
+function resolveClassifierAgent(api: OpenClawPluginApi, pluginConfig?: Record<string, unknown>): string {
+  // 1. Explicit classifier agent
+  const classifierAgent = pluginConfig?.classifierAgentId ?? (api as any).pluginConfig?.classifierAgentId;
+  if (typeof classifierAgent === "string" && classifierAgent) return classifierAgent;
+  // 2. Fall back to default agent
+  return resolveDefaultAgent(api);
+}
+function resolveDefaultAgent(api: OpenClawPluginApi): string {
+  const fromConfig = (api as any).pluginConfig?.defaultAgentId;
+  if (typeof fromConfig === "string" && fromConfig) return fromConfig;
+  try {
+    const profilesPath = join(process.env.HOME ?? "/home/claw", ".openclaw", "agent-profiles.json");
+    const raw = readFileSync(profilesPath, "utf8");
+    const profiles = JSON.parse(raw).agents ?? {};
+    const defaultAgent = Object.entries(profiles).find(([, p]: [string, any]) => p.isDefault);
+    if (defaultAgent) return defaultAgent[0];
+  } catch { /* fall through */ }
+  return "default";
+}

package/src/pipeline/planner.test.ts CHANGED Viewed

@@ -16,6 +16,17 @@ vi.mock("../api/linear-api.js", () => ({}));
 vi.mock("openclaw/plugin-sdk", () => ({}));
+// Mock CLI tool runners for cross-model review
+vi.mock("../tools/claude-tool.js", () => ({
+  runClaude: vi.fn().mockResolvedValue({ success: true, output: "Claude review feedback" }),
+}));
+vi.mock("../tools/codex-tool.js", () => ({
+  runCodex: vi.fn().mockResolvedValue({ success: true, output: "Codex review feedback" }),
+}));
+vi.mock("../tools/gemini-tool.js", () => ({
+  runGemini: vi.fn().mockResolvedValue({ success: true, output: "Gemini review feedback" }),
+}));
 const mockLinearApi = {
   getProject: vi.fn().mockResolvedValue({
     id: "proj-1",
@@ -61,7 +72,13 @@ vi.mock("../tools/planner-tools.js", () => ({
 // Imports (AFTER mocks)
 // ---------------------------------------------------------------------------
-import { initiatePlanningSession, handlePlannerTurn, runPlanAudit } from "./planner.js";
+import {
+  initiatePlanningSession,
+  handlePlannerTurn,
+  runPlanAudit,
+  runCrossModelReview,
+  resolveReviewModel,
+} from "./planner.js";
 import {
   registerPlanningSession,
   updatePlanningSession,
@@ -73,6 +90,9 @@ import {
   clearActivePlannerContext,
   auditPlan,
 } from "../tools/planner-tools.js";
+import { runClaude } from "../tools/claude-tool.js";
+import { runCodex } from "../tools/codex-tool.js";
+import { runGemini } from "../tools/gemini-tool.js";
 // ---------------------------------------------------------------------------
 // Helpers
@@ -230,47 +250,31 @@ describe("handlePlannerTurn", () => {
     );
   });
-  it("detects finalize plan intent and triggers audit instead of regular turn", async () => {
-    const ctx = createCtx();
-    const session = createSession();
-    await handlePlannerTurn(ctx, session, {
-      issueId: "issue-1",
-      commentBody: "finalize plan",
-      commentorName: "Tester",
-    });
+  // Note: finalize/abandon intent detection has moved to webhook.ts via
+  // intent-classify.ts. handlePlannerTurn is now a pure "continue planning"
+  // function that always runs the agent.
+});
-    // Audit path: auditPlan is called, runAgent is NOT called
-    expect(auditPlan).toHaveBeenCalled();
-    expect(runAgentMock).not.toHaveBeenCalled();
-  });
+// ---------------------------------------------------------------------------
+// runPlanAudit
+// ---------------------------------------------------------------------------
-  it("detects abandon intent and ends session as abandoned", async () => {
+describe("runPlanAudit", () => {
+  it("transitions to plan_review on passing audit", async () => {
+    vi.mocked(auditPlan).mockReturnValue({ pass: true, problems: [], warnings: [] });
     const ctx = createCtx();
     const session = createSession();
-    await handlePlannerTurn(ctx, session, {
-      issueId: "issue-1",
-      commentBody: "abandon planning",
-      commentorName: "Tester",
-    });
+    await runPlanAudit(ctx, session);
-    expect(endPlanningSession).toHaveBeenCalledWith(
+    expect(updatePlanningSession).toHaveBeenCalledWith(
       "proj-1",
-      "abandoned",
+      { status: "plan_review" },
       undefined,
     );
-    // Should NOT run the agent
-    expect(runAgentMock).not.toHaveBeenCalled();
   });
-});
-// ---------------------------------------------------------------------------
-// runPlanAudit
-// ---------------------------------------------------------------------------
-describe("runPlanAudit", () => {
-  it("posts success comment on passing audit", async () => {
+  it("posts 'Passed Checks' comment on passing audit", async () => {
     vi.mocked(auditPlan).mockReturnValue({ pass: true, problems: [], warnings: [] });
     const ctx = createCtx();
     const session = createSession();
@@ -279,24 +283,46 @@ describe("runPlanAudit", () => {
     expect(mockLinearApi.createComment).toHaveBeenCalledWith(
       "issue-1",
-      expect.stringContaining("Approved"),
+      expect.stringContaining("Plan Passed Checks"),
     );
   });
-  it("ends session as approved on pass", async () => {
+  it("runs cross-model review automatically on passing audit", async () => {
     vi.mocked(auditPlan).mockReturnValue({ pass: true, problems: [], warnings: [] });
     const ctx = createCtx();
     const session = createSession();
     await runPlanAudit(ctx, session);
-    expect(endPlanningSession).toHaveBeenCalledWith(
-      "proj-1",
-      "approved",
-      undefined,
+    // Default review model is "gemini" (since no primary model configured)
+    expect(runGemini).toHaveBeenCalled();
+  });
+  it("runs planner agent with review prompt including cross-model feedback", async () => {
+    vi.mocked(auditPlan).mockReturnValue({ pass: true, problems: [], warnings: [] });
+    const ctx = createCtx();
+    const session = createSession();
+    await runPlanAudit(ctx, session);
+    // Agent should run with a review prompt
+    expect(runAgentMock).toHaveBeenCalledWith(
+      expect.objectContaining({
+        message: expect.stringContaining("Plan Review"),
+      }),
     );
   });
+  it("does NOT end session as approved on passing audit (waits for user approval)", async () => {
+    vi.mocked(auditPlan).mockReturnValue({ pass: true, problems: [], warnings: [] });
+    const ctx = createCtx();
+    const session = createSession();
+    await runPlanAudit(ctx, session);
+    expect(endPlanningSession).not.toHaveBeenCalled();
+  });
   it("posts problems on failing audit", async () => {
     vi.mocked(auditPlan).mockReturnValue({
       pass: false,
@@ -314,7 +340,7 @@ describe("runPlanAudit", () => {
     );
   });
-  it("does NOT end session as approved on fail", async () => {
+  it("does NOT transition to plan_review on failing audit", async () => {
     vi.mocked(auditPlan).mockReturnValue({
       pass: false,
       problems: ["No estimates"],
@@ -325,10 +351,103 @@ describe("runPlanAudit", () => {
     await runPlanAudit(ctx, session);
-    expect(endPlanningSession).not.toHaveBeenCalledWith(
+    expect(updatePlanningSession).not.toHaveBeenCalledWith(
       "proj-1",
-      "approved",
+      { status: "plan_review" },
       expect.anything(),
     );
   });
+  it("includes warnings in success comment when present", async () => {
+    vi.mocked(auditPlan).mockReturnValue({
+      pass: true,
+      problems: [],
+      warnings: ["PROJ-3 has no acceptance criteria"],
+    });
+    const ctx = createCtx();
+    const session = createSession();
+    await runPlanAudit(ctx, session);
+    expect(mockLinearApi.createComment).toHaveBeenCalledWith(
+      "issue-1",
+      expect.stringContaining("PROJ-3 has no acceptance criteria"),
+    );
+  });
+});
+// ---------------------------------------------------------------------------
+// resolveReviewModel
+// ---------------------------------------------------------------------------
+describe("resolveReviewModel", () => {
+  it("returns 'codex' when primary model is claude-based", () => {
+    expect(resolveReviewModel({
+      agents: { defaults: { model: { primary: "anthropic/claude-sonnet-4" } } },
+    } as any)).toBe("codex");
+  });
+  it("returns 'gemini' when primary model is codex-based", () => {
+    expect(resolveReviewModel({
+      agents: { defaults: { model: { primary: "openai/codex-3" } } },
+    } as any)).toBe("gemini");
+  });
+  it("returns 'codex' when primary model is gemini-based", () => {
+    expect(resolveReviewModel({
+      agents: { defaults: { model: { primary: "google/gemini-2" } } },
+    } as any)).toBe("codex");
+  });
+  it("returns 'gemini' when no primary model configured", () => {
+    expect(resolveReviewModel({})).toBe("gemini");
+  });
+  it("respects explicit plannerReviewModel config override", () => {
+    expect(resolveReviewModel({
+      plannerReviewModel: "gemini",
+      agents: { defaults: { model: { primary: "anthropic/claude-sonnet-4" } } },
+    } as any)).toBe("gemini");
+  });
+});
+// ---------------------------------------------------------------------------
+// runCrossModelReview
+// ---------------------------------------------------------------------------
+describe("runCrossModelReview", () => {
+  it("calls the correct CLI runner for the specified model", async () => {
+    const api = createApi();
+    await runCrossModelReview(api, "claude", "test snapshot");
+    expect(runClaude).toHaveBeenCalled();
+    vi.clearAllMocks();
+    await runCrossModelReview(api, "codex", "test snapshot");
+    expect(runCodex).toHaveBeenCalled();
+    vi.clearAllMocks();
+    await runCrossModelReview(api, "gemini", "test snapshot");
+    expect(runGemini).toHaveBeenCalled();
+  });
+  it("returns review output on success", async () => {
+    const api = createApi();
+    const result = await runCrossModelReview(api, "claude", "test snapshot");
+    expect(result).toBe("Claude review feedback");
+  });
+  it("returns graceful fallback on failure", async () => {
+    vi.mocked(runClaude).mockResolvedValueOnce({ success: false, error: "timeout" } as any);
+    const api = createApi();
+    const result = await runCrossModelReview(api, "claude", "test snapshot");
+    expect(result).toContain("review failed");
+  });
+  it("returns graceful fallback on exception", async () => {
+    vi.mocked(runClaude).mockRejectedValueOnce(new Error("network error"));
+    const api = createApi();
+    const result = await runCrossModelReview(api, "claude", "test snapshot");
+    expect(result).toContain("review unavailable");
+  });
 });