npm - @gswangg/duncan-cc - Versions diffs - 0.1.0 - Mend

@gswangg/duncan-cc 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/README.md +110 -0
package/SPEC.md +195 -0
package/package.json +39 -0
package/src/content-replacements.ts +185 -0
package/src/discovery.ts +340 -0
package/src/mcp-server.ts +356 -0
package/src/normalize.ts +702 -0
package/src/parser.ts +257 -0
package/src/pipeline.ts +274 -0
package/src/query.ts +626 -0
package/src/system-prompt.ts +408 -0
package/src/tree.ts +371 -0
package/tests/_skip-if-no-corpus.ts +12 -0
package/tests/compaction.test.ts +205 -0
package/tests/content-replacements.test.ts +214 -0
package/tests/discovery.test.ts +129 -0
package/tests/normalize.test.ts +192 -0
package/tests/parity.test.ts +226 -0
package/tests/parser-tree.test.ts +268 -0
package/tests/pipeline.test.ts +174 -0
package/tests/self-exclusion.test.ts +272 -0
package/tests/system-prompt.test.ts +238 -0
package/tsconfig.json +14 -0

package/src/query.ts ADDED Viewed

@@ -0,0 +1,626 @@
+/**
+ * Duncan Query Dispatch
+ *
+ * Queries CC sessions using the Anthropic API with structured output
+ * via the duncan_response tool.
+ */
+import Anthropic from "@anthropic-ai/sdk";
+import { randomUUID } from "node:crypto";
+import { readFileSync, existsSync } from "node:fs";
+import { join } from "node:path";
+import { homedir } from "node:os";
+import { processSessionFile, processSessionWindows, type PipelineResult, type WindowPipelineResult } from "./pipeline.js";
+import { resolveSessionFilesExcludingSelf, findCallingSession, listAllSessionFiles, type RoutingParams, type RoutingResult } from "./discovery.js";
+// ============================================================================
+// OAuth token resolution
+// ============================================================================
+/**
+ * Resolve Anthropic auth from:
+ * 1. Explicit apiKey/token parameter
+ * 2. CC's OAuth credentials (~/.claude/.credentials.json)
+ * 3. ANTHROPIC_API_KEY env var
+ */
+interface ResolvedAuth {
+  apiKey?: string | null;
+  authToken?: string;
+  defaultHeaders?: Record<string, string>;
+}
+function resolveAuth(explicit?: string): ResolvedAuth {
+  if (explicit) {
+    if (explicit.includes("sk-ant-oat")) {
+      return oauthClientConfig(explicit);
+    }
+    return { apiKey: explicit };
+  }
+  // CC's OAuth — primary auth for CC users
+  const ccCredsPath = join(homedir(), ".claude", ".credentials.json");
+  if (existsSync(ccCredsPath)) {
+    try {
+      const creds = JSON.parse(readFileSync(ccCredsPath, "utf-8"));
+      if (creds.claudeAiOauth?.accessToken) {
+        return oauthClientConfig(creds.claudeAiOauth.accessToken);
+      }
+    } catch {}
+  }
+  // Fallback: API key from environment
+  if (process.env.ANTHROPIC_API_KEY) return { apiKey: process.env.ANTHROPIC_API_KEY };
+  throw new Error("No Anthropic auth found. Authenticate via Claude Code or set ANTHROPIC_API_KEY.");
+}
+function oauthClientConfig(token: string): ResolvedAuth {
+  return {
+    apiKey: null,
+    authToken: token,
+    defaultHeaders: {
+      "accept": "application/json",
+      "anthropic-dangerous-direct-browser-access": "true",
+      "anthropic-beta": "claude-code-20250219,oauth-2025-04-20,fine-grained-tool-streaming-2025-05-14",
+      "user-agent": "duncan-cc/0.1.0",
+      "x-app": "cli",
+    },
+  };
+}
+// ============================================================================
+// Duncan Response Tool
+// ============================================================================
+const DUNCAN_RESPONSE_TOOL: Anthropic.Tool = {
+  name: "duncan_response",
+  description: "Provide your answer to the query.",
+  input_schema: {
+    type: "object" as const,
+    properties: {
+      hasContext: {
+        type: "boolean",
+        description: "true if the conversation contained specific information to answer the question, false if it did not",
+      },
+      answer: {
+        type: "string",
+        description: "Your answer based on the conversation context, or a brief explanation of why you lack context",
+      },
+    },
+    required: ["hasContext", "answer"],
+  },
+};
+const DUNCAN_PREFIX = `Answer solely based on the conversation above. If you don't explicitly have context from the conversation on this topic, say so. Use the duncan_response tool to provide your answer.
+`;
+// ============================================================================
+// Types
+// ============================================================================
+export interface DuncanResult {
+  hasContext: boolean;
+  answer: string;
+}
+export interface DuncanQueryResult {
+  queryId: string;
+  sessionFile: string;
+  sessionId: string;
+  windowIndex: number;
+  model: string;
+  result: DuncanResult;
+}
+export interface DuncanBatchResult {
+  queryId: string;
+  question: string;
+  results: DuncanQueryResult[];
+  totalWindows: number;
+  hasMore: boolean;
+  offset: number;
+}
+// ============================================================================
+// Single Session Query
+// ============================================================================
+const MAX_RETRIES = 3;
+/**
+ * Query a single session window with a question.
+ */
+export async function querySingleWindow(
+  pipeline: PipelineResult | WindowPipelineResult,
+  question: string,
+  opts: {
+    apiKey?: string;
+    model?: string;
+    signal?: AbortSignal;
+  } = {},
+): Promise<DuncanResult> {
+  const auth = resolveAuth(opts.apiKey);
+  const isOAuth = !!auth.authToken;
+  const client = new Anthropic({
+    ...auth,
+    dangerouslyAllowBrowser: true,
+  } as any);
+  const model = opts.model ?? pipeline.modelInfo?.modelId ?? "claude-sonnet-4-20250514";
+  // Build messages: session context + question
+  const messages: Anthropic.MessageParam[] = [
+    ...pipeline.messages.map((m) => ({
+      role: m.role as "user" | "assistant",
+      content: m.content,
+    })),
+    {
+      role: "user" as const,
+      content: DUNCAN_PREFIX + question,
+    },
+  ];
+  // Ensure messages alternate correctly (the question might create user→user)
+  const fixedMessages = ensureAlternation(messages);
+  // Add cache_control breakpoints for prompt caching.
+  // Strategy: cache the session context (stable across queries), let the
+  // duncan query question (last user message) vary without invalidating cache.
+  // Place breakpoint on the last content block of the penultimate message.
+  addCacheBreakpoints(fixedMessages);
+  // Build system prompt — OAuth requires Claude Code identity prefix
+  // Each section gets cache_control for system prompt caching.
+  const systemBlocks: Anthropic.TextBlockParam[] = [];
+  if (isOAuth) {
+    systemBlocks.push({
+      type: "text",
+      text: "You are Claude Code, Anthropic's official CLI for Claude.",
+      cache_control: { type: "ephemeral" },
+    } as any);
+  }
+  if (pipeline.systemPrompt) {
+    systemBlocks.push({
+      type: "text",
+      text: pipeline.systemPrompt,
+      cache_control: { type: "ephemeral" },
+    } as any);
+  }
+  for (let attempt = 0; attempt <= MAX_RETRIES; attempt++) {
+    const response = await client.messages.create({
+      model,
+      system: systemBlocks.length > 0 ? systemBlocks : undefined,
+      messages: fixedMessages,
+      tools: [DUNCAN_RESPONSE_TOOL],
+      max_tokens: 16384,
+    });
+    // Look for duncan_response tool call
+    const toolCall = response.content.find(
+      (c): c is Anthropic.ToolUseBlock => c.type === "tool_use" && c.name === "duncan_response",
+    );
+    if (toolCall) {
+      const input = toolCall.input as { hasContext: boolean; answer: string };
+      if (typeof input.hasContext === "boolean" && typeof input.answer === "string") {
+        return { hasContext: input.hasContext, answer: input.answer };
+      }
+    }
+    // Retry: ask the model to use the tool
+    if (attempt < MAX_RETRIES) {
+      fixedMessages.push(
+        { role: "assistant", content: response.content },
+        {
+          role: "user",
+          content: "You must respond by calling the duncan_response tool with { hasContext: boolean, answer: string }. Do not respond with plain text.",
+        },
+      );
+    }
+  }
+  throw new Error(`Duncan query failed after ${MAX_RETRIES} retries: model did not produce a valid duncan_response tool call`);
+}
+// ============================================================================
+// Batch Query
+// ============================================================================
+/**
+ * Query multiple sessions with a question.
+ */
+export async function queryBatch(
+  question: string,
+  routing: RoutingParams & { toolUseId?: string },
+  opts: {
+    apiKey?: string;
+    model?: string;
+    signal?: AbortSignal;
+    batchSize?: number;
+    onProgress?: (completed: number, total: number) => void;
+  } = {},
+): Promise<DuncanBatchResult> {
+  const queryId = randomUUID();
+  const resolved = resolveSessionFilesExcludingSelf(routing);
+  if (resolved.sessions.length === 0) {
+    return {
+      queryId,
+      question,
+      results: [],
+      totalWindows: 0,
+      hasMore: false,
+      offset: routing.offset ?? 0,
+    };
+  }
+  // Process each session into windows
+  const targets: Array<{
+    sessionFile: string;
+    sessionId: string;
+    pipeline: WindowPipelineResult;
+  }> = [];
+  for (const session of resolved.sessions) {
+    try {
+      const windows = processSessionWindows(session.path);
+      for (const w of windows) {
+        if (w.messages.length === 0) continue;
+        targets.push({
+          sessionFile: session.path,
+          sessionId: session.sessionId,
+          pipeline: w,
+        });
+      }
+    } catch {
+      // Skip unprocessable sessions
+    }
+  }
+  const batchSize = opts.batchSize ?? 5;
+  const results: DuncanQueryResult[] = [];
+  let completed = 0;
+  for (let i = 0; i < targets.length; i += batchSize) {
+    if (opts.signal?.aborted) break;
+    const batch = targets.slice(i, i + batchSize);
+    const batchResults = await Promise.all(
+      batch.map(async (target) => {
+        try {
+          const result = await querySingleWindow(target.pipeline, question, {
+            apiKey: opts.apiKey,
+            model: opts.model ?? target.pipeline.modelInfo?.modelId,
+            signal: opts.signal,
+          });
+          completed++;
+          opts.onProgress?.(completed, targets.length);
+          return {
+            queryId,
+            sessionFile: target.sessionFile,
+            sessionId: target.sessionId,
+            windowIndex: target.pipeline.windowIndex,
+            model: target.pipeline.modelInfo?.modelId ?? "unknown",
+            result,
+          };
+        } catch (err: any) {
+          completed++;
+          opts.onProgress?.(completed, targets.length);
+          return {
+            queryId,
+            sessionFile: target.sessionFile,
+            sessionId: target.sessionId,
+            windowIndex: target.pipeline.windowIndex,
+            model: target.pipeline.modelInfo?.modelId ?? "unknown",
+            result: {
+              hasContext: false,
+              answer: `Error: ${err.message}`,
+            },
+          };
+        }
+      }),
+    );
+    results.push(...batchResults);
+  }
+  return {
+    queryId,
+    question,
+    results,
+    totalWindows: targets.length,
+    hasMore: resolved.hasMore,
+    offset: routing.offset ?? 0,
+  };
+}
+// ============================================================================
+// Self Query — multiple samples from the active window
+// ============================================================================
+/**
+ * Query the calling session's own active window N times for sampling diversity.
+ *
+ * Uses a two-wave strategy to leverage prompt caching:
+ * 1. Wave 1: Send 1 query to prime the cache (pays full input cost)
+ * 2. Wave 2: Send remaining N-1 queries in batches (hit cached prefix)
+ *
+ * The active session is identified by toolUseId (from MCP _meta).
+ */
+export async function querySelf(
+  question: string,
+  opts: {
+    toolUseId: string;
+    copies?: number;
+    batchSize?: number;
+    apiKey?: string;
+    model?: string;
+    signal?: AbortSignal;
+    onProgress?: (completed: number, total: number) => void;
+  },
+): Promise<DuncanBatchResult> {
+  const queryId = randomUUID();
+  const copies = opts.copies ?? 3;
+  // Find the calling session by toolUseId
+  const allSessions = listAllSessionFiles();
+  const callingSessionId = findCallingSession(opts.toolUseId, allSessions);
+  if (!callingSessionId) {
+    return {
+      queryId, question, results: [], totalWindows: 0, hasMore: false, offset: 0,
+    };
+  }
+  const session = allSessions.find(s => s.sessionId === callingSessionId);
+  if (!session) {
+    return {
+      queryId, question, results: [], totalWindows: 0, hasMore: false, offset: 0,
+    };
+  }
+  // Process the session and get the LAST (active) window
+  const windows = processSessionWindows(session.path);
+  if (windows.length === 0) {
+    return {
+      queryId, question, results: [], totalWindows: 0, hasMore: false, offset: 0,
+    };
+  }
+  const activeWindow = windows[windows.length - 1];
+  if (activeWindow.messages.length === 0) {
+    return {
+      queryId, question, results: [], totalWindows: 0, hasMore: false, offset: 0,
+    };
+  }
+  const total = copies;
+  let completed = 0;
+  const results: DuncanQueryResult[] = [];
+  const queryOnce = async (): Promise<DuncanQueryResult> => {
+    try {
+      const result = await querySingleWindow(activeWindow, question, {
+        apiKey: opts.apiKey,
+        model: opts.model ?? activeWindow.modelInfo?.modelId,
+        signal: opts.signal,
+      });
+      completed++;
+      opts.onProgress?.(completed, total);
+      return {
+        queryId,
+        sessionFile: session.path,
+        sessionId: session.sessionId,
+        windowIndex: activeWindow.windowIndex,
+        model: activeWindow.modelInfo?.modelId ?? "unknown",
+        result,
+      };
+    } catch (err: any) {
+      completed++;
+      opts.onProgress?.(completed, total);
+      return {
+        queryId,
+        sessionFile: session.path,
+        sessionId: session.sessionId,
+        windowIndex: activeWindow.windowIndex,
+        model: activeWindow.modelInfo?.modelId ?? "unknown",
+        result: { hasContext: false, answer: `Error: ${err.message}` },
+      };
+    }
+  };
+  // Wave 1: prime the cache with a single query
+  results.push(await queryOnce());
+  if (opts.signal?.aborted || copies <= 1) {
+    return { queryId, question, results, totalWindows: total, hasMore: false, offset: 0 };
+  }
+  // Wave 2: remaining copies in batches, hitting cached prefix
+  const remaining = copies - 1;
+  const batchSize = opts.batchSize ?? 5;
+  for (let i = 0; i < remaining; i += batchSize) {
+    if (opts.signal?.aborted) break;
+    const batchCount = Math.min(batchSize, remaining - i);
+    const batchResults = await Promise.all(
+      Array.from({ length: batchCount }, () => queryOnce()),
+    );
+    results.push(...batchResults);
+  }
+  return { queryId, question, results, totalWindows: total, hasMore: false, offset: 0 };
+}
+// ============================================================================
+// Ancestors Query — prior compaction windows of the active session
+// ============================================================================
+/**
+ * Query the calling session's prior compaction windows (excluding active).
+ *
+ * In CC (no dfork), "ancestors" means the compacted windows of the current
+ * session — the context that was summarized away. Returns nothing if the
+ * session has no compaction boundaries.
+ */
+export async function queryAncestors(
+  question: string,
+  opts: {
+    toolUseId: string;
+    limit?: number;
+    offset?: number;
+    batchSize?: number;
+    apiKey?: string;
+    model?: string;
+    signal?: AbortSignal;
+    onProgress?: (completed: number, total: number) => void;
+  },
+): Promise<DuncanBatchResult> {
+  const queryId = randomUUID();
+  const limit = opts.limit ?? 50;
+  const offset = opts.offset ?? 0;
+  // Find the calling session
+  const allSessions = listAllSessionFiles();
+  const callingSessionId = findCallingSession(opts.toolUseId, allSessions);
+  if (!callingSessionId) {
+    return { queryId, question, results: [], totalWindows: 0, hasMore: false, offset };
+  }
+  const session = allSessions.find(s => s.sessionId === callingSessionId);
+  if (!session) {
+    return { queryId, question, results: [], totalWindows: 0, hasMore: false, offset };
+  }
+  // Get all windows, drop the last (active) one
+  const allWindows = processSessionWindows(session.path);
+  const ancestorWindows = allWindows.slice(0, -1).filter(w => w.messages.length > 0);
+  if (ancestorWindows.length === 0) {
+    return { queryId, question, results: [], totalWindows: 0, hasMore: false, offset };
+  }
+  const totalWindows = ancestorWindows.length;
+  const page = ancestorWindows.slice(offset, offset + limit);
+  const batchSize = opts.batchSize ?? 5;
+  const results: DuncanQueryResult[] = [];
+  let completed = 0;
+  for (let i = 0; i < page.length; i += batchSize) {
+    if (opts.signal?.aborted) break;
+    const batch = page.slice(i, i + batchSize);
+    const batchResults = await Promise.all(
+      batch.map(async (window) => {
+        try {
+          const result = await querySingleWindow(window, question, {
+            apiKey: opts.apiKey,
+            model: opts.model ?? window.modelInfo?.modelId,
+            signal: opts.signal,
+          });
+          completed++;
+          opts.onProgress?.(completed, page.length);
+          return {
+            queryId,
+            sessionFile: session.path,
+            sessionId: session.sessionId,
+            windowIndex: window.windowIndex,
+            model: window.modelInfo?.modelId ?? "unknown",
+            result,
+          };
+        } catch (err: any) {
+          completed++;
+          opts.onProgress?.(completed, page.length);
+          return {
+            queryId,
+            sessionFile: session.path,
+            sessionId: session.sessionId,
+            windowIndex: window.windowIndex,
+            model: window.modelInfo?.modelId ?? "unknown",
+            result: { hasContext: false, answer: `Error: ${err.message}` },
+          };
+        }
+      }),
+    );
+    results.push(...batchResults);
+  }
+  return {
+    queryId,
+    question,
+    results,
+    totalWindows,
+    hasMore: offset + limit < totalWindows,
+    offset,
+  };
+}
+// ============================================================================
+// Helpers
+// ============================================================================
+/**
+ * Add cache_control breakpoints to messages for prompt caching.
+ *
+ * Places an ephemeral cache breakpoint on the last content block of the
+ * penultimate message. This caches all session context while allowing
+ * the duncan query (last message) to vary without invalidating the cache.
+ *
+ * Matches CC's caching strategy (CC API format functions) where the last content block
+ * of each message gets cache_control when caching is enabled.
+ */
+function addCacheBreakpoints(messages: Anthropic.MessageParam[]): void {
+  if (messages.length < 2) return;
+  // Find the penultimate message (last session context message before the duncan query)
+  const penultimate = messages[messages.length - 2];
+  if (!penultimate) return;
+  const content = penultimate.content;
+  if (typeof content === "string") {
+    // Convert to block format to add cache_control
+    penultimate.content = [
+      {
+        type: "text" as const,
+        text: content,
+        cache_control: { type: "ephemeral" as const },
+      } as any,
+    ];
+  } else if (Array.isArray(content) && content.length > 0) {
+    // Add cache_control to the last block
+    const lastBlock = content[content.length - 1] as any;
+    content[content.length - 1] = {
+      ...lastBlock,
+      cache_control: { type: "ephemeral" as const },
+    };
+  }
+}
+/** Ensure messages alternate user/assistant */
+function ensureAlternation(messages: Anthropic.MessageParam[]): Anthropic.MessageParam[] {
+  if (messages.length === 0) return messages;
+  const result: Anthropic.MessageParam[] = [messages[0]];
+  for (let i = 1; i < messages.length; i++) {
+    const prev = result[result.length - 1];
+    if (messages[i].role === prev.role) {
+      // Merge same-role messages
+      const prevContent = Array.isArray(prev.content) ? prev.content : [{ type: "text" as const, text: prev.content }];
+      const curContent = Array.isArray(messages[i].content) ? messages[i].content : [{ type: "text" as const, text: messages[i].content as string }];
+      result[result.length - 1] = {
+        role: prev.role,
+        content: [...prevContent, ...curContent] as any,
+      };
+    } else {
+      result.push(messages[i]);
+    }
+  }
+  // Ensure first message is user
+  if (result[0].role !== "user") {
+    result.unshift({ role: "user", content: "[Session context follows]" });
+  }
+  return result;
+}