npm - osborn - Versions diffs - 0.5.2 → 0.5.5 - Mend

osborn 0.5.2 → 0.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/.claude/settings.local.json +9 -0
package/.claude/skills/markdown-to-pdf/SKILL.md +29 -0
package/.claude/skills/pdf-to-markdown/SKILL.md +28 -0
package/.claude/skills/playwright-browser/SKILL.md +75 -0
package/.claude/skills/youtube-transcript/SKILL.md +24 -0
package/dist/claude-llm.d.ts +29 -1
package/dist/claude-llm.js +346 -79
package/dist/config.d.ts +6 -2
package/dist/config.js +6 -1
package/dist/fast-brain.d.ts +124 -12
package/dist/fast-brain.js +1361 -96
package/dist/index-3-2-26-legacy.d.ts +1 -0
package/dist/index-3-2-26-legacy.js +2233 -0
package/dist/index.js +889 -394
package/dist/jsonl-search.d.ts +66 -0
package/dist/jsonl-search.js +274 -0
package/dist/leagcyprompts2.d.ts +0 -0
package/dist/leagcyprompts2.js +573 -0
package/dist/pipeline-direct-llm.d.ts +77 -0
package/dist/pipeline-direct-llm.js +216 -0
package/dist/pipeline-fastbrain.d.ts +45 -0
package/dist/pipeline-fastbrain.js +367 -0
package/dist/prompts-2-25-26.d.ts +0 -0
package/dist/prompts-2-25-26.js +518 -0
package/dist/prompts-3-2-26.d.ts +78 -0
package/dist/prompts-3-2-26.js +1319 -0
package/dist/prompts.d.ts +83 -8
package/dist/prompts.js +1990 -374
package/dist/session-access.d.ts +60 -2
package/dist/session-access.js +172 -2
package/dist/summary-index.d.ts +87 -0
package/dist/summary-index.js +570 -0
package/dist/turn-detector-shim.d.ts +24 -0
package/dist/turn-detector-shim.js +83 -0
package/dist/voice-io.d.ts +9 -3
package/dist/voice-io.js +39 -20
package/package.json +18 -11

package/dist/pipeline-direct-llm.d.ts ADDED Viewed

@@ -0,0 +1,77 @@
+/**
+ * Pipeline Direct LLM — Wraps ClaudeLLM with parallel Gemini fast brain
+ *
+ * In pipeline mode, every user message fires two tracks simultaneously:
+ *   Track A: Claude SDK (unchanged) — speaks the answer via TTS
+ *   Track B: Gemini fast brain (new) — searches JSONL memory, sends result to UI only
+ *
+ * Phase 1 (current): Gemini is silent — results go to frontend panel for monitoring
+ * Phase 2 (future): Gemini speaks first, Claude suppressed when Gemini has HIGH confidence
+ */
+import { llm, type APIConnectOptions } from '@livekit/agents';
+import { type ClaudeLLMOptions } from './claude-llm.js';
+import { EventEmitter } from 'events';
+export interface InterruptionContext {
+    spokenText: string;
+    recentMessages: string;
+}
+export interface PipelineDirectOptions extends ClaudeLLMOptions {
+    onFastBrainResult?: (result: FastBrainPanelResult) => void;
+    getChatHistory?: () => {
+        role: string;
+        content: string;
+    }[];
+    getResearchContext?: () => string | undefined;
+    /** Returns pending interruption context and clears it (consumed once). null = no pending interruption. */
+    getAndConsumeInterruptionContext?: () => InterruptionContext | null;
+}
+export interface FastBrainPanelResult {
+    question: string;
+    answer: string;
+    type: string;
+    elapsedMs: number;
+    timestamp: number;
+    toolsUsed: string[];
+}
+export declare class PipelineDirectLLM extends llm.LLM {
+    #private;
+    constructor(opts: PipelineDirectOptions);
+    /** Stop the index watcher (call on disconnect/session switch) */
+    stopIndexWatcher(): void;
+    get events(): EventEmitter;
+    get sessionId(): string | null;
+    get model(): string;
+    get isResumingSession(): boolean;
+    label(): string;
+    setResumeSessionId(id: string | null): void;
+    setContinueSession(e: boolean): void;
+    resetForSessionSwitch(): void;
+    respondToPermission(allow: boolean, msg?: string): void;
+    hasPendingPermission(): boolean;
+    getPendingPermission(): {
+        toolName: string;
+        input: any;
+    };
+    getMcpServers(): Record<string, import("@anthropic-ai/claude-agent-sdk").McpServerConfig>;
+    setMcpServers(s: any): void;
+    interruptAgent(): Promise<boolean>;
+    abortAgent(): void;
+    rewindAgent(checkpointId?: string): Promise<boolean>;
+    hasActiveAgent(): boolean;
+    /** Send a new prompt to Claude via direct chat() — event listeners stay attached */
+    sendPrompt(prompt: string): void;
+    enableMcpServer(k: string, c: any): void;
+    disableMcpServer(k: string): void;
+    getLatestCheckpoint(): string;
+    getFirstCheckpoint(): string;
+    getCheckpoints(): string[];
+    clearCheckpoints(): void;
+    hasCheckpoints(): boolean;
+    chat({ chatCtx, toolCtx, connOptions, abortController, }: {
+        chatCtx: llm.ChatContext;
+        toolCtx?: llm.ToolContext;
+        connOptions?: APIConnectOptions;
+        abortController?: AbortController;
+    }): llm.LLMStream;
+}
+export declare function createPipelineDirectLLM(opts: PipelineDirectOptions): PipelineDirectLLM;

package/dist/pipeline-direct-llm.js ADDED Viewed

@@ -0,0 +1,216 @@
+/**
+ * Pipeline Direct LLM — Wraps ClaudeLLM with parallel Gemini fast brain
+ *
+ * In pipeline mode, every user message fires two tracks simultaneously:
+ *   Track A: Claude SDK (unchanged) — speaks the answer via TTS
+ *   Track B: Gemini fast brain (new) — searches JSONL memory, sends result to UI only
+ *
+ * Phase 1 (current): Gemini is silent — results go to frontend panel for monitoring
+ * Phase 2 (future): Gemini speaks first, Claude suppressed when Gemini has HIGH confidence
+ */
+import { llm, DEFAULT_API_CONNECT_OPTIONS } from '@livekit/agents';
+import { ClaudeLLM } from './claude-llm.js';
+import { askPipelineFastBrain } from './pipeline-fastbrain.js';
+import { buildSummaryIndex, startIndexWatcher } from './summary-index.js';
+export class PipelineDirectLLM extends llm.LLM {
+    #claudeLLM;
+    #opts;
+    #turnAbort = null;
+    #indexWatcher = null;
+    #indexBuilding = false;
+    constructor(opts) {
+        super();
+        this.#claudeLLM = new ClaudeLLM(opts);
+        this.#opts = opts;
+    }
+    /** Stop the index watcher (call on disconnect/session switch) */
+    stopIndexWatcher() {
+        if (this.#indexWatcher) {
+            this.#indexWatcher.stop();
+            this.#indexWatcher = null;
+        }
+    }
+    // Proxy all properties
+    get events() { return this.#claudeLLM.events; }
+    get sessionId() { return this.#claudeLLM.sessionId; }
+    get model() { return this.#claudeLLM.model; }
+    get isResumingSession() { return this.#claudeLLM.isResumingSession; }
+    label() { return 'pipeline-direct'; }
+    // Proxy all methods
+    setResumeSessionId(id) { this.#claudeLLM.setResumeSessionId(id); }
+    setContinueSession(e) { this.#claudeLLM.setContinueSession(e); }
+    resetForSessionSwitch() { this.#claudeLLM.resetForSessionSwitch(); }
+    respondToPermission(allow, msg) { this.#claudeLLM.respondToPermission(allow, msg); }
+    hasPendingPermission() { return this.#claudeLLM.hasPendingPermission(); }
+    getPendingPermission() { return this.#claudeLLM.getPendingPermission(); }
+    getMcpServers() { return this.#claudeLLM.getMcpServers(); }
+    setMcpServers(s) { this.#claudeLLM.setMcpServers(s); }
+    // Agent control — proxied to ClaudeLLM for fast brain access
+    async interruptAgent() { return this.#claudeLLM.interruptQuery(); }
+    abortAgent() { this.#claudeLLM.abortQuery(); }
+    async rewindAgent(checkpointId) { return this.#claudeLLM.rewindToCheckpoint(checkpointId); }
+    hasActiveAgent() { return this.#claudeLLM.hasActiveQuery(); }
+    /** Send a new prompt to Claude via direct chat() — event listeners stay attached */
+    sendPrompt(prompt) {
+        console.log(`📋 [pipeline] Sending prompt to Claude (${prompt.length} chars)`);
+        const chatCtx = new llm.ChatContext();
+        chatCtx.addMessage({ role: 'user', content: prompt });
+        this.#claudeLLM.chat({ chatCtx });
+    }
+    enableMcpServer(k, c) { this.#claudeLLM.enableMcpServer(k, c); }
+    disableMcpServer(k) { this.#claudeLLM.disableMcpServer(k); }
+    getLatestCheckpoint() { return this.#claudeLLM.getLatestCheckpoint(); }
+    getFirstCheckpoint() { return this.#claudeLLM.getFirstCheckpoint(); }
+    getCheckpoints() { return this.#claudeLLM.getCheckpoints(); }
+    clearCheckpoints() { this.#claudeLLM.clearCheckpoints(); }
+    hasCheckpoints() { return this.#claudeLLM.hasCheckpoints(); }
+    #chatCallCount = 0;
+    chat({ chatCtx, toolCtx, connOptions = DEFAULT_API_CONNECT_OPTIONS, abortController, }) {
+        const callN = ++this.#chatCallCount;
+        // Extract user text for fast brain
+        let userText = '';
+        for (let i = chatCtx.items.length - 1; i >= 0; i--) {
+            const item = chatCtx.items[i];
+            if (item.type === 'message' && item.role === 'user') {
+                if (Array.isArray(item.content)) {
+                    userText = item.content.filter((c) => typeof c === 'string').join('\n');
+                }
+                break;
+            }
+        }
+        console.log(`📥 [pipeline] chat() call #${callN}: "${userText.substring(0, 60)}"`);
+        // Check for pending interruption context — enrich user message if interrupted
+        const interruptCtx = this.#opts.getAndConsumeInterruptionContext?.();
+        if (interruptCtx && userText.trim()) {
+            console.log(`🔇 [pipeline] Enriching user message with interruption context`);
+            // Interrupt Claude's current work before sending enriched message
+            this.#claudeLLM.interruptQuery().catch(() => { });
+            // Replace user message in chatCtx with context-enriched version
+            const enrichedMessage = [
+                `[INTERRUPTED] The user interrupted your response mid-speech.`,
+                ``,
+                `What the user heard before cutoff:`,
+                `"${interruptCtx.spokenText}"`,
+                ``,
+                `Your recent messages (full untruncated — you wrote these):`,
+                interruptCtx.recentMessages || '(no recent messages found)',
+                ``,
+                `User's message: "${userText}"`,
+                ``,
+                `Handle naturally:`,
+                `- If it's a quick side question, answer it then continue where you left off (restart sub-agents if needed)`,
+                `- If they want to change direction, follow their lead`,
+                `- Don't repeat what was already spoken unless it makes sense to clarify`,
+                `- Reference unspoken content naturally if relevant`,
+            ].join('\n');
+            // Modify the last user message in chatCtx
+            for (let i = chatCtx.items.length - 1; i >= 0; i--) {
+                const item = chatCtx.items[i];
+                if (item.type === 'message' && item.role === 'user') {
+                    item.content = [enrichedMessage];
+                    break;
+                }
+            }
+        }
+        // Fire Claude
+        const claudeStream = this.#claudeLLM.chat({ chatCtx, toolCtx, connOptions, abortController });
+        // Fire pipeline fast brain in background — no await, no blocking
+        if (userText.trim()) {
+            this.#firePipelineFastBrain(userText);
+        }
+        return claudeStream;
+    }
+    async #firePipelineFastBrain(userText) {
+        // Abort stale turn
+        if (this.#turnAbort)
+            this.#turnAbort.abort();
+        this.#turnAbort = new AbortController();
+        const signal = this.#turnAbort.signal;
+        const startMs = Date.now();
+        // Wait for SDK to assign session ID — listen for event instead of polling
+        // Large sessions (22MB+) can take 10-15s for SDK to replay JSONL
+        let sessionId = this.#claudeLLM.sessionId;
+        if (!sessionId) {
+            sessionId = await new Promise((resolve) => {
+                // Listen for the session_id event from SDK
+                const onSessionId = (data) => {
+                    resolve(data.sessionId);
+                };
+                this.#claudeLLM.events.once('session_id', onSessionId);
+                // Safety timeout — don't wait forever
+                setTimeout(() => {
+                    this.#claudeLLM.events.removeListener('session_id', onSessionId);
+                    resolve(this.#claudeLLM.sessionId || 'pending');
+                }, 15000);
+            });
+        }
+        const workingDir = this.#opts.workingDirectory || process.cwd();
+        const sessionBaseDir = this.#opts.sessionBaseDir || workingDir;
+        // Build summary index on first question (async, non-blocking for subsequent questions)
+        if (!this.#indexWatcher && !this.#indexBuilding && sessionId !== 'pending') {
+            this.#indexBuilding = true;
+            try {
+                const startBuild = Date.now();
+                const state = buildSummaryIndex(sessionId, workingDir, sessionBaseDir, (msg) => console.log(`🔍 [index] ${msg}`));
+                this.#indexWatcher = startIndexWatcher(sessionId, workingDir, sessionBaseDir, state);
+                console.log(`🔍 [index] Built + watching in ${Date.now() - startBuild}ms`);
+            }
+            catch (err) {
+                console.error('🔍 [index] Build failed:', err?.message);
+            }
+            this.#indexBuilding = false;
+        }
+        try {
+            console.log(`🧠⚡ [pipeline] Fast brain: "${userText.substring(0, 60)}"`);
+            const result = await askPipelineFastBrain(workingDir, sessionId, userText, {
+                chatHistory: this.#opts.getChatHistory?.() || [],
+                researchContext: this.#opts.getResearchContext?.(),
+                sessionBaseDir,
+                agentControl: {
+                    interrupt: () => this.#claudeLLM.interruptQuery(),
+                    abort: () => this.#claudeLLM.abortQuery(),
+                    hasActiveAgent: () => this.#claudeLLM.hasActiveQuery(),
+                    getRecentUserMessages: (count) => {
+                        const history = this.#opts.getChatHistory?.() || [];
+                        return history
+                            .filter(t => t.role === 'user')
+                            .slice(-count)
+                            .map(t => t.content);
+                    },
+                    sendPrompt: (prompt) => {
+                        // Direct call to ClaudeLLM.chat() — event listeners (tts_say, tool_use, etc.) still attached
+                        // skipTTSQueue mode: tts_say events → index.ts → session.say() — works independently
+                        console.log(`🧠⚡ [control] Sending new prompt to Claude (${prompt.length} chars)`);
+                        const chatCtx = new llm.ChatContext();
+                        chatCtx.addMessage({ role: 'user', content: prompt });
+                        this.#claudeLLM.chat({ chatCtx });
+                    },
+                },
+            });
+            if (signal.aborted)
+                return;
+            const elapsedMs = Date.now() - startMs;
+            console.log(`🧠⚡ [pipeline] ${result.type} in ${elapsedMs}ms [${result.toolsUsed.join(',')}]: "${result.script.substring(0, 80)}"`);
+            this.#opts.onFastBrainResult?.({
+                question: userText,
+                answer: result.script,
+                type: result.type,
+                elapsedMs,
+                timestamp: Date.now(),
+                toolsUsed: result.toolsUsed,
+            });
+        }
+        catch (err) {
+            if (err?.name === 'AbortError')
+                return;
+            console.error('❌ [pipeline] Fast brain error:', err?.message);
+        }
+        finally {
+            if (this.#turnAbort?.signal === signal)
+                this.#turnAbort = null;
+        }
+    }
+}
+export function createPipelineDirectLLM(opts) {
+    return new PipelineDirectLLM(opts);
+}

package/dist/pipeline-fastbrain.d.ts ADDED Viewed

@@ -0,0 +1,45 @@
+/**
+ * pipeline-fastbrain.ts — Pipeline Fast Brain (Agent with AFC)
+ *
+ * Uses Gemini Flash as an AGENT with Automatic Function Calling (AFC).
+ * One generateContent() call handles everything:
+ *   - Gemini decides IF it needs to search (skips for greetings/follow-ups)
+ *   - Gemini decides WHAT to search (smart phrase selection)
+ *   - Gemini can multi-step: search → not enough → refine → search again
+ *   - AFC handles the tool loop internally (up to 3 rounds)
+ *
+ * Tools:
+ *   search_session — ripgrep the summary index + read full content via byte offsets
+ *
+ * No separate phrase extraction call. No manual tool loop. One API invocation.
+ */
+export interface PipelineFastBrainResult {
+    script: string;
+    type: 'answer' | 'research_needed' | 'acknowledgment' | 'error';
+    toolsUsed: string[];
+}
+export interface PipelineFastBrainOptions {
+    chatHistory?: {
+        role: string;
+        content: string;
+    }[];
+    researchContext?: string;
+    sessionBaseDir?: string;
+    agentControl?: AgentControlCallbacks;
+}
+/** Clear the pipeline fast brain session (call on disconnect/reconnect) */
+export declare function clearPipelineFastBrainSession(): void;
+/** No-op — kept for backward compatibility with index.ts import */
+export declare function prewarmBM25Index(_sessionId: string, _workingDir: string): Promise<void>;
+/**
+ * Create a CallableTool that wraps ripgrep search of the summary index
+ * + byte-offset full content reads from raw JSONL.
+ */
+export interface AgentControlCallbacks {
+    interrupt: () => Promise<boolean>;
+    abort: () => void;
+    hasActiveAgent: () => boolean;
+    getRecentUserMessages: (count: number) => string[];
+    sendPrompt: (prompt: string) => void;
+}
+export declare function askPipelineFastBrain(workingDir: string, sessionId: string, question: string, opts?: PipelineFastBrainOptions): Promise<PipelineFastBrainResult>;