npm - @teammates/cli - Versions diffs - 0.3.3 → 0.4.0 - Mend

@teammates/cli 0.3.3 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md +1 -1
package/dist/adapter.d.ts +12 -1
package/dist/adapter.js +127 -125
package/dist/adapter.test.js +74 -0
package/dist/adapters/cli-proxy.js +0 -11
package/dist/adapters/copilot.js +0 -11
package/dist/cli.js +84 -18
package/dist/types.d.ts +4 -0
package/package.json +7 -8
package/scripts/patch-copilot-sdk.cjs +30 -0

package/README.md CHANGED Viewed

@@ -129,7 +129,7 @@ The CLI uses a generic adapter interface to support any coding agent. Each adapt
 ### How Adapters Work
 1. The adapter queries the recall index for relevant memories (automatic, in-process)
-2. The orchestrator builds a full prompt (SOUL → WISDOM → recall results → daily logs → weekly summaries → session history → roster → task)
+2. The orchestrator builds a full prompt within a 32k token budget (SOUL → WISDOM → recall results → daily logs (budget-trimmed) → session state → roster → task)
 3. The prompt is written to a temp file
 4. The agent CLI is spawned with the prompt
 5. stdout/stderr are captured for result parsing

package/dist/adapter.d.ts CHANGED Viewed

@@ -70,14 +70,25 @@ export declare function syncRecallIndex(teammatesDir: string, teammate?: string)
 /**
  * Build the full prompt for a teammate session.
  * Includes identity, memory, roster, output protocol, and the task.
+ *
+ * Context budget (32k tokens):
+ * - Current daily log (today): always included, outside budget
+ * - Days 2-7: up to 24k tokens (whole entries)
+ * - Recall results: at least 8k tokens + unused daily log budget
+ *   (last entry may overflow by up to 4k tokens)
+ * - Weekly summaries: excluded (already indexed by recall)
+ *
+ * Identity, wisdom, roster, and protocol are never trimmed.
+ * The task prompt is never trimmed.
  */
 export declare function buildTeammatePrompt(teammate: TeammateConfig, taskPrompt: string, options?: {
     handoffContext?: string;
     roster?: RosterEntry[];
     services?: InstalledService[];
     sessionFile?: string;
-    sessionContent?: string;
     recallResults?: SearchResult[];
+    /** Token budget for the prompt wrapper (default 64k). Task is excluded. */
+    tokenBudget?: number;
 }): string;
 /**
  * Format a handoff envelope into a human-readable context string.

package/dist/adapter.js CHANGED Viewed

@@ -40,164 +40,166 @@ export async function syncRecallIndex(teammatesDir, teammate) {
         await indexer.syncAll();
     }
 }
+/**
+ * Default token budget for the prompt wrapper (everything except the task).
+ * ~64k tokens ≈ 256k chars at ~4 chars/token.
+ * The task prompt itself is excluded from this budget — if a user pastes
+ * a large input, that's intentional and we don't trim it.
+ */
+const DEFAULT_TOKEN_BUDGET = 64_000;
+const CHARS_PER_TOKEN = 4;
+/**
+ * Context budget allocation:
+ * - Days 2-7 get up to DAILY_LOG_BUDGET tokens (whole entries)
+ * - Recall gets at least RECALL_MIN_BUDGET, plus whatever daily logs didn't use
+ * - Last recall entry can push total up to CONTEXT_BUDGET + RECALL_OVERFLOW (36k)
+ * - Weekly summaries are excluded (already indexed by recall)
+ */
+const CONTEXT_BUDGET_TOKENS = 32_000;
+const DAILY_LOG_BUDGET_TOKENS = 24_000;
+const RECALL_MIN_BUDGET_TOKENS = 8_000;
+const RECALL_OVERFLOW_TOKENS = 4_000;
+/** Estimate tokens from character count. */
+function estimateTokens(text) {
+    return Math.ceil(text.length / CHARS_PER_TOKEN);
+}
 /**
  * Build the full prompt for a teammate session.
  * Includes identity, memory, roster, output protocol, and the task.
+ *
+ * Context budget (32k tokens):
+ * - Current daily log (today): always included, outside budget
+ * - Days 2-7: up to 24k tokens (whole entries)
+ * - Recall results: at least 8k tokens + unused daily log budget
+ *   (last entry may overflow by up to 4k tokens)
+ * - Weekly summaries: excluded (already indexed by recall)
+ *
+ * Identity, wisdom, roster, and protocol are never trimmed.
+ * The task prompt is never trimmed.
  */
 export function buildTeammatePrompt(teammate, taskPrompt, options) {
     const parts = [];
-    // ── Identity ──────────────────────────────────────────────────────
-    parts.push(`# You are ${teammate.name}\n`);
-    parts.push(teammate.soul);
-    parts.push("\n---\n");
-    // ── Wisdom ───────────────────────────────────────────────────────
+    // ── Identity (required) ─────────────────────────────────────────
+    parts.push(`# You are ${teammate.name}\n\n${teammate.soul}\n\n---\n`);
+    // ── Wisdom (required) ───────────────────────────────────────────
     if (teammate.wisdom.trim()) {
-        parts.push("## Your Wisdom\n");
-        parts.push(teammate.wisdom);
-        parts.push("\n---\n");
-    }
-    // ── Recall results (relevant episodic & semantic memories) ────────
-    if (options?.recallResults && options.recallResults.length > 0) {
-        parts.push("## Relevant Memories (from recall search)\n");
-        parts.push("These memories were retrieved based on relevance to the current task:\n");
-        for (const r of options.recallResults) {
+        parts.push(`## Your Wisdom\n\n${teammate.wisdom}\n\n---\n`);
+    }
+    // ── Budget-allocated context (daily logs → recall) ──────────────
+    // Today's log: always included, outside budget
+    // Days 2-7: up to 24k tokens (whole entries)
+    // Recall: at least 8k + unused daily budget, last entry may overflow by 4k
+    const todayLog = teammate.dailyLogs.slice(0, 1);
+    const pastLogs = teammate.dailyLogs.slice(1, 7); // days 2-7
+    let dailyBudget = DAILY_LOG_BUDGET_TOKENS;
+    // Current daily log (today) — never trimmed, always included
+    if (todayLog.length > 0) {
+        const todayLines = ["## Recent Daily Logs\n"];
+        for (const log of todayLog) {
+            todayLines.push(`### ${log.date}\n${log.content}\n`);
+        }
+        parts.push(todayLines.join("\n"));
+    }
+    // Days 2-7 — whole entries, up to 24k tokens
+    if (pastLogs.length > 0) {
+        const lines = [];
+        for (const log of pastLogs) {
+            const entry = `### ${log.date}\n${log.content}\n`;
+            const cost = estimateTokens(entry);
+            if (cost > dailyBudget)
+                break;
+            lines.push(entry);
+            dailyBudget -= cost;
+        }
+        if (lines.length > 0)
+            parts.push(lines.join("\n"));
+    }
+    // Recall results — gets at least 8k tokens, plus unused daily budget
+    // Last entry may overflow by up to 4k tokens
+    const recallBudget = Math.max(RECALL_MIN_BUDGET_TOKENS, RECALL_MIN_BUDGET_TOKENS + dailyBudget);
+    const recallResults = options?.recallResults ?? [];
+    if (recallResults.length > 0) {
+        const lines = [
+            "## Relevant Memories (from recall search)\n",
+            "These memories were retrieved based on relevance to the current task:\n",
+        ];
+        const headerCost = estimateTokens(lines.join("\n"));
+        let recallUsed = headerCost;
+        for (const r of recallResults) {
             const label = r.contentType
                 ? `[${r.contentType}] ${r.uri}`
                 : r.uri;
-            parts.push(`### ${label}\n${r.text}\n`);
+            const entry = `### ${label}\n${r.text}\n`;
+            const cost = estimateTokens(entry);
+            if (recallUsed + cost > recallBudget + RECALL_OVERFLOW_TOKENS)
+                break;
+            lines.push(entry);
+            recallUsed += cost;
+            // Stop cleanly at budget — but allow the current entry (overflow grace)
+            if (recallUsed >= recallBudget)
+                break;
         }
-        parts.push("\n---\n");
-    }
-    // ── Recent daily logs ──────────────────────────────────────────────
-    if (teammate.dailyLogs.length > 0) {
-        parts.push("## Recent Daily Logs\n");
-        for (const log of teammate.dailyLogs.slice(0, 7)) {
-            parts.push(`### ${log.date}\n${log.content}\n`);
+        if (lines.length > 2) {
+            lines.push("\n---\n");
+            parts.push(lines.join("\n"));
         }
-        parts.push("\n---\n");
     }
-    // ── Weekly summaries (recent episodic context) ─────────────────────
-    if (teammate.weeklyLogs.length > 0) {
-        parts.push("## Recent Weekly Summaries\n");
-        for (const log of teammate.weeklyLogs.slice(0, 2)) {
-            parts.push(`### ${log.week}\n${log.content}\n`);
+    // Close context section with separator if needed
+    if (todayLog.length > 0 || pastLogs.length > 0) {
+        const lastPart = parts[parts.length - 1];
+        if (!lastPart.endsWith("---\n")) {
+            parts.push("\n---\n");
         }
-        parts.push("\n---\n");
-    }
-    // ── Session history (prior tasks in this session) ─────────────────
-    if (options?.sessionContent?.trim()) {
-        parts.push("## Session History\n");
-        parts.push("These are entries from your prior tasks in this session:\n");
-        parts.push(options.sessionContent);
-        parts.push("\n---\n");
     }
-    // ── Team roster ───────────────────────────────────────────────────
+    // ── Team roster (required, small) ───────────────────────────────
     if (options?.roster && options.roster.length > 0) {
-        parts.push("## Your Team\n");
-        parts.push("These are the other teammates you can hand off work to:\n");
+        const lines = [
+            "## Your Team\n",
+            "These are the other teammates you can hand off work to:\n",
+        ];
         for (const t of options.roster) {
             if (t.name === teammate.name)
                 continue;
             const owns = t.ownership.primary.length > 0
                 ? ` — owns: ${t.ownership.primary.join(", ")}`
                 : "";
-            parts.push(`- **@${t.name}**: ${t.role}${owns}`);
+            lines.push(`- **@${t.name}**: ${t.role}${owns}`);
         }
-        parts.push("\n---\n");
+        lines.push("\n---\n");
+        parts.push(lines.join("\n"));
     }
-    // ── Installed services ──────────────────────────────────────────────
+    // ── Installed services (required, small) ────────────────────────
     if (options?.services && options.services.length > 0) {
-        parts.push("## Available Services\n");
-        parts.push("These services are installed and available for you to use:\n");
+        const lines = [
+            "## Available Services\n",
+            "These services are installed and available for you to use:\n",
+        ];
         for (const svc of options.services) {
-            parts.push(`### ${svc.name}\n`);
-            parts.push(svc.description);
-            parts.push(`\n**Usage:** \`${svc.usage}\`\n`);
+            lines.push(`### ${svc.name}\n`);
+            lines.push(svc.description);
+            lines.push(`\n**Usage:** \`${svc.usage}\`\n`);
         }
-        parts.push("\n---\n");
+        lines.push("\n---\n");
+        parts.push(lines.join("\n"));
     }
-    // ── Handoff context (if this task came from another teammate) ─────
+    // ── Handoff context (required when present) ─────────────────────
     if (options?.handoffContext) {
-        parts.push("## Handoff Context\n");
-        parts.push(options.handoffContext);
-        parts.push("\n---\n");
+        parts.push(`## Handoff Context\n\n${options.handoffContext}\n\n---\n`);
     }
-    // ── Session state ────────────────────────────────────────────────
+    // ── Session state (required) ────────────────────────────────────
     if (options?.sessionFile) {
-        parts.push("## Session State\n");
-        parts.push(`Your session file is at: \`${options.sessionFile}\`
-**Before returning your result**, append a brief entry to this file with:
-- What you did
-- Key decisions made
-- Files changed
-- Anything the next task should know
-This is how you maintain continuity across tasks. Always read it, always update it.
-`);
-        parts.push("\n---\n");
-    }
-    // ── Memory updates ─────────────────────────────────────────────────
+        parts.push(`## Session State\n\nYour session file is at: \`${options.sessionFile}\`\n\n**Before returning your result**, append a brief entry to this file with:\n- What you did\n- Key decisions made\n- Files changed\n- Anything the next task should know\n\nThis is how you maintain continuity across tasks. Always read it, always update it.\n\n---\n`);
+    }
+    // ── Memory updates (required) ───────────────────────────────────
     const today = new Date().toISOString().slice(0, 10);
-    parts.push("## Memory Updates\n");
-    parts.push(`**Before returning your result**, update your memory files:
-1. **Daily log** — Read \`.teammates/${teammate.name}/memory/${today}.md\` first (it may have entries from earlier tasks today), then write it back with your entry added. Create the file if it doesn't exist.
-   - What you did
-   - Key decisions made
-   - Files changed
-   - Anything the next task should know
-2. **Typed memories** — If you learned something durable (a decision, pattern, feedback, or reference), create a typed memory file at \`.teammates/${teammate.name}/memory/<type>_<topic>.md\` with frontmatter (\`name\`, \`description\`, \`type\`). Update existing memory files if the topic already has one.
-3. **WISDOM.md** — Do not edit directly. Wisdom entries are distilled from typed memories during compaction.
-These files are your persistent memory. Without them, your next session starts from scratch.
-`);
-    parts.push("\n---\n");
-    // ── Output protocol ───────────────────────────────────────────────
-    parts.push("## Output Protocol (CRITICAL)\n");
-    parts.push(`**Your #1 job is to produce a visible text response.** Session updates and memory writes are secondary — they support continuity but are not the deliverable. The user sees ONLY your text output. If you update files but return no text, the user sees an empty message and your work is invisible.
-Format your response as:
-\`\`\`
-TO: user
-# <Subject line>
-<Body — full markdown response>
-\`\`\`
-**Handoffs:** To hand off work to a teammate, include a fenced handoff block anywhere in your response:
-\`\`\`
-\`\`\`handoff
-@<teammate>
-<task description — what you need them to do, with full context>
-\`\`\`
-\`\`\`
-**Rules:**
-- **You MUST end your turn with visible text output.** A turn that ends with only tool calls and no text is a failed turn.
-- The \`# Subject\` line is REQUIRED — it becomes the message title.
-- Always write a substantive body. Never return just the subject.
-- Use markdown: headings, lists, code blocks, bold, etc.
-- Do as much work as you can before handing off.
-- Only hand off to teammates listed in "Your Team" above.
-- The handoff block can appear anywhere in your response — it will be detected automatically.
-`);
-    parts.push("\n---\n");
-    // ── Current date/time ────────────────────────────────────────────
+    parts.push(`## Memory Updates\n\n**Before returning your result**, update your memory files:\n\n1. **Daily log** — Read \`.teammates/${teammate.name}/memory/${today}.md\` first (it may have entries from earlier tasks today), then write it back with your entry added. Create the file if it doesn't exist.\n   - What you did\n   - Key decisions made\n   - Files changed\n   - Anything the next task should know\n\n2. **Typed memories** — If you learned something durable (a decision, pattern, feedback, or reference), create a typed memory file at \`.teammates/${teammate.name}/memory/<type>_<topic>.md\` with frontmatter (\`name\`, \`description\`, \`type\`). Update existing memory files if the topic already has one.\n\n3. **WISDOM.md** — Do not edit directly. Wisdom entries are distilled from typed memories during compaction.\n\nThese files are your persistent memory. Without them, your next session starts from scratch.\n\n---\n`);
+    // ── Output protocol (required) ──────────────────────────────────
+    parts.push(`## Output Protocol (CRITICAL)\n\n**Your #1 job is to produce a visible text response.** Session updates and memory writes are secondary — they support continuity but are not the deliverable. The user sees ONLY your text output. If you update files but return no text, the user sees an empty message and your work is invisible.\n\nFormat your response as:\n\n\`\`\`\nTO: user\n# <Subject line>\n\n<Body — full markdown response>\n\`\`\`\n\n**Handoffs:** To hand off work to a teammate, include a fenced handoff block anywhere in your response:\n\n\`\`\`\n\`\`\`handoff\n@<teammate>\n<task description — what you need them to do, with full context>\n\`\`\`\n\`\`\`\n\n**Rules:**\n- **You MUST end your turn with visible text output.** A turn that ends with only tool calls and no text is a failed turn.\n- The \`# Subject\` line is REQUIRED — it becomes the message title.\n- Always write a substantive body. Never return just the subject.\n- Use markdown: headings, lists, code blocks, bold, etc.\n- Do as much work as you can before handing off.\n- Only hand off to teammates listed in "Your Team" above.\n- The handoff block can appear anywhere in your response — it will be detected automatically.\n\n---\n`);
+    // ── Current date/time (required, small) ─────────────────────────
     const now = new Date();
-    parts.push(`**Current date:** ${now.toLocaleDateString("en-US", { weekday: "long", year: "numeric", month: "long", day: "numeric" })} (${today})`);
-    parts.push(`**Current time:** ${now.toLocaleTimeString("en-US", { hour: "2-digit", minute: "2-digit" })}\n`);
-    parts.push("---\n");
-    // ── Task ──────────────────────────────────────────────────────────
-    parts.push("## Task\n");
-    parts.push(taskPrompt);
-    parts.push("\n---\n");
-    // ── Final reminder (last thing the agent reads) ─────────────────
-    parts.push("**REMINDER: After completing the task and updating session/memory files, you MUST produce a text response starting with `TO: user`. An empty response is a bug.**");
+    parts.push(`**Current date:** ${now.toLocaleDateString("en-US", { weekday: "long", year: "numeric", month: "long", day: "numeric" })} (${today})\n**Current time:** ${now.toLocaleTimeString("en-US", { hour: "2-digit", minute: "2-digit" })}\n\n---\n`);
+    // ── Task (always included, excluded from budget) ────────────────
+    parts.push(`## Task\n\n${taskPrompt}\n\n---\n\n**REMINDER: After completing the task and updating session/memory files, you MUST produce a text response starting with \`TO: user\`. An empty response is a bug.**`);
     return parts.join("\n");
 }
 /**

package/dist/adapter.test.js CHANGED Viewed

@@ -99,6 +99,80 @@ describe("buildTeammatePrompt", () => {
         expect(prompt).toContain("## Session State");
         expect(prompt).toContain("/tmp/beacon-session.md");
     });
+    it("drops daily logs that exceed the 24k daily budget", () => {
+        // Each log is ~50k chars = ~12.5k tokens. Only 1 fits in 24k daily budget.
+        const bigContent = "D".repeat(50_000);
+        const config = makeConfig({
+            dailyLogs: [
+                { date: "2026-03-18", content: "Today's log — never trimmed" },
+                { date: "2026-03-17", content: bigContent }, // day 2 — fits in 24k
+                { date: "2026-03-16", content: bigContent }, // day 3 — exceeds 24k, dropped
+            ],
+        });
+        const prompt = buildTeammatePrompt(config, "task");
+        // Today's log is always fully present (never trimmed)
+        expect(prompt).toContain("Today's log — never trimmed");
+        // Day 2 fits within 24k
+        expect(prompt).toContain("2026-03-17");
+        // Day 3 doesn't fit (12.5k + 12.5k > 24k)
+        expect(prompt).not.toContain("2026-03-16");
+    });
+    it("recall gets at least 8k tokens even when daily logs use full 24k", () => {
+        // Daily logs fill their 24k budget. Recall still gets its guaranteed 8k minimum.
+        const dailyContent = "D".repeat(90_000); // ~22.5k tokens — fits in 24k
+        const config = makeConfig({
+            dailyLogs: [
+                { date: "2026-03-18", content: "today" },
+                { date: "2026-03-17", content: dailyContent },
+            ],
+        });
+        const recallText = "R".repeat(20_000); // ~5k tokens — fits in 8k min
+        const prompt = buildTeammatePrompt(config, "task", {
+            recallResults: [
+                { teammate: "beacon", uri: "memory/decision_foo.md", text: recallText, score: 0.9, contentType: "typed_memory" },
+            ],
+        });
+        expect(prompt).toContain("2026-03-17");
+        expect(prompt).toContain("## Relevant Memories");
+    });
+    it("recall gets unused daily log budget", () => {
+        // Small daily logs leave most of 24k unused — recall gets the surplus.
+        const config = makeConfig({
+            dailyLogs: [
+                { date: "2026-03-18", content: "today" },
+                { date: "2026-03-17", content: "short day 2" }, // ~3 tokens
+            ],
+        });
+        // Large recall result — should fit because daily logs barely used any budget
+        const recallText = "R".repeat(80_000); // ~20k tokens — fits in (8k + ~24k unused)
+        const prompt = buildTeammatePrompt(config, "task", {
+            recallResults: [
+                { teammate: "beacon", uri: "memory/big.md", text: recallText, score: 0.9, contentType: "typed_memory" },
+            ],
+        });
+        expect(prompt).toContain("## Relevant Memories");
+        expect(prompt).toContain("memory/big.md");
+    });
+    it("weekly summaries are excluded (indexed by recall)", () => {
+        const config = makeConfig({
+            dailyLogs: [{ date: "2026-03-13", content: "short log" }],
+            weeklyLogs: [{ week: "2026-W11", content: "short summary" }],
+        });
+        const prompt = buildTeammatePrompt(config, "task");
+        expect(prompt).toContain("## Recent Daily Logs");
+        expect(prompt).not.toContain("## Recent Weekly Summaries");
+    });
+    it("excludes task prompt from budget calculation", () => {
+        // Large task prompt should not trigger trimming of wrapper sections
+        const bigTask = "x".repeat(100_000);
+        const config = makeConfig({
+            dailyLogs: [{ date: "2026-03-13", content: "small log" }],
+        });
+        const prompt = buildTeammatePrompt(config, bigTask);
+        // Daily logs should still be included despite the huge task
+        expect(prompt).toContain("## Recent Daily Logs");
+        expect(prompt).toContain("small log");
+    });
 });
 describe("formatHandoffContext", () => {
     it("formats basic handoff", () => {

package/dist/adapters/cli-proxy.js CHANGED Viewed

@@ -140,16 +140,6 @@ export class CliProxyAdapter {
         // If the teammate has no soul (e.g. the raw agent), skip identity/memory
         // wrapping but include handoff instructions so it can delegate to teammates
         const sessionFile = this.sessionFiles.get(teammate.name);
-        // Read session file content for injection into the prompt
-        let sessionContent;
-        if (sessionFile) {
-            try {
-                sessionContent = await readFile(sessionFile, "utf-8");
-            }
-            catch {
-                // Session file may not exist yet — that's fine
-            }
-        }
         let fullPrompt;
         if (teammate.soul) {
             // Query recall for relevant memories before building prompt
@@ -163,7 +153,6 @@ export class CliProxyAdapter {
                 roster: this.roster,
                 services: this.services,
                 sessionFile,
-                sessionContent,
                 recallResults: recall?.results,
             });
         }

package/dist/adapters/copilot.js CHANGED Viewed

@@ -59,16 +59,6 @@ export class CopilotAdapter {
     async executeTask(_sessionId, teammate, prompt) {
         await this.ensureClient(teammate.cwd);
         const sessionFile = this.sessionFiles.get(teammate.name);
-        // Read session file content for injection into the prompt
-        let sessionContent;
-        if (sessionFile) {
-            try {
-                sessionContent = await readFile(sessionFile, "utf-8");
-            }
-            catch {
-                // Session file may not exist yet — that's fine
-            }
-        }
         // Build the full teammate prompt (identity + memory + task)
         let fullPrompt;
         if (teammate.soul) {
@@ -83,7 +73,6 @@ export class CopilotAdapter {
                 roster: this.roster,
                 services: this.services,
                 sessionFile,
-                sessionContent,
                 recallResults: recall?.results,
             });
         }

package/dist/cli.js CHANGED Viewed

@@ -10,7 +10,6 @@
 import { exec as execCb, execSync, spawn } from "node:child_process";
 import { mkdirSync, readFileSync, writeFileSync } from "node:fs";
 import { mkdir, readdir, rm, stat, unlink } from "node:fs/promises";
-import { tmpdir } from "node:os";
 import { dirname, join, resolve } from "node:path";
 import { createInterface } from "node:readline";
 import { App, ChatView, concat, esc, Interview, pen, renderMarkdown, stripAnsi, } from "@teammates/consolonia";
@@ -39,24 +38,78 @@ class TeammatesREPL {
     lastResult = null;
     lastResults = new Map();
     conversationHistory = [];
+    /** Running summary of older conversation history maintained by the coding agent. */
+    conversationSummary = "";
     storeResult(result) {
         this.lastResult = result;
         this.lastResults.set(result.teammate, result);
         this.conversationHistory.push({
             role: result.teammate,
-            text: result.rawOutput ?? result.summary,
+            text: result.summary,
         });
     }
+    /** Token budget for recent conversation history (24k tokens ≈ 96k chars). */
+    static CONV_HISTORY_CHARS = 24_000 * 4;
     buildConversationContext() {
-        if (this.conversationHistory.length === 0)
+        if (this.conversationHistory.length === 0 && !this.conversationSummary)
             return "";
-        // Keep last 10 exchanges to avoid blowing up prompt size
-        const recent = this.conversationHistory.slice(-10);
-        const lines = ["## Conversation History\n"];
-        for (const entry of recent) {
-            lines.push(`**${entry.role}:** ${entry.text}\n`);
+        const budget = TeammatesREPL.CONV_HISTORY_CHARS;
+        const parts = ["## Conversation History\n"];
+        // Include running summary of older conversation if present
+        if (this.conversationSummary) {
+            parts.push(`### Previous Conversation Summary\n\n${this.conversationSummary}\n`);
+        }
+        // Work backwards from newest — include whole entries up to 24k tokens
+        const entries = [];
+        let used = 0;
+        for (let i = this.conversationHistory.length - 1; i >= 0; i--) {
+            const line = `**${this.conversationHistory[i].role}:** ${this.conversationHistory[i].text}\n`;
+            if (used + line.length > budget && entries.length > 0)
+                break;
+            entries.unshift(line);
+            used += line.length;
         }
-        return lines.join("\n");
+        if (entries.length > 0)
+            parts.push(entries.join("\n"));
+        return parts.join("\n");
+    }
+    /**
+     * Check if conversation history exceeds the 24k token budget.
+     * If so, take the older entries that won't fit, combine with existing summary,
+     * and queue a summarization task to the coding agent.
+     */
+    maybeQueueSummarization() {
+        const budget = TeammatesREPL.CONV_HISTORY_CHARS;
+        // Calculate how many recent entries fit in the budget (newest first)
+        let recentChars = 0;
+        let splitIdx = this.conversationHistory.length;
+        for (let i = this.conversationHistory.length - 1; i >= 0; i--) {
+            const line = `**${this.conversationHistory[i].role}:** ${this.conversationHistory[i].text}\n`;
+            if (recentChars + line.length > budget)
+                break;
+            recentChars += line.length;
+            splitIdx = i;
+        }
+        if (splitIdx === 0)
+            return; // everything fits — nothing to summarize
+        // Collect entries that are being pushed out
+        const toSummarize = this.conversationHistory.slice(0, splitIdx);
+        const entriesText = toSummarize
+            .map((e) => `**${e.role}:** ${e.text}`)
+            .join("\n");
+        // Build the summarization prompt
+        const prompt = this.conversationSummary
+            ? `You are maintaining a running summary of an ongoing conversation between a user and their AI teammates. Update the existing summary to incorporate the new conversation entries below.\n\n## Current Summary\n\n${this.conversationSummary}\n\n## New Entries to Incorporate\n\n${entriesText}\n\n## Instructions\n\nReturn ONLY the updated summary — no preamble, no explanation. The summary should:\n- Be a concise bulleted list of key topics discussed, decisions made, and work completed\n- Preserve important context that future messages might reference\n- Drop trivial or redundant details\n- Stay under 2000 characters\n- Do NOT include any output protocol (no TO:, no # Subject, no handoff blocks)`
+            : `You are maintaining a running summary of an ongoing conversation between a user and their AI teammates. Summarize the conversation entries below.\n\n## Entries to Summarize\n\n${entriesText}\n\n## Instructions\n\nReturn ONLY the summary — no preamble, no explanation. The summary should:\n- Be a concise bulleted list of key topics discussed, decisions made, and work completed\n- Preserve important context that future messages might reference\n- Drop trivial or redundant details\n- Stay under 2000 characters\n- Do NOT include any output protocol (no TO:, no # Subject, no handoff blocks)`;
+        // Remove the summarized entries — they'll be captured in the summary
+        this.conversationHistory.splice(0, splitIdx);
+        // Queue the summarization task to the base coding agent
+        this.taskQueue.push({
+            type: "summarize",
+            teammate: this.adapterName,
+            task: prompt,
+        });
+        this.kickDrain();
     }
     adapterName;
     teammatesDir;
@@ -2471,6 +2524,10 @@ Do NOT modify any other teammate's files. Only edit your own SOUL.md and daily l
                 if (this.activeTasks.size === 0) {
                     this.stopStatusAnimation();
                 }
+                // Suppress display for internal summarization tasks
+                const activeEntry = this.agentActive.get(event.result.teammate);
+                if (activeEntry?.type === "summarize")
+                    break;
                 if (!this.chatView)
                     this.input.deactivateAndErase();
                 const raw = event.result.rawOutput ?? "";
@@ -2486,15 +2543,7 @@ Do NOT modify any other teammate's files. Only edit your own SOUL.md and daily l
                 const subject = event.result.summary || "Task completed";
                 this.feedLine(concat(tp.accent(`${event.result.teammate}: `), tp.text(subject)));
                 this.lastCleanedOutput = cleaned;
-                if (sizeKB > 5) {
-                    const tmpFile = join(tmpdir(), `teammates-${event.result.teammate}-${Date.now()}.md`);
-                    writeFileSync(tmpFile, cleaned, "utf-8");
-                    this.feedLine(tp.muted(`  ${"─".repeat(40)}`));
-                    this.feedLine(tp.warning(`  ⚠ Response is ${sizeKB.toFixed(1)}KB — saved to temp file:`));
-                    this.feedLine(tp.muted(`  ${tmpFile}`));
-                    this.feedLine(tp.muted(`  ${"─".repeat(40)}`));
-                }
-                else if (cleaned) {
+                if (cleaned) {
                     this.feedMarkdown(cleaned);
                 }
                 else {
@@ -2719,6 +2768,20 @@ Do NOT modify any other teammate's files. Only edit your own SOUL.md and daily l
                 if (entry.type === "compact") {
                     await this.runCompact(entry.teammate);
                 }
+                else if (entry.type === "summarize") {
+                    // Internal housekeeping — summarize older conversation history
+                    const result = await this.orchestrator.assign({
+                        teammate: entry.teammate,
+                        task: entry.task,
+                    });
+                    // Extract the summary from the agent's output (strip protocol artifacts)
+                    const raw = result.rawOutput ?? "";
+                    this.conversationSummary = raw
+                        .replace(/^TO:\s*\S+\s*\n/im, "")
+                        .replace(/^#\s+.+\n*/m, "")
+                        .replace(/```json\s*\n\s*\{[\s\S]*?\}\s*\n\s*```\s*$/g, "")
+                        .trim();
+                }
                 else {
                     // btw and debug tasks skip conversation context (not part of main thread)
                     const extraContext = entry.type === "btw" || entry.type === "debug"
@@ -2736,6 +2799,8 @@ Do NOT modify any other teammate's files. Only edit your own SOUL.md and daily l
                     // btw and debug results are not stored in conversation history
                     if (entry.type !== "btw" && entry.type !== "debug") {
                         this.storeResult(result);
+                        // Check if older history needs summarizing
+                        this.maybeQueueSummarization();
                     }
                     if (entry.type === "retro") {
                         this.handleRetroResult(result);
@@ -2920,6 +2985,7 @@ Do NOT modify any other teammate's files. Only edit your own SOUL.md and daily l
     }
     async cmdClear() {
         this.conversationHistory.length = 0;
+        this.conversationSummary = "";
         this.lastResult = null;
         this.lastResults.clear();
         this.taskQueue.length = 0;

package/dist/types.d.ts CHANGED Viewed

@@ -124,6 +124,10 @@ export type QueueEntry = {
     type: "debug";
     teammate: string;
     task: string;
+} | {
+    type: "summarize";
+    teammate: string;
+    task: string;
 };
 /** A registered slash command. */
 export interface SlashCommand {

package/package.json CHANGED Viewed

@@ -1,13 +1,14 @@
 {
   "name": "@teammates/cli",
-  "version": "0.3.3",
+  "version": "0.4.0",
   "description": "Agent-agnostic CLI for teammates. Routes tasks, manages handoffs, and plugs into any coding agent backend.",
   "type": "module",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",
   "files": [
     "dist",
-    "template"
+    "template",
+    "scripts"
   ],
   "bin": {
     "teammates": "dist/cli.js"
@@ -18,7 +19,8 @@
     "test": "vitest run",
     "test:coverage": "vitest run --coverage",
     "test:watch": "vitest",
-    "typecheck": "tsc --noEmit"
+    "typecheck": "tsc --noEmit",
+    "postinstall": "node scripts/patch-copilot-sdk.cjs"
   },
   "keywords": [
     "teammates",
@@ -31,8 +33,8 @@
   "license": "MIT",
   "dependencies": {
     "@github/copilot-sdk": "^0.1.32",
-    "@teammates/consolonia": "0.3.3",
-    "@teammates/recall": "0.3.3",
+    "@teammates/consolonia": "0.4.0",
+    "@teammates/recall": "0.4.0",
     "chalk": "^5.6.2",
     "ora": "^9.3.0"
   },
@@ -42,9 +44,6 @@
     "typescript": "^5.5.0",
     "vitest": "^4.1.0"
   },
-  "overrides": {
-    "vscode-jsonrpc": "9.0.0-next.11"
-  },
   "engines": {
     "node": ">=20.0.0"
   }

package/scripts/patch-copilot-sdk.cjs ADDED Viewed

@@ -0,0 +1,30 @@
+// Patches @github/copilot-sdk to fix ESM subpath import for vscode-jsonrpc.
+// The SDK imports "vscode-jsonrpc/node" but vscode-jsonrpc@8.x has no exports
+// map, so Node's ESM resolver fails. This adds the ".js" extension.
+// Remove this patch once copilot-sdk ships a fix upstream.
+const fs = require("fs");
+const path = require("path");
+const target = path.join(
+  __dirname,
+  "..",
+  "node_modules",
+  "@github",
+  "copilot-sdk",
+  "dist",
+  "session.js"
+);
+if (!fs.existsSync(target)) {
+  // copilot-sdk not installed yet (e.g. during workspace linking) — skip
+  process.exit(0);
+}
+let src = fs.readFileSync(target, "utf8");
+if (src.includes('vscode-jsonrpc/node"') && !src.includes('vscode-jsonrpc/node.js"')) {
+  src = src.replace(/vscode-jsonrpc\/node"/g, 'vscode-jsonrpc/node.js"');
+  fs.writeFileSync(target, src, "utf8");
+  console.log("Patched @github/copilot-sdk: vscode-jsonrpc/node -> vscode-jsonrpc/node.js");
+}