npm - @tenex-chat/backend - Versions diffs - 0.9.4 → 0.9.6 - Mend

@tenex-chat/backend 0.9.4 → 0.9.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (148) hide show

package/README.md +5 -1
package/dist/daemon-wrapper.cjs +47 -0
package/dist/index.js +59268 -0
package/dist/wrapper.js +171 -0
package/package.json +19 -27
package/src/agents/AgentRegistry.ts +9 -7
package/src/agents/AgentStorage.ts +24 -1
package/src/agents/agent-installer.ts +6 -0
package/src/agents/agent-loader.ts +7 -2
package/src/agents/constants.ts +10 -2
package/src/agents/execution/AgentExecutor.ts +35 -6
package/src/agents/execution/StreamCallbacks.ts +53 -13
package/src/agents/execution/StreamExecutionHandler.ts +110 -16
package/src/agents/execution/StreamSetup.ts +19 -9
package/src/agents/execution/ToolEventHandlers.ts +112 -0
package/src/agents/role-categories.ts +53 -0
package/src/agents/types/runtime.ts +7 -0
package/src/agents/types/storage.ts +7 -0
package/src/commands/agent/import/openclaw-distiller.ts +63 -7
package/src/commands/agent/import/openclaw-reader.ts +54 -0
package/src/commands/agent/import/openclaw.ts +120 -29
package/src/commands/agent/index.ts +83 -2
package/src/commands/setup/display.ts +123 -0
package/src/commands/setup/embed.ts +13 -13
package/src/commands/setup/global-system-prompt.ts +15 -17
package/src/commands/setup/image.ts +17 -20
package/src/commands/setup/interactive.ts +37 -20
package/src/commands/setup/llm.ts +12 -7
package/src/commands/setup/onboarding.ts +1580 -248
package/src/commands/setup/providers.ts +3 -3
package/src/conversations/ConversationStore.ts +23 -2
package/src/conversations/MessageBuilder.ts +51 -73
package/src/conversations/formatters/utils/conversation-transcript-formatter.ts +425 -0
package/src/conversations/search/embeddings/ConversationEmbeddingService.ts +40 -98
package/src/conversations/search/embeddings/ConversationIndexingJob.ts +40 -52
package/src/conversations/services/ConversationSummarizer.ts +1 -2
package/src/conversations/types.ts +11 -0
package/src/daemon/Daemon.ts +78 -57
package/src/daemon/ProjectRuntime.ts +6 -12
package/src/daemon/SubscriptionManager.ts +13 -0
package/src/daemon/index.ts +0 -1
package/src/event-handler/index.ts +1 -0
package/src/index.ts +20 -1
package/src/llm/ChunkHandler.ts +1 -1
package/src/llm/FinishHandler.ts +28 -4
package/src/llm/LLMConfigEditor.ts +218 -106
package/src/llm/index.ts +0 -4
package/src/llm/meta/MetaModelResolver.ts +3 -18
package/src/llm/middleware/message-sanitizer.ts +153 -0
package/src/llm/providers/ollama-models.ts +0 -38
package/src/llm/service.ts +50 -15
package/src/llm/types.ts +0 -12
package/src/llm/utils/ConfigurationManager.ts +88 -465
package/src/llm/utils/ConfigurationTester.ts +42 -185
package/src/llm/utils/ModelSelector.ts +156 -92
package/src/llm/utils/ProviderConfigUI.ts +10 -141
package/src/llm/utils/models-dev-cache.ts +102 -23
package/src/llm/utils/provider-select-prompt.ts +284 -0
package/src/llm/utils/provider-setup.ts +81 -34
package/src/llm/utils/variant-list-prompt.ts +361 -0
package/src/nostr/AgentEventDecoder.ts +1 -0
package/src/nostr/AgentEventEncoder.ts +37 -0
package/src/nostr/AgentProfilePublisher.ts +13 -0
package/src/nostr/AgentPublisher.ts +26 -0
package/src/nostr/kinds.ts +1 -0
package/src/nostr/ndkClient.ts +4 -1
package/src/nostr/types.ts +12 -0
package/src/prompts/fragments/25-rag-instructions.ts +22 -21
package/src/prompts/fragments/31-agents-md-guidance.ts +7 -21
package/src/prompts/fragments/index.ts +2 -0
package/src/prompts/utils/systemPromptBuilder.ts +18 -28
package/src/services/AgentDefinitionMonitor.ts +8 -0
package/src/services/ConfigService.ts +34 -0
package/src/services/PubkeyService.ts +7 -1
package/src/services/compression/CompressionService.ts +133 -74
package/src/services/compression/compression-utils.ts +110 -19
package/src/services/config/types.ts +0 -6
package/src/services/dispatch/AgentDispatchService.ts +79 -0
package/src/services/intervention/InterventionService.ts +78 -5
package/src/services/nip46/Nip46SigningService.ts +30 -1
package/src/services/projects/ProjectContext.ts +8 -6
package/src/services/rag/RAGCollectionRegistry.ts +199 -0
package/src/services/rag/RAGDatabaseService.ts +2 -7
package/src/services/rag/RAGOperations.ts +25 -45
package/src/services/rag/RAGService.ts +0 -31
package/src/services/rag/RagSubscriptionService.ts +71 -122
package/src/services/rag/rag-utils.ts +13 -0
package/src/services/ral/RALRegistry.ts +25 -184
package/src/services/reports/ReportEmbeddingService.ts +63 -113
package/src/services/search/UnifiedSearchService.ts +115 -4
package/src/services/search/index.ts +1 -0
package/src/services/search/projectFilter.ts +20 -4
package/src/services/search/providers/ConversationSearchProvider.ts +1 -0
package/src/services/search/providers/GenericCollectionSearchProvider.ts +81 -0
package/src/services/search/providers/LessonSearchProvider.ts +1 -8
package/src/services/search/providers/ReportSearchProvider.ts +1 -0
package/src/services/search/types.ts +24 -3
package/src/services/trust-pubkeys/SystemPubkeyListService.ts +148 -0
package/src/services/trust-pubkeys/TrustPubkeyService.ts +70 -9
package/src/telemetry/setup.ts +2 -13
package/src/tools/implementations/ask.ts +3 -3
package/src/tools/implementations/conversation_get.ts +28 -268
package/src/tools/implementations/fs_grep.ts +6 -6
package/src/tools/implementations/fs_read.ts +2 -0
package/src/tools/implementations/fs_write.ts +2 -0
package/src/tools/implementations/learn.ts +38 -50
package/src/tools/implementations/rag_add_documents.ts +6 -4
package/src/tools/implementations/rag_create_collection.ts +37 -4
package/src/tools/implementations/rag_delete_collection.ts +9 -0
package/src/tools/implementations/{search.ts → rag_search.ts} +31 -25
package/src/tools/registry.ts +7 -8
package/src/tools/types.ts +11 -2
package/src/tools/utils/transcript-args.ts +13 -0
package/src/utils/cli-theme.ts +13 -0
package/src/utils/logger.ts +55 -0
package/src/utils/metadataKeys.ts +17 -0
package/src/utils/sqlEscaping.ts +39 -0
package/src/wrapper.ts +7 -3
package/dist/src/index.js +0 -46778
package/dist/tenex-backend-wrapper.cjs +0 -3
package/src/agents/execution/constants.ts +0 -16
package/src/agents/execution/index.ts +0 -3
package/src/agents/index.ts +0 -4
package/src/commands/agent.ts +0 -215
package/src/conversations/formatters/DelegationXmlFormatter.ts +0 -64
package/src/conversations/formatters/index.ts +0 -9
package/src/conversations/index.ts +0 -2
package/src/conversations/utils/content-utils.ts +0 -69
package/src/daemon/UnixSocketTransport.ts +0 -318
package/src/event-handler/newConversation.ts +0 -165
package/src/events/NDKProjectStatus.ts +0 -384
package/src/events/index.ts +0 -4
package/src/lib/json-parser.ts +0 -30
package/src/llm/RecordingState.ts +0 -37
package/src/llm/StreamPublisher.ts +0 -40
package/src/llm/middleware/flight-recorder.ts +0 -188
package/src/llm/utils/claudeCodePromptCompiler.ts +0 -141
package/src/nostr/constants.ts +0 -38
package/src/prompts/core/index.ts +0 -3
package/src/prompts/index.ts +0 -21
package/src/services/image/index.ts +0 -12
package/src/services/status/index.ts +0 -11
package/src/telemetry/diagnostics.ts +0 -27
package/src/tools/implementations/rag_query.ts +0 -107
package/src/types/index.ts +0 -46
package/src/utils/agentFetcher.ts +0 -107
package/src/utils/conversation-utils.ts +0 -1
package/src/utils/process.ts +0 -49

package/src/prompts/fragments/25-rag-instructions.ts CHANGED Viewed

@@ -77,15 +77,16 @@ rag_add_documents({
 })
 \`\`\`
-### 3. rag_query
-Perform semantic search on a collection.
+### 3. rag_search
+Search across ALL project knowledge — reports, conversations, lessons, and any
+additional RAG collections — using natural language semantic search.
 \`\`\`typescript
-rag_query({
-  collection: "project_knowledge",
-  query_text: "How does authentication work?",
-  top_k: 5,  // Number of results (1-100)
-  include_metadata: true  // Include document metadata
+rag_search({
+  query: "How does authentication work?",
+  limit: 10,  // Maximum results (default: 10)
+  collections: ["reports", "lessons"],  // Optional: filter to specific collections
+  prompt: "Summarize the auth approach"  // Optional: LLM extraction
 })
 \`\`\`
@@ -143,7 +144,7 @@ All tools use standardized error responses:
 {
   "success": false,
   "error": "Descriptive error message",
-  "toolName": "rag_query"
+  "toolName": "rag_search"
 }
 \`\`\`
@@ -169,9 +170,9 @@ rag_add_documents({
 })
 // Later, retrieve relevant context
-rag_query({
-  collection: "agent_insights",
-  query_text: "What are the user's programming language preferences?"
+rag_search({
+  query: "What are the user's programming language preferences?",
+  collections: ["agent_insights"]
 })
 \`\`\`
@@ -192,9 +193,9 @@ rag_add_documents({
 })
 // Query for specific information
-rag_query({
-  collection: "project_docs",
-  query_text: "API authentication methods"
+rag_search({
+  query: "API authentication methods",
+  collections: ["project_docs"]
 })
 \`\`\`
@@ -222,9 +223,9 @@ rag_add_documents({
 })
 // Find related lessons semantically
-rag_query({
-  collection: "lessons",
-  query_text: "How to handle promise rejections"
+rag_search({
+  query: "How to handle promise rejections",
+  collections: ["lessons"]
 })
 \`\`\`
@@ -247,9 +248,9 @@ rag_add_documents({
   }]
 })
-rag_query({
-  collection: "code_patterns",
-  query_text: "authentication hook implementation"
+rag_search({
+  query: "authentication hook implementation",
+  collections: ["code_patterns"]
 })
 \`\`\`
@@ -273,7 +274,7 @@ Share collections between agents:
 \`\`\`typescript
 delegate({
   task: "Analyze the project documentation",
-  tools: ["rag_query"],
+  tools: ["rag_search"],
   context: "Use collection 'project_docs' for analysis"
 })
 \`\`\`

package/src/prompts/fragments/31-agents-md-guidance.ts CHANGED Viewed

@@ -57,27 +57,13 @@ export const agentsMdGuidanceFragment: PromptFragment<AgentsMdGuidanceArgs> = {
 - Deeper, more specific AGENTS.md files override general root instructions.
 ### Writing AGENTS.md Files
-When working in a directory that needs specific agent guidance:
-1. Create an AGENTS.md file in that directory.
-2. Focus on **executable commands** (test/build) and **strict conventions**.
-3. Do not duplicate generic info; focus on what is unique to this directory.
-### AGENTS.md Format
-\`\`\`markdown
-# Directory Context
-Specific architectural details or business logic for this directory.
-## Commands
-- Test: \`npm test path/to/dir\`
-- Lint: \`npm run lint:specific\`
-## Conventions
-- Code Style: Functional patterns preferred
-- Naming: CamelCase for files, PascalCase for classes
-## Related
-- [API Docs](./docs/api.md)
-\`\`\``);
+When creating or updating an AGENTS.md file:
+1. **Maximum 50 lines.** If it's longer, you're including too much. Cut aggressively.
+2. **No code examples.** Don't include correct/incorrect patterns, usage snippets, or testing templates. Just state the rule in plain English.
+3. **No boilerplate sections.** Don't add Anti-Patterns, Testing, Dependencies, or Related sections. Only include what's genuinely unique to this directory.
+4. **Don't repeat parent info.** Import patterns, naming conventions, layer rules — if it's in a parent directory's AGENTS.md, don't restate it.
+5. **List actual files.** Name the real files that exist, not idealized directory trees. Keep it to key files only, not every file.
+6. **State rules, not ideology.** "Tools delegate to services" is a rule. A 10-line example showing correct vs incorrect delegation is ideology.`);
         // If root AGENTS.md content is available and short, include it
         if (rootAgentsMdContent && rootAgentsMdContent.length < MAX_ROOT_CONTENT_LENGTH_FOR_SYSTEM_PROMPT) {

package/src/prompts/fragments/index.ts CHANGED Viewed

@@ -37,6 +37,7 @@ import { agentDirectedMonitoringFragment } from "./28-agent-directed-monitoring"
 import { ragCollectionsFragment } from "./29-rag-collections";
 import { worktreeContextFragment } from "./30-worktree-context";
 import { agentsMdGuidanceFragment } from "./31-agents-md-guidance";
+import { processMetricsFragment } from "./32-process-metrics";
 import { debugModeFragment } from "./debug-mode";
 import { delegationCompletionFragment } from "./delegation-completion";
@@ -85,6 +86,7 @@ export function registerAllFragments(): void {
     fragmentRegistry.register(ragCollectionsFragment);
     fragmentRegistry.register(worktreeContextFragment);
     fragmentRegistry.register(agentsMdGuidanceFragment);
+    fragmentRegistry.register(processMetricsFragment);
 }
 // Auto-register all fragments on import

package/src/prompts/utils/systemPromptBuilder.ts CHANGED Viewed

@@ -250,37 +250,24 @@ async function addCoreAgentFragments(
     // Add RAG collection attribution - shows agents their contributions to RAG collections
     // This uses the provenance tracking metadata (agent_pubkey) from document ingestion
-    //
-    // OPTIMIZATION: First check if any collections exist using lightweight check
-    // to avoid initializing embedding provider when RAG isn't used.
     try {
-        const { hasRagCollections, RAGService } = await import("@/services/rag/RAGService");
-        // Fast path: skip full initialization if no collections exist
-        // Note: hasRagCollections() returns false on errors and logs them internally
-        if (!(await hasRagCollections())) {
-            logger.debug("📊 Skipping RAG collection stats - no collections available");
-        } else {
-            // Collections exist - now we need full service for stats
-            const ragService = RAGService.getInstance();
-            const collections = await ragService.getAllCollectionStats(agent.pubkey);
-            // Only add the fragment if we have any collection data
-            if (collections.length > 0) {
-                builder.add("rag-collections", {
-                    agentPubkey: agent.pubkey,
-                    collections,
-                });
-                logger.debug("📊 Added RAG collection stats to system prompt", {
-                    agent: agent.name,
-                    collectionsWithContributions: collections.filter(c => c.agentDocCount > 0).length,
-                    totalCollections: collections.length,
-                });
-            }
+        const { RAGService } = await import("@/services/rag/RAGService");
+        const ragService = RAGService.getInstance();
+        const collections = await ragService.getAllCollectionStats(agent.pubkey);
+        if (collections.length > 0) {
+            builder.add("rag-collections", {
+                agentPubkey: agent.pubkey,
+                collections,
+            });
+            logger.debug("📊 Added RAG collection stats to system prompt", {
+                agent: agent.name,
+                collectionsWithContributions: collections.filter(c => c.agentDocCount > 0).length,
+                totalCollections: collections.length,
+            });
         }
     } catch (error) {
-        // RAG service might not be available - skip gracefully
-        logger.debug("Could not fetch RAG collection stats for prompt:", error);
+        logger.debug("Could not get RAG collection stats:", error);
     }
 }
@@ -654,6 +641,9 @@ async function buildMainSystemPrompt(options: BuildSystemPromptOptions): Promise
     // Add relay configuration context
     systemPromptBuilder.add("relay-configuration", {});
+    // Add process metrics (PID, uptime, CPU/memory usage)
+    systemPromptBuilder.add("process-metrics", {});
     // Add meta-project context (other projects this agent belongs to)
     // This gives agents cross-project awareness without overwhelming them
     systemPromptBuilder.add("meta-project-context", {

package/src/services/AgentDefinitionMonitor.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 import type { StoredAgent } from "@/agents/AgentStorage";
 import { agentStorage } from "@/agents/AgentStorage";
 import { NDKAgentDefinition } from "@/events/NDKAgentDefinition";
+import { isValidCategory } from "@/agents/role-categories";
 import { logger } from "@/utils/logger";
 import type NDK from "@nostr-dev-kit/ndk";
 import type { NDKEvent, NDKFilter, NDKSubscription } from "@nostr-dev-kit/ndk";
@@ -545,6 +546,13 @@ export class AgentDefinitionMonitor {
             changedFields.push("role");
         }
+        const rawCategory = agentDef.category || undefined;
+        const newCategory = rawCategory && isValidCategory(rawCategory) ? rawCategory : undefined;
+        if (newCategory !== storedAgent.category) {
+            storedAgent.category = newCategory;
+            changedFields.push("category");
+        }
         const newDescription = agentDef.description || undefined;
         if (newDescription !== storedAgent.description) {
             storedAgent.description = newDescription;

package/src/services/ConfigService.ts CHANGED Viewed

@@ -367,6 +367,40 @@ export class ConfigService {
         return loadedConfig.llms.configurations[name];
     }
+    /**
+     * Get all resolved LLM configurations, skipping meta models.
+     * Returns the default config first, followed by the rest in declaration order.
+     */
+    getAllLLMConfigs(): LLMConfiguration[] {
+        if (!this.loadedConfig) {
+            throw new Error("Config not loaded. Call loadConfig() first.");
+        }
+        const llms = this.loadedConfig.llms;
+        const configs: LLMConfiguration[] = [];
+        const seen = new Set<string>();
+        // Default first
+        if (llms.default && llms.configurations[llms.default]) {
+            const config = llms.configurations[llms.default];
+            if (!isMetaModelConfiguration(config)) {
+                configs.push(config);
+                seen.add(`${config.provider}:${config.model}`);
+            }
+        }
+        // Then the rest, deduplicating by provider:model
+        for (const config of Object.values(llms.configurations)) {
+            if (isMetaModelConfiguration(config)) continue;
+            const key = `${config.provider}:${config.model}`;
+            if (seen.has(key)) continue;
+            seen.add(key);
+            configs.push(config);
+        }
+        return configs;
+    }
     /**
      * Check if a configuration name refers to a meta model.
      */

package/src/services/PubkeyService.ts CHANGED Viewed

@@ -85,7 +85,13 @@ export class PubkeyService {
      * Uses AgentRegistry's getAgentByPubkey for efficient O(1) lookup.
      */
     private getAgentSlug(pubkey: Hexpubkey): string | undefined {
-        const projectCtx = getProjectContext();
+        let projectCtx;
+        try {
+            projectCtx = getProjectContext();
+        } catch {
+            // Name resolution must remain available even outside a project-scoped context
+            return undefined;
+        }
         // Use direct pubkey lookup from AgentRegistry (O(1) instead of O(n))
         const agent = projectCtx.getAgentByPubkey(pubkey);

package/src/services/compression/CompressionService.ts CHANGED Viewed

@@ -2,6 +2,7 @@ import type { LLMService } from "@/llm/service";
 import { shortenConversationId } from "@/utils/conversation-id";
 import type { ConversationStore } from "@/conversations/ConversationStore";
 import type { ConversationEntry } from "@/conversations/types";
+import { renderConversationXml } from "@/conversations/formatters/utils/conversation-transcript-formatter";
 import { trace, SpanStatusCode, type Span } from "@opentelemetry/api";
 import { logger } from "@/utils/logger";
 import { config } from "@/services/ConfigService";
@@ -18,9 +19,52 @@ import {
   validateSegmentsForEntries,
   applySegmentsToEntries,
   createFallbackSegmentForEntries,
+  computeTokenAwareWindowSize,
 } from "./compression-utils.js";
 const tracer = trace.getTracer("tenex.compression");
+const CONTEXT_SEGMENT_LIMIT = 3;
+function buildContextPreamble(existingSegments: CompressionSegment[]): string {
+  if (existingSegments.length === 0) {
+    return "";
+  }
+  const recentSegments = existingSegments.slice(-CONTEXT_SEGMENT_LIMIT);
+  const contextLines = recentSegments.map(
+    (segment, index) => `[Previous context ${index + 1}]: ${segment.compressed}`
+  );
+  return `Previous conversation context (already compressed):\n${contextLines.join("\n")}\n\n`;
+}
+function buildCompressionPrompt(
+  transcriptXml: string,
+  firstShortId: string,
+  lastShortId: string,
+  existingSegments: CompressionSegment[]
+): string {
+  const contextPreamble = buildContextPreamble(existingSegments);
+  return `You are compressing conversation history represented as XML. Analyze the conversation and create 1-3 compressed segments that preserve key information while being concise.
+For each segment, provide:
+- fromEventId: starting message id from XML (the id attribute)
+- toEventId: ending message id from XML (the id attribute)
+- compressed: a concise summary (2-4 sentences) of the key points
+Rules:
+- Preserve attribution: who said or did what.
+- Preserve recipient targeting when present.
+- Preserve temporal flow using the time="+seconds" indicators and conversation t0.
+- Use IDs exactly as shown in XML id attributes (do not invent IDs).
+- The first segment must start at id "${firstShortId}" and the last segment must end at id "${lastShortId}".
+${contextPreamble}Messages to compress:
+${transcriptXml}
+Create segments that group related topics together. Preserve important decisions, errors, and outcomes.`;
+}
 /**
  * CompressionService - Orchestrates conversation history compression.
@@ -153,17 +197,57 @@ export class CompressionService {
               conversationId,
               entries,
               compressionConfig.slidingWindowSize,
-              span
+              span,
+              effectiveBudget
             );
           }
           span.setStatus({ code: SpanStatusCode.OK });
           return;
         }
+        // Compute range impact before attempting LLM call
+        const rangeEntries = entries.slice(range.startIndex, range.endIndex);
+        const rangeTokens = estimateTokensFromEntries(rangeEntries);
+        // Skip LLM when range can't meaningfully help
+        if (blocking) {
+          const tokenOverage = currentTokens - effectiveBudget;
+          if (rangeTokens < tokenOverage) {
+            // Even compressing the entire range to zero can't close the gap
+            span.addEvent("compression.skip_to_fallback", {
+              "reason": "range_too_small_for_overage",
+              "range.tokens": rangeTokens,
+              "token.overage": tokenOverage,
+            });
+            await this.useFallback(
+              conversationId,
+              entries,
+              compressionConfig.slidingWindowSize,
+              span,
+              effectiveBudget
+            );
+            span.setStatus({ code: SpanStatusCode.OK });
+            return;
+          }
+        } else {
+          // Proactive mode: skip if range is tiny (not worth an LLM call)
+          if (rangeTokens < 500) {
+            span.addEvent("compression.skip_proactive", {
+              "reason": "range_too_small",
+              "range.tokens": rangeTokens,
+            });
+            span.setStatus({ code: SpanStatusCode.OK });
+            return;
+          }
+        }
         // Attempt LLM compression
         try {
-          const rangeEntries = entries.slice(range.startIndex, range.endIndex);
-          const newSegments = await this.compressEntries(rangeEntries);
+          const newSegments = await this.compressEntries(
+            conversationId,
+            rangeEntries,
+            existingSegments
+          );
           // Emit telemetry for successful summary generation
           span.addEvent("compression.summary_generated", {
@@ -195,7 +279,8 @@ export class CompressionService {
                 conversationId,
                 entries,
                 compressionConfig.slidingWindowSize,
-                span
+                span,
+                effectiveBudget
               );
             }
             return;
@@ -239,7 +324,8 @@ export class CompressionService {
               conversationId,
               entries,
               compressionConfig.slidingWindowSize,
-              span
+              span,
+              effectiveBudget
             );
           } else {
             // Proactive mode: fail silently, don't throw
@@ -263,7 +349,9 @@ export class CompressionService {
    * Compress a range of entries using LLM.
    */
   private async compressEntries(
-    entries: ConversationEntry[]
+    conversationId: string,
+    entries: ConversationEntry[],
+    existingSegments: CompressionSegment[]
   ): Promise<CompressionSegment[]> {
     return tracer.startActiveSpan(
       "compression.llm_compress",
@@ -271,71 +359,30 @@ export class CompressionService {
         try {
           span.setAttribute("entries.count", entries.length);
-          // Format entries for LLM, including tool payloads
-          const formattedEntries = entries
-            .map((e) => {
-              let formatted = `[${e.messageType}]`;
-              // Add text content if present
-              if (e.content) {
-                formatted += ` ${e.content}`;
-              }
-              // Add tool payload summary for tool-call/tool-result entries
-              if (e.toolData && e.toolData.length > 0) {
-                const toolSummary = e.toolData
-                  .map((tool) => {
-                    if ('toolName' in tool) {
-                      // ToolCallPart
-                      return `Tool: ${tool.toolName}`;
-                    } else if ('toolCallId' in tool) {
-                      // ToolResultPart - cast to any to avoid type narrowing issues
-                      const toolResult = tool as any;
-                      const resultPreview = typeof toolResult.result === 'string'
-                        ? toolResult.result.substring(0, 100)
-                        : JSON.stringify(toolResult.result).substring(0, 100);
-                      return `Result: ${resultPreview}${resultPreview.length >= 100 ? '...' : ''}`;
-                    }
-                    return '';
-                  })
-                  .filter(Boolean)
-                  .join(', ');
-                if (toolSummary) {
-                  formatted += ` [${toolSummary}]`;
-                }
-              }
-              return formatted;
-            })
-            .join("\n\n");
-          const eventIds = entries
-            .filter((e) => e.eventId)
-            .map((e) => e.eventId!);
-          if (eventIds.length === 0) {
+          const {
+            xml: transcriptXml,
+            shortIdToEventId,
+            firstShortId,
+            lastShortId,
+          } = renderConversationXml(entries, { conversationId });
+          if (shortIdToEventId.size === 0 || !firstShortId || !lastShortId) {
             throw new Error("No eventIds found in entries to compress");
           }
+          const prompt = buildCompressionPrompt(
+            transcriptXml,
+            firstShortId,
+            lastShortId,
+            existingSegments
+          );
           // Call LLM to compress
           const result = await this.effectiveLlmService.generateObject(
             [
               {
                 role: "user",
-                content: `You are compressing conversation history. Analyze the following messages and create 1-3 compressed segments that preserve key information while being concise.
-For each segment, provide:
-- fromEventId: starting message event ID
-- toEventId: ending message event ID
-- compressed: a concise summary (2-4 sentences) of the key points
-Messages to compress:
-${formattedEntries}
-Event IDs in order: ${eventIds.join(", ")}
-Create segments that group related topics together. Preserve important decisions, errors, and outcomes.`,
+                content: prompt,
               },
             ],
             CompressionSegmentsSchema
@@ -343,13 +390,17 @@ Create segments that group related topics together. Preserve important decisions
           // Convert LLM output to CompressionSegment format
           const segments: CompressionSegment[] = result.object.map(
-            (seg: CompressionSegmentInput) => ({
-              fromEventId: seg.fromEventId,
-              toEventId: seg.toEventId,
-              compressed: seg.compressed,
-              createdAt: Date.now(),
-              model: this.effectiveLlmService.model,
-            })
+            (seg: CompressionSegmentInput) => {
+              const fromId = seg.fromEventId.trim();
+              const toId = seg.toEventId.trim();
+              return {
+                fromEventId: shortIdToEventId.get(fromId) ?? fromId,
+                toEventId: shortIdToEventId.get(toId) ?? toId,
+                compressed: seg.compressed,
+                createdAt: Date.now(),
+                model: this.effectiveLlmService.model,
+              };
+            }
           );
           span.setAttribute("segments.count", segments.length);
@@ -375,19 +426,27 @@ Create segments that group related topics together. Preserve important decisions
     conversationId: string,
     entries: ConversationEntry[],
     windowSize: number,
-    span: Span
+    span: Span,
+    tokenBudget: number
   ): Promise<void> {
+    const tokenAwareWindowSize = computeTokenAwareWindowSize(entries, tokenBudget);
+    const effectiveWindowSize = Math.min(windowSize, tokenAwareWindowSize);
     span.setAttribute("fallback.used", true);
-    span.setAttribute("fallback.window_size", windowSize);
+    span.setAttribute("fallback.configured_window", windowSize);
+    span.setAttribute("fallback.token_aware_window", tokenAwareWindowSize);
+    span.setAttribute("fallback.effective_window", effectiveWindowSize);
     logger.warn("Compression fallback triggered - using sliding window truncation", {
       conversationId,
       entriesCount: entries.length,
-      windowSize,
+      configuredWindow: windowSize,
+      tokenAwareWindow: tokenAwareWindowSize,
+      effectiveWindow: effectiveWindowSize,
     });
     // Delegate to pure utility function
-    const fallbackSegment = createFallbackSegmentForEntries(entries, windowSize);
+    const fallbackSegment = createFallbackSegmentForEntries(entries, effectiveWindowSize);
     if (!fallbackSegment) {
       // Can't create a valid segment (too few entries or insufficient event IDs)