npm - @tom2012/cc-web - Versions diffs - 1.5.111 → 1.5.113 - Mend

@tom2012/cc-web 1.5.111 → 1.5.113

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/backend/dist/information/condenser.js CHANGED Viewed

@@ -1,7 +1,9 @@
 "use strict";
 // backend/src/information/condenser.ts
 //
-// Condense and reorganize conversations using Claude CLI (haiku).
+// Iterative condense and reorganize using Claude CLI (haiku).
+// Implements: half-window segmentation, cohesion tracking, context summary injection,
+// single-turn overflow handling, guard rails.
 var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
     if (k2 === undefined) k2 = k;
     var desc = Object.getOwnPropertyDescriptor(m, k);
@@ -43,10 +45,14 @@ const path = __importStar(require("path"));
 const child_process_1 = require("child_process");
 const config_1 = require("../config");
 const conversation_sync_1 = require("./conversation-sync");
+// Haiku context: ~200K tokens. Half window for input, half for output.
+const HALF_WINDOW_TOKENS = 80000;
+// Keywords that mark uncondensable user turns
+const UNCONDENSABLE_RE = /不要|别|错了|改成|不是这样|必须|禁止|永远不要|以后请/;
 function estimateTokens(text) {
     return Math.ceil(text.length / 4);
 }
-/** Call Claude CLI in non-interactive mode with haiku. */
+// ── Claude CLI ──
 function callHaiku(prompt) {
     return new Promise((resolve, reject) => {
         (0, child_process_1.execFile)('claude', ['-p', prompt, '--model', 'haiku'], { timeout: 120000, maxBuffer: 8 * 1024 * 1024 }, (err, stdout) => {
@@ -56,15 +62,11 @@ function callHaiku(prompt) {
         });
     });
 }
-/** Extract JSON array from Haiku response (handles code fences, extra text). */
 function extractJsonArray(text) {
-    // Strip markdown code fences
     let cleaned = text.replace(/```json\s*/gi, '').replace(/```\s*/g, '');
-    // Try to find the JSON array
     const start = cleaned.indexOf('[');
     if (start === -1)
         throw new Error('No JSON array found');
-    // Find matching closing bracket
     let depth = 0;
     let end = -1;
     for (let i = start; i < cleaned.length; i++) {
@@ -79,71 +81,285 @@ function extractJsonArray(text) {
         }
     }
     if (end === -1) {
-        // Array was truncated — try to repair by closing it
-        cleaned = cleaned.slice(start) + ']';
-        // Remove any trailing incomplete object
-        cleaned = cleaned.replace(/,\s*\{[^}]*$/, ']');
+        cleaned = cleaned.slice(start);
+        cleaned = cleaned.replace(/,\s*\{[^}]*$/, '') + ']';
     }
     else {
         cleaned = cleaned.slice(start, end + 1);
     }
     return JSON.parse(cleaned);
 }
-/** Parse v0.md into turn sections. */
 function parseTurns(content) {
     const sections = content.split(/(?=^## [UA]\d+)/m).filter(Boolean);
     return sections.map(s => {
         const match = s.match(/^(## [UA]\d+.*)\n/);
         if (!match)
-            return { id: '', header: '', body: s };
-        return { id: match[1].replace(/^## /, '').split(/[\s\[]/)[0], header: match[1], body: s.slice(match[0].length).trim() };
-    }).filter(t => t.id);
+            return null;
+        const header = match[1];
+        const id = header.replace(/^## /, '').split(/[\s\[]/)[0];
+        const body = s.slice(match[0].length).trim();
+        const hasMarker = /\[c\d+/.test(header);
+        return { id, header, body, tokens: estimateTokens(body), condensed: hasMarker, cohesion: null };
+    }).filter(Boolean);
 }
-/** Build condensed content from turns with [cN,P%] markers. */
-function buildCondensedContent(originalTurns, condensedBodies, // turnId → condensed text (null = keep original)
-prevMarkers, // turnId → existing marker chain from previous version
-level) {
+function extractMarkerChain(header) {
+    const match = header.match(/\[(.+)\]\s*$/);
+    return match ? match[1] : '';
+}
+// ── Prompt building ──
+const CONDENSE_RULES = `你是一个对话缩减器。目标：大幅压缩对话，只保留对未来 LLM 行为有影响的信息。
+## 必须激进缩减为一句话的内容（这些占对话的 80%+）：
+- LLM 的工具调用和输出 → "执行了 X，结果：Y"
+- 构建/发布日志 → "构建成功" 或 "发布 vX.Y.Z"
+- 代码修改的详细描述 → "修改了 file.ts 的 funcName"
+- 文件内容展示 → "读取了 file.ts"
+- 搜索/grep 结果 → "搜索 X，找到 N 处"
+- LLM 的解释性文字（"让我检查一下""我来看看"等） → 删除
+- 重复的同类操作（多次发版、多次构建） → 只保留最后一次的结果
+## 必须保留原文的内容（condensed 设为 null）：
+- 用户纠正 LLM 的发言（"不对""错了""改成""不要"）
+- 用户表达需求或偏好（"我希望""请实现""以后请"）
+- 设计决策讨论（"为什么选 A 不选 B"）
+- 错误诊断（"报错 X，原因是 Y"）
+- 标记了 [已缩减] 的轮次
+## 不得违反：
+- 绝不改变语义方向（肯定↔否定）
+- 保留版本号、文件路径等标识符
+对每轮输出 JSON：
+[{"turn":"U1","condensed":"缩减内容或null","cohesion":0.8},...]
+cohesion: 与上一轮的话题相关性（0-1）`;
+function buildSegmentPrompt(turns, condensedUpTo, contextSummary) {
+    const parts = [CONDENSE_RULES, ''];
+    if (contextSummary) {
+        parts.push(`[前文摘要：${contextSummary}]`, '');
+    }
+    parts.push('对话：');
+    for (let i = 0; i < turns.length; i++) {
+        const t = turns[i];
+        if (i < condensedUpTo) {
+            // Already condensed in previous iteration — mark as [已缩减]
+            parts.push(`## ${t.id} [已缩减]`);
+            parts.push(t.body);
+        }
+        else {
+            parts.push(`## ${t.id}`);
+            parts.push(t.body);
+        }
+        parts.push('');
+    }
+    return parts.join('\n');
+}
+// ── Context summary generation ──
+function generateContextSummary(turns) {
+    // Take first sentence of each turn, max 5 turns
+    const summaryParts = [];
+    for (const t of turns.slice(0, 5)) {
+        const firstSentence = t.body.split(/[。！？\n]/)[0].slice(0, 40);
+        summaryParts.push(`${t.id}: ${firstSentence}`);
+    }
+    if (turns.length > 5)
+        summaryParts.push(`...共${turns.length}轮`);
+    return summaryParts.join('；');
+}
+// ── Select segment that fits in half window ──
+function selectSegment(turns, startIdx, halfWindow) {
+    let total = 0;
+    const promptOverhead = estimateTokens(CONDENSE_RULES) + 200; // rules + formatting
+    total += promptOverhead;
+    for (let i = startIdx; i < turns.length; i++) {
+        const turnCost = turns[i].tokens + 20; // header + formatting overhead
+        if (total + turnCost > halfWindow && i > startIdx) {
+            // Ensure we end on a complete U-A pair
+            let endIdx = i;
+            // If endIdx splits a U-A pair (ends on U without A), back up one
+            if (endIdx > startIdx && turns[endIdx - 1]?.id.startsWith('U')) {
+                endIdx--;
+            }
+            return { endIdx: Math.max(startIdx + 2, endIdx), totalTokens: total };
+        }
+        total += turnCost;
+    }
+    return { endIdx: turns.length, totalTokens: total };
+}
+// ── Find lowest cohesion cut point ──
+function findLowestCohesionCut(turns, startIdx, endIdx) {
+    let minCohesion = 2;
+    let cutIdx = Math.floor((startIdx + endIdx) / 2); // fallback: midpoint
+    for (let i = startIdx + 2; i < endIdx; i += 2) { // step by 2 to cut at U-A pair boundaries
+        const c = turns[i].cohesion;
+        if (c !== null && c < minCohesion) {
+            minCohesion = c;
+            cutIdx = i;
+        }
+    }
+    // If all cohesion > 0.8, use midpoint fallback
+    if (minCohesion > 0.8)
+        cutIdx = Math.floor((startIdx + endIdx) / 2);
+    return cutIdx;
+}
+// ── Pre-truncate oversized single turn ──
+function truncateTurn(turn, maxTokens) {
+    const headTokens = Math.floor(maxTokens * 0.7);
+    const tailTokens = Math.floor(maxTokens * 0.2);
+    const headChars = headTokens * 4;
+    const tailChars = tailTokens * 4;
+    const omitted = estimateTokens(turn.body) - maxTokens;
+    const truncatedBody = turn.body.slice(0, headChars) +
+        `\n\n[...省略约 ${omitted} tokens...]\n\n` +
+        turn.body.slice(-tailChars);
+    return { ...turn, body: truncatedBody, tokens: estimateTokens(truncatedBody) };
+}
+// ── Iterative condense ──
+// Strategy: slide a window through turns. Each window includes:
+//   1. Context prefix: last CONTEXT_OVERLAP condensed turns from previous window (marked [已缩减])
+//   2. New turns to condense (fills remaining window space)
+// Haiku sees the context to understand conversation flow, but only condenses new turns.
+const CONTEXT_OVERLAP = 6; // number of condensed turns to carry as context
+const BUDGET_FOR_CONTEXT = 8000; // max tokens for context prefix
+async function iterativeCondense(turns) {
+    const halfWindow = HALF_WINDOW_TOKENS;
+    const cohesionMap = {};
+    let condensedUpTo = 0;
+    // Pre-truncate any single turn larger than half window
+    for (let i = 0; i < turns.length; i++) {
+        if (turns[i].tokens > halfWindow * 0.8) {
+            turns[i] = truncateTurn(turns[i], Math.floor(halfWindow * 0.7));
+        }
+    }
+    console.log(`[condenser] starting iterative condense: ${turns.length} turns`);
+    while (condensedUpTo < turns.length) {
+        // 1. Build context prefix from last few condensed turns
+        let contextTurns = [];
+        let contextTokens = 0;
+        if (condensedUpTo > 0) {
+            const contextStart = Math.max(0, condensedUpTo - CONTEXT_OVERLAP);
+            for (let i = contextStart; i < condensedUpTo; i++) {
+                if (contextTokens + turns[i].tokens + 20 > BUDGET_FOR_CONTEXT)
+                    break;
+                contextTurns.push(turns[i]);
+                contextTokens += turns[i].tokens + 20;
+            }
+        }
+        // Also prepend a summary of everything before the context window
+        let contextSummary = '';
+        const contextStartIdx = condensedUpTo > CONTEXT_OVERLAP ? condensedUpTo - CONTEXT_OVERLAP : 0;
+        if (contextStartIdx > 0) {
+            contextSummary = generateContextSummary(turns.slice(0, contextStartIdx));
+        }
+        // 2. Fill remaining window with new turns
+        const availableForNew = halfWindow - contextTokens - estimateTokens(CONDENSE_RULES) - 500;
+        let newEnd = condensedUpTo;
+        let newTokens = 0;
+        while (newEnd < turns.length) {
+            const cost = turns[newEnd].tokens + 20;
+            if (newTokens + cost > availableForNew && newEnd > condensedUpTo)
+                break;
+            newTokens += cost;
+            newEnd++;
+        }
+        if (newEnd <= condensedUpTo)
+            break; // Stuck — no new turns fit
+        // 3. Build prompt: context (marked [已缩减]) + new turns (to condense)
+        const segmentTurns = [...contextTurns, ...turns.slice(condensedUpTo, newEnd)];
+        const prompt = buildSegmentPrompt(segmentTurns, contextTurns.length, contextSummary);
+        // 4. Call Haiku
+        const results = await callHaikuAndParse(prompt, turns, condensedUpTo, newEnd, condensedUpTo);
+        applyResults(turns, results, condensedUpTo, newEnd, cohesionMap);
+        console.log(`[condenser] iteration: turns ${condensedUpTo}-${newEnd} (context: ${contextTurns.length} turns), ${results.size} results from Haiku`);
+        condensedUpTo = newEnd;
+    }
+    console.log(`[condenser] done: ${condensedUpTo}/${turns.length} turns processed`);
+    return { condensedTurns: turns, cohesionMap };
+}
+async function callHaikuAndParse(prompt, allTurns, segStart, segEnd, condensedUpTo) {
+    let rawResult;
+    try {
+        rawResult = await callHaiku(prompt);
+    }
+    catch (err) {
+        // On failure, skip this segment (leave turns as-is)
+        console.error('[condenser] Haiku call failed:', err instanceof Error ? err.message : err);
+        return new Map();
+    }
+    let parsed;
+    try {
+        parsed = extractJsonArray(rawResult);
+    }
+    catch {
+        console.error('[condenser] JSON parse failed, skipping segment');
+        return new Map();
+    }
+    const resultMap = new Map();
+    for (const r of parsed) {
+        resultMap.set(r.turn, r);
+    }
+    return resultMap;
+}
+function applyResults(turns, results, condensedUpTo, segEnd, cohesionMap) {
+    for (let i = condensedUpTo; i < segEnd && i < turns.length; i++) {
+        const t = turns[i];
+        const r = results.get(t.id);
+        // Record cohesion
+        if (r?.cohesion !== undefined) {
+            t.cohesion = r.cohesion;
+            cohesionMap[t.id] = r.cohesion;
+        }
+        // Guard rail: protect uncondensable user turns
+        if (t.id.startsWith('U') && UNCONDENSABLE_RE.test(t.body)) {
+            t.condensed = true; // Mark as processed but keep original
+            continue;
+        }
+        // Guard rail: already condensed turns must not be re-condensed
+        if (t.condensed)
+            continue;
+        // Apply condensation
+        if (r && r.condensed !== null && r.condensed !== undefined) {
+            t.body = r.condensed;
+            t.tokens = estimateTokens(r.condensed);
+        }
+        t.condensed = true;
+    }
+}
+// ── Build final content with markers ──
+function buildFinalContent(originalTurns, // from v0.md (for token % calculation)
+condensedTurns, prevMarkers, level) {
     const lines = [];
-    for (const turn of originalTurns) {
-        const condensed = condensedBodies.get(turn.id);
-        const body = condensed ?? turn.body;
-        const origTokens = estimateTokens(turn.body);
-        const newTokens = estimateTokens(body);
+    for (let i = 0; i < condensedTurns.length; i++) {
+        const ct = condensedTurns[i];
+        const ot = originalTurns.find(t => t.id === ct.id);
+        const origTokens = ot ? ot.tokens : ct.tokens;
+        const newTokens = ct.tokens;
         let marker = '';
-        if (condensed !== null && condensed !== undefined) {
-            // This turn was condensed
-            const pct = origTokens > 0 ? Math.round(newTokens / origTokens * 100) : 100;
-            const prevChain = prevMarkers.get(turn.id) || '';
+        if (origTokens > 0 && newTokens < origTokens * 0.95) {
+            // Content was actually condensed (>5% reduction)
+            const pct = Math.round(newTokens / origTokens * 100);
+            const prevChain = prevMarkers.get(ct.id) || '';
             marker = prevChain ? ` [c${level},${pct}%;${prevChain}]` : ` [c${level},${pct}%]`;
         }
         else {
-            // Keep existing marker from previous version
-            const existing = prevMarkers.get(turn.id);
+            const existing = prevMarkers.get(ct.id);
             if (existing)
                 marker = ` [${existing}]`;
         }
-        lines.push(`## ${turn.id}${marker}`);
-        lines.push(body);
+        lines.push(`## ${ct.id}${marker}`);
+        lines.push(ct.body);
         lines.push('');
     }
     return lines.join('\n');
 }
-/** Extract existing [cN,P%] marker chain from a header. */
-function extractMarkerChain(header) {
-    const match = header.match(/\[(.+)\]\s*$/);
-    return match ? match[1] : '';
-}
-// ── Condense ──
+// ── Public: condenseConversation ──
 async function condenseConversation(convDir) {
     const meta = (0, conversation_sync_1.readMeta)(convDir);
     if (!meta)
         return null;
-    // Read the latest version as base
     const latestEntry = meta.versions[meta.latest];
     if (!latestEntry)
         return null;
     const baseContent = fs.readFileSync(path.join(convDir, latestEntry.file), 'utf-8');
-    // Read original for token comparison
     const v0Content = fs.readFileSync(path.join(convDir, 'v0.md'), 'utf-8');
     const originalTurns = parseTurns(v0Content);
     const baseTurns = parseTurns(baseContent);
@@ -154,62 +370,15 @@ async function condenseConversation(convDir) {
         if (chain)
             prevMarkers.set(t.id, chain);
     }
-    // Build prompt
-    const prompt = `你是一个对话缩减器。对以下对话的每一轮进行缩减。
-判断标准：如果未来的 LLM 只看到缩减后的版本，行为是否会与看到原文时不同？
-- 不同 → 保留原文
-- 相同 → 大幅缩减
-硬性规则：
-1. 用户纠正/否定行为的发言 → 必须保留原文
-2. 绝不改变语义方向（肯定↔否定）
-3. 保留所有数字、标识符、文件路径
-4. 构建/部署日志 → 一句话结果
-5. 确认性回复 → 保留原文
-对每轮输出 JSON 数组：
-[{"turn":"U1","condensed":"缩减后的内容或null表示保留原文"},...]
-对话（如果过长已截取最近部分）：
-${baseContent.length > 40000 ? '...[前文已省略]\n\n' + baseContent.slice(-40000) : baseContent}`;
-    let result;
-    try {
-        result = await callHaiku(prompt);
-    }
-    catch (err) {
-        throw new Error('Claude CLI 调用失败: ' + (err instanceof Error ? err.message : String(err)));
-    }
-    // Parse JSON from response (handles code fences, truncation)
-    let condensedArray;
-    try {
-        condensedArray = extractJsonArray(result);
-    }
-    catch (parseErr) {
-        throw new Error('无法解析 Haiku 返回的 JSON: ' + (parseErr instanceof Error ? parseErr.message : ''));
-    }
-    // Build condensed bodies map
-    const condensedBodies = new Map();
-    for (const item of condensedArray) {
-        condensedBodies.set(item.turn, item.condensed);
-    }
-    // Guard rail: protect uncondensable turns
-    for (const turn of originalTurns) {
-        if (turn.id.startsWith('U')) {
-            const body = turn.body.toLowerCase();
-            if (/不要|别|错了|改成|不是|必须|禁止/.test(body)) {
-                condensedBodies.set(turn.id, null); // Force keep original
-            }
-        }
-    }
-    // Determine next version number
-    const versionNumbers = Object.keys(meta.versions)
-        .map(v => parseInt(v.replace('v', '')))
-        .filter(n => !isNaN(n));
+    // Run iterative condense on base turns (deep copy bodies)
+    const workingTurns = baseTurns.map(t => ({ ...t, condensed: /\[c\d+/.test(t.header) }));
+    const { condensedTurns, cohesionMap } = await iterativeCondense(workingTurns);
+    // Determine next version
+    const versionNumbers = Object.keys(meta.versions).map(v => parseInt(v.replace('v', ''))).filter(n => !isNaN(n));
     const nextNum = Math.max(...versionNumbers) + 1;
     const nextVersion = `v${nextNum}`;
-    // Build condensed content
-    const condensedContent = buildCondensedContent(originalTurns, condensedBodies, prevMarkers, nextNum);
+    // Build final content with markers
+    const condensedContent = buildFinalContent(originalTurns, condensedTurns, prevMarkers, nextNum);
     const afterTokens = estimateTokens(condensedContent);
     const beforeTokens = latestEntry.tokens;
     // Write file
@@ -224,23 +393,24 @@ ${baseContent.length > 40000 ? '...[前文已省略]\n\n' + baseContent.slice(-4
         base: meta.latest,
     };
     meta.latest = nextVersion;
+    // Merge cohesion map
+    meta.cohesion_map = { ...meta.cohesion_map, ...cohesionMap };
     (0, conversation_sync_1.writeMeta)(convDir, meta);
     return { version: nextVersion, before_tokens: beforeTokens, after_tokens: afterTokens };
 }
-// ── Reorganize ──
+// ── Public: reorganizeConversation ──
 async function reorganizeConversation(convDir) {
     const meta = (0, conversation_sync_1.readMeta)(convDir);
     if (!meta)
         return null;
     if (meta.reorganize_count >= 2)
-        return null; // Max 2 reorganizations
-    // Classify turns by expand stats
+        return null;
     const byTurn = meta.expand_stats.by_turn;
+    const v0Content = fs.readFileSync(path.join(convDir, 'v0.md'), 'utf-8');
+    const originalTurns = parseTurns(v0Content);
     const highAttention = [];
     const lowAttention = [];
     const neverAccessed = [];
-    const v0Content = fs.readFileSync(path.join(convDir, 'v0.md'), 'utf-8');
-    const originalTurns = parseTurns(v0Content);
     for (const turn of originalTurns) {
         const count = byTurn[turn.id] || 0;
         if (count >= 3)
@@ -251,54 +421,112 @@ async function reorganizeConversation(convDir) {
             neverAccessed.push(turn.id);
     }
     if (highAttention.length === 0)
-        return null; // Nothing to reorganize
-    const prompt = `你是一个对话重整器。以下对话被缩减后，用户反复需要展开某些轮次。
-请从原始对话重新生成缩减版，调整策略：
-高关注轮次（保留更多细节）：${highAttention.join(', ')}
-低关注轮次（大幅缩减）：${lowAttention.join(', ')}
-从未访问的轮次（高度缩减为一句话）：${neverAccessed.join(', ')}
-硬性规则：
-1. 用户纠正/否定行为的发言 → 必须保留原文
-2. 绝不改变语义方向
-3. 保留所有数字、标识符、文件路径
-对每轮输出 JSON 数组：
-[{"turn":"U1","condensed":"缩减后的内容或null表示保留原文"},...]
-原始对话：
-${v0Content.length > 40000 ? '...[前文已省略]\n\n' + v0Content.slice(-40000) : v0Content}`;
-    let result;
-    try {
-        result = await callHaiku(prompt);
-    }
-    catch (err) {
-        throw new Error('Claude CLI 调用失败: ' + (err instanceof Error ? err.message : String(err)));
-    }
-    let condensedArray;
-    try {
-        condensedArray = extractJsonArray(result);
-    }
-    catch (parseErr) {
-        throw new Error('无法解析 Haiku 返回的 JSON: ' + (parseErr instanceof Error ? parseErr.message : ''));
-    }
-    const condensedBodies = new Map();
-    for (const item of condensedArray) {
-        condensedBodies.set(item.turn, item.condensed);
+        return null;
+    const workingTurns = originalTurns.map(t => ({ ...t, condensed: false }));
+    const highSet = new Set(highAttention);
+    const halfWindow = HALF_WINDOW_TOKENS;
+    let condensedUpTo = 0;
+    const cohesionMap = {};
+    // Pre-truncate oversized turns
+    for (let i = 0; i < workingTurns.length; i++) {
+        if (workingTurns[i].tokens > halfWindow * 0.8) {
+            workingTurns[i] = truncateTurn(workingTurns[i], Math.floor(halfWindow * 0.7));
+        }
     }
-    // Guard rail
-    for (const turn of originalTurns) {
-        if (turn.id.startsWith('U') && /不要|别|错了|改成|不是|必须|禁止/.test(turn.body.toLowerCase())) {
-            condensedBodies.set(turn.id, null);
+    // Iterative sliding window (same strategy as condense)
+    while (condensedUpTo < workingTurns.length) {
+        let contextTurns = [];
+        let contextTokens = 0;
+        if (condensedUpTo > 0) {
+            const ctxStart = Math.max(0, condensedUpTo - CONTEXT_OVERLAP);
+            for (let i = ctxStart; i < condensedUpTo; i++) {
+                if (contextTokens + workingTurns[i].tokens + 20 > BUDGET_FOR_CONTEXT)
+                    break;
+                contextTurns.push(workingTurns[i]);
+                contextTokens += workingTurns[i].tokens + 20;
+            }
+        }
+        let contextSummary = '';
+        const ctxStartIdx = condensedUpTo > CONTEXT_OVERLAP ? condensedUpTo - CONTEXT_OVERLAP : 0;
+        if (ctxStartIdx > 0)
+            contextSummary = generateContextSummary(workingTurns.slice(0, ctxStartIdx));
+        const reorgRulesTokens = 600; // approximate
+        const availableForNew = halfWindow - contextTokens - reorgRulesTokens - estimateTokens(CONDENSE_RULES);
+        let newEnd = condensedUpTo;
+        let newTokens = 0;
+        while (newEnd < workingTurns.length) {
+            const cost = workingTurns[newEnd].tokens + 20;
+            if (newTokens + cost > availableForNew && newEnd > condensedUpTo)
+                break;
+            newTokens += cost;
+            newEnd++;
+        }
+        if (newEnd <= condensedUpTo)
+            break;
+        // Build reorganize prompt with attention hints
+        const promptParts = [
+            `你是一个对话重整器。基于使用数据，激进缩减对话。`,
+            ``,
+            `高关注轮次（用户反复查看，保留更多细节）：${highAttention.join(', ')}`,
+            `低关注轮次（大幅缩减为一句话）：${lowAttention.join(', ')}`,
+            `从未访问的轮次（高度缩减为几个字）：${neverAccessed.join(', ')}`,
+            ``,
+            `## 必须激进缩减的内容：`,
+            `- 工具调用和输出 → "执行了 X，结果：Y"`,
+            `- 构建/发布日志 → "构建成功" 或 "发布 vX.Y.Z"`,
+            `- 代码修改描述 → "修改了 file.ts"`,
+            `- 文件内容展示 → "读取了 file.ts"`,
+            `- LLM 解释性文字（"让我检查""我来看看"） → 删除`,
+            ``,
+            `## 必须保留原文（condensed 设为 null）：`,
+            `- 高关注轮次中的用户需求和决策讨论`,
+            `- 用户纠正/否定（"不对""错了""改成"）`,
+            `- 标记了 [已缩减] 的轮次`,
+            ``,
+            `## 不得违反：绝不改变语义方向，保留版本号和文件路径`,
+            ``,
+            `对每轮输出 JSON：[{"turn":"U1","condensed":"缩减内容或null","cohesion":0.8},...]`,
+        ];
+        if (contextSummary)
+            promptParts.push(``, `[前文摘要：${contextSummary}]`);
+        promptParts.push(``, `对话：`);
+        for (const ct of contextTurns) {
+            promptParts.push(`## ${ct.id} [已缩减]`, ct.body, '');
+        }
+        for (let i = condensedUpTo; i < newEnd; i++) {
+            promptParts.push(`## ${workingTurns[i].id}`, workingTurns[i].body, '');
+        }
+        const results = await callHaikuAndParse(promptParts.join('\n'), workingTurns, condensedUpTo, newEnd, condensedUpTo);
+        for (let i = condensedUpTo; i < newEnd && i < workingTurns.length; i++) {
+            const t = workingTurns[i];
+            const r = results.get(t.id);
+            if (r?.cohesion !== undefined) {
+                t.cohesion = r.cohesion;
+                cohesionMap[t.id] = r.cohesion;
+            }
+            if (t.condensed)
+                continue;
+            if (t.id.startsWith('U') && UNCONDENSABLE_RE.test(t.body)) {
+                t.condensed = true;
+                continue;
+            }
+            if (highSet.has(t.id)) {
+                t.condensed = true;
+                continue;
+            }
+            if (r && r.condensed !== null && r.condensed !== undefined) {
+                t.body = r.condensed;
+                t.tokens = estimateTokens(r.condensed);
+            }
+            t.condensed = true;
         }
+        condensedUpTo = newEnd;
     }
-    const versionNumbers = Object.keys(meta.versions)
-        .map(v => parseInt(v.replace('v', '')))
-        .filter(n => !isNaN(n));
+    // Build final
+    const versionNumbers = Object.keys(meta.versions).map(v => parseInt(v.replace('v', ''))).filter(n => !isNaN(n));
     const nextNum = Math.max(...versionNumbers) + 1;
     const nextVersion = `v${nextNum}`;
-    const condensedContent = buildCondensedContent(originalTurns, condensedBodies, new Map(), nextNum);
+    const condensedContent = buildFinalContent(originalTurns, workingTurns, new Map(), nextNum);
     const afterTokens = estimateTokens(condensedContent);
     const latestEntry = meta.versions[meta.latest];
     const beforeTokens = latestEntry?.tokens ?? meta.original_tokens;
@@ -315,6 +543,7 @@ ${v0Content.length > 40000 ? '...[前文已省略]\n\n' + v0Content.slice(-40000
     meta.latest = nextVersion;
     meta.reorganize_count += 1;
     meta.last_reorganize_at = new Date().toISOString();
+    meta.cohesion_map = { ...meta.cohesion_map, ...cohesionMap };
     (0, conversation_sync_1.writeMeta)(convDir, meta);
     return { version: nextVersion, before_tokens: beforeTokens, after_tokens: afterTokens, high_attention_turns: highAttention };
 }