specmem-hardwicksoftware 3.7.32 → 3.7.33
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/specmem-cli.cjs +18 -33
- package/bootstrap.cjs +5 -1
- package/claude-hooks/agent-loading-hook.js +31 -47
- package/claude-hooks/subagent-loading-hook.js +1 -1
- package/claude-hooks/team-comms-enforcer.cjs +112 -93
- package/dist/config/configSync.js +4 -1
- package/dist/index.js +44 -1
- package/dist/init/claudeConfigInjector.js +4 -1
- package/dist/installer/autoInstall.js +4 -1
- package/dist/mcp/compactionProxy.js +627 -72
- package/dist/mcp/compactionProxyDaemon.js +18 -4
- package/dist/mcp/specMemServer.js +8 -0
- package/dist/watcher/index.js +16 -2
- package/package.json +1 -1
- package/scripts/deploy-hooks.cjs +4 -1
- package/scripts/specmem-init.cjs +31 -35
- package/scripts/specmem-uninstall.cjs +4 -1
- package/specmem/model-config.json +3 -3
- package/specmem/supervisord.conf +1 -1
- package/svg-sections/readme-install.svg +89 -53
|
@@ -15,7 +15,7 @@
|
|
|
15
15
|
* @website https://justcalljon.pro
|
|
16
16
|
*/
|
|
17
17
|
|
|
18
|
-
import { createServer, get as httpGet } from 'http';
|
|
18
|
+
import { createServer, get as httpGet, request as httpRequest } from 'http';
|
|
19
19
|
import { request as httpsRequest } from 'https';
|
|
20
20
|
import { appendFileSync, writeFileSync, readFileSync, mkdirSync, existsSync, copyFileSync, unlinkSync } from 'fs';
|
|
21
21
|
import { createConnection } from 'net';
|
|
@@ -62,12 +62,54 @@ const OLD_STRIP_THRESHOLD = 100; // chars — only strip results bigger
|
|
|
62
62
|
const OLD_STRIP_PREVIEW_CHARS = 200; // chars — keep this much of the original
|
|
63
63
|
|
|
64
64
|
// Live neural MT compression config
|
|
65
|
-
const
|
|
65
|
+
const _TRANSLATE_SOCKET_FALLBACK = process.env.SPECMEM_TRANSLATE_SOCKET ||
|
|
66
66
|
join(process.env.SPECMEM_PROJECT_PATH || process.cwd(), 'specmem', 'run', 'translate.sock');
|
|
67
67
|
const PRESERVE_RECENT_MESSAGES = 3;
|
|
68
|
-
const MIN_TRANSLATE_LENGTH =
|
|
68
|
+
const MIN_TRANSLATE_LENGTH = 0; // No minimum — compress everything
|
|
69
69
|
const DONT_COMPRESS_FLAG = 'DONT_COMPRESS';
|
|
70
70
|
|
|
71
|
+
// ============================================================================
|
|
72
|
+
// Multi-Project Registry — tracks all registered projects for resource sharing
|
|
73
|
+
// ============================================================================
|
|
74
|
+
|
|
75
|
+
const projectRegistry = new Map(); // keyed by projectPath → { projectPath, pid, registeredAt, lastSeen }
|
|
76
|
+
|
|
77
|
+
// Auto-register the spawning project so daemon always has at least one
|
|
78
|
+
const _foundingProjectPath = process.env.SPECMEM_PROJECT_PATH || null;
|
|
79
|
+
if (_foundingProjectPath) {
|
|
80
|
+
projectRegistry.set(_foundingProjectPath, {
|
|
81
|
+
projectPath: _foundingProjectPath,
|
|
82
|
+
pid: process.ppid || 0,
|
|
83
|
+
registeredAt: Date.now(),
|
|
84
|
+
lastSeen: Date.now(),
|
|
85
|
+
});
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
/**
|
|
89
|
+
* Resolve translate socket dynamically across all registered projects.
|
|
90
|
+
* Iterates registry sorted by lastSeen desc, returns first socket that exists.
|
|
91
|
+
* Fallback: SPECMEM_TRANSLATE_SOCKET env var, then null.
|
|
92
|
+
*/
|
|
93
|
+
function resolveTranslateSocket() {
|
|
94
|
+
// Try registered projects, most recently seen first
|
|
95
|
+
const entries = [...projectRegistry.values()].sort((a, b) => b.lastSeen - a.lastSeen);
|
|
96
|
+
for (const entry of entries) {
|
|
97
|
+
const sockPath = join(entry.projectPath, 'specmem', 'run', 'translate.sock');
|
|
98
|
+
if (existsSync(sockPath)) return sockPath;
|
|
99
|
+
}
|
|
100
|
+
// Fallback to env var / founding project socket
|
|
101
|
+
if (existsSync(_TRANSLATE_SOCKET_FALLBACK)) return _TRANSLATE_SOCKET_FALLBACK;
|
|
102
|
+
return null;
|
|
103
|
+
}
|
|
104
|
+
|
|
105
|
+
/**
|
|
106
|
+
* Invalidate TM and synonym caches — called on registry changes.
|
|
107
|
+
*/
|
|
108
|
+
function _invalidateProjectCaches() {
|
|
109
|
+
_tmCache = null;
|
|
110
|
+
_synonyms = null;
|
|
111
|
+
}
|
|
112
|
+
|
|
71
113
|
// Preview ring buffer — stores last 5 compressed requests for TUI display
|
|
72
114
|
const PREVIEW_BUFFER_SIZE = 5;
|
|
73
115
|
const recentRequests = []; // { original, optimized, timestamp, type, savings }
|
|
@@ -160,6 +202,7 @@ let liveConfig = {
|
|
|
160
202
|
TRANSLATE_ENABLED: true, // toggle MT translation (requires translate.sock)
|
|
161
203
|
OLD_STRIP_ENABLED: true, // toggle old tool_result stripping
|
|
162
204
|
SYSTEM_PROMPT_COMPRESS: true, // toggle system prompt steno+translate compression
|
|
205
|
+
SYSTEM_REMINDER_STRIPPING: true, // toggle <system-reminder> stripping (keeps first, strips rest)
|
|
163
206
|
};
|
|
164
207
|
|
|
165
208
|
// Stats
|
|
@@ -171,6 +214,7 @@ const stats = {
|
|
|
171
214
|
tokensStripped: 0,
|
|
172
215
|
bytesStripped: 0,
|
|
173
216
|
liveCharsCompressed: 0,
|
|
217
|
+
systemRemindersStripped: 0,
|
|
174
218
|
liveBlocksCompressed: 0,
|
|
175
219
|
zhVerified: 0, // Chinese translations that passed loop-back verification
|
|
176
220
|
zhRejected: 0, // Chinese translations rejected (steno fallback)
|
|
@@ -200,18 +244,53 @@ const TM_MAX_ENTRIES = 10000;
|
|
|
200
244
|
let _tmCache = null; // { hash: { en, zh, sim, ts } }
|
|
201
245
|
let _synonyms = null; // { word: Set<synonym> } — learned from failed verifications
|
|
202
246
|
|
|
247
|
+
/**
|
|
248
|
+
* Get all TM file paths from registered projects.
|
|
249
|
+
*/
|
|
250
|
+
function _getAllTMPaths() {
|
|
251
|
+
const paths = [];
|
|
252
|
+
for (const entry of projectRegistry.values()) {
|
|
253
|
+
paths.push(join(entry.projectPath, 'specmem', 'run', 'translation-memory.json'));
|
|
254
|
+
}
|
|
255
|
+
// Always include founding project path as fallback
|
|
256
|
+
if (!paths.includes(TM_FILE)) paths.push(TM_FILE);
|
|
257
|
+
return paths;
|
|
258
|
+
}
|
|
259
|
+
|
|
260
|
+
/**
|
|
261
|
+
* Get all synonyms file paths from registered projects.
|
|
262
|
+
*/
|
|
263
|
+
function _getAllSynonymPaths() {
|
|
264
|
+
const paths = [];
|
|
265
|
+
for (const entry of projectRegistry.values()) {
|
|
266
|
+
paths.push(join(entry.projectPath, 'specmem', 'run', 'learned-synonyms.json'));
|
|
267
|
+
}
|
|
268
|
+
if (!paths.includes(SYNONYMS_FILE)) paths.push(SYNONYMS_FILE);
|
|
269
|
+
return paths;
|
|
270
|
+
}
|
|
271
|
+
|
|
203
272
|
function _tmHash(text) {
|
|
204
273
|
return createHash('md5').update(text.toLowerCase().trim()).digest('hex').slice(0, 16);
|
|
205
274
|
}
|
|
206
275
|
|
|
207
276
|
function _loadTM() {
|
|
208
277
|
if (_tmCache) return _tmCache;
|
|
209
|
-
|
|
210
|
-
|
|
211
|
-
|
|
212
|
-
|
|
213
|
-
|
|
214
|
-
|
|
278
|
+
_tmCache = {};
|
|
279
|
+
// Merge TM entries from all registered projects (later timestamp wins)
|
|
280
|
+
for (const tmPath of _getAllTMPaths()) {
|
|
281
|
+
try {
|
|
282
|
+
if (existsSync(tmPath)) {
|
|
283
|
+
const entries = JSON.parse(readFileSync(tmPath, 'utf8'));
|
|
284
|
+
if (entries && typeof entries === 'object') {
|
|
285
|
+
for (const [hash, entry] of Object.entries(entries)) {
|
|
286
|
+
if (!_tmCache[hash] || (entry.ts || 0) > (_tmCache[hash].ts || 0)) {
|
|
287
|
+
_tmCache[hash] = entry;
|
|
288
|
+
}
|
|
289
|
+
}
|
|
290
|
+
}
|
|
291
|
+
}
|
|
292
|
+
} catch { /* corrupt file, skip */ }
|
|
293
|
+
}
|
|
215
294
|
return _tmCache;
|
|
216
295
|
}
|
|
217
296
|
|
|
@@ -225,7 +304,14 @@ function _saveTM() {
|
|
|
225
304
|
const toRemove = sorted.slice(0, keys.length - TM_MAX_ENTRIES);
|
|
226
305
|
for (const k of toRemove) delete tm[k];
|
|
227
306
|
}
|
|
228
|
-
|
|
307
|
+
const data = JSON.stringify(tm);
|
|
308
|
+
// Fan-out write to ALL registered projects
|
|
309
|
+
for (const tmPath of _getAllTMPaths()) {
|
|
310
|
+
try {
|
|
311
|
+
mkdirSync(dirname(tmPath), { recursive: true });
|
|
312
|
+
writeFileSync(tmPath, data, 'utf8');
|
|
313
|
+
} catch { /* skip unreachable paths */ }
|
|
314
|
+
}
|
|
229
315
|
} catch (e) { log('warn', `TM save failed: ${e.message}`); }
|
|
230
316
|
}
|
|
231
317
|
|
|
@@ -253,29 +339,41 @@ let _tmSaveTimer = null;
|
|
|
253
339
|
// e.g., MT says "rebuild" but original had "refactor" — these are equivalent
|
|
254
340
|
function _loadSynonyms() {
|
|
255
341
|
if (_synonyms) return _synonyms;
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
|
|
342
|
+
_synonyms = {};
|
|
343
|
+
// Merge synonyms from all registered projects + package seed
|
|
344
|
+
const allPaths = [
|
|
345
|
+
..._getAllSynonymPaths(),
|
|
259
346
|
join(fileURLToPath(import.meta.url), '..', '..', '..', 'specmem', 'run', 'learned-synonyms.json'),
|
|
260
347
|
];
|
|
261
|
-
|
|
348
|
+
let loadedAny = false;
|
|
349
|
+
for (const synPath of allPaths) {
|
|
262
350
|
try {
|
|
263
351
|
if (existsSync(synPath)) {
|
|
264
352
|
const raw = JSON.parse(readFileSync(synPath, 'utf8'));
|
|
265
|
-
_synonyms = {};
|
|
266
353
|
for (const [word, syns] of Object.entries(raw)) {
|
|
267
|
-
_synonyms[word] = new Set(
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
if (synPath !== SYNONYMS_FILE && _synonyms && Object.keys(_synonyms).length > 0) {
|
|
271
|
-
try { mkdirSync(dirname(SYNONYMS_FILE), { recursive: true }); } catch {}
|
|
272
|
-
try { copyFileSync(synPath, SYNONYMS_FILE); } catch {}
|
|
354
|
+
if (!_synonyms[word]) _synonyms[word] = new Set();
|
|
355
|
+
const synList = Array.isArray(syns) ? syns : [...syns];
|
|
356
|
+
for (const s of synList) _synonyms[word].add(s);
|
|
273
357
|
}
|
|
274
|
-
|
|
358
|
+
loadedAny = true;
|
|
275
359
|
}
|
|
276
|
-
} catch { /*
|
|
360
|
+
} catch { /* skip corrupt */ }
|
|
361
|
+
}
|
|
362
|
+
// If loaded from package seed and no project files exist, seed all projects
|
|
363
|
+
if (loadedAny && Object.keys(_synonyms).length > 0) {
|
|
364
|
+
for (const synPath of _getAllSynonymPaths()) {
|
|
365
|
+
if (!existsSync(synPath)) {
|
|
366
|
+
try { mkdirSync(dirname(synPath), { recursive: true }); } catch {}
|
|
367
|
+
try {
|
|
368
|
+
const serializable = {};
|
|
369
|
+
for (const [word, set] of Object.entries(_synonyms)) {
|
|
370
|
+
serializable[word] = [...set];
|
|
371
|
+
}
|
|
372
|
+
writeFileSync(synPath, JSON.stringify(serializable), 'utf8');
|
|
373
|
+
} catch {}
|
|
374
|
+
}
|
|
375
|
+
}
|
|
277
376
|
}
|
|
278
|
-
if (!_synonyms) _synonyms = {};
|
|
279
377
|
return _synonyms;
|
|
280
378
|
}
|
|
281
379
|
|
|
@@ -286,7 +384,14 @@ function _saveSynonyms() {
|
|
|
286
384
|
for (const [word, set] of Object.entries(syns)) {
|
|
287
385
|
serializable[word] = [...set];
|
|
288
386
|
}
|
|
289
|
-
|
|
387
|
+
const data = JSON.stringify(serializable);
|
|
388
|
+
// Fan-out write to ALL registered projects
|
|
389
|
+
for (const synPath of _getAllSynonymPaths()) {
|
|
390
|
+
try {
|
|
391
|
+
mkdirSync(dirname(synPath), { recursive: true });
|
|
392
|
+
writeFileSync(synPath, data, 'utf8');
|
|
393
|
+
} catch { /* skip unreachable paths */ }
|
|
394
|
+
}
|
|
290
395
|
} catch (e) { log('warn', `Synonyms save failed: ${e.message}`); }
|
|
291
396
|
}
|
|
292
397
|
|
|
@@ -380,6 +485,23 @@ function isCompactionRequest(body) {
|
|
|
380
485
|
return false;
|
|
381
486
|
}
|
|
382
487
|
|
|
488
|
+
/**
|
|
489
|
+
* Smart-strip Edit tool_use inputs to just - / + diff lines.
|
|
490
|
+
* Returns compact string or null if not an Edit block.
|
|
491
|
+
*/
|
|
492
|
+
function smartStripEdit(input) {
|
|
493
|
+
if (!input || !input.file_path || !input.old_string) return null;
|
|
494
|
+
const lines = [`Edit(${input.file_path})`];
|
|
495
|
+
// old_string → removed lines (prefix with -)
|
|
496
|
+
for (const l of input.old_string.split('\n')) lines.push(`- ${l}`);
|
|
497
|
+
// new_string → added lines (prefix with +)
|
|
498
|
+
if (input.new_string != null) {
|
|
499
|
+
for (const l of input.new_string.split('\n')) lines.push(`+ ${l}`);
|
|
500
|
+
}
|
|
501
|
+
if (input.replace_all) lines.push('(replace_all)');
|
|
502
|
+
return lines.join('\n');
|
|
503
|
+
}
|
|
504
|
+
|
|
383
505
|
function stripMessages(messages) {
|
|
384
506
|
if (!Array.isArray(messages)) return { strippedMessages: messages, strippingStats: { toolResultsStripped: 0, toolUsesStripped: 0, charsRemoved: 0 } };
|
|
385
507
|
|
|
@@ -422,6 +544,22 @@ function stripMessages(messages) {
|
|
|
422
544
|
const input = block.input;
|
|
423
545
|
if (!input) return block;
|
|
424
546
|
|
|
547
|
+
// Smart diff stripping for Edit tool — keep only - / + lines
|
|
548
|
+
const editDiff = (block.name === 'Edit') ? smartStripEdit(input) : null;
|
|
549
|
+
if (editDiff) {
|
|
550
|
+
const inputStr = JSON.stringify(input);
|
|
551
|
+
charsRemoved += inputStr.length - editDiff.length;
|
|
552
|
+
toolUsesStripped++;
|
|
553
|
+
const stripped = {
|
|
554
|
+
type: 'tool_use',
|
|
555
|
+
id: block.id,
|
|
556
|
+
name: block.name,
|
|
557
|
+
input: { _stripped: editDiff }
|
|
558
|
+
};
|
|
559
|
+
if (block.cache_control) stripped.cache_control = block.cache_control;
|
|
560
|
+
return stripped;
|
|
561
|
+
}
|
|
562
|
+
|
|
425
563
|
const inputStr = JSON.stringify(input);
|
|
426
564
|
if (inputStr.length <= TOOL_USE_INPUT_PREVIEW_CHARS * 2) return block;
|
|
427
565
|
|
|
@@ -513,6 +651,16 @@ function stripOldToolResults(messages) {
|
|
|
513
651
|
const input = block.input;
|
|
514
652
|
if (!input) return block;
|
|
515
653
|
|
|
654
|
+
// Smart Edit stripping — keep only - / + diff lines
|
|
655
|
+
const editDiff = smartStripEdit(block);
|
|
656
|
+
if (editDiff) {
|
|
657
|
+
const origLen = JSON.stringify(input).length;
|
|
658
|
+
const newLen = JSON.stringify(editDiff.input).length;
|
|
659
|
+
charsRemoved += origLen - newLen;
|
|
660
|
+
toolResultsStripped++;
|
|
661
|
+
return editDiff;
|
|
662
|
+
}
|
|
663
|
+
|
|
516
664
|
const inputStr = JSON.stringify(input);
|
|
517
665
|
if (inputStr.length <= liveConfig.OLD_STRIP_THRESHOLD) return block;
|
|
518
666
|
|
|
@@ -548,6 +696,19 @@ function stripOldToolResults(messages) {
|
|
|
548
696
|
text: txt.slice(0, OLD_STRIP_PREVIEW_CHARS) + `...\n[HOOK-TRIMMED: ${txt.length} chars]`
|
|
549
697
|
};
|
|
550
698
|
}
|
|
699
|
+
|
|
700
|
+
// Strip old assistant text blocks — Claude's own output echoed back
|
|
701
|
+
// No point sending Claude its own words; keep first line as context anchor
|
|
702
|
+
if (msg.role === 'assistant' && txt.length > 120) {
|
|
703
|
+
const firstLine = txt.split('\n')[0].slice(0, 120);
|
|
704
|
+
const removed = txt.length - firstLine.length;
|
|
705
|
+
charsRemoved += removed;
|
|
706
|
+
toolResultsStripped++;
|
|
707
|
+
return {
|
|
708
|
+
...block,
|
|
709
|
+
text: `${firstLine}...\n[ASST-ECHO-STRIPPED: ${txt.length} chars → ${firstLine.length}]`
|
|
710
|
+
};
|
|
711
|
+
}
|
|
551
712
|
}
|
|
552
713
|
|
|
553
714
|
return block;
|
|
@@ -559,6 +720,81 @@ function stripOldToolResults(messages) {
|
|
|
559
720
|
return { messages: newMessages, strippingStats: { toolResultsStripped, charsRemoved } };
|
|
560
721
|
}
|
|
561
722
|
|
|
723
|
+
/**
|
|
724
|
+
* Strip <system-reminder> tags from messages.
|
|
725
|
+
* Keeps the FIRST system-reminder encountered (sets up style/context),
|
|
726
|
+
* strips all subsequent ones to save tokens.
|
|
727
|
+
*
|
|
728
|
+
* Returns { messages, remindersStripped, charsRemoved }.
|
|
729
|
+
*/
|
|
730
|
+
function stripSystemReminders(messages) {
|
|
731
|
+
if (!Array.isArray(messages)) return { messages, remindersStripped: 0, charsRemoved: 0 };
|
|
732
|
+
if (!liveConfig.SYSTEM_REMINDER_STRIPPING) return { messages, remindersStripped: 0, charsRemoved: 0 };
|
|
733
|
+
|
|
734
|
+
const SR_RE = /<system-reminder>[\s\S]*?<\/system-reminder>/g;
|
|
735
|
+
let firstSeen = false;
|
|
736
|
+
let remindersStripped = 0;
|
|
737
|
+
let charsRemoved = 0;
|
|
738
|
+
|
|
739
|
+
const newMessages = messages.map(msg => {
|
|
740
|
+
if (!msg) return msg;
|
|
741
|
+
|
|
742
|
+
// Handle string content
|
|
743
|
+
if (typeof msg.content === 'string') {
|
|
744
|
+
const matches = msg.content.match(SR_RE);
|
|
745
|
+
if (!matches) return msg;
|
|
746
|
+
|
|
747
|
+
let newText = msg.content;
|
|
748
|
+
for (const match of matches) {
|
|
749
|
+
if (!firstSeen) {
|
|
750
|
+
firstSeen = true; // keep the very first one
|
|
751
|
+
continue;
|
|
752
|
+
}
|
|
753
|
+
newText = newText.replace(match, '');
|
|
754
|
+
charsRemoved += match.length;
|
|
755
|
+
remindersStripped++;
|
|
756
|
+
}
|
|
757
|
+
return { ...msg, content: newText.replace(/\n{3,}/g, '\n\n').trim() };
|
|
758
|
+
}
|
|
759
|
+
|
|
760
|
+
// Handle array content blocks
|
|
761
|
+
if (!Array.isArray(msg.content)) return msg;
|
|
762
|
+
|
|
763
|
+
const newContent = msg.content.map(block => {
|
|
764
|
+
if (block.type !== 'text' || typeof block.text !== 'string') return block;
|
|
765
|
+
|
|
766
|
+
const matches = block.text.match(SR_RE);
|
|
767
|
+
if (!matches) return block;
|
|
768
|
+
|
|
769
|
+
let newText = block.text;
|
|
770
|
+
for (const match of matches) {
|
|
771
|
+
if (!firstSeen) {
|
|
772
|
+
firstSeen = true; // keep the very first one
|
|
773
|
+
continue;
|
|
774
|
+
}
|
|
775
|
+
newText = newText.replace(match, '');
|
|
776
|
+
charsRemoved += match.length;
|
|
777
|
+
remindersStripped++;
|
|
778
|
+
}
|
|
779
|
+
const cleaned = newText.replace(/\n{3,}/g, '\n\n').trim();
|
|
780
|
+
|
|
781
|
+
// If block is now empty after stripping, remove it entirely
|
|
782
|
+
if (!cleaned) return null;
|
|
783
|
+
|
|
784
|
+
return { ...block, text: cleaned };
|
|
785
|
+
}).filter(Boolean);
|
|
786
|
+
|
|
787
|
+
// If all content blocks were stripped, keep a minimal marker
|
|
788
|
+
if (newContent.length === 0) {
|
|
789
|
+
return { ...msg, content: [{ type: 'text', text: '[context]' }] };
|
|
790
|
+
}
|
|
791
|
+
|
|
792
|
+
return { ...msg, content: newContent };
|
|
793
|
+
});
|
|
794
|
+
|
|
795
|
+
return { messages: newMessages, remindersStripped, charsRemoved };
|
|
796
|
+
}
|
|
797
|
+
|
|
562
798
|
// ============================================================================
|
|
563
799
|
// Live Compression — Stenography + Neural MT with Loop-back Verification
|
|
564
800
|
// ============================================================================
|
|
@@ -849,15 +1085,60 @@ async function compressMessagesLive(messages) {
|
|
|
849
1085
|
let stenoOnlyCount = 0;
|
|
850
1086
|
let tmHits = 0;
|
|
851
1087
|
|
|
852
|
-
const
|
|
1088
|
+
const _resolvedSocket = resolveTranslateSocket();
|
|
1089
|
+
const translateAvailable = liveConfig.TRANSLATE_ENABLED && !!_resolvedSocket;
|
|
1090
|
+
|
|
1091
|
+
// ── Pre-translation filter: detect "translation-hostile" content ──
|
|
1092
|
+
// File paths, IDs, hashes, permissions, IPs, URLs, code identifiers, etc.
|
|
1093
|
+
// These will ALWAYS fail backtranslation verification, so skip MT entirely.
|
|
1094
|
+
const _PATH_RE = /(?:^|\s)[.~]?\/[\w./-]{3,}/; // /foo/bar.js, ./rel, ~/home
|
|
1095
|
+
const _UUID_RE = /[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}/i;
|
|
1096
|
+
const _HEX_RE = /\b[0-9a-f]{7,64}\b/i; // git hashes, hex IDs
|
|
1097
|
+
const _PERM_RE = /[dl-][r-][w-][xsStT-][r-][w-][xsStT-][r-][w-][xsStT-]/; // drwxr-xr-x
|
|
1098
|
+
const _IP_RE = /\b\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}\b/; // IPv4
|
|
1099
|
+
const _URL_RE = /https?:\/\/\S{6,}/; // URLs
|
|
1100
|
+
const _PKG_RE = /[\w@][\w./-]*@\d+\.\d+/; // pkg@1.2.3
|
|
1101
|
+
const _CODE_ID = /\b[a-z][a-zA-Z0-9]{2,}\.[a-zA-Z]{1,4}\b/; // file.ext patterns
|
|
1102
|
+
const _CAMEL = /\b[a-z]+[A-Z][a-zA-Z]+\b/; // camelCase identifiers
|
|
1103
|
+
const _SNAKE = /\b[a-z]+_[a-z_]+\b/; // snake_case identifiers
|
|
1104
|
+
|
|
1105
|
+
function isTranslationHostile(text) {
|
|
1106
|
+
if (!text || text.length < 20) return true; // too short to compress meaningfully
|
|
1107
|
+
// Count how many "technical markers" appear
|
|
1108
|
+
const markers = [_PATH_RE, _UUID_RE, _HEX_RE, _PERM_RE, _IP_RE, _URL_RE, _PKG_RE, _CODE_ID];
|
|
1109
|
+
let hits = 0;
|
|
1110
|
+
for (const re of markers) if (re.test(text)) hits++;
|
|
1111
|
+
if (hits >= 3) return true; // 3+ different marker types = definitely technical
|
|
1112
|
+
|
|
1113
|
+
// Check density: what fraction of words are code/path-like?
|
|
1114
|
+
const words = text.split(/\s+/).filter(w => w.length > 1);
|
|
1115
|
+
if (words.length === 0) return true;
|
|
1116
|
+
let techWords = 0;
|
|
1117
|
+
for (const w of words) {
|
|
1118
|
+
if (_PATH_RE.test(w) || _HEX_RE.test(w) || _UUID_RE.test(w) ||
|
|
1119
|
+
_PERM_RE.test(w) || _IP_RE.test(w) || _URL_RE.test(w) ||
|
|
1120
|
+
_CAMEL.test(w) || _SNAKE.test(w) || _PKG_RE.test(w) ||
|
|
1121
|
+
/^\d+$/.test(w) || /^[A-Z_]{3,}$/.test(w)) {
|
|
1122
|
+
techWords++;
|
|
1123
|
+
}
|
|
1124
|
+
}
|
|
1125
|
+
return (techWords / words.length) > 0.40; // >40% technical tokens = skip MT
|
|
1126
|
+
}
|
|
853
1127
|
|
|
854
1128
|
// Step 1.5: Check Translation Memory cache first
|
|
855
1129
|
const needMT = []; // indices that need neural MT (only mtEligible blocks)
|
|
1130
|
+
let mtSkippedTech = 0;
|
|
856
1131
|
for (let i = 0; i < stenoTexts.length; i++) {
|
|
857
1132
|
// Only tool_result content is eligible for Chinese MT
|
|
858
1133
|
// User/assistant text stays steno-only to prevent Claude responding in Chinese
|
|
859
1134
|
if (!textLocations[i].mtEligible) continue;
|
|
860
1135
|
|
|
1136
|
+
// Skip translation-hostile content (file paths, IDs, code, etc.)
|
|
1137
|
+
if (isTranslationHostile(stenoTexts[i])) {
|
|
1138
|
+
mtSkippedTech++;
|
|
1139
|
+
continue; // stays steno-only — finalTexts[i] already has steno text
|
|
1140
|
+
}
|
|
1141
|
+
|
|
861
1142
|
const cached = tmLookup(stenoTexts[i]);
|
|
862
1143
|
if (cached && cached.length < stenoTexts[i].length) {
|
|
863
1144
|
finalTexts[i] = cached;
|
|
@@ -867,12 +1148,15 @@ async function compressMessagesLive(messages) {
|
|
|
867
1148
|
needMT.push(i);
|
|
868
1149
|
}
|
|
869
1150
|
}
|
|
1151
|
+
if (mtSkippedTech > 0) {
|
|
1152
|
+
log('info', `MT-SKIP: ${mtSkippedTech} blocks skipped (translation-hostile content)`);
|
|
1153
|
+
}
|
|
870
1154
|
|
|
871
1155
|
if (translateAvailable && needMT.length > 0) {
|
|
872
1156
|
try {
|
|
873
1157
|
// Step 2: Translate uncached steno English → Chinese (zt)
|
|
874
1158
|
const mtInputs = needMT.map(i => stenoTexts[i]);
|
|
875
|
-
const chineseTexts = await translateBatch(mtInputs,
|
|
1159
|
+
const chineseTexts = await translateBatch(mtInputs, _resolvedSocket, 'en', 'zh');
|
|
876
1160
|
|
|
877
1161
|
// Filter: only verify texts that actually changed and got shorter
|
|
878
1162
|
const needVerify = [];
|
|
@@ -888,7 +1172,7 @@ async function compressMessagesLive(messages) {
|
|
|
888
1172
|
|
|
889
1173
|
if (needVerify.length > 0) {
|
|
890
1174
|
// Step 3: Translate Chinese → English (loop-back)
|
|
891
|
-
const backTranslated = await translateBatch(needVerify,
|
|
1175
|
+
const backTranslated = await translateBatch(needVerify, _resolvedSocket, 'zh', 'en');
|
|
892
1176
|
|
|
893
1177
|
// Step 4: Verify each — compare back-translated with original
|
|
894
1178
|
for (let v = 0; v < verifyIndices.length; v++) {
|
|
@@ -1031,13 +1315,14 @@ async function compressSystemPrompt(system) {
|
|
|
1031
1315
|
: [...textBlocks];
|
|
1032
1316
|
|
|
1033
1317
|
// Step 2: Apply Chinese translation to eligible sections
|
|
1034
|
-
|
|
1318
|
+
const _sysSocket = resolveTranslateSocket();
|
|
1319
|
+
if (liveConfig.TRANSLATE_ENABLED && _sysSocket) {
|
|
1035
1320
|
try {
|
|
1036
1321
|
// Translate entire steno'd text via Hardwick Translate
|
|
1037
|
-
const translations = await translateBatch(compressed,
|
|
1322
|
+
const translations = await translateBatch(compressed, _sysSocket, 'en', 'zh');
|
|
1038
1323
|
if (translations && translations.length === compressed.length) {
|
|
1039
1324
|
// Verify each translation round-trips correctly
|
|
1040
|
-
const backTranslated = await translateBatch(translations,
|
|
1325
|
+
const backTranslated = await translateBatch(translations, _sysSocket, 'zh', 'en');
|
|
1041
1326
|
|
|
1042
1327
|
for (let i = 0; i < compressed.length; i++) {
|
|
1043
1328
|
if (!translations[i] || !backTranslated) continue;
|
|
@@ -1153,7 +1438,7 @@ async function handleRequest(req, res) {
|
|
|
1153
1438
|
const tmSize = Object.keys(tm).length;
|
|
1154
1439
|
const synSize = Object.keys(syns).length;
|
|
1155
1440
|
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1156
|
-
res.end(JSON.stringify({ status: 'ok', paused: proxyPaused, uptime: Math.round((Date.now() - stats.startTime) / 1000), ...stats, tmEntries: tmSize, synonymPairs: synSize, envBaseUrlSet: !!process.env.ANTHROPIC_BASE_URL, envBaseUrl: process.env.ANTHROPIC_BASE_URL || '(not set)' }, null, 2));
|
|
1441
|
+
res.end(JSON.stringify({ status: 'ok', paused: proxyPaused, uptime: Math.round((Date.now() - stats.startTime) / 1000), ...stats, tmEntries: tmSize, synonymPairs: synSize, registeredProjects: projectRegistry.size, activeTranslateSocket: resolveTranslateSocket(), envBaseUrlSet: !!process.env.ANTHROPIC_BASE_URL, envBaseUrl: process.env.ANTHROPIC_BASE_URL || '(not set)' }, null, 2));
|
|
1157
1442
|
return;
|
|
1158
1443
|
}
|
|
1159
1444
|
|
|
@@ -1176,13 +1461,14 @@ async function handleRequest(req, res) {
|
|
|
1176
1461
|
try {
|
|
1177
1462
|
const body = JSON.parse((await collectBody(req)).toString('utf8'));
|
|
1178
1463
|
if (body.PRESERVE_RECENT_MESSAGES != null) liveConfig.PRESERVE_RECENT_MESSAGES = Math.max(1, Math.min(20, parseInt(body.PRESERVE_RECENT_MESSAGES) || 3));
|
|
1179
|
-
if (body.OLD_STRIP_THRESHOLD != null) liveConfig.OLD_STRIP_THRESHOLD = Math.max(
|
|
1180
|
-
if (body.MIN_TRANSLATE_LENGTH != null) liveConfig.MIN_TRANSLATE_LENGTH = Math.max(
|
|
1464
|
+
if (body.OLD_STRIP_THRESHOLD != null) liveConfig.OLD_STRIP_THRESHOLD = Math.max(0, Math.min(2000, parseInt(body.OLD_STRIP_THRESHOLD) || 0));
|
|
1465
|
+
if (body.MIN_TRANSLATE_LENGTH != null) liveConfig.MIN_TRANSLATE_LENGTH = Math.max(0, Math.min(200, parseInt(body.MIN_TRANSLATE_LENGTH) || 0));
|
|
1181
1466
|
if (body.TOOL_RESULT_PREVIEW_CHARS != null) liveConfig.TOOL_RESULT_PREVIEW_CHARS = Math.max(50, Math.min(500, parseInt(body.TOOL_RESULT_PREVIEW_CHARS) || 200));
|
|
1182
1467
|
if (body.STENO_ENABLED != null) liveConfig.STENO_ENABLED = !!body.STENO_ENABLED;
|
|
1183
1468
|
if (body.TRANSLATE_ENABLED != null) liveConfig.TRANSLATE_ENABLED = !!body.TRANSLATE_ENABLED;
|
|
1184
1469
|
if (body.OLD_STRIP_ENABLED != null) liveConfig.OLD_STRIP_ENABLED = !!body.OLD_STRIP_ENABLED;
|
|
1185
1470
|
if (body.SYSTEM_PROMPT_COMPRESS != null) liveConfig.SYSTEM_PROMPT_COMPRESS = !!body.SYSTEM_PROMPT_COMPRESS;
|
|
1471
|
+
if (body.SYSTEM_REMINDER_STRIPPING != null) liveConfig.SYSTEM_REMINDER_STRIPPING = !!body.SYSTEM_REMINDER_STRIPPING;
|
|
1186
1472
|
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1187
1473
|
res.end(JSON.stringify({ ok: true, ...liveConfig }));
|
|
1188
1474
|
} catch (e) {
|
|
@@ -1224,11 +1510,97 @@ async function handleRequest(req, res) {
|
|
|
1224
1510
|
return;
|
|
1225
1511
|
}
|
|
1226
1512
|
|
|
1513
|
+
// Explicit pause/resume endpoints — no guessing with toggle
|
|
1514
|
+
if (req.url === '/pause' && req.method === 'POST') {
|
|
1515
|
+
proxyPaused = true;
|
|
1516
|
+
log('info', 'Proxy PAUSED via /pause');
|
|
1517
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1518
|
+
res.end(JSON.stringify({ paused: true }));
|
|
1519
|
+
return;
|
|
1520
|
+
}
|
|
1521
|
+
if (req.url === '/resume' && req.method === 'POST') {
|
|
1522
|
+
proxyPaused = false;
|
|
1523
|
+
log('info', 'Proxy RESUMED via /resume');
|
|
1524
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1525
|
+
res.end(JSON.stringify({ paused: false }));
|
|
1526
|
+
return;
|
|
1527
|
+
}
|
|
1528
|
+
|
|
1529
|
+
// --- Multi-Project Registry Endpoints ---
|
|
1530
|
+
|
|
1531
|
+
// POST /register — register a project with the daemon
|
|
1532
|
+
if (req.url === '/register' && req.method === 'POST') {
|
|
1533
|
+
try {
|
|
1534
|
+
const body = JSON.parse((await collectBody(req)).toString('utf8'));
|
|
1535
|
+
if (!body.projectPath) {
|
|
1536
|
+
res.writeHead(400, { 'Content-Type': 'application/json' });
|
|
1537
|
+
res.end(JSON.stringify({ error: 'projectPath required' }));
|
|
1538
|
+
return;
|
|
1539
|
+
}
|
|
1540
|
+
projectRegistry.set(body.projectPath, {
|
|
1541
|
+
projectPath: body.projectPath,
|
|
1542
|
+
pid: body.pid || 0,
|
|
1543
|
+
registeredAt: projectRegistry.get(body.projectPath)?.registeredAt || Date.now(),
|
|
1544
|
+
lastSeen: Date.now(),
|
|
1545
|
+
});
|
|
1546
|
+
_invalidateProjectCaches();
|
|
1547
|
+
log('info', `REGISTRY: registered project "${body.projectPath}" (pid=${body.pid || 0}, total=${projectRegistry.size})`);
|
|
1548
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1549
|
+
res.end(JSON.stringify({ ok: true, registered: projectRegistry.size }));
|
|
1550
|
+
} catch (e) {
|
|
1551
|
+
res.writeHead(400, { 'Content-Type': 'application/json' });
|
|
1552
|
+
res.end(JSON.stringify({ error: e.message }));
|
|
1553
|
+
}
|
|
1554
|
+
return;
|
|
1555
|
+
}
|
|
1556
|
+
|
|
1557
|
+
// POST /deregister — remove a project from the daemon
|
|
1558
|
+
if (req.url === '/deregister' && req.method === 'POST') {
|
|
1559
|
+
try {
|
|
1560
|
+
const body = JSON.parse((await collectBody(req)).toString('utf8'));
|
|
1561
|
+
if (body.projectPath && projectRegistry.has(body.projectPath)) {
|
|
1562
|
+
projectRegistry.delete(body.projectPath);
|
|
1563
|
+
_invalidateProjectCaches();
|
|
1564
|
+
log('info', `REGISTRY: deregistered project "${body.projectPath}" (remaining=${projectRegistry.size})`);
|
|
1565
|
+
}
|
|
1566
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1567
|
+
res.end(JSON.stringify({ ok: true, registered: projectRegistry.size }));
|
|
1568
|
+
} catch (e) {
|
|
1569
|
+
res.writeHead(400, { 'Content-Type': 'application/json' });
|
|
1570
|
+
res.end(JSON.stringify({ error: e.message }));
|
|
1571
|
+
}
|
|
1572
|
+
return;
|
|
1573
|
+
}
|
|
1574
|
+
|
|
1575
|
+
// GET /registry — diagnostic: list all registered projects
|
|
1576
|
+
if (req.url === '/registry' && req.method === 'GET') {
|
|
1577
|
+
const projects = [];
|
|
1578
|
+
for (const [path, entry] of projectRegistry.entries()) {
|
|
1579
|
+
let alive = false;
|
|
1580
|
+
if (entry.pid > 0) {
|
|
1581
|
+
try { process.kill(entry.pid, 0); alive = true; } catch {}
|
|
1582
|
+
}
|
|
1583
|
+
const sockPath = join(path, 'specmem', 'run', 'translate.sock');
|
|
1584
|
+
projects.push({
|
|
1585
|
+
projectPath: path,
|
|
1586
|
+
pid: entry.pid,
|
|
1587
|
+
alive,
|
|
1588
|
+
registeredAt: new Date(entry.registeredAt).toISOString(),
|
|
1589
|
+
lastSeen: new Date(entry.lastSeen).toISOString(),
|
|
1590
|
+
translateSocket: existsSync(sockPath) ? sockPath : null,
|
|
1591
|
+
});
|
|
1592
|
+
}
|
|
1593
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
1594
|
+
res.end(JSON.stringify({ projects, total: projects.length }, null, 2));
|
|
1595
|
+
return;
|
|
1596
|
+
}
|
|
1597
|
+
|
|
1227
1598
|
// Count only real API traffic, not management endpoint polls
|
|
1228
1599
|
stats.totalRequests++;
|
|
1229
1600
|
|
|
1601
|
+
let rawBody;
|
|
1230
1602
|
try {
|
|
1231
|
-
|
|
1603
|
+
rawBody = await collectBody(req);
|
|
1232
1604
|
|
|
1233
1605
|
// Paused — pass everything through untouched
|
|
1234
1606
|
if (proxyPaused) {
|
|
@@ -1275,7 +1647,8 @@ async function handleRequest(req, res) {
|
|
|
1275
1647
|
pushEvent('info', `POST /v1/messages model=${body.model || '?'} msgs=${messageCount} size=${(originalSize / 1024).toFixed(0)}KB`);
|
|
1276
1648
|
|
|
1277
1649
|
const isCompaction = isCompactionRequest(body);
|
|
1278
|
-
|
|
1650
|
+
// No passthrough — always process everything (system-reminder strip + steno + translate)
|
|
1651
|
+
const isPassthrough = false;
|
|
1279
1652
|
let sysPromptModified = false;
|
|
1280
1653
|
|
|
1281
1654
|
// === SYSTEM PROMPT COMPRESSION ===
|
|
@@ -1286,7 +1659,7 @@ async function handleRequest(req, res) {
|
|
|
1286
1659
|
const _sysKey = typeof body.system === 'string' ? body.system
|
|
1287
1660
|
: Array.isArray(body.system) ? body.system.map(b => typeof b === 'string' ? b : (b?.text || '')).join('')
|
|
1288
1661
|
: JSON.stringify(body.system);
|
|
1289
|
-
const _sysHash =
|
|
1662
|
+
const _sysHash = createHash('md5').update(_sysKey).digest('hex');
|
|
1290
1663
|
const _sysCached = _sysPromptCache.get(_sysHash);
|
|
1291
1664
|
|
|
1292
1665
|
if (_sysCached) {
|
|
@@ -1333,8 +1706,26 @@ async function handleRequest(req, res) {
|
|
|
1333
1706
|
log('info', `=== ${logMsg} ===`);
|
|
1334
1707
|
pushEvent('compaction', logMsg);
|
|
1335
1708
|
|
|
1336
|
-
|
|
1337
|
-
|
|
1709
|
+
// Strip redundant system-reminders first (before tool stripping)
|
|
1710
|
+
try {
|
|
1711
|
+
const srResult = stripSystemReminders(body.messages);
|
|
1712
|
+
if (srResult.remindersStripped > 0) {
|
|
1713
|
+
body.messages = srResult.messages;
|
|
1714
|
+
log('info', `[compaction] Stripped ${srResult.remindersStripped} system-reminders (${srResult.charsRemoved} chars)`);
|
|
1715
|
+
}
|
|
1716
|
+
} catch (srErr) {
|
|
1717
|
+
log('warn', `[compaction] stripSystemReminders failed: ${srErr.message}`);
|
|
1718
|
+
}
|
|
1719
|
+
|
|
1720
|
+
let strippingStats = { toolResultsStripped: 0, toolUsesStripped: 0, charsRemoved: 0 };
|
|
1721
|
+
try {
|
|
1722
|
+
const result = stripMessages(body.messages);
|
|
1723
|
+
body.messages = result.strippedMessages;
|
|
1724
|
+
strippingStats = result.strippingStats;
|
|
1725
|
+
} catch (stripErr) {
|
|
1726
|
+
log('warn', `stripMessages failed, using raw messages: ${stripErr.message}`);
|
|
1727
|
+
// Keep body.messages as-is
|
|
1728
|
+
}
|
|
1338
1729
|
|
|
1339
1730
|
// Run steno+MT compression in parallel (independent of strip)
|
|
1340
1731
|
if (!dontCompress) {
|
|
@@ -1369,24 +1760,38 @@ async function handleRequest(req, res) {
|
|
|
1369
1760
|
return;
|
|
1370
1761
|
}
|
|
1371
1762
|
|
|
1372
|
-
// ===
|
|
1373
|
-
|
|
1374
|
-
|
|
1375
|
-
|
|
1376
|
-
|
|
1377
|
-
|
|
1378
|
-
|
|
1379
|
-
|
|
1380
|
-
|
|
1381
|
-
|
|
1763
|
+
// === NO PASSTHROUGH — always process all requests ===
|
|
1764
|
+
// (passthrough mode removed — every request gets stripped + compressed)
|
|
1765
|
+
|
|
1766
|
+
// Step 0: Strip redundant <system-reminder> tags
|
|
1767
|
+
let srCharsRemoved = 0;
|
|
1768
|
+
let srRemindersStripped = 0;
|
|
1769
|
+
try {
|
|
1770
|
+
const srResult = stripSystemReminders(body.messages);
|
|
1771
|
+
if (srResult.remindersStripped > 0) {
|
|
1772
|
+
body.messages = srResult.messages;
|
|
1773
|
+
srCharsRemoved = srResult.charsRemoved;
|
|
1774
|
+
srRemindersStripped = srResult.remindersStripped;
|
|
1775
|
+
log('info', `Stripped ${srResult.remindersStripped} system-reminders (${srResult.charsRemoved} chars)`);
|
|
1776
|
+
}
|
|
1777
|
+
} catch (srErr) {
|
|
1778
|
+
log('warn', `stripSystemReminders failed, skipping: ${srErr.message}`);
|
|
1382
1779
|
}
|
|
1383
1780
|
|
|
1384
1781
|
// Step 1: Strip large tool_results from old messages (biggest savings)
|
|
1385
|
-
|
|
1386
|
-
|
|
1387
|
-
|
|
1782
|
+
let oldStrip = { toolResultsStripped: 0, charsRemoved: 0 };
|
|
1783
|
+
try {
|
|
1784
|
+
if (liveConfig.OLD_STRIP_ENABLED) {
|
|
1785
|
+
const result = stripOldToolResults(body.messages);
|
|
1786
|
+
if (result.strippingStats.charsRemoved > 0) {
|
|
1787
|
+
body.messages = result.messages;
|
|
1788
|
+
oldStrip = result.strippingStats;
|
|
1789
|
+
}
|
|
1790
|
+
}
|
|
1791
|
+
} catch (stripErr) {
|
|
1792
|
+
log('warn', `stripOldToolResults failed, skipping: ${stripErr.message}`);
|
|
1793
|
+
}
|
|
1388
1794
|
if (oldStrip.charsRemoved > 0) {
|
|
1389
|
-
body.messages = preStripped;
|
|
1390
1795
|
stats.oldStripped += oldStrip.toolResultsStripped;
|
|
1391
1796
|
stats.oldCharsRemoved += oldStrip.charsRemoved;
|
|
1392
1797
|
stats.tokensStripped += Math.floor(oldStrip.charsRemoved / 4);
|
|
@@ -1397,13 +1802,18 @@ async function handleRequest(req, res) {
|
|
|
1397
1802
|
// Step 2: Steno+MT compression on remaining text
|
|
1398
1803
|
const { messages: compressed, blocksCompressed, charsCompressed, verifiedCount = 0, stenoOnlyCount = 0, tmHits: hits = 0, samples: liveSamples = [] } = await compressMessagesLive(body.messages);
|
|
1399
1804
|
|
|
1400
|
-
|
|
1805
|
+
// srCharsRemoved already tracked from Step 0 above
|
|
1806
|
+
|
|
1807
|
+
if (blocksCompressed === 0 && oldStrip.charsRemoved === 0 && srCharsRemoved === 0) {
|
|
1401
1808
|
stats.passthrough++;
|
|
1402
1809
|
pushEvent('pass', `msgs=${messageCount} (nothing to compress)`);
|
|
1403
1810
|
forwardRequest(req, res, rawBody);
|
|
1404
1811
|
return;
|
|
1405
1812
|
}
|
|
1406
1813
|
|
|
1814
|
+
// If anything was stripped/compressed, body was mutated — must re-serialize
|
|
1815
|
+
body.messages = compressed;
|
|
1816
|
+
|
|
1407
1817
|
// Store translation samples for preview
|
|
1408
1818
|
if (liveSamples.length > 0) stats._lastSamples = liveSamples;
|
|
1409
1819
|
|
|
@@ -1417,8 +1827,8 @@ async function handleRequest(req, res) {
|
|
|
1417
1827
|
stats.stenoOnly += (blocksCompressed - verifiedCount - stenoOnlyCount);
|
|
1418
1828
|
stats.tmHits += hits;
|
|
1419
1829
|
pushEvent('compress', `LIVE: ${blocksCompressed} blocks, ${charsCompressed} chars (${verifiedCount} zh, ${stenoOnlyCount} steno, ${hits} TM)`);
|
|
1420
|
-
} else if (oldStrip.charsRemoved > 0) {
|
|
1421
|
-
// Only stripping, no compression — still send modified body
|
|
1830
|
+
} else if (oldStrip.charsRemoved > 0 || srCharsRemoved > 0) {
|
|
1831
|
+
// Only stripping (tool results or system-reminders), no compression — still send modified body
|
|
1422
1832
|
stats.liveCompressed++;
|
|
1423
1833
|
}
|
|
1424
1834
|
stats.lastLiveCompress = new Date().toISOString();
|
|
@@ -1428,7 +1838,8 @@ async function handleRequest(req, res) {
|
|
|
1428
1838
|
const savedPercent = originalSize > 0 ? ((savedBytes / originalSize) * 100).toFixed(1) : '0';
|
|
1429
1839
|
|
|
1430
1840
|
const stripInfo = oldStrip.charsRemoved > 0 ? ` [STRIP: ${oldStrip.toolResultsStripped} results, ${(oldStrip.charsRemoved / 1024).toFixed(0)}KB]` : '';
|
|
1431
|
-
|
|
1841
|
+
const srInfo = srCharsRemoved > 0 ? ` [SR: ${srRemindersStripped} reminders, ${(srCharsRemoved / 1024).toFixed(1)}KB]` : '';
|
|
1842
|
+
log('info', `LIVE: ${blocksCompressed} blocks | ${(originalSize / 1024).toFixed(0)}KB → ${(compressedBody.length / 1024).toFixed(0)}KB (-${savedPercent}%)${stripInfo}${srInfo}`);
|
|
1432
1843
|
pushEvent('saved', `${(originalSize / 1024).toFixed(0)}KB → ${(compressedBody.length / 1024).toFixed(0)}KB (-${savedPercent}%) ~${Math.round(savedBytes / 3.5)} tokens`);
|
|
1433
1844
|
|
|
1434
1845
|
pushPreview(rawBody.toString('utf8'), compressedBody.toString('utf8'), 'live', liveSamples);
|
|
@@ -1437,11 +1848,35 @@ async function handleRequest(req, res) {
|
|
|
1437
1848
|
|
|
1438
1849
|
} catch (err) {
|
|
1439
1850
|
log('error', `Handler error: ${err.message}`);
|
|
1851
|
+
log('error', `Handler stack: ${err.stack || '(no stack)'}`);
|
|
1440
1852
|
pushEvent('error', err.message);
|
|
1441
1853
|
stats.errors++;
|
|
1854
|
+
// CRITICAL: Never return 502 — fall back to forwarding raw body.
|
|
1855
|
+
// The proxy must NEVER break the API call. Compression is optional;
|
|
1856
|
+
// if it fails, just passthrough the original request.
|
|
1442
1857
|
if (!res.headersSent) {
|
|
1443
|
-
|
|
1444
|
-
|
|
1858
|
+
try {
|
|
1859
|
+
const fallbackBody = (typeof rawBody !== 'undefined' && rawBody && rawBody.length > 0) ? rawBody : null;
|
|
1860
|
+
if (fallbackBody) {
|
|
1861
|
+
log('warn', `Falling back to passthrough after handler error: ${err.message}`);
|
|
1862
|
+
stats.passthrough++;
|
|
1863
|
+
forwardRequest(req, res, fallbackBody);
|
|
1864
|
+
} else {
|
|
1865
|
+
// rawBody unavailable — re-collect from request if possible, else auto-pause and passthrough next time
|
|
1866
|
+
log('warn', `No rawBody available — auto-pausing proxy to prevent further 502s: ${err.message}`);
|
|
1867
|
+
proxyPaused = true;
|
|
1868
|
+
// Return a retriable error so Claude Code retries (and next attempt hits passthrough path)
|
|
1869
|
+
res.writeHead(503, { 'Content-Type': 'application/json', 'Retry-After': '1' });
|
|
1870
|
+
res.end(JSON.stringify({ type: 'error', error: { type: 'overloaded_error', message: 'Proxy auto-paused due to handler error, retry immediately' } }));
|
|
1871
|
+
}
|
|
1872
|
+
} catch (fallbackErr) {
|
|
1873
|
+
log('error', `Fallback also failed: ${fallbackErr.message}`);
|
|
1874
|
+
if (!res.headersSent) {
|
|
1875
|
+
proxyPaused = true;
|
|
1876
|
+
res.writeHead(503, { 'Content-Type': 'application/json', 'Retry-After': '1' });
|
|
1877
|
+
res.end(JSON.stringify({ type: 'error', error: { type: 'overloaded_error', message: 'Proxy auto-paused, retry immediately' } }));
|
|
1878
|
+
}
|
|
1879
|
+
}
|
|
1445
1880
|
}
|
|
1446
1881
|
}
|
|
1447
1882
|
}
|
|
@@ -1459,13 +1894,9 @@ let proxyServer = null;
|
|
|
1459
1894
|
* Returns { started: boolean, port: number }
|
|
1460
1895
|
*/
|
|
1461
1896
|
export async function startCompactionProxy() {
|
|
1462
|
-
//
|
|
1463
|
-
|
|
1464
|
-
|
|
1465
|
-
cleanupPortFile();
|
|
1466
|
-
cleanupPidFile();
|
|
1467
|
-
return { started: false, port: PROXY_PORT, reason: 'disabled_by_user' };
|
|
1468
|
-
}
|
|
1897
|
+
// Disabled flag = start in passthrough mode (proxy always in path for seamless toggling).
|
|
1898
|
+
// The daemon itself reads the flag and starts paused.
|
|
1899
|
+
const disabledByUser = existsSync(DISABLED_FILE);
|
|
1469
1900
|
|
|
1470
1901
|
// Check PID file — is daemon already running?
|
|
1471
1902
|
if (existsSync(PID_FILE)) {
|
|
@@ -1478,8 +1909,11 @@ export async function startCompactionProxy() {
|
|
|
1478
1909
|
// Process exists, verify it responds to health check
|
|
1479
1910
|
const healthy = await checkDaemonHealth();
|
|
1480
1911
|
if (healthy) {
|
|
1481
|
-
log('info', `Daemon already running (PID ${pid}), skipping spawn`);
|
|
1482
|
-
|
|
1912
|
+
log('info', `Daemon already running (PID ${pid})${disabledByUser ? ' (passthrough mode)' : ''}, skipping spawn`);
|
|
1913
|
+
// If disabled flag changed since daemon started, sync pause state via SIGUSR1
|
|
1914
|
+
// (daemon checks disabled file on toggle, but we can hint via stats check)
|
|
1915
|
+
registerWithDaemon(process.env.SPECMEM_PROJECT_PATH, process.pid);
|
|
1916
|
+
return { started: false, port: PROXY_PORT, paused: disabledByUser, reason: 'daemon_already_running' };
|
|
1483
1917
|
}
|
|
1484
1918
|
// Process alive but not responding — stale, kill it
|
|
1485
1919
|
log('warn', `Daemon PID ${pid} alive but not healthy, killing stale process`);
|
|
@@ -1515,14 +1949,16 @@ export async function startCompactionProxy() {
|
|
|
1515
1949
|
const deadline = Date.now() + 3000;
|
|
1516
1950
|
while (Date.now() < deadline) {
|
|
1517
1951
|
if (existsSync(PORT_FILE)) {
|
|
1518
|
-
log('info', `Daemon ready (PID ${child.pid}), port file appeared`);
|
|
1519
|
-
|
|
1952
|
+
log('info', `Daemon ready (PID ${child.pid})${disabledByUser ? ' in passthrough mode' : ''}, port file appeared`);
|
|
1953
|
+
registerWithDaemon(process.env.SPECMEM_PROJECT_PATH, process.pid);
|
|
1954
|
+
return { started: true, port: PROXY_PORT, paused: disabledByUser };
|
|
1520
1955
|
}
|
|
1521
1956
|
await new Promise(r => setTimeout(r, 100));
|
|
1522
1957
|
}
|
|
1523
1958
|
|
|
1524
1959
|
log('warn', 'Daemon spawned but port file did not appear within 3s');
|
|
1525
|
-
|
|
1960
|
+
registerWithDaemon(process.env.SPECMEM_PROJECT_PATH, process.pid);
|
|
1961
|
+
return { started: true, port: PROXY_PORT, paused: disabledByUser, reason: 'timeout_waiting_for_port' };
|
|
1526
1962
|
}
|
|
1527
1963
|
|
|
1528
1964
|
/**
|
|
@@ -1559,6 +1995,12 @@ function togglePause() {
|
|
|
1559
1995
|
return proxyPaused;
|
|
1560
1996
|
}
|
|
1561
1997
|
|
|
1998
|
+
function setPaused(state) {
|
|
1999
|
+
proxyPaused = !!state;
|
|
2000
|
+
log('info', `Proxy pause state set to ${proxyPaused ? 'PAUSED' : 'ACTIVE'}`);
|
|
2001
|
+
return proxyPaused;
|
|
2002
|
+
}
|
|
2003
|
+
|
|
1562
2004
|
/**
|
|
1563
2005
|
* Check if the daemon is responding on its health endpoint.
|
|
1564
2006
|
*/
|
|
@@ -1575,11 +2017,12 @@ function checkDaemonHealth() {
|
|
|
1575
2017
|
}
|
|
1576
2018
|
|
|
1577
2019
|
/**
|
|
1578
|
-
* Stop the proxy —
|
|
2020
|
+
* Stop the proxy — deregisters this project from the daemon.
|
|
1579
2021
|
* The daemon persists independently of the MCP process.
|
|
1580
2022
|
* Use killCompactionProxy() to explicitly terminate the daemon.
|
|
1581
2023
|
*/
|
|
1582
2024
|
export function stopCompactionProxy() {
|
|
2025
|
+
deregisterFromDaemon(process.env.SPECMEM_PROJECT_PATH);
|
|
1583
2026
|
return Promise.resolve();
|
|
1584
2027
|
}
|
|
1585
2028
|
|
|
@@ -1667,6 +2110,115 @@ export function getCompactionProxyStats() {
|
|
|
1667
2110
|
return { running, daemonPid, port: PROXY_PORT };
|
|
1668
2111
|
}
|
|
1669
2112
|
|
|
2113
|
+
// ============================================================================
|
|
2114
|
+
// Registration helpers — fire-and-forget HTTP to the daemon
|
|
2115
|
+
// ============================================================================
|
|
2116
|
+
|
|
2117
|
+
/**
|
|
2118
|
+
* Register this project with the running daemon.
|
|
2119
|
+
* Fire-and-forget — if daemon isn't running yet, fails silently.
|
|
2120
|
+
*/
|
|
2121
|
+
function registerWithDaemon(projectPath, pid) {
|
|
2122
|
+
if (!projectPath) return;
|
|
2123
|
+
const body = JSON.stringify({ projectPath, pid: pid || process.pid });
|
|
2124
|
+
try {
|
|
2125
|
+
const req = httpRequest({
|
|
2126
|
+
hostname: '127.0.0.1',
|
|
2127
|
+
port: PROXY_PORT,
|
|
2128
|
+
path: '/register',
|
|
2129
|
+
method: 'POST',
|
|
2130
|
+
headers: { 'Content-Type': 'application/json', 'Content-Length': Buffer.byteLength(body) },
|
|
2131
|
+
timeout: 2000,
|
|
2132
|
+
});
|
|
2133
|
+
req.on('error', () => {}); // fire-and-forget
|
|
2134
|
+
req.on('timeout', () => req.destroy());
|
|
2135
|
+
req.write(body);
|
|
2136
|
+
req.end();
|
|
2137
|
+
log('info', `Sent /register for "${projectPath}" (pid=${pid || process.pid})`);
|
|
2138
|
+
} catch { /* fire-and-forget */ }
|
|
2139
|
+
}
|
|
2140
|
+
|
|
2141
|
+
/**
|
|
2142
|
+
* Deregister this project from the running daemon.
|
|
2143
|
+
* Fire-and-forget — best effort cleanup on shutdown.
|
|
2144
|
+
*/
|
|
2145
|
+
function deregisterFromDaemon(projectPath) {
|
|
2146
|
+
if (!projectPath) return;
|
|
2147
|
+
const body = JSON.stringify({ projectPath });
|
|
2148
|
+
try {
|
|
2149
|
+
const req = httpRequest({
|
|
2150
|
+
hostname: '127.0.0.1',
|
|
2151
|
+
port: PROXY_PORT,
|
|
2152
|
+
path: '/deregister',
|
|
2153
|
+
method: 'POST',
|
|
2154
|
+
headers: { 'Content-Type': 'application/json', 'Content-Length': Buffer.byteLength(body) },
|
|
2155
|
+
timeout: 2000,
|
|
2156
|
+
});
|
|
2157
|
+
req.on('error', () => {}); // fire-and-forget
|
|
2158
|
+
req.on('timeout', () => req.destroy());
|
|
2159
|
+
req.write(body);
|
|
2160
|
+
req.end();
|
|
2161
|
+
log('info', `Sent /deregister for "${projectPath}"`);
|
|
2162
|
+
} catch { /* fire-and-forget */ }
|
|
2163
|
+
}
|
|
2164
|
+
|
|
2165
|
+
// ============================================================================
|
|
2166
|
+
// Stale Project Reaper — removes dead projects from the registry
|
|
2167
|
+
// ============================================================================
|
|
2168
|
+
|
|
2169
|
+
/**
|
|
2170
|
+
* Check if a PID is alive using signal 0.
|
|
2171
|
+
*/
|
|
2172
|
+
function isPidAlive(pid) {
|
|
2173
|
+
if (!pid || pid <= 0) return false;
|
|
2174
|
+
try {
|
|
2175
|
+
process.kill(pid, 0);
|
|
2176
|
+
return true;
|
|
2177
|
+
} catch {
|
|
2178
|
+
return false;
|
|
2179
|
+
}
|
|
2180
|
+
}
|
|
2181
|
+
|
|
2182
|
+
/**
|
|
2183
|
+
* Reap stale projects — remove entries with dead PIDs.
|
|
2184
|
+
*/
|
|
2185
|
+
function reapStaleProjects() {
|
|
2186
|
+
let reaped = 0;
|
|
2187
|
+
for (const [path, entry] of projectRegistry.entries()) {
|
|
2188
|
+
if (entry.pid > 0 && !isPidAlive(entry.pid)) {
|
|
2189
|
+
projectRegistry.delete(path);
|
|
2190
|
+
reaped++;
|
|
2191
|
+
log('info', `REAPER: removed stale project "${path}" (dead pid=${entry.pid})`);
|
|
2192
|
+
}
|
|
2193
|
+
}
|
|
2194
|
+
if (reaped > 0) {
|
|
2195
|
+
_invalidateProjectCaches();
|
|
2196
|
+
log('info', `REAPER: reaped ${reaped} stale projects, ${projectRegistry.size} remaining`);
|
|
2197
|
+
}
|
|
2198
|
+
}
|
|
2199
|
+
|
|
2200
|
+
let _reaperTimer = null;
|
|
2201
|
+
|
|
2202
|
+
/**
|
|
2203
|
+
* Start the stale project reaper (30s interval, unref'd).
|
|
2204
|
+
*/
|
|
2205
|
+
function startReaper() {
|
|
2206
|
+
if (_reaperTimer) return;
|
|
2207
|
+
_reaperTimer = setInterval(reapStaleProjects, 30000);
|
|
2208
|
+
_reaperTimer.unref();
|
|
2209
|
+
log('info', 'REAPER: started (30s interval)');
|
|
2210
|
+
}
|
|
2211
|
+
|
|
2212
|
+
/**
|
|
2213
|
+
* Check if any registered projects have live PIDs.
|
|
2214
|
+
*/
|
|
2215
|
+
function hasLiveProjects() {
|
|
2216
|
+
for (const entry of projectRegistry.values()) {
|
|
2217
|
+
if (entry.pid > 0 && isPidAlive(entry.pid)) return true;
|
|
2218
|
+
}
|
|
2219
|
+
return false;
|
|
2220
|
+
}
|
|
2221
|
+
|
|
1670
2222
|
// ============================================================================
|
|
1671
2223
|
// Daemon Internals — exported for compactionProxyDaemon.js
|
|
1672
2224
|
// ============================================================================
|
|
@@ -1675,6 +2227,9 @@ export {
|
|
|
1675
2227
|
handleRequest,
|
|
1676
2228
|
log,
|
|
1677
2229
|
togglePause,
|
|
2230
|
+
setPaused,
|
|
2231
|
+
startReaper,
|
|
2232
|
+
hasLiveProjects,
|
|
1678
2233
|
PROXY_PORT,
|
|
1679
2234
|
PORT_FILE,
|
|
1680
2235
|
PID_FILE,
|