@pugi/cli 0.1.0-beta.31 → 0.1.0-beta.35
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/commands/smoke.js +133 -0
- package/dist/core/auth/ensure-authenticated.js +129 -0
- package/dist/core/bash-classifier.js +108 -1
- package/dist/core/codegraph/decision-store.js +248 -0
- package/dist/core/codegraph/detect-repo.js +459 -0
- package/dist/core/codegraph/install.js +134 -0
- package/dist/core/codegraph/offer-hook.js +220 -0
- package/dist/core/diagnostics/probes/status-snapshot.js +50 -4
- package/dist/core/onboarding/ensure-initialized.js +133 -0
- package/dist/core/repl/session.js +370 -9
- package/dist/core/repl/slash-commands.js +68 -5
- package/dist/core/smoke/headless-driver.js +174 -0
- package/dist/core/smoke/orchestrator.js +194 -0
- package/dist/core/smoke/runner.js +238 -0
- package/dist/core/smoke/scenario-parser.js +316 -0
- package/dist/runtime/cli.js +453 -11
- package/dist/runtime/commands/cancel.js +231 -0
- package/dist/runtime/commands/codegraph-status.js +227 -0
- package/dist/runtime/commands/permissions.js +23 -0
- package/dist/runtime/commands/redo-blob-store.js +92 -0
- package/dist/runtime/commands/redo.js +361 -0
- package/dist/runtime/commands/status.js +11 -3
- package/dist/runtime/commands/undo.js +32 -0
- package/dist/runtime/headless-repl.js +195 -0
- package/dist/runtime/version.js +1 -1
- package/dist/tui/permissions-picker.js +78 -0
- package/dist/tui/render.js +35 -0
- package/dist/tui/status-bar.js +1 -1
- package/dist/tui/tool-stream-pane.js +45 -3
- package/package.json +7 -4
- package/test/scenarios/codegen-create-file.scenario.txt +13 -0
- package/test/scenarios/compact-force.scenario.txt +11 -0
- package/test/scenarios/identity.scenario.txt +11 -0
- package/test/scenarios/persona-handoff.scenario.txt +11 -0
- package/test/scenarios/walkback.scenario.txt +12 -0
- package/dist/core/engine/compaction-hook.js +0 -154
- package/dist/core/init/scaffold.js +0 -195
- package/dist/core/memory/dual-write.spec.js +0 -297
- package/dist/core/memory-sync/queue.spec.js +0 -105
- package/dist/core/repl/codebase-survey.js +0 -308
- package/dist/core/repl/init-interview.js +0 -457
- package/dist/core/repl/onboarding-state.js +0 -297
- package/dist/runtime/commands/memory.spec.js +0 -174
|
@@ -0,0 +1,459 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Repo detection helper — Wave 6 BIG TRACK 9 Phase 2 (codegraph
|
|
3
|
+
* context-aware auto-install, 2026-05-27).
|
|
4
|
+
*
|
|
5
|
+
* Walks up from `cwd` looking for a `.git/` directory; if found, runs a
|
|
6
|
+
* bounded scan (≤ MAX_SCAN_FILES files, depth-limited) to classify the
|
|
7
|
+
* repo size + detect primary languages. The result feeds two surfaces:
|
|
8
|
+
*
|
|
9
|
+
* 1. `pugi init` — when the repo is medium+ AND has a supported
|
|
10
|
+
* primary language, the init flow asks the operator whether to
|
|
11
|
+
* install the codegraph MCP server (Phase 1 example config →
|
|
12
|
+
* auto-merged into .pugi/mcp.json).
|
|
13
|
+
* 2. Cold-start hook — every `pugi` invocation looks up the last-asked
|
|
14
|
+
* timestamp; if the operator declined more than 30 days ago AND
|
|
15
|
+
* the repo still triggers, we surface a one-line nudge.
|
|
16
|
+
*
|
|
17
|
+
* Why a stand-alone scanner (vs. reusing core/repo-map/scanner.ts):
|
|
18
|
+
*
|
|
19
|
+
* - repo-map scans up to 5000 files with statSync per file to build a
|
|
20
|
+
* symbol cache. We need a much cheaper classification: ≤ 1000 files,
|
|
21
|
+
* no stat for size (just dirent.name), bail early on the first
|
|
22
|
+
* manifest file we recognise. The 5000-file walker would dominate
|
|
23
|
+
* cold-start latency on a monorepo.
|
|
24
|
+
* - We deliberately do NOT respect .pugiignore here — codegraph cares
|
|
25
|
+
* about the WHOLE repo (vendored libs included), not the operator's
|
|
26
|
+
* curated workspace view. The repo-map scanner does the opposite.
|
|
27
|
+
* - The output is structurally different (size category + language
|
|
28
|
+
* manifest list) so even if we reused the walker the post-processing
|
|
29
|
+
* would be different. Keeping the scans independent prevents one
|
|
30
|
+
* surface's heuristics from leaking into the other.
|
|
31
|
+
*
|
|
32
|
+
* Pure module: no logging, no network, no telemetry. Errors during
|
|
33
|
+
* readdir on a subtree (permission denied, symlink loop) are swallowed
|
|
34
|
+
* and the walker continues — repo detection is best-effort context.
|
|
35
|
+
* The function NEVER throws; a malformed cwd returns `{ isRepo: false }`.
|
|
36
|
+
*/
|
|
37
|
+
import { readdirSync, existsSync, statSync, readFileSync } from 'node:fs';
|
|
38
|
+
import { dirname, join, resolve } from 'node:path';
|
|
39
|
+
/**
|
|
40
|
+
* Maximum directories we descend into. A 1000-file repo classifies as
|
|
41
|
+
* "large" already; deeper walks add latency without changing the
|
|
42
|
+
* verdict. Hit this cap and we cap the file count at MAX_SCAN_FILES
|
|
43
|
+
* and return the verdict — the codegraph decision does not care
|
|
44
|
+
* whether the repo is 1001 or 100_001 files.
|
|
45
|
+
*/
|
|
46
|
+
export const MAX_SCAN_FILES = 1000;
|
|
47
|
+
/**
|
|
48
|
+
* Hard cap on walk depth. Counted from `gitRoot`. Anything beyond is
|
|
49
|
+
* deep tooling output (node_modules, vendored deps, generated). The
|
|
50
|
+
* scanner short-circuits at this depth and the result is reported as
|
|
51
|
+
* `wasCapped: true` so the consumer can hint the operator if needed.
|
|
52
|
+
*/
|
|
53
|
+
export const MAX_SCAN_DEPTH = 6;
|
|
54
|
+
/**
|
|
55
|
+
* Walk-up cap searching for the `.git/` parent. 12 ancestors matches
|
|
56
|
+
* the bootstrap.ts contract for project-marker detection — operators
|
|
57
|
+
* running `pugi` from `node_modules/foo/bar/baz` are an error case, not
|
|
58
|
+
* a feature.
|
|
59
|
+
*/
|
|
60
|
+
export const MAX_GIT_WALK = 12;
|
|
61
|
+
/**
|
|
62
|
+
* Directory basenames we skip outright. These are pure noise for code
|
|
63
|
+
* navigation — vendored deps, build artefacts, version-control plumbing,
|
|
64
|
+
* cached test outputs. Trimming them at the dirent level keeps the scan
|
|
65
|
+
* O(useful-source-files) rather than O(everything-on-disk).
|
|
66
|
+
*/
|
|
67
|
+
const SKIP_DIRS = new Set([
|
|
68
|
+
'.git',
|
|
69
|
+
'node_modules',
|
|
70
|
+
'dist',
|
|
71
|
+
'build',
|
|
72
|
+
'out',
|
|
73
|
+
'.next',
|
|
74
|
+
'.nuxt',
|
|
75
|
+
'.turbo',
|
|
76
|
+
'.cache',
|
|
77
|
+
'coverage',
|
|
78
|
+
'__pycache__',
|
|
79
|
+
'.venv',
|
|
80
|
+
'venv',
|
|
81
|
+
'target',
|
|
82
|
+
'.gradle',
|
|
83
|
+
'.idea',
|
|
84
|
+
'.vscode',
|
|
85
|
+
'.pugi',
|
|
86
|
+
]);
|
|
87
|
+
/**
|
|
88
|
+
* Source-file extensions that count toward the size category. Mirrors
|
|
89
|
+
* the codegraph upstream's own language list (tree-sitter grammars for
|
|
90
|
+
* 19 languages) but pruned to the set that we actually return as
|
|
91
|
+
* `supported` languages — the categorisation must agree with the
|
|
92
|
+
* language-match gate that drives the install prompt.
|
|
93
|
+
*/
|
|
94
|
+
const SOURCE_EXTENSIONS = new Set([
|
|
95
|
+
'.ts', '.tsx', '.js', '.jsx', '.mjs', '.cjs',
|
|
96
|
+
'.py',
|
|
97
|
+
'.rs',
|
|
98
|
+
'.go',
|
|
99
|
+
'.java', '.kt', '.kts',
|
|
100
|
+
'.rb',
|
|
101
|
+
'.php',
|
|
102
|
+
'.c', '.h', '.cpp', '.hpp', '.cc', '.cxx',
|
|
103
|
+
'.cs',
|
|
104
|
+
'.swift',
|
|
105
|
+
'.scala',
|
|
106
|
+
]);
|
|
107
|
+
export const CODEGRAPH_SUPPORTED_LANGUAGES = Object.freeze([
|
|
108
|
+
'typescript',
|
|
109
|
+
'javascript',
|
|
110
|
+
'python',
|
|
111
|
+
'rust',
|
|
112
|
+
'go',
|
|
113
|
+
'java',
|
|
114
|
+
]);
|
|
115
|
+
const MANIFEST_HINTS = Object.freeze([
|
|
116
|
+
{ filename: 'package.json', languages: ['javascript', 'typescript'] },
|
|
117
|
+
{ filename: 'tsconfig.json', languages: ['typescript'] },
|
|
118
|
+
{ filename: 'pyproject.toml', languages: ['python'] },
|
|
119
|
+
{ filename: 'requirements.txt', languages: ['python'] },
|
|
120
|
+
{ filename: 'setup.py', languages: ['python'] },
|
|
121
|
+
{ filename: 'Pipfile', languages: ['python'] },
|
|
122
|
+
{ filename: 'Cargo.toml', languages: ['rust'] },
|
|
123
|
+
{ filename: 'go.mod', languages: ['go'] },
|
|
124
|
+
{ filename: 'pom.xml', languages: ['java'] },
|
|
125
|
+
{ filename: 'build.gradle', languages: ['java'] },
|
|
126
|
+
{ filename: 'build.gradle.kts', languages: ['java'] },
|
|
127
|
+
]);
|
|
128
|
+
/**
|
|
129
|
+
* Walk up from `cwd` looking for `.git/`. Returns the absolute path of
|
|
130
|
+
* the git-root directory OR null if none is found within the walk cap.
|
|
131
|
+
*/
|
|
132
|
+
export function findGitRoot(cwd) {
|
|
133
|
+
let current = resolve(cwd);
|
|
134
|
+
for (let i = 0; i < MAX_GIT_WALK; i += 1) {
|
|
135
|
+
if (existsSync(join(current, '.git')))
|
|
136
|
+
return current;
|
|
137
|
+
const parent = dirname(current);
|
|
138
|
+
if (parent === current)
|
|
139
|
+
return null;
|
|
140
|
+
current = parent;
|
|
141
|
+
}
|
|
142
|
+
return null;
|
|
143
|
+
}
|
|
144
|
+
/**
|
|
145
|
+
* Read manifest files at the git root + classify their languages.
|
|
146
|
+
* Pure file-system stat — we do NOT parse the manifests (a malformed
|
|
147
|
+
* package.json should not break detection). Multiple manifests can
|
|
148
|
+
* hit; e.g. a polyglot repo with package.json + pyproject.toml lights
|
|
149
|
+
* up both `typescript`/`javascript` and `python`.
|
|
150
|
+
*
|
|
151
|
+
* `package.json` is special-cased: if a `tsconfig.json` lives next to
|
|
152
|
+
* it we drop the `javascript` hint so a pure-TS repo doesn't get
|
|
153
|
+
* counted twice. JS-only repos surface as `javascript`.
|
|
154
|
+
*/
|
|
155
|
+
function detectManifestLanguages(gitRoot) {
|
|
156
|
+
const out = new Set();
|
|
157
|
+
const hasTsconfig = existsSync(join(gitRoot, 'tsconfig.json'));
|
|
158
|
+
for (const hint of MANIFEST_HINTS) {
|
|
159
|
+
if (!existsSync(join(gitRoot, hint.filename)))
|
|
160
|
+
continue;
|
|
161
|
+
for (const lang of hint.languages) {
|
|
162
|
+
if (hint.filename === 'package.json' && hasTsconfig && lang === 'javascript') {
|
|
163
|
+
continue;
|
|
164
|
+
}
|
|
165
|
+
out.add(lang);
|
|
166
|
+
}
|
|
167
|
+
}
|
|
168
|
+
return out;
|
|
169
|
+
}
|
|
170
|
+
/**
|
|
171
|
+
* Bounded BFS-by-stack walk from `root`. Caps at MAX_SCAN_FILES +
|
|
172
|
+
* MAX_SCAN_DEPTH. Returns `{ srcCount, languages, wasCapped }`.
|
|
173
|
+
*
|
|
174
|
+
* Why a manual stack rather than `readdirSync({ recursive: true })`:
|
|
175
|
+
* the recursive readdir loads the entire tree into memory before we
|
|
176
|
+
* see the first entry; on a monorepo we would walk node_modules
|
|
177
|
+
* (forbidden) before our SKIP_DIRS filter could fire. A manual stack
|
|
178
|
+
* lets us prune at every level.
|
|
179
|
+
*/
|
|
180
|
+
function scanRepo(root) {
|
|
181
|
+
const languagesFromExt = new Set();
|
|
182
|
+
let srcCount = 0;
|
|
183
|
+
let wasCapped = false;
|
|
184
|
+
// Per-language file counts so we can apply the "at least 3 files"
|
|
185
|
+
// threshold below — a single stray .py in a TS repo should not light
|
|
186
|
+
// up python.
|
|
187
|
+
const perLang = new Map();
|
|
188
|
+
const stack = [{ abs: root, depth: 0 }];
|
|
189
|
+
while (stack.length > 0) {
|
|
190
|
+
const frame = stack.pop();
|
|
191
|
+
if (!frame)
|
|
192
|
+
break;
|
|
193
|
+
if (frame.depth > MAX_SCAN_DEPTH) {
|
|
194
|
+
wasCapped = true;
|
|
195
|
+
continue;
|
|
196
|
+
}
|
|
197
|
+
let entries;
|
|
198
|
+
try {
|
|
199
|
+
entries = readdirSync(frame.abs, { withFileTypes: true });
|
|
200
|
+
}
|
|
201
|
+
catch {
|
|
202
|
+
continue;
|
|
203
|
+
}
|
|
204
|
+
for (const entry of entries) {
|
|
205
|
+
if (srcCount >= MAX_SCAN_FILES) {
|
|
206
|
+
wasCapped = true;
|
|
207
|
+
break;
|
|
208
|
+
}
|
|
209
|
+
if (entry.isDirectory()) {
|
|
210
|
+
if (SKIP_DIRS.has(entry.name))
|
|
211
|
+
continue;
|
|
212
|
+
if (entry.name.startsWith('.') && entry.name !== '.') {
|
|
213
|
+
// Skip hidden dirs that are NOT in our whitelist (e.g. .yarn,
|
|
214
|
+
// .pnpm-store). .pugi/.git are already in SKIP_DIRS.
|
|
215
|
+
continue;
|
|
216
|
+
}
|
|
217
|
+
stack.push({ abs: join(frame.abs, entry.name), depth: frame.depth + 1 });
|
|
218
|
+
continue;
|
|
219
|
+
}
|
|
220
|
+
if (!entry.isFile())
|
|
221
|
+
continue;
|
|
222
|
+
const ext = extensionOf(entry.name);
|
|
223
|
+
if (!ext)
|
|
224
|
+
continue;
|
|
225
|
+
if (!SOURCE_EXTENSIONS.has(ext))
|
|
226
|
+
continue;
|
|
227
|
+
srcCount += 1;
|
|
228
|
+
const lang = languageForExtension(ext);
|
|
229
|
+
if (lang) {
|
|
230
|
+
perLang.set(lang, (perLang.get(lang) ?? 0) + 1);
|
|
231
|
+
}
|
|
232
|
+
}
|
|
233
|
+
if (srcCount >= MAX_SCAN_FILES) {
|
|
234
|
+
wasCapped = true;
|
|
235
|
+
break;
|
|
236
|
+
}
|
|
237
|
+
}
|
|
238
|
+
// Promote per-language counts to detected languages with a noise
|
|
239
|
+
// floor. The threshold is intentionally low (3) so a small repo
|
|
240
|
+
// with a handful of Python utility scripts in an otherwise-TS
|
|
241
|
+
// codebase still surfaces as polyglot.
|
|
242
|
+
for (const [lang, count] of perLang.entries()) {
|
|
243
|
+
if (count >= 3)
|
|
244
|
+
languagesFromExt.add(lang);
|
|
245
|
+
}
|
|
246
|
+
return { srcCount, languagesFromExt, wasCapped };
|
|
247
|
+
}
|
|
248
|
+
/**
|
|
249
|
+
* Map a file extension to a SupportedLanguage. Returns null for
|
|
250
|
+
* extensions we count toward the size category but do NOT surface as
|
|
251
|
+
* supported languages (c, cs, swift, scala, …) — codegraph supports
|
|
252
|
+
* more languages than our nudge gate.
|
|
253
|
+
*/
|
|
254
|
+
export function languageForExtension(ext) {
|
|
255
|
+
switch (ext) {
|
|
256
|
+
case '.ts':
|
|
257
|
+
case '.tsx':
|
|
258
|
+
return 'typescript';
|
|
259
|
+
case '.js':
|
|
260
|
+
case '.jsx':
|
|
261
|
+
case '.mjs':
|
|
262
|
+
case '.cjs':
|
|
263
|
+
return 'javascript';
|
|
264
|
+
case '.py':
|
|
265
|
+
return 'python';
|
|
266
|
+
case '.rs':
|
|
267
|
+
return 'rust';
|
|
268
|
+
case '.go':
|
|
269
|
+
return 'go';
|
|
270
|
+
case '.java':
|
|
271
|
+
case '.kt':
|
|
272
|
+
case '.kts':
|
|
273
|
+
return 'java';
|
|
274
|
+
default:
|
|
275
|
+
return null;
|
|
276
|
+
}
|
|
277
|
+
}
|
|
278
|
+
/**
|
|
279
|
+
* Lowercase extension including the leading dot. Returns null for
|
|
280
|
+
* dotfiles (no extension) and for paths without a dot.
|
|
281
|
+
*/
|
|
282
|
+
function extensionOf(filename) {
|
|
283
|
+
const idx = filename.lastIndexOf('.');
|
|
284
|
+
if (idx <= 0)
|
|
285
|
+
return null;
|
|
286
|
+
// `.env` style dotfiles return `'.env'` from lastIndexOf — they
|
|
287
|
+
// are filtered by the SOURCE_EXTENSIONS membership check below
|
|
288
|
+
// since `.env` is not in the source-language set.
|
|
289
|
+
return filename.slice(idx).toLowerCase();
|
|
290
|
+
}
|
|
291
|
+
/**
|
|
292
|
+
* Classify a file count into the small / medium / large bucket. Pure —
|
|
293
|
+
* exposed so spec callers can pin the exact thresholds independent of
|
|
294
|
+
* the rest of the walker. Operators reading the prompt copy MUST see
|
|
295
|
+
* the same boundaries the implementation enforces.
|
|
296
|
+
*/
|
|
297
|
+
export function categoriseSize(srcCount) {
|
|
298
|
+
if (srcCount <= 50)
|
|
299
|
+
return 'small';
|
|
300
|
+
if (srcCount <= 500)
|
|
301
|
+
return 'medium';
|
|
302
|
+
return 'large';
|
|
303
|
+
}
|
|
304
|
+
/**
|
|
305
|
+
* Single entry-point. Pure. Never throws. Returns the structured
|
|
306
|
+
* verdict so the init prompt + cold-start hook + status command can
|
|
307
|
+
* all branch off one shared computation.
|
|
308
|
+
*/
|
|
309
|
+
export function detectRepo(cwd) {
|
|
310
|
+
let absCwd;
|
|
311
|
+
try {
|
|
312
|
+
absCwd = resolve(cwd);
|
|
313
|
+
const stat = statSync(absCwd);
|
|
314
|
+
if (!stat.isDirectory()) {
|
|
315
|
+
return { isRepo: false, reason: 'unreadable-cwd' };
|
|
316
|
+
}
|
|
317
|
+
}
|
|
318
|
+
catch {
|
|
319
|
+
return { isRepo: false, reason: 'unreadable-cwd' };
|
|
320
|
+
}
|
|
321
|
+
const gitRoot = findGitRoot(absCwd);
|
|
322
|
+
if (!gitRoot) {
|
|
323
|
+
return { isRepo: false, reason: 'no-git' };
|
|
324
|
+
}
|
|
325
|
+
const manifestLangs = detectManifestLanguages(gitRoot);
|
|
326
|
+
const { srcCount, languagesFromExt, wasCapped } = scanRepo(gitRoot);
|
|
327
|
+
const allLangs = new Set();
|
|
328
|
+
for (const lang of manifestLangs)
|
|
329
|
+
allLangs.add(lang);
|
|
330
|
+
for (const lang of languagesFromExt)
|
|
331
|
+
allLangs.add(lang);
|
|
332
|
+
const sortedLangs = [...allLangs].sort();
|
|
333
|
+
const sizeCategory = categoriseSize(srcCount);
|
|
334
|
+
const offerCodegraph = sizeCategory !== 'small' && sortedLangs.length > 0;
|
|
335
|
+
return {
|
|
336
|
+
isRepo: true,
|
|
337
|
+
gitRoot,
|
|
338
|
+
sizeCategory,
|
|
339
|
+
primarySymbolCount: srcCount,
|
|
340
|
+
languages: sortedLangs,
|
|
341
|
+
offerCodegraph,
|
|
342
|
+
wasCapped,
|
|
343
|
+
};
|
|
344
|
+
}
|
|
345
|
+
/**
|
|
346
|
+
* Render the cold-start nudge copy. Pure — exposed for spec parity so
|
|
347
|
+
* the cold-start hook + the spec assert against the same line.
|
|
348
|
+
*
|
|
349
|
+
* "Detected medium TypeScript repo with ~200 src files. Install
|
|
350
|
+
* codegraph MCP for symbol-aware code navigation? (Y/n)"
|
|
351
|
+
*
|
|
352
|
+
* The "~N" formatting rounds to the nearest 10 so the operator does
|
|
353
|
+
* not see a flapping count between scans on the same repo (one stray
|
|
354
|
+
* test fixture would change a precise N by 1).
|
|
355
|
+
*/
|
|
356
|
+
export function buildOfferCopy(detection) {
|
|
357
|
+
const noun = humanLanguageLabel(detection.languages);
|
|
358
|
+
const sizeLabel = detection.sizeCategory === 'large' ? 'large' : 'medium';
|
|
359
|
+
const approx = approxFileCount(detection.primarySymbolCount, detection.wasCapped);
|
|
360
|
+
const strength = detection.sizeCategory === 'large' ? 'strongly recommended' : 'recommended';
|
|
361
|
+
return `Detected ${sizeLabel} ${noun} repo with ${approx} src files (${strength}). Install codegraph MCP for symbol-aware code navigation? (Y/n)`;
|
|
362
|
+
}
|
|
363
|
+
/**
|
|
364
|
+
* Render the "X days old, refresh?" reminder copy. Single sentence,
|
|
365
|
+
* one CTA. The session module surfaces this on the system pane when
|
|
366
|
+
* the codegraph mcp.json entry exists but `lastIndexedAt` is stale.
|
|
367
|
+
*/
|
|
368
|
+
export function buildStaleIndexCopy(daysOld) {
|
|
369
|
+
return `Codegraph index is ${daysOld} day${daysOld === 1 ? '' : 's'} old. Run /codegraph-status to refresh.`;
|
|
370
|
+
}
|
|
371
|
+
/**
|
|
372
|
+
* Render the primary language label for the prompt. We use the
|
|
373
|
+
* first detected language (alphabetic order from `detectRepo`) so
|
|
374
|
+
* the copy is deterministic. Multi-language repos get a generic
|
|
375
|
+
* `polyglot` suffix — saves us from enumerating "TypeScript +
|
|
376
|
+
* Python + Rust + …" in the headline.
|
|
377
|
+
*/
|
|
378
|
+
function humanLanguageLabel(langs) {
|
|
379
|
+
if (langs.length === 0)
|
|
380
|
+
return 'source';
|
|
381
|
+
const primary = labelFor(langs[0]);
|
|
382
|
+
if (langs.length === 1)
|
|
383
|
+
return primary;
|
|
384
|
+
return `${primary} polyglot`;
|
|
385
|
+
}
|
|
386
|
+
function labelFor(lang) {
|
|
387
|
+
switch (lang) {
|
|
388
|
+
case 'typescript': return 'TypeScript';
|
|
389
|
+
case 'javascript': return 'JavaScript';
|
|
390
|
+
case 'python': return 'Python';
|
|
391
|
+
case 'rust': return 'Rust';
|
|
392
|
+
case 'go': return 'Go';
|
|
393
|
+
case 'java': return 'Java';
|
|
394
|
+
}
|
|
395
|
+
}
|
|
396
|
+
function approxFileCount(count, wasCapped) {
|
|
397
|
+
if (wasCapped)
|
|
398
|
+
return `${MAX_SCAN_FILES}+`;
|
|
399
|
+
if (count < 10)
|
|
400
|
+
return String(count);
|
|
401
|
+
const rounded = Math.round(count / 10) * 10;
|
|
402
|
+
return `~${rounded}`;
|
|
403
|
+
}
|
|
404
|
+
/**
|
|
405
|
+
* Parse a manifest hint into its declared languages. Tiny export so
|
|
406
|
+
* spec callers can drive the same map without re-declaring it.
|
|
407
|
+
*/
|
|
408
|
+
export function manifestHintFor(filename) {
|
|
409
|
+
for (const hint of MANIFEST_HINTS) {
|
|
410
|
+
if (hint.filename === filename)
|
|
411
|
+
return hint.languages;
|
|
412
|
+
}
|
|
413
|
+
return null;
|
|
414
|
+
}
|
|
415
|
+
/**
|
|
416
|
+
* Best-effort manifest-only language detection. Useful for callers
|
|
417
|
+
* that already have a `gitRoot` and do NOT want to walk the filesystem
|
|
418
|
+
* (e.g. /codegraph-status, which trusts the existing scan cache).
|
|
419
|
+
*
|
|
420
|
+
* The file-IO is just `existsSync` per manifest — no read/parse. A
|
|
421
|
+
* package.json that mentions Python in its `engines` will NOT light up
|
|
422
|
+
* python here; that is by design. The full scan is the source of truth.
|
|
423
|
+
*/
|
|
424
|
+
export function detectManifestLanguagesPublic(gitRoot) {
|
|
425
|
+
return [...detectManifestLanguages(gitRoot)].sort();
|
|
426
|
+
}
|
|
427
|
+
/**
|
|
428
|
+
* Sniff whether a manifest is structurally JSON. Pure — exposed only
|
|
429
|
+
* so a future surface can avoid double-checking. The manifest probe
|
|
430
|
+
* itself does NOT depend on this; it uses existsSync and trusts the
|
|
431
|
+
* filename heuristic.
|
|
432
|
+
*
|
|
433
|
+
* @internal
|
|
434
|
+
*/
|
|
435
|
+
export function looksLikeJson(text) {
|
|
436
|
+
const trimmed = text.trim();
|
|
437
|
+
if (trimmed.length === 0)
|
|
438
|
+
return false;
|
|
439
|
+
return trimmed.startsWith('{') || trimmed.startsWith('[');
|
|
440
|
+
}
|
|
441
|
+
/**
|
|
442
|
+
* Read the contents of a manifest file. Truncated к 8 KiB so a
|
|
443
|
+
* misnamed multi-MB file (e.g. a vendored lockfile masquerading as
|
|
444
|
+
* package.json) cannot stall the detector. Returns null on any IO
|
|
445
|
+
* error. Reserved for future use by surfaces that want manifest
|
|
446
|
+
* content beyond presence checks.
|
|
447
|
+
*
|
|
448
|
+
* @internal
|
|
449
|
+
*/
|
|
450
|
+
export function readManifestTruncated(absPath, maxBytes = 8 * 1024) {
|
|
451
|
+
try {
|
|
452
|
+
const raw = readFileSync(absPath, 'utf8');
|
|
453
|
+
return raw.length > maxBytes ? raw.slice(0, maxBytes) : raw;
|
|
454
|
+
}
|
|
455
|
+
catch {
|
|
456
|
+
return null;
|
|
457
|
+
}
|
|
458
|
+
}
|
|
459
|
+
//# sourceMappingURL=detect-repo.js.map
|
|
@@ -0,0 +1,134 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Codegraph MCP install helper — Wave 6 BIG TRACK 9 Phase 2.
|
|
3
|
+
*
|
|
4
|
+
* Writes the codegraph MCP server config к `.pugi/mcp.json` so the
|
|
5
|
+
* registry loader picks it up on the next dispatch. Mirrors the
|
|
6
|
+
* Phase 1 example config at `apps/pugi-cli/docs/examples/codegraph.mcp.json`
|
|
7
|
+
* — same `codegraph serve --mcp` command + `pending` trust state. The
|
|
8
|
+
* operator still has to run `pugi mcp trust codegraph` before tools
|
|
9
|
+
* actually surface; the install path NEVER auto-trusts, by design.
|
|
10
|
+
*
|
|
11
|
+
* Idempotent: re-running on a workspace that already has a `codegraph`
|
|
12
|
+
* entry is a no-op + returns `{ status: 'already-installed' }`. Other
|
|
13
|
+
* MCP servers in the same file are preserved.
|
|
14
|
+
*
|
|
15
|
+
* The function is intentionally NOT bundled into core/mcp/ to keep
|
|
16
|
+
* the codegraph product (install copy, decision store, language gate)
|
|
17
|
+
* one cohesive module. The MCP registry is a generic surface; the
|
|
18
|
+
* codegraph adoption is a feature on top of it.
|
|
19
|
+
*/
|
|
20
|
+
import { existsSync, mkdirSync, readFileSync, writeFileSync } from 'node:fs';
|
|
21
|
+
import { resolve } from 'node:path';
|
|
22
|
+
/**
|
|
23
|
+
* Canonical config shape we write into `.pugi/mcp.json` under the
|
|
24
|
+
* `codegraph` key. Matches `mcpServerConfigSchema` (Zod) in
|
|
25
|
+
* core/mcp/client.ts and the published example at docs/examples/
|
|
26
|
+
* codegraph.mcp.json. Drift here MUST land alongside a registry
|
|
27
|
+
* schema change OR the next dispatch crashes with a validation error.
|
|
28
|
+
*/
|
|
29
|
+
export const CODEGRAPH_MCP_ENTRY = Object.freeze({
|
|
30
|
+
command: 'codegraph',
|
|
31
|
+
args: Object.freeze(['serve', '--mcp']),
|
|
32
|
+
env: Object.freeze({}),
|
|
33
|
+
trust: 'pending',
|
|
34
|
+
});
|
|
35
|
+
/**
|
|
36
|
+
* Documentation URL surfaced after a successful install so the operator
|
|
37
|
+
* knows how to actually run codegraph index commands. Single source of
|
|
38
|
+
* truth — both the init flow and the /codegraph-status command pull
|
|
39
|
+
* from this constant.
|
|
40
|
+
*/
|
|
41
|
+
export const CODEGRAPH_DOCS_URL = 'https://github.com/colbymchenry/codegraph';
|
|
42
|
+
/**
|
|
43
|
+
* Merge the codegraph entry into `.pugi/mcp.json`. Creates the file
|
|
44
|
+
* (with `{ schema: 1, servers: { codegraph: ... } }`) when it does not
|
|
45
|
+
* exist. Preserves every other server entry on disk.
|
|
46
|
+
*
|
|
47
|
+
* @param workspaceRoot absolute path to the project root that owns the
|
|
48
|
+
* `.pugi/` directory. The caller is responsible for
|
|
49
|
+
* ensuring `.pugi/` exists (the install helper
|
|
50
|
+
* creates it as a defensive fallback).
|
|
51
|
+
*/
|
|
52
|
+
export function installCodegraphMcpEntry(workspaceRoot) {
|
|
53
|
+
const pugiDir = resolve(workspaceRoot, '.pugi');
|
|
54
|
+
const configPath = resolve(pugiDir, 'mcp.json');
|
|
55
|
+
try {
|
|
56
|
+
if (!existsSync(pugiDir)) {
|
|
57
|
+
mkdirSync(pugiDir, { recursive: true });
|
|
58
|
+
}
|
|
59
|
+
let existing = {};
|
|
60
|
+
if (existsSync(configPath)) {
|
|
61
|
+
try {
|
|
62
|
+
const raw = readFileSync(configPath, 'utf8');
|
|
63
|
+
if (raw.trim().length > 0) {
|
|
64
|
+
const parsed = JSON.parse(raw);
|
|
65
|
+
if (parsed && typeof parsed === 'object') {
|
|
66
|
+
existing = parsed;
|
|
67
|
+
}
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
catch (error) {
|
|
71
|
+
return {
|
|
72
|
+
status: 'failed',
|
|
73
|
+
reason: `cannot parse existing .pugi/mcp.json: ${error.message}`,
|
|
74
|
+
};
|
|
75
|
+
}
|
|
76
|
+
}
|
|
77
|
+
const servers = (existing.servers && typeof existing.servers === 'object')
|
|
78
|
+
? { ...existing.servers }
|
|
79
|
+
: {};
|
|
80
|
+
if (servers['codegraph']) {
|
|
81
|
+
return { status: 'already-installed', configPath };
|
|
82
|
+
}
|
|
83
|
+
servers['codegraph'] = {
|
|
84
|
+
command: CODEGRAPH_MCP_ENTRY.command,
|
|
85
|
+
args: [...CODEGRAPH_MCP_ENTRY.args],
|
|
86
|
+
env: { ...CODEGRAPH_MCP_ENTRY.env },
|
|
87
|
+
trust: CODEGRAPH_MCP_ENTRY.trust,
|
|
88
|
+
};
|
|
89
|
+
const out = {
|
|
90
|
+
schema: typeof existing.schema === 'number' ? existing.schema : 1,
|
|
91
|
+
servers,
|
|
92
|
+
};
|
|
93
|
+
writeFileSync(configPath, `${JSON.stringify(out, null, 2)}\n`, { mode: 0o600 });
|
|
94
|
+
return { status: 'installed', configPath };
|
|
95
|
+
}
|
|
96
|
+
catch (error) {
|
|
97
|
+
return { status: 'failed', reason: error.message };
|
|
98
|
+
}
|
|
99
|
+
}
|
|
100
|
+
/**
|
|
101
|
+
* Check whether `.pugi/mcp.json` already declares the `codegraph`
|
|
102
|
+
* server. Pure best-effort — a malformed file returns false (we err
|
|
103
|
+
* on the side of "not installed" so the operator can re-trigger the
|
|
104
|
+
* install path instead of being silently locked out).
|
|
105
|
+
*
|
|
106
|
+
* Returns the parsed `trust` state when present so callers can render
|
|
107
|
+
* the right status copy ("declared, awaiting trust" vs "active").
|
|
108
|
+
*/
|
|
109
|
+
export function detectCodegraphInstalled(workspaceRoot) {
|
|
110
|
+
const configPath = resolve(workspaceRoot, '.pugi/mcp.json');
|
|
111
|
+
if (!existsSync(configPath)) {
|
|
112
|
+
return { installed: false, trust: null, configPath };
|
|
113
|
+
}
|
|
114
|
+
try {
|
|
115
|
+
const raw = readFileSync(configPath, 'utf8');
|
|
116
|
+
if (raw.trim().length === 0) {
|
|
117
|
+
return { installed: false, trust: null, configPath };
|
|
118
|
+
}
|
|
119
|
+
const parsed = JSON.parse(raw);
|
|
120
|
+
const codegraph = parsed.servers?.['codegraph'];
|
|
121
|
+
if (!codegraph) {
|
|
122
|
+
return { installed: false, trust: null, configPath };
|
|
123
|
+
}
|
|
124
|
+
return {
|
|
125
|
+
installed: true,
|
|
126
|
+
trust: codegraph.trust === 'trusted' || codegraph.trust === 'denied' ? codegraph.trust : 'pending',
|
|
127
|
+
configPath,
|
|
128
|
+
};
|
|
129
|
+
}
|
|
130
|
+
catch {
|
|
131
|
+
return { installed: false, trust: null, configPath };
|
|
132
|
+
}
|
|
133
|
+
}
|
|
134
|
+
//# sourceMappingURL=install.js.map
|