sumulige-claude 1.1.2 → 1.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/hooks/code-formatter.cjs +7 -2
- package/.claude/hooks/multi-session.cjs +9 -3
- package/.claude/hooks/pre-commit.cjs +0 -0
- package/.claude/hooks/pre-push.cjs +0 -0
- package/.claude/hooks/project-kickoff.cjs +22 -11
- package/.claude/hooks/rag-skill-loader.cjs +7 -0
- package/.claude/hooks/thinking-silent.cjs +9 -3
- package/.claude/hooks/todo-manager.cjs +19 -13
- package/.claude/hooks/verify-work.cjs +10 -4
- package/.claude/quality-gate.json +9 -3
- package/.claude/settings.local.json +16 -1
- package/.claude/templates/hooks/README.md +302 -0
- package/.claude/templates/hooks/hook.sh.template +94 -0
- package/.claude/templates/hooks/user-prompt-submit.cjs.template +116 -0
- package/.claude/templates/hooks/user-response-submit.cjs.template +94 -0
- package/.claude/templates/hooks/validate.js +173 -0
- package/.claude/workflow/document-scanner.js +426 -0
- package/.claude/workflow/knowledge-engine.js +941 -0
- package/.claude/workflow/notebooklm/browser.js +1028 -0
- package/.claude/workflow/phases/phase1-research.js +578 -0
- package/.claude/workflow/phases/phase1-research.ts +465 -0
- package/.claude/workflow/phases/phase2-approve.js +722 -0
- package/.claude/workflow/phases/phase3-plan.js +1200 -0
- package/.claude/workflow/phases/phase4-develop.js +894 -0
- package/.claude/workflow/search-cache.js +230 -0
- package/.claude/workflow/templates/approval.md +315 -0
- package/.claude/workflow/templates/development.md +377 -0
- package/.claude/workflow/templates/planning.md +328 -0
- package/.claude/workflow/templates/research.md +250 -0
- package/.claude/workflow/types.js +37 -0
- package/.claude/workflow/web-search.js +278 -0
- package/.claude-plugin/marketplace.json +2 -2
- package/AGENTS.md +176 -0
- package/CHANGELOG.md +7 -14
- package/cli.js +20 -0
- package/config/quality-gate.json +9 -3
- package/development/cache/web-search/search_1193d605f8eb364651fc2f2041b58a31.json +36 -0
- package/development/cache/web-search/search_3798bf06960edc125f744a1abb5b72c5.json +36 -0
- package/development/cache/web-search/search_37c7d4843a53f0d83f1122a6f908a2a3.json +36 -0
- package/development/cache/web-search/search_44166fa0153709ee168485a22aa0ab40.json +36 -0
- package/development/cache/web-search/search_4deaebb1f77e86a8ca066dc5a49c59fd.json +36 -0
- package/development/cache/web-search/search_94da91789466070a7f545612e73c7372.json +36 -0
- package/development/cache/web-search/search_dd5de8491b8b803a3cb01339cd210fb0.json +36 -0
- package/development/knowledge-base/.index.clean.json +0 -0
- package/development/knowledge-base/.index.json +486 -0
- package/development/knowledge-base/test-best-practices.md +29 -0
- package/development/projects/proj_mkh1pazz_ixmt1/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4jvnb_z7rwf/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4jxkd_ewz5a/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4k84n_ni73k/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4wfyd_u9w88/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4wsbo_iahvf/development/projects/proj_mkh4xbpg_4na5w/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4wsbo_iahvf/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4xulg_1ka8x/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4xwhj_gch8j/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase2/requirements.md +226 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase3/PRD.md +345 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase3/TASK_PLAN.md +284 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase3/prototype/README.md +14 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/DEVELOPMENT_LOG.md +35 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/TASKS.md +34 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/.env.example +5 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/README.md +60 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/package.json +25 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/src/index.js +70 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/src/routes/index.js +48 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/tests/health.test.js +20 -0
- package/development/projects/proj_mkh4y2qk_9lm8z/phase4/source/tests/jest.config.js +21 -0
- package/development/projects/proj_mkh7veqg_3lypc/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh7veqg_3lypc/phase2/requirements.md +226 -0
- package/development/projects/proj_mkh7veqg_3lypc/phase3/PRD.md +345 -0
- package/development/projects/proj_mkh7veqg_3lypc/phase3/TASK_PLAN.md +284 -0
- package/development/projects/proj_mkh7veqg_3lypc/phase3/prototype/README.md +14 -0
- package/development/projects/proj_mkh8k8fo_rmqn5/phase1/feasibility-report.md +160 -0
- package/development/projects/proj_mkh8xyhy_1vshq/phase1/feasibility-report.md +178 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase1/feasibility-report.md +377 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase2/requirements.md +442 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase3/api-design.md +800 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase3/architecture.md +625 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase3/data-model.md +830 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase3/risks.md +957 -0
- package/development/projects/proj_mkh8zddd_dhamf/phase3/wbs.md +381 -0
- package/development/todos/.state.json +14 -1
- package/development/todos/INDEX.md +31 -73
- package/development/todos/completed/develop/local-knowledge-index.md +85 -0
- package/development/todos/{active → completed/develop}/todo-system.md +13 -3
- package/development/todos/completed/develop/web-search-integration.md +83 -0
- package/development/todos/completed/test/phase1-e2e-test.md +103 -0
- package/lib/commands.js +388 -0
- package/package.json +3 -2
- package/tests/config-manager.test.js +677 -0
- package/tests/config-validator.test.js +436 -0
- package/tests/errors.test.js +477 -0
- package/tests/manual/phase1-e2e.sh +389 -0
- package/tests/manual/phase2-test-cases.md +311 -0
- package/tests/manual/phase3-test-cases.md +309 -0
- package/tests/manual/phase4-test-cases.md +414 -0
- package/tests/manual/test-cases.md +417 -0
- package/tests/quality-gate.test.js +679 -0
- package/tests/quality-rules.test.js +619 -0
- package/tests/version-check.test.js +75 -0
|
@@ -0,0 +1,426 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Document Scanner - Extract content and metadata from local files
|
|
3
|
+
*
|
|
4
|
+
* Supports:
|
|
5
|
+
* - Text extraction from multiple file formats
|
|
6
|
+
* - Metadata extraction (word count, headings, links)
|
|
7
|
+
* - Content checksum for change detection
|
|
8
|
+
*/
|
|
9
|
+
|
|
10
|
+
const fs = require('fs');
|
|
11
|
+
const path = require('path');
|
|
12
|
+
const crypto = require('crypto');
|
|
13
|
+
|
|
14
|
+
// ============================================================================
|
|
15
|
+
// Configuration
|
|
16
|
+
// ============================================================================
|
|
17
|
+
|
|
18
|
+
const MAX_CONTENT_SIZE = 500 * 1024; // 500KB - don't store content if larger
|
|
19
|
+
const MAX_SNIPPET_SIZE = 2000; // Store snippet for large files
|
|
20
|
+
|
|
21
|
+
// Supported file types for content scanning
|
|
22
|
+
const SCANNABLE_TYPES = [
|
|
23
|
+
'.md', '.markdown', // Markdown
|
|
24
|
+
'.txt', // Plain text
|
|
25
|
+
'.json', '.yaml', '.yml', // Config files
|
|
26
|
+
'.js', '.ts', '.jsx', '.tsx', // JavaScript/TypeScript
|
|
27
|
+
'.py', '.rs', '.go', '.java', '.c', '.cpp', '.h', '.hpp', // Code
|
|
28
|
+
'.sh', '.bash', '.zsh', '.fish', // Shell scripts
|
|
29
|
+
'.css', '.scss', '.less', // Stylesheets
|
|
30
|
+
'.html', '.htm', '.xml', // Markup
|
|
31
|
+
'.sql', '.graphql', '.gql' // Query languages
|
|
32
|
+
];
|
|
33
|
+
|
|
34
|
+
// ============================================================================
|
|
35
|
+
// Document Scanner Class
|
|
36
|
+
// ============================================================================
|
|
37
|
+
|
|
38
|
+
class DocumentScanner {
|
|
39
|
+
/**
|
|
40
|
+
* Check if a file type is scannable
|
|
41
|
+
*/
|
|
42
|
+
static isScannable(filePath) {
|
|
43
|
+
const ext = path.extname(filePath).toLowerCase();
|
|
44
|
+
return SCANNABLE_TYPES.includes(ext);
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
/**
|
|
48
|
+
* Scan a file and extract metadata
|
|
49
|
+
*/
|
|
50
|
+
static scanFile(filePath, options = {}) {
|
|
51
|
+
const {
|
|
52
|
+
includeContent = true,
|
|
53
|
+
maxContentSize = MAX_CONTENT_SIZE
|
|
54
|
+
} = options;
|
|
55
|
+
|
|
56
|
+
if (!fs.existsSync(filePath)) {
|
|
57
|
+
throw new Error(`File not found: ${filePath}`);
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
const stats = fs.statSync(filePath);
|
|
61
|
+
const ext = path.extname(filePath).toLowerCase();
|
|
62
|
+
|
|
63
|
+
// Basic metadata
|
|
64
|
+
const metadata = {
|
|
65
|
+
path: filePath,
|
|
66
|
+
size: stats.size,
|
|
67
|
+
lastModified: stats.mtimeMs,
|
|
68
|
+
contentType: this.getMimeType(ext),
|
|
69
|
+
extension: ext
|
|
70
|
+
};
|
|
71
|
+
|
|
72
|
+
// If file is too large or not scannable, skip content
|
|
73
|
+
if (!this.isScannable(filePath) || stats.size === 0) {
|
|
74
|
+
return {
|
|
75
|
+
...metadata,
|
|
76
|
+
scannable: false,
|
|
77
|
+
wordCount: 0,
|
|
78
|
+
headings: [],
|
|
79
|
+
links: [],
|
|
80
|
+
};
|
|
81
|
+
}
|
|
82
|
+
|
|
83
|
+
// Read file content
|
|
84
|
+
let content;
|
|
85
|
+
try {
|
|
86
|
+
content = fs.readFileSync(filePath, 'utf-8');
|
|
87
|
+
} catch (error) {
|
|
88
|
+
return {
|
|
89
|
+
...metadata,
|
|
90
|
+
scannable: false,
|
|
91
|
+
error: error.message
|
|
92
|
+
};
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
// Calculate checksum
|
|
96
|
+
const checksum = crypto
|
|
97
|
+
.createHash('md5')
|
|
98
|
+
.update(content)
|
|
99
|
+
.digest('hex');
|
|
100
|
+
|
|
101
|
+
// Extract metadata based on file type
|
|
102
|
+
const extracted = this.extractMetadata(content, ext);
|
|
103
|
+
|
|
104
|
+
// Determine whether to store full content or just snippet
|
|
105
|
+
const shouldStoreContent = includeContent && content.length <= maxContentSize;
|
|
106
|
+
|
|
107
|
+
return {
|
|
108
|
+
...metadata,
|
|
109
|
+
scannable: true,
|
|
110
|
+
checksum,
|
|
111
|
+
wordCount: extracted.wordCount,
|
|
112
|
+
lineCount: extracted.lineCount,
|
|
113
|
+
headings: extracted.headings,
|
|
114
|
+
links: extracted.links,
|
|
115
|
+
codeBlocks: extracted.codeBlocks,
|
|
116
|
+
frontMatter: extracted.frontMatter,
|
|
117
|
+
// Content or snippet
|
|
118
|
+
content: shouldStoreContent ? content : null,
|
|
119
|
+
snippet: shouldStoreContent ? null : content.substring(0, MAX_SNIPPET_SIZE)
|
|
120
|
+
};
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
/**
|
|
124
|
+
* Extract metadata from content based on file type
|
|
125
|
+
*/
|
|
126
|
+
static extractMetadata(content, ext) {
|
|
127
|
+
const lines = content.split('\n');
|
|
128
|
+
const wordCount = this.countWords(content);
|
|
129
|
+
const lineCount = lines.length;
|
|
130
|
+
|
|
131
|
+
let headings = [];
|
|
132
|
+
let links = [];
|
|
133
|
+
let codeBlocks = [];
|
|
134
|
+
let frontMatter = null;
|
|
135
|
+
|
|
136
|
+
// Markdown-specific extraction
|
|
137
|
+
if (['.md', '.markdown'].includes(ext)) {
|
|
138
|
+
const mdResult = this.extractMarkdownMetadata(content);
|
|
139
|
+
headings = mdResult.headings;
|
|
140
|
+
links = mdResult.links;
|
|
141
|
+
codeBlocks = mdResult.codeBlocks;
|
|
142
|
+
frontMatter = mdResult.frontMatter;
|
|
143
|
+
}
|
|
144
|
+
// Code-specific extraction
|
|
145
|
+
else if (['.js', '.ts', '.jsx', '.tsx', '.py', '.rs', '.go'].includes(ext)) {
|
|
146
|
+
const codeResult = this.extractCodeMetadata(content, ext);
|
|
147
|
+
headings = codeResult.headings; // Functions/classes as headings
|
|
148
|
+
links = codeResult.links; // Import/require statements
|
|
149
|
+
}
|
|
150
|
+
|
|
151
|
+
return {
|
|
152
|
+
wordCount,
|
|
153
|
+
lineCount,
|
|
154
|
+
headings,
|
|
155
|
+
links,
|
|
156
|
+
codeBlocks,
|
|
157
|
+
frontMatter
|
|
158
|
+
};
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
/**
|
|
162
|
+
* Extract Markdown-specific metadata
|
|
163
|
+
*/
|
|
164
|
+
static extractMarkdownMetadata(content) {
|
|
165
|
+
const headings = [];
|
|
166
|
+
const links = [];
|
|
167
|
+
const codeBlocks = [];
|
|
168
|
+
let frontMatter = null;
|
|
169
|
+
|
|
170
|
+
const lines = content.split('\n');
|
|
171
|
+
let inCodeBlock = false;
|
|
172
|
+
let codeBlockLang = null;
|
|
173
|
+
let currentCodeBlock = [];
|
|
174
|
+
|
|
175
|
+
// Check for YAML front matter
|
|
176
|
+
if (lines[0] === '---') {
|
|
177
|
+
const endIdx = lines.slice(1).findIndex(line => line === '---');
|
|
178
|
+
if (endIdx > 0) {
|
|
179
|
+
const frontMatterContent = lines.slice(1, endIdx + 1).join('\n');
|
|
180
|
+
frontMatter = this.parseFrontMatter(frontMatterContent);
|
|
181
|
+
}
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
for (let i = 0; i < lines.length; i++) {
|
|
185
|
+
const line = lines[i];
|
|
186
|
+
|
|
187
|
+
// Track code blocks
|
|
188
|
+
if (line.startsWith('```')) {
|
|
189
|
+
if (!inCodeBlock) {
|
|
190
|
+
inCodeBlock = true;
|
|
191
|
+
codeBlockLang = line.substring(3).trim() || 'text';
|
|
192
|
+
currentCodeBlock = [];
|
|
193
|
+
} else {
|
|
194
|
+
codeBlocks.push({
|
|
195
|
+
language: codeBlockLang,
|
|
196
|
+
lineStart: i - currentCodeBlock.length,
|
|
197
|
+
preview: currentCodeBlock.slice(0, 3).join('\n')
|
|
198
|
+
});
|
|
199
|
+
inCodeBlock = false;
|
|
200
|
+
currentCodeBlock = [];
|
|
201
|
+
}
|
|
202
|
+
continue;
|
|
203
|
+
}
|
|
204
|
+
|
|
205
|
+
if (inCodeBlock) {
|
|
206
|
+
currentCodeBlock.push(line);
|
|
207
|
+
continue;
|
|
208
|
+
}
|
|
209
|
+
|
|
210
|
+
// Extract headings
|
|
211
|
+
const headingMatch = line.match(/^(#{1,6})\s+(.+)$/);
|
|
212
|
+
if (headingMatch) {
|
|
213
|
+
const level = headingMatch[1].length;
|
|
214
|
+
const text = headingMatch[2].trim();
|
|
215
|
+
headings.push({ level, text, line: i + 1 });
|
|
216
|
+
}
|
|
217
|
+
|
|
218
|
+
// Extract links
|
|
219
|
+
const linkMatch = line.match(/\[([^\]]+)\]\(([^)]+)\)/g);
|
|
220
|
+
if (linkMatch) {
|
|
221
|
+
linkMatch.forEach(link => {
|
|
222
|
+
const match = link.match(/\[([^\]]+)\]\(([^)]+)\)/);
|
|
223
|
+
if (match) {
|
|
224
|
+
links.push({ text: match[1], url: match[2] });
|
|
225
|
+
}
|
|
226
|
+
});
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
|
|
230
|
+
return { headings, links, codeBlocks, frontMatter };
|
|
231
|
+
}
|
|
232
|
+
|
|
233
|
+
/**
|
|
234
|
+
* Extract code-specific metadata (functions, classes, imports)
|
|
235
|
+
*/
|
|
236
|
+
static extractCodeMetadata(content, ext) {
|
|
237
|
+
const headings = [];
|
|
238
|
+
const links = [];
|
|
239
|
+
|
|
240
|
+
const lines = content.split('\n');
|
|
241
|
+
|
|
242
|
+
// Patterns for different languages
|
|
243
|
+
const patterns = {
|
|
244
|
+
'.js': { func: /^\s*(?:export\s+)?(?:async\s+)?function\s+(\w+)/, class: /^\s*class\s+(\w+)/, import: /^\s*import\s+.*from\s+['"]([^'"]+)['"]/ },
|
|
245
|
+
'.ts': { func: /^\s*(?:export\s+)?(?:async\s+)?function\s+(\w+)/, class: /^\s*class\s+(\w+)/, import: /^\s*import\s+.*from\s+['"]([^'"]+)['"]/ },
|
|
246
|
+
'.jsx': { func: /^\s*(?:export\s+)?(?:async\s+)?function\s+(\w+)/, class: /^\s*class\s+(\w+)/, import: /^\s*import\s+.*from\s+['"]([^'"]+)['"]/ },
|
|
247
|
+
'.tsx': { func: /^\s*(?:export\s+)?(?:async\s+)?function\s+(\w+)/, class: /^\s*class\s+(\w+)/, import: /^\s*import\s+.*from\s+['"]([^'"]+)['"]/ },
|
|
248
|
+
'.py': { func: /^\s*def\s+(\w+)\s*\(/, class: /^\s*class\s+(\w+)\s*:/, import: /^\s*(?:import|from)\s+(\w+)/ },
|
|
249
|
+
'.rs': { func: /^\s*(?:pub\s+)?fn\s+(\w+)\s*\(/, class: /^\s*(?:pub\s+)?(struct|enum|trait)\s+(\w+)/, import: /^\s*use\s+([^;]+);/ },
|
|
250
|
+
'.go': { func: /^\s*func\s+(?:\(\w+\s+\*?\w+\)\s+)?(\w+)\s*\(/, class: /^\s*type\s+(\w+)\s+struct/, import: /^\s*import\s+(?:\(|")([^")]+)/ }
|
|
251
|
+
};
|
|
252
|
+
|
|
253
|
+
const lang = patterns[ext] || patterns['.js'];
|
|
254
|
+
|
|
255
|
+
for (let i = 0; i < lines.length; i++) {
|
|
256
|
+
const line = lines[i];
|
|
257
|
+
|
|
258
|
+
// Extract functions
|
|
259
|
+
const funcMatch = line.match(lang.func);
|
|
260
|
+
if (funcMatch) {
|
|
261
|
+
headings.push({ type: 'function', name: funcMatch[1], line: i + 1 });
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
// Extract classes
|
|
265
|
+
const classMatch = line.match(lang.class);
|
|
266
|
+
if (classMatch) {
|
|
267
|
+
const name = classMatch[2] || classMatch[1];
|
|
268
|
+
headings.push({ type: 'class', name, line: i + 1 });
|
|
269
|
+
}
|
|
270
|
+
|
|
271
|
+
// Extract imports
|
|
272
|
+
const importMatch = line.match(lang.import);
|
|
273
|
+
if (importMatch) {
|
|
274
|
+
links.push({ type: 'import', name: importMatch[1], line: i + 1 });
|
|
275
|
+
}
|
|
276
|
+
}
|
|
277
|
+
|
|
278
|
+
return { headings, links };
|
|
279
|
+
}
|
|
280
|
+
|
|
281
|
+
/**
|
|
282
|
+
* Parse YAML front matter
|
|
283
|
+
*/
|
|
284
|
+
static parseFrontMatter(content) {
|
|
285
|
+
const result = {};
|
|
286
|
+
const lines = content.split('\n');
|
|
287
|
+
|
|
288
|
+
for (const line of lines) {
|
|
289
|
+
const match = line.match(/^(\w+):\s*(.+)$/);
|
|
290
|
+
if (match) {
|
|
291
|
+
result[match[1]] = match[2].trim();
|
|
292
|
+
}
|
|
293
|
+
}
|
|
294
|
+
|
|
295
|
+
return result;
|
|
296
|
+
}
|
|
297
|
+
|
|
298
|
+
/**
|
|
299
|
+
* Count words in content (rough estimate for mixed content)
|
|
300
|
+
*/
|
|
301
|
+
static countWords(content) {
|
|
302
|
+
// For code files, count tokens more accurately
|
|
303
|
+
// For text files, count words
|
|
304
|
+
const tokens = content
|
|
305
|
+
.replace(/\s+/g, ' ')
|
|
306
|
+
.replace(/[{}();,.<>[\]]/g, ' ')
|
|
307
|
+
.split(' ')
|
|
308
|
+
.filter(t => t.length > 0);
|
|
309
|
+
|
|
310
|
+
return tokens.length;
|
|
311
|
+
}
|
|
312
|
+
|
|
313
|
+
/**
|
|
314
|
+
* Get MIME type for extension
|
|
315
|
+
*/
|
|
316
|
+
static getMimeType(ext) {
|
|
317
|
+
const mimeTypes = {
|
|
318
|
+
'.md': 'text/markdown',
|
|
319
|
+
'.markdown': 'text/markdown',
|
|
320
|
+
'.txt': 'text/plain',
|
|
321
|
+
'.json': 'application/json',
|
|
322
|
+
'.yaml': 'text/yaml',
|
|
323
|
+
'.yml': 'text/yaml',
|
|
324
|
+
'.js': 'text/javascript',
|
|
325
|
+
'.ts': 'text/typescript',
|
|
326
|
+
'.jsx': 'text/jsx',
|
|
327
|
+
'.tsx': 'text/tsx',
|
|
328
|
+
'.py': 'text/x-python',
|
|
329
|
+
'.rs': 'text/x-rust',
|
|
330
|
+
'.go': 'text/x-go',
|
|
331
|
+
'.java': 'text/x-java',
|
|
332
|
+
'.c': 'text/x-c',
|
|
333
|
+
'.cpp': 'text/x-c++',
|
|
334
|
+
'.h': 'text/x-c',
|
|
335
|
+
'.hpp': 'text/x-c++',
|
|
336
|
+
'.sh': 'text/x-shellscript',
|
|
337
|
+
'.bash': 'text/x-shellscript',
|
|
338
|
+
'.css': 'text/css',
|
|
339
|
+
'.scss': 'text/x-scss',
|
|
340
|
+
'.less': 'text/x-less',
|
|
341
|
+
'.html': 'text/html',
|
|
342
|
+
'.htm': 'text/html',
|
|
343
|
+
'.xml': 'text/xml',
|
|
344
|
+
'.sql': 'text/x-sql',
|
|
345
|
+
'.graphql': 'text/x-graphql',
|
|
346
|
+
'.gql': 'text/x-graphql'
|
|
347
|
+
};
|
|
348
|
+
return mimeTypes[ext.toLowerCase()] || 'text/plain';
|
|
349
|
+
}
|
|
350
|
+
|
|
351
|
+
/**
|
|
352
|
+
* Scan a directory recursively
|
|
353
|
+
*/
|
|
354
|
+
static scanDirectory(dirPath, options = {}) {
|
|
355
|
+
const {
|
|
356
|
+
recursive = true,
|
|
357
|
+
maxDepth = 10,
|
|
358
|
+
includePatterns = [],
|
|
359
|
+
excludePatterns = ['node_modules', '.git', 'dist', 'build', 'coverage']
|
|
360
|
+
} = options;
|
|
361
|
+
|
|
362
|
+
if (!fs.existsSync(dirPath)) {
|
|
363
|
+
throw new Error(`Directory not found: ${dirPath}`);
|
|
364
|
+
}
|
|
365
|
+
|
|
366
|
+
const results = [];
|
|
367
|
+
const scanQueue = [{ dir: dirPath, depth: 0 }];
|
|
368
|
+
|
|
369
|
+
while (scanQueue.length > 0) {
|
|
370
|
+
const { dir, depth } = scanQueue.shift();
|
|
371
|
+
|
|
372
|
+
if (depth > maxDepth) continue;
|
|
373
|
+
|
|
374
|
+
let entries;
|
|
375
|
+
try {
|
|
376
|
+
entries = fs.readdirSync(dir, { withFileTypes: true });
|
|
377
|
+
} catch (error) {
|
|
378
|
+
continue; // Skip directories we can't read
|
|
379
|
+
}
|
|
380
|
+
|
|
381
|
+
for (const entry of entries) {
|
|
382
|
+
// Skip excluded directories
|
|
383
|
+
if (entry.isDirectory() && excludePatterns.includes(entry.name)) {
|
|
384
|
+
continue;
|
|
385
|
+
}
|
|
386
|
+
|
|
387
|
+
const fullPath = path.join(dir, entry.name);
|
|
388
|
+
|
|
389
|
+
if (entry.isDirectory() && recursive) {
|
|
390
|
+
scanQueue.push({ dir: fullPath, depth: depth + 1 });
|
|
391
|
+
} else if (entry.isFile()) {
|
|
392
|
+
// Check include patterns
|
|
393
|
+
if (includePatterns.length > 0) {
|
|
394
|
+
const matches = includePatterns.some(pattern => {
|
|
395
|
+
if (pattern instanceof RegExp) {
|
|
396
|
+
return pattern.test(fullPath);
|
|
397
|
+
}
|
|
398
|
+
return fullPath.includes(pattern);
|
|
399
|
+
});
|
|
400
|
+
if (!matches) continue;
|
|
401
|
+
}
|
|
402
|
+
|
|
403
|
+
try {
|
|
404
|
+
const scanResult = this.scanFile(fullPath, options);
|
|
405
|
+
results.push(scanResult);
|
|
406
|
+
} catch (error) {
|
|
407
|
+
// Skip files that can't be scanned
|
|
408
|
+
}
|
|
409
|
+
}
|
|
410
|
+
}
|
|
411
|
+
}
|
|
412
|
+
|
|
413
|
+
return results;
|
|
414
|
+
}
|
|
415
|
+
}
|
|
416
|
+
|
|
417
|
+
// ============================================================================
|
|
418
|
+
// Exports
|
|
419
|
+
// ============================================================================
|
|
420
|
+
|
|
421
|
+
module.exports = {
|
|
422
|
+
DocumentScanner,
|
|
423
|
+
SCANNABLE_TYPES,
|
|
424
|
+
MAX_CONTENT_SIZE,
|
|
425
|
+
MAX_SNIPPET_SIZE
|
|
426
|
+
};
|