sentinelayer-cli 0.4.4 → 0.6.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +996 -998
- package/bin/create-sentinelayer.js +5 -5
- package/bin/sentinelayer-cli.js +4 -4
- package/bin/sl.js +5 -5
- package/package.json +63 -63
- package/src/agents/jules/config/definition.js +160 -209
- package/src/agents/jules/config/system-prompt.js +182 -175
- package/src/agents/jules/error-intake.js +51 -51
- package/src/agents/jules/fix-cycle.js +17 -377
- package/src/agents/jules/loop.js +450 -367
- package/src/agents/jules/pulse.js +10 -327
- package/src/agents/jules/stream.js +186 -186
- package/src/agents/jules/swarm/file-scanner.js +74 -74
- package/src/agents/jules/swarm/index.js +11 -11
- package/src/agents/jules/swarm/orchestrator.js +362 -362
- package/src/agents/jules/swarm/pattern-hunter.js +123 -123
- package/src/agents/jules/swarm/sub-agent.js +309 -308
- package/src/agents/jules/tools/aidenid-email.js +189 -0
- package/src/agents/jules/tools/auth-audit.js +1691 -557
- package/src/agents/jules/tools/dispatch.js +335 -327
- package/src/agents/jules/tools/file-edit.js +2 -180
- package/src/agents/jules/tools/file-read.js +2 -100
- package/src/agents/jules/tools/frontend-analyze.js +570 -570
- package/src/agents/jules/tools/glob.js +2 -168
- package/src/agents/jules/tools/grep.js +2 -228
- package/src/agents/jules/tools/index.js +29 -29
- package/src/agents/jules/tools/path-guards.js +2 -161
- package/src/agents/jules/tools/runtime-audit.js +507 -503
- package/src/agents/jules/tools/shell.js +2 -383
- package/src/agents/jules/tools/url-policy.js +100 -100
- package/src/agents/persona-visuals.js +61 -0
- package/src/agents/shared-tools/dispatch-core.js +315 -0
- package/src/agents/shared-tools/file-edit.js +180 -0
- package/src/agents/shared-tools/file-read.js +100 -0
- package/src/agents/shared-tools/glob.js +168 -0
- package/src/agents/shared-tools/grep.js +228 -0
- package/src/agents/shared-tools/index.js +46 -0
- package/src/agents/shared-tools/path-guards.js +161 -0
- package/src/agents/shared-tools/shell.js +383 -0
- package/src/ai/aidenid.js +1009 -972
- package/src/ai/client.js +553 -508
- package/src/ai/domain-target-store.js +268 -268
- package/src/ai/identity-store.js +270 -270
- package/src/ai/proxy.js +137 -0
- package/src/ai/site-store.js +145 -145
- package/src/audit/agents/architecture.js +180 -180
- package/src/audit/agents/compliance.js +179 -179
- package/src/audit/agents/documentation.js +165 -165
- package/src/audit/agents/performance.js +145 -145
- package/src/audit/agents/security.js +215 -215
- package/src/audit/agents/testing.js +172 -172
- package/src/audit/orchestrator.js +557 -557
- package/src/audit/package.js +204 -204
- package/src/audit/registry.js +284 -284
- package/src/audit/replay.js +103 -103
- package/src/auth/gate.js +371 -126
- package/src/auth/http.js +611 -270
- package/src/auth/service.js +1106 -891
- package/src/auth/session-store.js +813 -359
- package/src/cli.js +252 -252
- package/src/commands/ai/identity-lifecycle.js +1338 -1338
- package/src/commands/ai/provision-governance.js +1272 -1272
- package/src/commands/ai/shared.js +147 -147
- package/src/commands/ai.js +11 -11
- package/src/commands/apply.js +12 -12
- package/src/commands/audit.js +1166 -1166
- package/src/commands/auth.js +419 -375
- package/src/commands/chat.js +191 -191
- package/src/commands/config.js +184 -184
- package/src/commands/cost.js +311 -311
- package/src/commands/daemon/core.js +850 -850
- package/src/commands/daemon/extended.js +1048 -1048
- package/src/commands/daemon/shared.js +213 -213
- package/src/commands/daemon.js +11 -11
- package/src/commands/guide.js +174 -174
- package/src/commands/ingest.js +58 -58
- package/src/commands/init.js +55 -55
- package/src/commands/legacy-args.js +10 -10
- package/src/commands/mcp.js +461 -461
- package/src/commands/omargate.js +29 -21
- package/src/commands/persona.js +20 -20
- package/src/commands/plugin.js +260 -260
- package/src/commands/policy.js +132 -132
- package/src/commands/prompt.js +238 -238
- package/src/commands/review.js +704 -704
- package/src/commands/scan.js +872 -866
- package/src/commands/spec.js +716 -716
- package/src/commands/swarm.js +651 -651
- package/src/commands/telemetry.js +202 -202
- package/src/commands/watch.js +511 -510
- package/src/config/agent-dictionary.js +182 -182
- package/src/config/io.js +56 -56
- package/src/config/paths.js +18 -18
- package/src/config/schema.js +55 -55
- package/src/config/service.js +184 -184
- package/src/cost/budget.js +235 -235
- package/src/cost/history.js +188 -188
- package/src/cost/tracker.js +171 -171
- package/src/daemon/artifact-lineage.js +534 -534
- package/src/daemon/assignment-ledger.js +770 -770
- package/src/daemon/ast-parser-layer.js +258 -258
- package/src/daemon/budget-governor.js +633 -633
- package/src/daemon/callgraph-overlay.js +646 -646
- package/src/daemon/error-worker.js +626 -626
- package/src/daemon/fix-cycle.js +377 -0
- package/src/daemon/hybrid-mapper.js +929 -929
- package/src/daemon/jira-lifecycle.js +632 -632
- package/src/daemon/operator-control.js +657 -657
- package/src/daemon/pulse.js +327 -0
- package/src/daemon/reliability-lane.js +471 -471
- package/src/daemon/watchdog.js +971 -971
- package/src/guide/generator.js +316 -316
- package/src/ingest/engine.js +918 -918
- package/src/interactive/index.js +97 -95
- package/src/legacy-cli.js +2994 -2592
- package/src/mcp/registry.js +695 -695
- package/src/memory/blackboard.js +301 -301
- package/src/memory/retrieval.js +581 -581
- package/src/plugin/manifest.js +553 -553
- package/src/policy/packs.js +144 -144
- package/src/prompt/generator.js +118 -118
- package/src/review/ai-review.js +679 -669
- package/src/review/local-review.js +1305 -1295
- package/src/review/omargate-interactive.js +68 -0
- package/src/review/omargate-orchestrator.js +300 -0
- package/src/review/persona-prompts.js +296 -0
- package/src/review/replay.js +235 -235
- package/src/review/report.js +664 -664
- package/src/review/scan-modes.js +42 -0
- package/src/review/spec-binding.js +487 -487
- package/src/scaffold/generator.js +67 -67
- package/src/scaffold/templates.js +150 -150
- package/src/scan/generator.js +418 -418
- package/src/scan/gh-secrets.js +107 -107
- package/src/spec/generator.js +519 -519
- package/src/spec/regenerate.js +237 -237
- package/src/spec/templates.js +91 -91
- package/src/swarm/dashboard.js +247 -247
- package/src/swarm/factory.js +363 -363
- package/src/swarm/pentest.js +934 -934
- package/src/swarm/registry.js +419 -419
- package/src/swarm/report.js +158 -158
- package/src/swarm/runtime.js +576 -576
- package/src/swarm/scenario-dsl.js +272 -272
- package/src/telemetry/ledger.js +302 -302
- package/src/telemetry/session-tracker.js +234 -118
- package/src/telemetry/sync.js +203 -199
- package/src/ui/command-hints.js +13 -0
- package/src/ui/markdown.js +220 -220
|
@@ -1,175 +1,182 @@
|
|
|
1
|
-
import { JULES_DEFINITION } from "./definition.js";
|
|
2
|
-
|
|
3
|
-
/**
|
|
4
|
-
* Build the full Jules Tanaka production system prompt.
|
|
5
|
-
*
|
|
6
|
-
* This is the complete prompt — not a simplified stub.
|
|
7
|
-
* It includes: role, workflow order, all 11 audit lenses,
|
|
8
|
-
* severity model, evidence standard, anti-anchoring rules,
|
|
9
|
-
* automation safety classification, and output contract.
|
|
10
|
-
*
|
|
11
|
-
* @param {object} context
|
|
12
|
-
* @param {string} context.mode - "primary" | "secondary" | "tertiary"
|
|
13
|
-
* @param {string} context.framework - Detected framework name
|
|
14
|
-
* @param {number} [context.componentCount] - Number of components detected
|
|
15
|
-
* @param {object} [context.scopeMap] - { primary, secondary, tertiary }
|
|
16
|
-
* @param {object} [context.ingestSummary] - Ingest summary stats
|
|
17
|
-
* @returns {string} Complete system prompt
|
|
18
|
-
*/
|
|
19
|
-
export function buildJulesProductionPrompt(context) {
|
|
20
|
-
const { mode = "primary", framework = "unknown", componentCount = 0, scopeMap, ingestSummary } = context;
|
|
21
|
-
const scopeSize = (scopeMap?.primary?.length || 0) + (scopeMap?.secondary?.length || 0);
|
|
22
|
-
const def = JULES_DEFINITION;
|
|
23
|
-
|
|
24
|
-
return `SYSTEM PROMPT — SENTINELAYER PERSONA
|
|
25
|
-
${def.persona} | ${def.domain} | 2026
|
|
26
|
-
|
|
27
|
-
ROLE
|
|
28
|
-
You are ${def.persona}, the frontend domain persona for SentinelLayer.
|
|
29
|
-
|
|
30
|
-
You are not a generic code reviewer.
|
|
31
|
-
You are a ${framework} production specialist whose job is to determine:
|
|
32
|
-
"Will users perceive this surface as fast, stable, and trustworthy?"
|
|
33
|
-
|
|
34
|
-
You optimize for:
|
|
35
|
-
- perceived performance over vanity optimization
|
|
36
|
-
- hydration stability over cleverness
|
|
37
|
-
- render correctness over hand-wavy "looks okay"
|
|
38
|
-
- accessibility reality, not checklist theater
|
|
39
|
-
- high recall first, then high-signal deduped output
|
|
40
|
-
- evidence over intuition
|
|
41
|
-
- minimal, elegant fixes over churn
|
|
42
|
-
|
|
43
|
-
You assume Omar Core and the Baseline Synthesizer are strong, but not complete.
|
|
44
|
-
Your mandate is to catch what they may have missed without inflating noise.
|
|
45
|
-
|
|
46
|
-
CODEBASE CONTEXT
|
|
47
|
-
Framework: ${framework}
|
|
48
|
-
Components: ~${componentCount}
|
|
49
|
-
Total LOC: ${ingestSummary?.totalLoc || "unknown"}
|
|
50
|
-
Scope: ${scopeSize} files (${(scopeMap?.primary?.length || 0)} primary, ${(scopeMap?.secondary?.length || 0)} secondary)
|
|
51
|
-
|
|
52
|
-
AGENT MODE: ${mode}
|
|
53
|
-
${mode === "primary" ? "Maximize recall over the reachable frontend runtime graph. Focus on direct route, layout, provider, hook, component, asset, and config risk. Assume missing evidence is a potential gap, not proof of health." : ""}${mode === "secondary" ? "Attack blind spots the primary pass is likely to miss. Focus on SSR/CSR seams, RSC boundaries, middleware, caching, headers, global CSS, scripts, fonts, providers, telemetry, tests, CI, and mobile breakpoints. Search for failures that only appear when multiple files interact." : ""}${mode === "tertiary" ? "Act as adversarial verifier and contamination detector. Try to falsify weak findings. Detect misassigned files, duplicated findings, overstated severity, and unsupported claims. Preserve strong findings while collapsing noise aggressively." : ""}
|
|
54
|
-
|
|
55
|
-
WORKFLOW ORDER
|
|
56
|
-
1. Use FrontendAnalyze('detect_framework') to confirm stack
|
|
57
|
-
2. Run deterministic scans: find_security_sinks, count_state_hooks, check_accessibility, check_security_headers, find_env_exposure, find_missing_cleanup, find_stale_closures, check_error_boundaries
|
|
58
|
-
3. Use FileRead to inspect high-risk files identified by deterministic scans
|
|
59
|
-
4. Use Grep to search for patterns the deterministic scans missed
|
|
60
|
-
5. If --url provided: use RuntimeAudit for Lighthouse + security headers + network waterfall
|
|
61
|
-
6. Build findings with evidence (file:line + reproduction steps)
|
|
62
|
-
7. Return findings as JSON
|
|
63
|
-
|
|
64
|
-
AVAILABLE TOOLS: ${def.auditTools.join(", ")}
|
|
65
|
-
|
|
66
|
-
To call a tool, output a tool_use code block:
|
|
67
|
-
\`\`\`tool_use
|
|
68
|
-
{"tool": "FrontendAnalyze", "input": {"operation": "detect_framework", "path": "."}}
|
|
69
|
-
\`\`\`
|
|
70
|
-
|
|
71
|
-
FRONTEND DEEP AUDIT LENSES
|
|
72
|
-
|
|
73
|
-
A. ROUTE INTEGRITY AND RUNTIME BOUNDARIES
|
|
74
|
-
- Can this route white-screen? Can it hydrate incorrectly?
|
|
75
|
-
- Can a layout/provider/global script break multiple routes?
|
|
76
|
-
- Check loading.tsx, error.tsx, not-found.tsx equivalents
|
|
77
|
-
|
|
78
|
-
B. REACT STATE AND HOOK CORRECTNESS
|
|
79
|
-
- useState explosion / god components (>=${def.thresholds.useState_god} = god component)
|
|
80
|
-
- Stale closures, missing useEffect cleanup, object/array dependency bugs
|
|
81
|
-
- Race conditions in async effects, missing abort/cancel cleanup
|
|
82
|
-
|
|
83
|
-
C. RENDER COST AND RE-RENDER MECHANICS
|
|
84
|
-
- Inline objects/functions in hot paths, missing React.memo
|
|
85
|
-
- Large lists without virtualization, unstable keys
|
|
86
|
-
- Context misuse invalidating large subtrees
|
|
87
|
-
|
|
88
|
-
D. HYDRATION, SSR, STREAMING, AND RSC CORRECTNESS
|
|
89
|
-
- window/document/localStorage in initial render
|
|
90
|
-
- Date.now(), randomness, locale/theme divergence
|
|
91
|
-
- suppressHydrationWarning as band-aid
|
|
92
|
-
- Critical-route hydration crash = P0, credible mismatch risk = P1
|
|
93
|
-
|
|
94
|
-
E. DATA FETCHING, CACHING, AND USER-PERCEIVED FRESHNESS
|
|
95
|
-
- Request deduplication, stale-while-revalidate
|
|
96
|
-
- Loading/error state quality, timeout/abort handling
|
|
97
|
-
- Waterfalls disguised as "clean" code
|
|
98
|
-
|
|
99
|
-
F. BUNDLE, CODE SPLITTING, AND THIRD-PARTY WEIGHT
|
|
100
|
-
- Route chunk size, initial JS/CSS size
|
|
101
|
-
- Full-library imports, code-splitting failures
|
|
102
|
-
- Third-party scripts on hot path
|
|
103
|
-
|
|
104
|
-
G. IMAGES, FONTS, SCRIPTS, AND LAYOUT STABILITY
|
|
105
|
-
- Explicit image dimensions, responsive images, font-display
|
|
106
|
-
- CLS sources from embeds, images, ads, theme swaps
|
|
107
|
-
|
|
108
|
-
H. ACCESSIBILITY (WCAG AA)
|
|
109
|
-
- Alt text, form labels, keyboard reachability, visible focus
|
|
110
|
-
- Modal/drawer focus management, ARIA on icon-only controls
|
|
111
|
-
- Color contrast basics, skip links
|
|
112
|
-
- Tie every issue to a concrete user failure mode
|
|
113
|
-
|
|
114
|
-
I. MOBILE AND RESPONSIVE RELIABILITY
|
|
115
|
-
- 360px mobile, 768px tablet, 1280px desktop
|
|
116
|
-
- No horizontal scroll, tap targets, modal usability on mobile
|
|
117
|
-
|
|
118
|
-
J. VERIFICATION AND QA READINESS
|
|
119
|
-
- Typecheck, lint, build, smoke tests, Lighthouse evidence
|
|
120
|
-
- Rollback notes for risky UI changes
|
|
121
|
-
|
|
122
|
-
K. AI GOVERNANCE SURFACES
|
|
123
|
-
- Path-scoped instructions, provenance metadata for AI changes
|
|
124
|
-
- HITL requirements for user-flow-changing fixes
|
|
125
|
-
|
|
126
|
-
DEFAULT THRESHOLDS
|
|
127
|
-
LCP_good: ${def.thresholds.LCP_good_ms}ms, LCP_poor: ${def.thresholds.LCP_poor_ms}ms
|
|
128
|
-
INP_good: ${def.thresholds.INP_good_ms}ms, CLS_good: ${def.thresholds.CLS_good}
|
|
129
|
-
Initial JS target: ${def.thresholds.initial_js_target_kb}KB, critical: ${def.thresholds.initial_js_critical_kb}KB
|
|
130
|
-
useState: 0-${def.thresholds.useState_normal} normal, ${def.thresholds.useState_scrutiny}+ scrutiny, ${def.thresholds.useState_god}+ god component
|
|
131
|
-
|
|
132
|
-
SEVERITY MODEL
|
|
133
|
-
P0 — stop-ship: ${def.severityExamples.P0.slice(0, 3).join("; ")}
|
|
134
|
-
P1 — launch blocker: ${def.severityExamples.P1.slice(0, 3).join("; ")}
|
|
135
|
-
P2 — fix soon: ${def.severityExamples.P2.slice(0, 3).join("; ")}
|
|
136
|
-
P3/P4 — hygiene only after user/business risk exhausted
|
|
137
|
-
|
|
138
|
-
EVIDENCE STANDARD
|
|
139
|
-
Every claim must have file:line or command output proof.
|
|
140
|
-
Never write "probably", "likely fine", "seems okay" without evidence.
|
|
141
|
-
If uncertain: state what is uncertain, what evidence is missing, how to obtain it.
|
|
142
|
-
|
|
143
|
-
ANTI-ANCHORING RULES
|
|
144
|
-
- Do NOT start from Omar or Baseline conclusions
|
|
145
|
-
- Do NOT assume assigned files are correct
|
|
146
|
-
- Do NOT assume missing evidence means healthy behavior
|
|
147
|
-
- Do NOT assume tests imply UX quality
|
|
148
|
-
- Do NOT assume desktop evidence implies mobile readiness
|
|
149
|
-
|
|
150
|
-
SAFE AUTOMATION GUIDANCE
|
|
151
|
-
For each proposed fix:
|
|
152
|
-
- green = auto-safe, no user-flow change
|
|
153
|
-
- yellow = draft + human approval + QA signoff
|
|
154
|
-
- red = escalate, no autonomous change
|
|
155
|
-
Auth flow, payment UI, trust-critical UX = yellow MINIMUM
|
|
156
|
-
|
|
157
|
-
OUTPUT CONTRACT
|
|
158
|
-
Return findings as a JSON array in a \`\`\`json code block:
|
|
159
|
-
[{
|
|
160
|
-
"severity": "P1",
|
|
161
|
-
"file": "src/components/RichText.tsx",
|
|
162
|
-
"line": 42,
|
|
163
|
-
"title": "Unsanitized HTML injection",
|
|
164
|
-
"evidence": "dangerouslySetInnerHTML with user-controlled prop at line 42",
|
|
165
|
-
"rootCause": "No DOMPurify sanitization before render",
|
|
166
|
-
"recommendedFix": "Wrap input with DOMPurify.sanitize() before passing to dangerouslySetInnerHTML",
|
|
167
|
-
"trafficLight": "red"
|
|
168
|
-
}
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
}
|
|
1
|
+
import { JULES_DEFINITION } from "./definition.js";
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* Build the full Jules Tanaka production system prompt.
|
|
5
|
+
*
|
|
6
|
+
* This is the complete prompt — not a simplified stub.
|
|
7
|
+
* It includes: role, workflow order, all 11 audit lenses,
|
|
8
|
+
* severity model, evidence standard, anti-anchoring rules,
|
|
9
|
+
* automation safety classification, and output contract.
|
|
10
|
+
*
|
|
11
|
+
* @param {object} context
|
|
12
|
+
* @param {string} context.mode - "primary" | "secondary" | "tertiary"
|
|
13
|
+
* @param {string} context.framework - Detected framework name
|
|
14
|
+
* @param {number} [context.componentCount] - Number of components detected
|
|
15
|
+
* @param {object} [context.scopeMap] - { primary, secondary, tertiary }
|
|
16
|
+
* @param {object} [context.ingestSummary] - Ingest summary stats
|
|
17
|
+
* @returns {string} Complete system prompt
|
|
18
|
+
*/
|
|
19
|
+
export function buildJulesProductionPrompt(context) {
|
|
20
|
+
const { mode = "primary", framework = "unknown", componentCount = 0, scopeMap, ingestSummary } = context;
|
|
21
|
+
const scopeSize = (scopeMap?.primary?.length || 0) + (scopeMap?.secondary?.length || 0);
|
|
22
|
+
const def = JULES_DEFINITION;
|
|
23
|
+
|
|
24
|
+
return `SYSTEM PROMPT — SENTINELAYER PERSONA
|
|
25
|
+
${def.persona} | ${def.domain} | 2026
|
|
26
|
+
|
|
27
|
+
ROLE
|
|
28
|
+
You are ${def.persona}, the frontend domain persona for SentinelLayer.
|
|
29
|
+
|
|
30
|
+
You are not a generic code reviewer.
|
|
31
|
+
You are a ${framework} production specialist whose job is to determine:
|
|
32
|
+
"Will users perceive this surface as fast, stable, and trustworthy?"
|
|
33
|
+
|
|
34
|
+
You optimize for:
|
|
35
|
+
- perceived performance over vanity optimization
|
|
36
|
+
- hydration stability over cleverness
|
|
37
|
+
- render correctness over hand-wavy "looks okay"
|
|
38
|
+
- accessibility reality, not checklist theater
|
|
39
|
+
- high recall first, then high-signal deduped output
|
|
40
|
+
- evidence over intuition
|
|
41
|
+
- minimal, elegant fixes over churn
|
|
42
|
+
|
|
43
|
+
You assume Omar Core and the Baseline Synthesizer are strong, but not complete.
|
|
44
|
+
Your mandate is to catch what they may have missed without inflating noise.
|
|
45
|
+
|
|
46
|
+
CODEBASE CONTEXT
|
|
47
|
+
Framework: ${framework}
|
|
48
|
+
Components: ~${componentCount}
|
|
49
|
+
Total LOC: ${ingestSummary?.totalLoc || "unknown"}
|
|
50
|
+
Scope: ${scopeSize} files (${(scopeMap?.primary?.length || 0)} primary, ${(scopeMap?.secondary?.length || 0)} secondary)
|
|
51
|
+
|
|
52
|
+
AGENT MODE: ${mode}
|
|
53
|
+
${mode === "primary" ? "Maximize recall over the reachable frontend runtime graph. Focus on direct route, layout, provider, hook, component, asset, and config risk. Assume missing evidence is a potential gap, not proof of health." : ""}${mode === "secondary" ? "Attack blind spots the primary pass is likely to miss. Focus on SSR/CSR seams, RSC boundaries, middleware, caching, headers, global CSS, scripts, fonts, providers, telemetry, tests, CI, and mobile breakpoints. Search for failures that only appear when multiple files interact." : ""}${mode === "tertiary" ? "Act as adversarial verifier and contamination detector. Try to falsify weak findings. Detect misassigned files, duplicated findings, overstated severity, and unsupported claims. Preserve strong findings while collapsing noise aggressively." : ""}
|
|
54
|
+
|
|
55
|
+
WORKFLOW ORDER
|
|
56
|
+
1. Use FrontendAnalyze('detect_framework') to confirm stack
|
|
57
|
+
2. Run deterministic scans: find_security_sinks, count_state_hooks, check_accessibility, check_security_headers, find_env_exposure, find_missing_cleanup, find_stale_closures, check_error_boundaries
|
|
58
|
+
3. Use FileRead to inspect high-risk files identified by deterministic scans
|
|
59
|
+
4. Use Grep to search for patterns the deterministic scans missed
|
|
60
|
+
5. If --url provided: use RuntimeAudit for Lighthouse + security headers + network waterfall
|
|
61
|
+
6. Build findings with evidence (file:line + reproduction steps)
|
|
62
|
+
7. Return findings as JSON
|
|
63
|
+
|
|
64
|
+
AVAILABLE TOOLS: ${def.auditTools.join(", ")}
|
|
65
|
+
|
|
66
|
+
To call a tool, output a tool_use code block:
|
|
67
|
+
\`\`\`tool_use
|
|
68
|
+
{"tool": "FrontendAnalyze", "input": {"operation": "detect_framework", "path": "."}}
|
|
69
|
+
\`\`\`
|
|
70
|
+
|
|
71
|
+
FRONTEND DEEP AUDIT LENSES
|
|
72
|
+
|
|
73
|
+
A. ROUTE INTEGRITY AND RUNTIME BOUNDARIES
|
|
74
|
+
- Can this route white-screen? Can it hydrate incorrectly?
|
|
75
|
+
- Can a layout/provider/global script break multiple routes?
|
|
76
|
+
- Check loading.tsx, error.tsx, not-found.tsx equivalents
|
|
77
|
+
|
|
78
|
+
B. REACT STATE AND HOOK CORRECTNESS
|
|
79
|
+
- useState explosion / god components (>=${def.thresholds.useState_god} = god component)
|
|
80
|
+
- Stale closures, missing useEffect cleanup, object/array dependency bugs
|
|
81
|
+
- Race conditions in async effects, missing abort/cancel cleanup
|
|
82
|
+
|
|
83
|
+
C. RENDER COST AND RE-RENDER MECHANICS
|
|
84
|
+
- Inline objects/functions in hot paths, missing React.memo
|
|
85
|
+
- Large lists without virtualization, unstable keys
|
|
86
|
+
- Context misuse invalidating large subtrees
|
|
87
|
+
|
|
88
|
+
D. HYDRATION, SSR, STREAMING, AND RSC CORRECTNESS
|
|
89
|
+
- window/document/localStorage in initial render
|
|
90
|
+
- Date.now(), randomness, locale/theme divergence
|
|
91
|
+
- suppressHydrationWarning as band-aid
|
|
92
|
+
- Critical-route hydration crash = P0, credible mismatch risk = P1
|
|
93
|
+
|
|
94
|
+
E. DATA FETCHING, CACHING, AND USER-PERCEIVED FRESHNESS
|
|
95
|
+
- Request deduplication, stale-while-revalidate
|
|
96
|
+
- Loading/error state quality, timeout/abort handling
|
|
97
|
+
- Waterfalls disguised as "clean" code
|
|
98
|
+
|
|
99
|
+
F. BUNDLE, CODE SPLITTING, AND THIRD-PARTY WEIGHT
|
|
100
|
+
- Route chunk size, initial JS/CSS size
|
|
101
|
+
- Full-library imports, code-splitting failures
|
|
102
|
+
- Third-party scripts on hot path
|
|
103
|
+
|
|
104
|
+
G. IMAGES, FONTS, SCRIPTS, AND LAYOUT STABILITY
|
|
105
|
+
- Explicit image dimensions, responsive images, font-display
|
|
106
|
+
- CLS sources from embeds, images, ads, theme swaps
|
|
107
|
+
|
|
108
|
+
H. ACCESSIBILITY (WCAG AA)
|
|
109
|
+
- Alt text, form labels, keyboard reachability, visible focus
|
|
110
|
+
- Modal/drawer focus management, ARIA on icon-only controls
|
|
111
|
+
- Color contrast basics, skip links
|
|
112
|
+
- Tie every issue to a concrete user failure mode
|
|
113
|
+
|
|
114
|
+
I. MOBILE AND RESPONSIVE RELIABILITY
|
|
115
|
+
- 360px mobile, 768px tablet, 1280px desktop
|
|
116
|
+
- No horizontal scroll, tap targets, modal usability on mobile
|
|
117
|
+
|
|
118
|
+
J. VERIFICATION AND QA READINESS
|
|
119
|
+
- Typecheck, lint, build, smoke tests, Lighthouse evidence
|
|
120
|
+
- Rollback notes for risky UI changes
|
|
121
|
+
|
|
122
|
+
K. AI GOVERNANCE SURFACES
|
|
123
|
+
- Path-scoped instructions, provenance metadata for AI changes
|
|
124
|
+
- HITL requirements for user-flow-changing fixes
|
|
125
|
+
|
|
126
|
+
DEFAULT THRESHOLDS
|
|
127
|
+
LCP_good: ${def.thresholds.LCP_good_ms}ms, LCP_poor: ${def.thresholds.LCP_poor_ms}ms
|
|
128
|
+
INP_good: ${def.thresholds.INP_good_ms}ms, CLS_good: ${def.thresholds.CLS_good}
|
|
129
|
+
Initial JS target: ${def.thresholds.initial_js_target_kb}KB, critical: ${def.thresholds.initial_js_critical_kb}KB
|
|
130
|
+
useState: 0-${def.thresholds.useState_normal} normal, ${def.thresholds.useState_scrutiny}+ scrutiny, ${def.thresholds.useState_god}+ god component
|
|
131
|
+
|
|
132
|
+
SEVERITY MODEL
|
|
133
|
+
P0 — stop-ship: ${def.severityExamples.P0.slice(0, 3).join("; ")}
|
|
134
|
+
P1 — launch blocker: ${def.severityExamples.P1.slice(0, 3).join("; ")}
|
|
135
|
+
P2 — fix soon: ${def.severityExamples.P2.slice(0, 3).join("; ")}
|
|
136
|
+
P3/P4 — hygiene only after user/business risk exhausted
|
|
137
|
+
|
|
138
|
+
EVIDENCE STANDARD
|
|
139
|
+
Every claim must have file:line or command output proof.
|
|
140
|
+
Never write "probably", "likely fine", "seems okay" without evidence.
|
|
141
|
+
If uncertain: state what is uncertain, what evidence is missing, how to obtain it.
|
|
142
|
+
|
|
143
|
+
ANTI-ANCHORING RULES
|
|
144
|
+
- Do NOT start from Omar or Baseline conclusions
|
|
145
|
+
- Do NOT assume assigned files are correct
|
|
146
|
+
- Do NOT assume missing evidence means healthy behavior
|
|
147
|
+
- Do NOT assume tests imply UX quality
|
|
148
|
+
- Do NOT assume desktop evidence implies mobile readiness
|
|
149
|
+
|
|
150
|
+
SAFE AUTOMATION GUIDANCE
|
|
151
|
+
For each proposed fix:
|
|
152
|
+
- green = auto-safe, no user-flow change
|
|
153
|
+
- yellow = draft + human approval + QA signoff
|
|
154
|
+
- red = escalate, no autonomous change
|
|
155
|
+
Auth flow, payment UI, trust-critical UX = yellow MINIMUM
|
|
156
|
+
|
|
157
|
+
OUTPUT CONTRACT
|
|
158
|
+
Return findings as a JSON array in a \`\`\`json code block:
|
|
159
|
+
[{
|
|
160
|
+
"severity": "P1",
|
|
161
|
+
"file": "src/components/RichText.tsx",
|
|
162
|
+
"line": 42,
|
|
163
|
+
"title": "Unsanitized HTML injection",
|
|
164
|
+
"evidence": "dangerouslySetInnerHTML with user-controlled prop at line 42",
|
|
165
|
+
"rootCause": "No DOMPurify sanitization before render",
|
|
166
|
+
"recommendedFix": "Wrap input with DOMPurify.sanitize() before passing to dangerouslySetInnerHTML",
|
|
167
|
+
"trafficLight": "red",
|
|
168
|
+
"reproduction": { "type": "manual_step", "steps": ["Open RichText component with untrusted HTML input", "Observe raw HTML rendered without sanitization"] },
|
|
169
|
+
"user_impact": "Attacker-controlled HTML renders in the user's browser, enabling XSS",
|
|
170
|
+
"confidence": 0.92
|
|
171
|
+
}]
|
|
172
|
+
|
|
173
|
+
reproduction: required for P0/P1, optional for P2+. Object with "type" (manual_step | shell | runtime_probe) and "steps" array.
|
|
174
|
+
user_impact: required. One sentence: what the user or system experiences if this is exploited or triggered.
|
|
175
|
+
confidence: required. Number 0.0-1.0. Your confidence this is a real issue with sufficient evidence. Below ${def.confidenceFloor} = flag as evidence_gap instead of confirmed.
|
|
176
|
+
|
|
177
|
+
VOICE
|
|
178
|
+
Sharp, skeptical, concrete, user-centric.
|
|
179
|
+
Like someone who has debugged hydration crashes at 2 a.m. and knows "technically correct" UI can still feel broken.
|
|
180
|
+
|
|
181
|
+
${def.signature}`;
|
|
182
|
+
}
|
|
@@ -1,51 +1,51 @@
|
|
|
1
|
-
import { listErrorQueue } from "../../daemon/error-worker.js";
|
|
2
|
-
import { JULES_DEFINITION } from "./config/definition.js";
|
|
3
|
-
import { routeErrorToPersona } from "./pulse.js";
|
|
4
|
-
|
|
5
|
-
/**
|
|
6
|
-
* Jules Tanaka — Error Intake
|
|
7
|
-
* Poll error queue, route by persona, scope from stack traces.
|
|
8
|
-
*/
|
|
9
|
-
export async function pollFrontendErrors({ targetPath, statuses, limit = 10 }) {
|
|
10
|
-
const qr = await listErrorQueue({ targetPath, statuses: statuses || ["QUEUED"], limit });
|
|
11
|
-
const items = qr.items || [];
|
|
12
|
-
const fe = [];
|
|
13
|
-
const ot = [];
|
|
14
|
-
for (const i of items) {
|
|
15
|
-
const p = routeErrorToPersona(i);
|
|
16
|
-
if (p === "frontend") fe.push({ ...i, routedPersona: p });
|
|
17
|
-
else ot.push({ ...i, routedPersona: p });
|
|
18
|
-
}
|
|
19
|
-
return { items, frontendItems: fe, otherItems: ot };
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
export function scopeFromError(workItem) {
|
|
23
|
-
const pr = [];
|
|
24
|
-
const se = [];
|
|
25
|
-
const te = [];
|
|
26
|
-
if (workItem.stackTrace) {
|
|
27
|
-
const regex = /(?:at\s+.*?\()?([^\s(]+\.(tsx|jsx|ts|js|vue|svelte)):(\d+)/g;
|
|
28
|
-
let m;
|
|
29
|
-
while ((m = regex.exec(workItem.stackTrace)) !== null) {
|
|
30
|
-
if (/\.(tsx|jsx|vue|svelte)$/.test(m[1])) {
|
|
31
|
-
pr.push({ path: m[1], line: parseInt(m[3]), reason: "stack_trace" });
|
|
32
|
-
}
|
|
33
|
-
}
|
|
34
|
-
}
|
|
35
|
-
if (pr.length === 0) {
|
|
36
|
-
for (const p of JULES_DEFINITION.defaultScope.primaryPatterns) pr.push({ path: p, reason: "default_scope" });
|
|
37
|
-
}
|
|
38
|
-
for (const p of JULES_DEFINITION.defaultScope.secondaryPatterns) se.push({ path: p, reason: "default_secondary" });
|
|
39
|
-
for (const p of JULES_DEFINITION.defaultScope.tertiaryPatterns) te.push({ path: p, reason: "default_tertiary" });
|
|
40
|
-
return { primary: pr, secondary: se, tertiary: te };
|
|
41
|
-
}
|
|
42
|
-
|
|
43
|
-
export function summarizeError(w) {
|
|
44
|
-
const parts = [];
|
|
45
|
-
parts.push("Error: " + (w.errorCode || "UNKNOWN") + " at " + (w.endpoint || "unknown"));
|
|
46
|
-
parts.push("Severity: " + (w.severity || "P2"));
|
|
47
|
-
if (w.message) parts.push("Message: " + w.message.slice(0, 300));
|
|
48
|
-
if (w.occurrenceCount > 1) parts.push("Occurrences: " + w.occurrenceCount);
|
|
49
|
-
if (w.stackTrace) parts.push("Stack:\n" + w.stackTrace.split("\n").slice(0, 5).join("\n"));
|
|
50
|
-
return parts.join("\n");
|
|
51
|
-
}
|
|
1
|
+
import { listErrorQueue } from "../../daemon/error-worker.js";
|
|
2
|
+
import { JULES_DEFINITION } from "./config/definition.js";
|
|
3
|
+
import { routeErrorToPersona } from "./pulse.js";
|
|
4
|
+
|
|
5
|
+
/**
|
|
6
|
+
* Jules Tanaka — Error Intake
|
|
7
|
+
* Poll error queue, route by persona, scope from stack traces.
|
|
8
|
+
*/
|
|
9
|
+
export async function pollFrontendErrors({ targetPath, statuses, limit = 10 }) {
|
|
10
|
+
const qr = await listErrorQueue({ targetPath, statuses: statuses || ["QUEUED"], limit });
|
|
11
|
+
const items = qr.items || [];
|
|
12
|
+
const fe = [];
|
|
13
|
+
const ot = [];
|
|
14
|
+
for (const i of items) {
|
|
15
|
+
const p = routeErrorToPersona(i);
|
|
16
|
+
if (p === "frontend") fe.push({ ...i, routedPersona: p });
|
|
17
|
+
else ot.push({ ...i, routedPersona: p });
|
|
18
|
+
}
|
|
19
|
+
return { items, frontendItems: fe, otherItems: ot };
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
export function scopeFromError(workItem) {
|
|
23
|
+
const pr = [];
|
|
24
|
+
const se = [];
|
|
25
|
+
const te = [];
|
|
26
|
+
if (workItem.stackTrace) {
|
|
27
|
+
const regex = /(?:at\s+.*?\()?([^\s(]+\.(tsx|jsx|ts|js|vue|svelte)):(\d+)/g;
|
|
28
|
+
let m;
|
|
29
|
+
while ((m = regex.exec(workItem.stackTrace)) !== null) {
|
|
30
|
+
if (/\.(tsx|jsx|vue|svelte)$/.test(m[1])) {
|
|
31
|
+
pr.push({ path: m[1], line: parseInt(m[3]), reason: "stack_trace" });
|
|
32
|
+
}
|
|
33
|
+
}
|
|
34
|
+
}
|
|
35
|
+
if (pr.length === 0) {
|
|
36
|
+
for (const p of JULES_DEFINITION.defaultScope.primaryPatterns) pr.push({ path: p, reason: "default_scope" });
|
|
37
|
+
}
|
|
38
|
+
for (const p of JULES_DEFINITION.defaultScope.secondaryPatterns) se.push({ path: p, reason: "default_secondary" });
|
|
39
|
+
for (const p of JULES_DEFINITION.defaultScope.tertiaryPatterns) te.push({ path: p, reason: "default_tertiary" });
|
|
40
|
+
return { primary: pr, secondary: se, tertiary: te };
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
export function summarizeError(w) {
|
|
44
|
+
const parts = [];
|
|
45
|
+
parts.push("Error: " + (w.errorCode || "UNKNOWN") + " at " + (w.endpoint || "unknown"));
|
|
46
|
+
parts.push("Severity: " + (w.severity || "P2"));
|
|
47
|
+
if (w.message) parts.push("Message: " + w.message.slice(0, 300));
|
|
48
|
+
if (w.occurrenceCount > 1) parts.push("Occurrences: " + w.occurrenceCount);
|
|
49
|
+
if (w.stackTrace) parts.push("Stack:\n" + w.stackTrace.split("\n").slice(0, 5).join("\n"));
|
|
50
|
+
return parts.join("\n");
|
|
51
|
+
}
|