nubos-pilot 1.2.1 → 1.2.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +43 -1
- package/agents/np-architect.md +2 -0
- package/agents/np-executor.md +1 -1
- package/agents/np-learnings-extractor.md +54 -0
- package/agents/np-planner.md +1 -1
- package/agents/np-security-reviewer.md +9 -0
- package/bin/np-tools/_commands.cjs +5 -0
- package/bin/np-tools/derive-tier.cjs +86 -0
- package/bin/np-tools/derive-tier.test.cjs +83 -0
- package/bin/np-tools/doctor.cjs +15 -2
- package/bin/np-tools/graph-impact.cjs +111 -0
- package/bin/np-tools/graph-impact.test.cjs +119 -0
- package/bin/np-tools/learnings.cjs +105 -0
- package/bin/np-tools/learnings.test.cjs +66 -0
- package/bin/np-tools/loop-run-round.cjs +7 -1
- package/bin/np-tools/scan-codebase.cjs +21 -1
- package/bin/np-tools/skill-audit.cjs +79 -0
- package/bin/np-tools/skill-audit.test.cjs +86 -0
- package/bin/np-tools/verify-reliability.cjs +65 -0
- package/bin/np-tools/verify-reliability.test.cjs +69 -0
- package/lib/agents.test.cjs +1 -0
- package/lib/checkpoint.cjs +3 -0
- package/lib/codebase-graph.cjs +0 -0
- package/lib/codebase-graph.test.cjs +174 -0
- package/lib/codebase-manifest.cjs +3 -0
- package/lib/config-defaults.cjs +13 -0
- package/lib/config-schema.cjs +11 -0
- package/lib/eval-reliability.cjs +63 -0
- package/lib/eval-reliability.test.cjs +56 -0
- package/lib/install/claude-hooks-learnings.test.cjs +82 -0
- package/lib/install/claude-hooks.cjs +65 -4
- package/lib/install/claude-hooks.test.cjs +5 -2
- package/lib/learnings/capture-ledger.cjs +80 -0
- package/lib/learnings/capture-ledger.test.cjs +54 -0
- package/lib/learnings/extract.cjs +191 -0
- package/lib/learnings/extract.test.cjs +115 -0
- package/lib/learnings.cjs +19 -95
- package/lib/memory.cjs +38 -33
- package/lib/messaging.cjs +12 -6
- package/lib/metrics-aggregate.cjs +14 -2
- package/lib/migrate.cjs +29 -0
- package/lib/migrate.test.cjs +91 -0
- package/lib/nubosloop-audit.cjs +104 -0
- package/lib/nubosloop-skill-audit.test.cjs +98 -0
- package/lib/nubosloop.cjs +9 -0
- package/lib/schemas/data/checkpoint.v1.json +13 -0
- package/lib/schemas/data/codebase-manifest.v1.json +22 -0
- package/lib/schemas/data/learnings.v1.json +28 -0
- package/lib/schemas/data/memory-manifest.v1.json +14 -0
- package/lib/schemas/data/memory-record.v1.json +16 -0
- package/lib/schemas/data/message.v1.json +19 -0
- package/lib/schemas/data/metrics-record.v1.json +11 -0
- package/lib/tier-classify.cjs +67 -0
- package/lib/tier-classify.test.cjs +67 -0
- package/lib/validate.cjs +301 -0
- package/lib/validate.test.cjs +242 -0
- package/np-tools.cjs +5 -0
- package/package.json +3 -1
- package/skills/np-access-control/SKILL.md +42 -0
- package/skills/np-accessibility-audit/SKILL.md +41 -0
- package/skills/np-adr/SKILL.md +37 -0
- package/skills/np-api-design/SKILL.md +34 -0
- package/skills/np-caching-strategy/SKILL.md +38 -0
- package/skills/np-data-modeling/SKILL.md +37 -0
- package/skills/np-data-privacy/SKILL.md +39 -0
- package/skills/np-dependency-audit/SKILL.md +47 -0
- package/skills/np-encryption/SKILL.md +47 -0
- package/skills/np-error-handling/SKILL.md +37 -0
- package/skills/np-incident-response/SKILL.md +38 -0
- package/skills/np-llm-app-architecture/SKILL.md +50 -0
- package/skills/np-observability/SKILL.md +39 -0
- package/skills/np-performance/SKILL.md +38 -0
- package/skills/np-queue-design/SKILL.md +32 -0
- package/skills/np-rag-design/SKILL.md +43 -0
- package/skills/np-refactoring/SKILL.md +35 -0
- package/skills/np-resilience-patterns/SKILL.md +39 -0
- package/skills/np-secure-code-review/SKILL.md +46 -0
- package/skills/np-secure-design/SKILL.md +44 -0
- package/skills/np-service-boundary/SKILL.md +35 -0
- package/skills/np-system-design/SKILL.md +40 -0
- package/skills/np-test-strategy/SKILL.md +46 -0
- package/skills/np-threat-model/SKILL.md +42 -0
- package/templates/claude/payload/hooks/np-learnings-hook.cjs +55 -0
- package/workflows/architect-phase.md +21 -1
- package/workflows/execute-phase.md +66 -4
- package/workflows/verify-work.md +17 -4
|
@@ -0,0 +1,174 @@
|
|
|
1
|
+
const { test } = require('node:test');
|
|
2
|
+
const assert = require('node:assert/strict');
|
|
3
|
+
|
|
4
|
+
const g = require('./codebase-graph.cjs');
|
|
5
|
+
|
|
6
|
+
function fact(id, directory, files, extra) {
|
|
7
|
+
const source_paths = files.map((f) => f.path);
|
|
8
|
+
return Object.assign({
|
|
9
|
+
id,
|
|
10
|
+
name: directory || 'root',
|
|
11
|
+
directory: directory || '',
|
|
12
|
+
primary_language: 'javascript',
|
|
13
|
+
language_distribution: { javascript: files.length },
|
|
14
|
+
file_count: files.length,
|
|
15
|
+
source_paths,
|
|
16
|
+
symbols: [],
|
|
17
|
+
internal_deps: [],
|
|
18
|
+
external_deps: [],
|
|
19
|
+
files,
|
|
20
|
+
}, extra || {});
|
|
21
|
+
}
|
|
22
|
+
|
|
23
|
+
test('CG-1: buildModuleGraph creates a node per fact', () => {
|
|
24
|
+
const facts = [
|
|
25
|
+
fact('src-auth', 'src/auth', [{ path: 'src/auth/login.js', language: 'javascript', symbols: [], deps: [] }]),
|
|
26
|
+
fact('src-db', 'src/db', [{ path: 'src/db/index.js', language: 'javascript', symbols: [], deps: [] }]),
|
|
27
|
+
];
|
|
28
|
+
const graph = g.buildModuleGraph(facts);
|
|
29
|
+
assert.equal(graph.module_count, 2);
|
|
30
|
+
assert.deepEqual(graph.nodes.map((n) => n.id), ['src-auth', 'src-db']);
|
|
31
|
+
});
|
|
32
|
+
|
|
33
|
+
test('CG-2: relative import resolves to a cross-module edge', () => {
|
|
34
|
+
const facts = [
|
|
35
|
+
fact('src-auth', 'src/auth', [
|
|
36
|
+
{ path: 'src/auth/login.js', language: 'javascript', symbols: [], deps: ['../db', 'bcrypt'] },
|
|
37
|
+
]),
|
|
38
|
+
fact('src-db', 'src/db', [
|
|
39
|
+
{ path: 'src/db/index.js', language: 'javascript', symbols: [], deps: [] },
|
|
40
|
+
]),
|
|
41
|
+
];
|
|
42
|
+
const graph = g.buildModuleGraph(facts);
|
|
43
|
+
assert.equal(graph.edge_count, 1);
|
|
44
|
+
assert.deepEqual(graph.edges[0], { from: 'src-auth', to: 'src-db', weight: 1 });
|
|
45
|
+
});
|
|
46
|
+
|
|
47
|
+
test('CG-3: external (non-relative) deps never become edges', () => {
|
|
48
|
+
const facts = [
|
|
49
|
+
fact('src-auth', 'src/auth', [
|
|
50
|
+
{ path: 'src/auth/login.js', language: 'javascript', symbols: [], deps: ['bcrypt', 'node:fs'] },
|
|
51
|
+
]),
|
|
52
|
+
];
|
|
53
|
+
const graph = g.buildModuleGraph(facts);
|
|
54
|
+
assert.equal(graph.edge_count, 0);
|
|
55
|
+
});
|
|
56
|
+
|
|
57
|
+
test('CG-4: same-module relative import is not a self-edge', () => {
|
|
58
|
+
const facts = [
|
|
59
|
+
fact('src-auth', 'src/auth', [
|
|
60
|
+
{ path: 'src/auth/login.js', language: 'javascript', symbols: [], deps: ['./session'] },
|
|
61
|
+
{ path: 'src/auth/session.js', language: 'javascript', symbols: [], deps: [] },
|
|
62
|
+
]),
|
|
63
|
+
];
|
|
64
|
+
const graph = g.buildModuleGraph(facts);
|
|
65
|
+
assert.equal(graph.edge_count, 0);
|
|
66
|
+
});
|
|
67
|
+
|
|
68
|
+
test('CG-5: repeated imports raise edge weight', () => {
|
|
69
|
+
const facts = [
|
|
70
|
+
fact('a', 'a', [
|
|
71
|
+
{ path: 'a/one.js', language: 'javascript', symbols: [], deps: ['../b'] },
|
|
72
|
+
{ path: 'a/two.js', language: 'javascript', symbols: [], deps: ['../b/helper'] },
|
|
73
|
+
]),
|
|
74
|
+
fact('b', 'b', [
|
|
75
|
+
{ path: 'b/index.js', language: 'javascript', symbols: [], deps: [] },
|
|
76
|
+
{ path: 'b/helper.js', language: 'javascript', symbols: [], deps: [] },
|
|
77
|
+
]),
|
|
78
|
+
];
|
|
79
|
+
const graph = g.buildModuleGraph(facts);
|
|
80
|
+
assert.equal(graph.edges.length, 1);
|
|
81
|
+
assert.equal(graph.edges[0].weight, 2);
|
|
82
|
+
});
|
|
83
|
+
|
|
84
|
+
test('CG-6: unresolved internal-looking deps are counted, not edged', () => {
|
|
85
|
+
const facts = [
|
|
86
|
+
fact('a', 'a', [
|
|
87
|
+
{ path: 'a/one.js', language: 'javascript', symbols: [], deps: ['../nonexistent'] },
|
|
88
|
+
]),
|
|
89
|
+
];
|
|
90
|
+
const graph = g.buildModuleGraph(facts);
|
|
91
|
+
assert.equal(graph.edge_count, 0);
|
|
92
|
+
assert.equal(graph.metrics.unresolved_internal_deps, 1);
|
|
93
|
+
});
|
|
94
|
+
|
|
95
|
+
test('CG-7: Tarjan detects a 2-module cycle', () => {
|
|
96
|
+
const facts = [
|
|
97
|
+
fact('a', 'a', [{ path: 'a/x.js', language: 'javascript', symbols: [], deps: ['../b'] }]),
|
|
98
|
+
fact('b', 'b', [{ path: 'b/index.js', language: 'javascript', symbols: [], deps: ['../a'] }]),
|
|
99
|
+
];
|
|
100
|
+
const graph = g.buildModuleGraph(facts);
|
|
101
|
+
assert.equal(graph.cycles.length, 1);
|
|
102
|
+
assert.deepEqual(graph.cycles[0], ['a', 'b']);
|
|
103
|
+
});
|
|
104
|
+
|
|
105
|
+
test('CG-8: acyclic graph reports no cycles', () => {
|
|
106
|
+
const facts = [
|
|
107
|
+
fact('a', 'a', [{ path: 'a/x.js', language: 'javascript', symbols: [], deps: ['../b'] }]),
|
|
108
|
+
fact('b', 'b', [{ path: 'b/index.js', language: 'javascript', symbols: [], deps: ['../c'] }]),
|
|
109
|
+
fact('c', 'c', [{ path: 'c/index.js', language: 'javascript', symbols: [], deps: [] }]),
|
|
110
|
+
];
|
|
111
|
+
const graph = g.buildModuleGraph(facts);
|
|
112
|
+
assert.equal(graph.cycles.length, 0);
|
|
113
|
+
});
|
|
114
|
+
|
|
115
|
+
test('CG-9: transitive dependents (impact) walk the reverse graph', () => {
|
|
116
|
+
const facts = [
|
|
117
|
+
fact('a', 'a', [{ path: 'a/x.js', language: 'javascript', symbols: [], deps: ['../b'] }]),
|
|
118
|
+
fact('b', 'b', [{ path: 'b/index.js', language: 'javascript', symbols: [], deps: ['../c'] }]),
|
|
119
|
+
fact('c', 'c', [{ path: 'c/index.js', language: 'javascript', symbols: [], deps: [] }]),
|
|
120
|
+
];
|
|
121
|
+
const graph = g.buildModuleGraph(facts);
|
|
122
|
+
assert.deepEqual(g.transitiveDependents(graph, 'c'), ['a', 'b']);
|
|
123
|
+
assert.deepEqual(g.directDependents(graph, 'c'), ['b']);
|
|
124
|
+
assert.deepEqual(g.transitiveDependencies(graph, 'a'), ['b', 'c']);
|
|
125
|
+
assert.deepEqual(g.directDependencies(graph, 'a'), ['b']);
|
|
126
|
+
});
|
|
127
|
+
|
|
128
|
+
test('CG-10: deterministic clustering groups a connected component together', () => {
|
|
129
|
+
const facts = [
|
|
130
|
+
fact('a', 'a', [{ path: 'a/x.js', language: 'javascript', symbols: [], deps: ['../b'] }]),
|
|
131
|
+
fact('b', 'b', [{ path: 'b/index.js', language: 'javascript', symbols: [], deps: ['../a'] }]),
|
|
132
|
+
fact('lonely', 'lonely', [{ path: 'lonely/z.js', language: 'javascript', symbols: [], deps: [] }]),
|
|
133
|
+
];
|
|
134
|
+
const graph = g.buildModuleGraph(facts);
|
|
135
|
+
const first = g.buildModuleGraph(facts);
|
|
136
|
+
assert.deepEqual(graph.clusters, first.clusters);
|
|
137
|
+
const clusterAB = graph.clusters.find((c) => c.members.includes('a'));
|
|
138
|
+
assert.ok(clusterAB.members.includes('b'));
|
|
139
|
+
assert.ok(!clusterAB.members.includes('lonely'));
|
|
140
|
+
});
|
|
141
|
+
|
|
142
|
+
test('CG-11: cycleFor and clusterOf locate a module', () => {
|
|
143
|
+
const facts = [
|
|
144
|
+
fact('a', 'a', [{ path: 'a/x.js', language: 'javascript', symbols: [], deps: ['../b'] }]),
|
|
145
|
+
fact('b', 'b', [{ path: 'b/index.js', language: 'javascript', symbols: [], deps: ['../a'] }]),
|
|
146
|
+
];
|
|
147
|
+
const graph = g.buildModuleGraph(facts);
|
|
148
|
+
assert.deepEqual(g.cycleFor(graph, 'a'), ['a', 'b']);
|
|
149
|
+
assert.equal(typeof g.clusterOf(graph, 'a'), 'number');
|
|
150
|
+
assert.equal(g.cycleFor(graph, 'missing'), null);
|
|
151
|
+
assert.equal(g.clusterOf(graph, 'missing'), null);
|
|
152
|
+
});
|
|
153
|
+
|
|
154
|
+
test('CG-12: root-relative (/-prefixed) deps resolve from project root', () => {
|
|
155
|
+
const facts = [
|
|
156
|
+
fact('src-auth', 'src/auth', [
|
|
157
|
+
{ path: 'src/auth/login.js', language: 'javascript', symbols: [], deps: ['/src/db'] },
|
|
158
|
+
]),
|
|
159
|
+
fact('src-db', 'src/db', [
|
|
160
|
+
{ path: 'src/db/index.js', language: 'javascript', symbols: [], deps: [] },
|
|
161
|
+
]),
|
|
162
|
+
];
|
|
163
|
+
const graph = g.buildModuleGraph(facts);
|
|
164
|
+
assert.equal(graph.edge_count, 1);
|
|
165
|
+
assert.deepEqual(graph.edges[0], { from: 'src-auth', to: 'src-db', weight: 1 });
|
|
166
|
+
});
|
|
167
|
+
|
|
168
|
+
test('CG-13: empty facts yield an empty graph', () => {
|
|
169
|
+
const graph = g.buildModuleGraph([]);
|
|
170
|
+
assert.equal(graph.module_count, 0);
|
|
171
|
+
assert.equal(graph.edge_count, 0);
|
|
172
|
+
assert.deepEqual(graph.cycles, []);
|
|
173
|
+
assert.deepEqual(graph.clusters, []);
|
|
174
|
+
});
|
|
@@ -3,8 +3,10 @@
|
|
|
3
3
|
const fs = require('node:fs');
|
|
4
4
|
const path = require('node:path');
|
|
5
5
|
const { atomicWriteFileSync, NubosPilotError } = require('./core.cjs');
|
|
6
|
+
const { assertValid } = require('./validate.cjs');
|
|
6
7
|
|
|
7
8
|
const SCHEMA_VERSION = 1;
|
|
9
|
+
const STORE_SCHEMA = 'codebase-manifest.v1';
|
|
8
10
|
const CODEBASE_DIR_NAME = 'codebase';
|
|
9
11
|
const MANIFEST_FILENAME = '.hashes.json';
|
|
10
12
|
|
|
@@ -63,6 +65,7 @@ function readManifest(projectRoot) {
|
|
|
63
65
|
);
|
|
64
66
|
}
|
|
65
67
|
if (!parsed.files || typeof parsed.files !== 'object') parsed.files = {};
|
|
68
|
+
assertValid(parsed, STORE_SCHEMA, 'manifest-invalid-shape', { path: p });
|
|
66
69
|
return parsed;
|
|
67
70
|
}
|
|
68
71
|
|
package/lib/config-defaults.cjs
CHANGED
|
@@ -9,6 +9,7 @@ const DEFAULT_WORKFLOW = Object.freeze({
|
|
|
9
9
|
commit_docs: true,
|
|
10
10
|
commit_artifacts: true,
|
|
11
11
|
worktree_isolation: false,
|
|
12
|
+
tier_routing: false,
|
|
12
13
|
research_tools: DEFAULT_RESEARCH_TOOLS,
|
|
13
14
|
});
|
|
14
15
|
|
|
@@ -21,6 +22,7 @@ const DEFAULT_AGENTS = Object.freeze({
|
|
|
21
22
|
|
|
22
23
|
const DEFAULT_LOOP = Object.freeze({
|
|
23
24
|
maxRounds: 3,
|
|
25
|
+
verify_runs: 1,
|
|
24
26
|
});
|
|
25
27
|
|
|
26
28
|
const DEFAULT_SWARM_RESEARCH = Object.freeze({
|
|
@@ -58,6 +60,14 @@ const DEFAULT_CONFORMANCE = Object.freeze({
|
|
|
58
60
|
inject_criteria: true,
|
|
59
61
|
});
|
|
60
62
|
|
|
63
|
+
const DEFAULT_LEARNINGS = Object.freeze({
|
|
64
|
+
auto_capture: true,
|
|
65
|
+
max_captures_per_hour: 10,
|
|
66
|
+
max_in_a_row: 3,
|
|
67
|
+
timeout_ms: 120000,
|
|
68
|
+
max_files: 30,
|
|
69
|
+
});
|
|
70
|
+
|
|
61
71
|
const DEFAULT_AUTO_LOG_LEARNING = true;
|
|
62
72
|
|
|
63
73
|
const DEFAULT_SPAWN_HEADLESS = Object.freeze({
|
|
@@ -86,6 +96,7 @@ const DEFAULT_CONFIG_TREE = Object.freeze({
|
|
|
86
96
|
spawn: DEFAULT_SPAWN,
|
|
87
97
|
security: DEFAULT_SECURITY,
|
|
88
98
|
conformance: DEFAULT_CONFORMANCE,
|
|
99
|
+
learnings: DEFAULT_LEARNINGS,
|
|
89
100
|
auto_log_learning: DEFAULT_AUTO_LOG_LEARNING,
|
|
90
101
|
});
|
|
91
102
|
|
|
@@ -119,6 +130,7 @@ function buildInstallConfig(answers) {
|
|
|
119
130
|
},
|
|
120
131
|
security: { ...DEFAULT_SECURITY },
|
|
121
132
|
conformance: { ...DEFAULT_CONFORMANCE },
|
|
133
|
+
learnings: { ...DEFAULT_LEARNINGS },
|
|
122
134
|
auto_log_learning: DEFAULT_AUTO_LOG_LEARNING,
|
|
123
135
|
};
|
|
124
136
|
}
|
|
@@ -135,6 +147,7 @@ module.exports = {
|
|
|
135
147
|
DEFAULT_SPAWN_HEADLESS,
|
|
136
148
|
DEFAULT_SECURITY,
|
|
137
149
|
DEFAULT_CONFORMANCE,
|
|
150
|
+
DEFAULT_LEARNINGS,
|
|
138
151
|
DEFAULT_AUTO_LOG_LEARNING,
|
|
139
152
|
DEFAULT_MODEL_PROFILE,
|
|
140
153
|
DEFAULT_SCOPE,
|
package/lib/config-schema.cjs
CHANGED
|
@@ -21,6 +21,7 @@ const SCHEMA = Object.freeze({
|
|
|
21
21
|
worktree_isolation: { type: 'boolean', optional: true },
|
|
22
22
|
research_tools: { type: 'object', shape: 'any', optional: true },
|
|
23
23
|
text_mode: { type: 'boolean', optional: true },
|
|
24
|
+
tier_routing: { type: 'boolean', optional: true },
|
|
24
25
|
},
|
|
25
26
|
},
|
|
26
27
|
agents: {
|
|
@@ -34,6 +35,7 @@ const SCHEMA = Object.freeze({
|
|
|
34
35
|
loop: {
|
|
35
36
|
type: 'object', optional: true, shape: {
|
|
36
37
|
maxRounds: { type: 'number', optional: true },
|
|
38
|
+
verify_runs: { type: 'number', optional: true },
|
|
37
39
|
},
|
|
38
40
|
},
|
|
39
41
|
swarm: {
|
|
@@ -86,6 +88,15 @@ const SCHEMA = Object.freeze({
|
|
|
86
88
|
inject_criteria: { type: 'boolean', optional: true },
|
|
87
89
|
},
|
|
88
90
|
},
|
|
91
|
+
learnings: {
|
|
92
|
+
type: 'object', optional: true, shape: {
|
|
93
|
+
auto_capture: { type: 'boolean', optional: true },
|
|
94
|
+
max_captures_per_hour: { type: 'number', optional: true },
|
|
95
|
+
max_in_a_row: { type: 'number', optional: true },
|
|
96
|
+
timeout_ms: { type: 'number', optional: true },
|
|
97
|
+
max_files: { type: 'number', optional: true },
|
|
98
|
+
},
|
|
99
|
+
},
|
|
89
100
|
});
|
|
90
101
|
|
|
91
102
|
function _typeOf(v) {
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
'use strict';
|
|
2
|
+
|
|
3
|
+
// pass@k reliability: the orchestrator runs a task's <verify> command k times
|
|
4
|
+
// and feeds the collected exit codes here. A task that passes only sometimes is
|
|
5
|
+
// FLAKY — not green. summarize() folds k runs into a single aggregate exit code
|
|
6
|
+
// (0 only when every run passed — pass^k semantics) so flakiness flows through
|
|
7
|
+
// the EXISTING verify-red → build-fixer path. No new critic category is
|
|
8
|
+
// introduced (that would risk the unknown-category spurious-stuck trap).
|
|
9
|
+
|
|
10
|
+
const { NubosPilotError } = require('./core.cjs');
|
|
11
|
+
|
|
12
|
+
/**
|
|
13
|
+
* @param {number[]} exitCodes one exit code per verify run (0 = pass)
|
|
14
|
+
* @returns {{runs:number, passes:number, fails:number, pass_at_1:boolean, pass_at_k:boolean, flaky:boolean, verdict:string, aggregate_exit_code:number}}
|
|
15
|
+
*/
|
|
16
|
+
function summarize(exitCodes) {
|
|
17
|
+
if (!Array.isArray(exitCodes) || exitCodes.length === 0) {
|
|
18
|
+
throw new NubosPilotError(
|
|
19
|
+
'eval-reliability-no-runs',
|
|
20
|
+
'summarize requires a non-empty array of exit codes',
|
|
21
|
+
{ got: exitCodes },
|
|
22
|
+
);
|
|
23
|
+
}
|
|
24
|
+
const codes = exitCodes.map((c) => Number(c));
|
|
25
|
+
if (codes.some((c) => !Number.isInteger(c))) {
|
|
26
|
+
throw new NubosPilotError(
|
|
27
|
+
'eval-reliability-bad-code',
|
|
28
|
+
'every exit code must be an integer',
|
|
29
|
+
{ codes: exitCodes },
|
|
30
|
+
);
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
const runs = codes.length;
|
|
34
|
+
const passes = codes.filter((c) => c === 0).length;
|
|
35
|
+
const fails = runs - passes;
|
|
36
|
+
const passAt1 = codes[0] === 0;
|
|
37
|
+
const passAtK = passes === runs;
|
|
38
|
+
const flaky = passes > 0 && fails > 0;
|
|
39
|
+
|
|
40
|
+
let verdict;
|
|
41
|
+
if (passAtK) verdict = 'reliable-pass';
|
|
42
|
+
else if (passes === 0) verdict = 'reliable-fail';
|
|
43
|
+
else verdict = 'flaky';
|
|
44
|
+
|
|
45
|
+
// pass^k: green only if every run passed. Flaky and all-fail both aggregate
|
|
46
|
+
// to non-zero so the loop treats them as verify-red.
|
|
47
|
+
const aggregate_exit_code = passAtK ? 0 : 1;
|
|
48
|
+
|
|
49
|
+
return { runs, passes, fails, pass_at_1: passAt1, pass_at_k: passAtK, flaky, verdict, aggregate_exit_code };
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
/** One-line human summary for the verify log the build-fixer reads. */
|
|
53
|
+
function describe(s) {
|
|
54
|
+
if (s.runs === 1) {
|
|
55
|
+
return s.pass_at_k ? 'verify passed (1 run)' : 'verify failed (1 run)';
|
|
56
|
+
}
|
|
57
|
+
if (s.verdict === 'reliable-pass') return 'verify reliably passed (' + s.passes + '/' + s.runs + ' runs)';
|
|
58
|
+
if (s.verdict === 'reliable-fail') return 'verify reliably failed (0/' + s.runs + ' runs passed)';
|
|
59
|
+
return 'FLAKY: verify passed only ' + s.passes + '/' + s.runs + ' runs — non-deterministic, treated as red. '
|
|
60
|
+
+ 'Make the verified behaviour deterministic (no sleeps/real clock/network/ordering) before this task can go green.';
|
|
61
|
+
}
|
|
62
|
+
|
|
63
|
+
module.exports = { summarize, describe };
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
'use strict';
|
|
2
|
+
|
|
3
|
+
const { test } = require('node:test');
|
|
4
|
+
const assert = require('node:assert');
|
|
5
|
+
const { summarize, describe } = require('./eval-reliability.cjs');
|
|
6
|
+
|
|
7
|
+
test('ER-1: all pass → reliable-pass, aggregate 0', () => {
|
|
8
|
+
const s = summarize([0, 0, 0]);
|
|
9
|
+
assert.strictEqual(s.verdict, 'reliable-pass');
|
|
10
|
+
assert.strictEqual(s.pass_at_k, true);
|
|
11
|
+
assert.strictEqual(s.pass_at_1, true);
|
|
12
|
+
assert.strictEqual(s.flaky, false);
|
|
13
|
+
assert.strictEqual(s.aggregate_exit_code, 0);
|
|
14
|
+
});
|
|
15
|
+
|
|
16
|
+
test('ER-2: all fail → reliable-fail, aggregate non-zero', () => {
|
|
17
|
+
const s = summarize([1, 1, 1]);
|
|
18
|
+
assert.strictEqual(s.verdict, 'reliable-fail');
|
|
19
|
+
assert.strictEqual(s.pass_at_k, false);
|
|
20
|
+
assert.strictEqual(s.flaky, false);
|
|
21
|
+
assert.strictEqual(s.aggregate_exit_code, 1);
|
|
22
|
+
});
|
|
23
|
+
|
|
24
|
+
test('ER-3: mixed → flaky, aggregate non-zero (pass^k)', () => {
|
|
25
|
+
const s = summarize([0, 1, 0]);
|
|
26
|
+
assert.strictEqual(s.verdict, 'flaky');
|
|
27
|
+
assert.strictEqual(s.flaky, true);
|
|
28
|
+
assert.strictEqual(s.pass_at_1, true);
|
|
29
|
+
assert.strictEqual(s.pass_at_k, false);
|
|
30
|
+
assert.strictEqual(s.aggregate_exit_code, 1);
|
|
31
|
+
});
|
|
32
|
+
|
|
33
|
+
test('ER-4: first-run-fail-then-pass is still flaky and red', () => {
|
|
34
|
+
const s = summarize([1, 0, 0]);
|
|
35
|
+
assert.strictEqual(s.flaky, true);
|
|
36
|
+
assert.strictEqual(s.pass_at_1, false);
|
|
37
|
+
assert.strictEqual(s.aggregate_exit_code, 1);
|
|
38
|
+
});
|
|
39
|
+
|
|
40
|
+
test('ER-5: single run preserves classic behaviour', () => {
|
|
41
|
+
assert.strictEqual(summarize([0]).aggregate_exit_code, 0);
|
|
42
|
+
assert.strictEqual(summarize([2]).aggregate_exit_code, 1);
|
|
43
|
+
assert.strictEqual(summarize([0]).verdict, 'reliable-pass');
|
|
44
|
+
});
|
|
45
|
+
|
|
46
|
+
test('ER-6: empty/invalid input throws', () => {
|
|
47
|
+
assert.throws(() => summarize([]), (e) => e.code === 'eval-reliability-no-runs');
|
|
48
|
+
assert.throws(() => summarize('nope'), (e) => e.code === 'eval-reliability-no-runs');
|
|
49
|
+
assert.throws(() => summarize([0, 1.5]), (e) => e.code === 'eval-reliability-bad-code');
|
|
50
|
+
});
|
|
51
|
+
|
|
52
|
+
test('ER-7: describe is human-readable and flags flaky loudly', () => {
|
|
53
|
+
assert.match(describe(summarize([0])), /passed \(1 run\)/);
|
|
54
|
+
assert.match(describe(summarize([0, 0, 0])), /reliably passed/);
|
|
55
|
+
assert.match(describe(summarize([0, 1, 0])), /FLAKY/);
|
|
56
|
+
});
|
|
@@ -0,0 +1,82 @@
|
|
|
1
|
+
'use strict';
|
|
2
|
+
|
|
3
|
+
const { test } = require('node:test');
|
|
4
|
+
const assert = require('node:assert/strict');
|
|
5
|
+
const fs = require('node:fs');
|
|
6
|
+
const path = require('node:path');
|
|
7
|
+
const os = require('node:os');
|
|
8
|
+
|
|
9
|
+
const mod = require('./claude-hooks.cjs');
|
|
10
|
+
|
|
11
|
+
function _mkSandbox() {
|
|
12
|
+
const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'np-learn-hooks-'));
|
|
13
|
+
const hooksDir = path.join(dir, '.claude', 'nubos-pilot', 'hooks');
|
|
14
|
+
fs.mkdirSync(hooksDir, { recursive: true });
|
|
15
|
+
fs.writeFileSync(path.join(hooksDir, 'np-statusline.cjs'), '// stub\n');
|
|
16
|
+
fs.writeFileSync(path.join(hooksDir, 'np-ctx-monitor.cjs'), '// stub\n');
|
|
17
|
+
fs.writeFileSync(path.join(hooksDir, 'np-security-hook.cjs'), '// stub\n');
|
|
18
|
+
fs.writeFileSync(path.join(hooksDir, 'np-learnings-hook.cjs'), '// stub\n');
|
|
19
|
+
return dir;
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
test('LH-1: which=learnings registers capture on Stop + reset on UserPromptSubmit', () => {
|
|
23
|
+
const dir = _mkSandbox();
|
|
24
|
+
try {
|
|
25
|
+
const res = mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'learnings' });
|
|
26
|
+
assert.equal(res.results.learnings.capture.action, 'installed');
|
|
27
|
+
assert.equal(res.results.learnings.reset.action, 'installed');
|
|
28
|
+
const settings = JSON.parse(fs.readFileSync(res.path, 'utf-8'));
|
|
29
|
+
const stop = JSON.stringify(settings.hooks.Stop);
|
|
30
|
+
const ups = JSON.stringify(settings.hooks.UserPromptSubmit);
|
|
31
|
+
assert.ok(stop.includes('np-learnings-hook.cjs'));
|
|
32
|
+
assert.ok(stop.includes(' capture'));
|
|
33
|
+
assert.ok(ups.includes('np-learnings-hook.cjs'));
|
|
34
|
+
assert.ok(ups.includes(' reset'));
|
|
35
|
+
} finally { fs.rmSync(dir, { recursive: true, force: true }); }
|
|
36
|
+
});
|
|
37
|
+
|
|
38
|
+
test('LH-2: which=all installs learnings alongside security', () => {
|
|
39
|
+
const dir = _mkSandbox();
|
|
40
|
+
try {
|
|
41
|
+
const res = mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'all' });
|
|
42
|
+
assert.ok(res.results.learnings);
|
|
43
|
+
assert.ok(res.results.security);
|
|
44
|
+
assert.equal(res.results.learnings.capture.action, 'installed');
|
|
45
|
+
} finally { fs.rmSync(dir, { recursive: true, force: true }); }
|
|
46
|
+
});
|
|
47
|
+
|
|
48
|
+
test('LH-3: install is idempotent — second run updates, not duplicates', () => {
|
|
49
|
+
const dir = _mkSandbox();
|
|
50
|
+
try {
|
|
51
|
+
mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'learnings' });
|
|
52
|
+
const res2 = mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'learnings' });
|
|
53
|
+
assert.equal(res2.results.learnings.capture.action, 'updated');
|
|
54
|
+
const settings = JSON.parse(fs.readFileSync(res2.path, 'utf-8'));
|
|
55
|
+
const stopLearnings = settings.hooks.Stop.filter((e) =>
|
|
56
|
+
JSON.stringify(e).includes('np-learnings-hook.cjs'));
|
|
57
|
+
assert.equal(stopLearnings.length, 1);
|
|
58
|
+
} finally { fs.rmSync(dir, { recursive: true, force: true }); }
|
|
59
|
+
});
|
|
60
|
+
|
|
61
|
+
test('LH-4: uninstall removes learnings hooks', () => {
|
|
62
|
+
const dir = _mkSandbox();
|
|
63
|
+
try {
|
|
64
|
+
mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'all' });
|
|
65
|
+
const res = mod.uninstallClaudeHooks({ projectRoot: dir, scope: 'local' });
|
|
66
|
+
assert.equal(res.results.learnings.action, 'removed');
|
|
67
|
+
const settings = JSON.parse(fs.readFileSync(res.path, 'utf-8'));
|
|
68
|
+
const dump = JSON.stringify(settings.hooks || {});
|
|
69
|
+
assert.ok(!dump.includes('np-learnings-hook.cjs'));
|
|
70
|
+
} finally { fs.rmSync(dir, { recursive: true, force: true }); }
|
|
71
|
+
});
|
|
72
|
+
|
|
73
|
+
test('LH-5: missing learnings hook script throws claude-hooks-script-missing', () => {
|
|
74
|
+
const dir = _mkSandbox();
|
|
75
|
+
try {
|
|
76
|
+
fs.rmSync(path.join(dir, '.claude', 'nubos-pilot', 'hooks', 'np-learnings-hook.cjs'));
|
|
77
|
+
assert.throws(
|
|
78
|
+
() => mod.installClaudeHooks({ projectRoot: dir, scope: 'local', which: 'learnings' }),
|
|
79
|
+
(e) => e.code === 'claude-hooks-script-missing',
|
|
80
|
+
);
|
|
81
|
+
} finally { fs.rmSync(dir, { recursive: true, force: true }); }
|
|
82
|
+
});
|
|
@@ -17,9 +17,11 @@ const { atomicWriteFileSync, NubosPilotError, withFileLock } = require('../core.
|
|
|
17
17
|
const STATUSLINE_REL = '.claude/nubos-pilot/hooks/np-statusline.cjs';
|
|
18
18
|
const CTX_MONITOR_REL = '.claude/nubos-pilot/hooks/np-ctx-monitor.cjs';
|
|
19
19
|
const SECURITY_HOOK_REL = '.claude/nubos-pilot/hooks/np-security-hook.cjs';
|
|
20
|
+
const LEARNINGS_HOOK_REL = '.claude/nubos-pilot/hooks/np-learnings-hook.cjs';
|
|
20
21
|
const NP_STATUSLINE_MARKER = 'np-statusline.';
|
|
21
22
|
const NP_CTX_MONITOR_MARKER = 'np-ctx-monitor.';
|
|
22
23
|
const NP_SECURITY_MARKER = 'np-security-hook.';
|
|
24
|
+
const NP_LEARNINGS_MARKER = 'np-learnings-hook.';
|
|
23
25
|
|
|
24
26
|
// ADR-0020: in-session security review layer. One DRY hook script, registered
|
|
25
27
|
// against five Claude Code lifecycle events, differentiated by a trailing verb.
|
|
@@ -32,6 +34,15 @@ const SECURITY_HOOKS = Object.freeze([
|
|
|
32
34
|
]);
|
|
33
35
|
const SECURITY_EVENTS = Object.freeze(['SessionStart', 'UserPromptSubmit', 'Stop', 'PostToolUse']);
|
|
34
36
|
|
|
37
|
+
// ADR-0010 / ECC continuous-learning: one DRY hook script. `capture` on Stop
|
|
38
|
+
// (rate-limited auto-extraction of the turn's learnings); `reset` on
|
|
39
|
+
// UserPromptSubmit (clears the consecutive-stop streak).
|
|
40
|
+
const LEARNINGS_HOOKS = Object.freeze([
|
|
41
|
+
{ verb: 'reset', event: 'UserPromptSubmit', matcher: undefined },
|
|
42
|
+
{ verb: 'capture', event: 'Stop', matcher: undefined },
|
|
43
|
+
]);
|
|
44
|
+
const LEARNINGS_EVENTS = Object.freeze(['UserPromptSubmit', 'Stop']);
|
|
45
|
+
|
|
35
46
|
function _settingsPath(scope, projectRoot) {
|
|
36
47
|
if (scope === 'global') return path.join(os.homedir(), '.claude', 'settings.json');
|
|
37
48
|
return path.join(projectRoot, '.claude', 'settings.local.json');
|
|
@@ -119,14 +130,15 @@ function _verbOf(command) {
|
|
|
119
130
|
return m ? m[1] : null;
|
|
120
131
|
}
|
|
121
132
|
|
|
122
|
-
function _installVerbHook(settings, eventName, matcher, cmd, verb) {
|
|
133
|
+
function _installVerbHook(settings, eventName, matcher, cmd, verb, marker) {
|
|
134
|
+
const mark = marker || NP_SECURITY_MARKER;
|
|
123
135
|
if (!settings.hooks || typeof settings.hooks !== 'object') settings.hooks = {};
|
|
124
136
|
if (!Array.isArray(settings.hooks[eventName])) settings.hooks[eventName] = [];
|
|
125
137
|
const list = settings.hooks[eventName];
|
|
126
138
|
for (const entry of list) {
|
|
127
139
|
const hooks = Array.isArray(entry.hooks) ? entry.hooks : [];
|
|
128
140
|
for (const h of hooks) {
|
|
129
|
-
if (h && typeof h.command === 'string' && h.command.includes(
|
|
141
|
+
if (h && typeof h.command === 'string' && h.command.includes(mark) && _verbOf(h.command) === verb) {
|
|
130
142
|
h.command = cmd;
|
|
131
143
|
h.type = 'command';
|
|
132
144
|
if (matcher !== undefined) entry.matcher = matcher;
|
|
@@ -145,11 +157,42 @@ function _installSecurity(settings, scope, projectRoot) {
|
|
|
145
157
|
const base = _hookCommand(SECURITY_HOOK_REL, scope, projectRoot);
|
|
146
158
|
const results = {};
|
|
147
159
|
for (const h of SECURITY_HOOKS) {
|
|
148
|
-
results[h.verb] = _installVerbHook(settings, h.event, h.matcher, base + ' ' + h.verb, h.verb);
|
|
160
|
+
results[h.verb] = _installVerbHook(settings, h.event, h.matcher, base + ' ' + h.verb, h.verb, NP_SECURITY_MARKER);
|
|
161
|
+
}
|
|
162
|
+
return results;
|
|
163
|
+
}
|
|
164
|
+
|
|
165
|
+
function _installLearnings(settings, scope, projectRoot) {
|
|
166
|
+
const base = _hookCommand(LEARNINGS_HOOK_REL, scope, projectRoot);
|
|
167
|
+
const results = {};
|
|
168
|
+
for (const h of LEARNINGS_HOOKS) {
|
|
169
|
+
results[h.verb] = _installVerbHook(settings, h.event, h.matcher, base + ' ' + h.verb, h.verb, NP_LEARNINGS_MARKER);
|
|
149
170
|
}
|
|
150
171
|
return results;
|
|
151
172
|
}
|
|
152
173
|
|
|
174
|
+
function _removeLearnings(settings) {
|
|
175
|
+
if (!settings.hooks || typeof settings.hooks !== 'object') return { action: 'absent' };
|
|
176
|
+
let removed = 0;
|
|
177
|
+
for (const eventName of LEARNINGS_EVENTS) {
|
|
178
|
+
if (!Array.isArray(settings.hooks[eventName])) continue;
|
|
179
|
+
const filtered = [];
|
|
180
|
+
for (const entry of settings.hooks[eventName]) {
|
|
181
|
+
const hooks = Array.isArray(entry.hooks) ? entry.hooks : [];
|
|
182
|
+
const kept = hooks.filter((h) => !(h && typeof h.command === 'string' && h.command.includes(NP_LEARNINGS_MARKER)));
|
|
183
|
+
if (kept.length > 0) {
|
|
184
|
+
filtered.push(kept.length === hooks.length ? entry : Object.assign({}, entry, { hooks: kept }));
|
|
185
|
+
} else {
|
|
186
|
+
removed++;
|
|
187
|
+
}
|
|
188
|
+
}
|
|
189
|
+
settings.hooks[eventName] = filtered;
|
|
190
|
+
if (filtered.length === 0) delete settings.hooks[eventName];
|
|
191
|
+
}
|
|
192
|
+
if (settings.hooks && Object.keys(settings.hooks).length === 0) delete settings.hooks;
|
|
193
|
+
return { action: removed > 0 ? 'removed' : 'absent' };
|
|
194
|
+
}
|
|
195
|
+
|
|
153
196
|
function _removeSecurity(settings) {
|
|
154
197
|
if (!settings.hooks || typeof settings.hooks !== 'object') return { action: 'absent' };
|
|
155
198
|
let removed = 0;
|
|
@@ -214,6 +257,7 @@ function installClaudeHooks(opts) {
|
|
|
214
257
|
const wantStatusline = which === 'statusline' || which === 'both' || which === 'all';
|
|
215
258
|
const wantCtxMonitor = which === 'ctx-monitor' || which === 'both' || which === 'all';
|
|
216
259
|
const wantSecurity = which === 'security' || which === 'all';
|
|
260
|
+
const wantLearnings = which === 'learnings' || which === 'all';
|
|
217
261
|
|
|
218
262
|
const statuslineCmd = _hookCommand(STATUSLINE_REL, scope, projectRoot);
|
|
219
263
|
const ctxMonitorCmd = _hookCommand(CTX_MONITOR_REL, scope, projectRoot);
|
|
@@ -222,6 +266,7 @@ function installClaudeHooks(opts) {
|
|
|
222
266
|
const statuslineAbs = path.join(base, STATUSLINE_REL);
|
|
223
267
|
const ctxMonitorAbs = path.join(base, CTX_MONITOR_REL);
|
|
224
268
|
const securityAbs = path.join(base, SECURITY_HOOK_REL);
|
|
269
|
+
const learningsAbs = path.join(base, LEARNINGS_HOOK_REL);
|
|
225
270
|
|
|
226
271
|
if (wantStatusline) {
|
|
227
272
|
if (!fs.existsSync(statuslineAbs)) {
|
|
@@ -250,6 +295,15 @@ function installClaudeHooks(opts) {
|
|
|
250
295
|
);
|
|
251
296
|
}
|
|
252
297
|
}
|
|
298
|
+
if (wantLearnings) {
|
|
299
|
+
if (!fs.existsSync(learningsAbs)) {
|
|
300
|
+
throw new NubosPilotError(
|
|
301
|
+
'claude-hooks-script-missing',
|
|
302
|
+
'Learnings hook script not found: ' + learningsAbs,
|
|
303
|
+
{ script: learningsAbs },
|
|
304
|
+
);
|
|
305
|
+
}
|
|
306
|
+
}
|
|
253
307
|
|
|
254
308
|
fs.mkdirSync(path.dirname(settingsPath), { recursive: true });
|
|
255
309
|
|
|
@@ -266,6 +320,9 @@ function installClaudeHooks(opts) {
|
|
|
266
320
|
if (wantSecurity) {
|
|
267
321
|
results.security = _installSecurity(settings, scope, projectRoot);
|
|
268
322
|
}
|
|
323
|
+
if (wantLearnings) {
|
|
324
|
+
results.learnings = _installLearnings(settings, scope, projectRoot);
|
|
325
|
+
}
|
|
269
326
|
|
|
270
327
|
if (o.dryRun) return { dryRun: true, path: settingsPath, results, settings };
|
|
271
328
|
|
|
@@ -279,7 +336,7 @@ function uninstallClaudeHooks(opts) {
|
|
|
279
336
|
const projectRoot = o.projectRoot || process.cwd();
|
|
280
337
|
const scope = o.scope === 'global' ? 'global' : 'local';
|
|
281
338
|
const settingsPath = _settingsPath(scope, projectRoot);
|
|
282
|
-
if (!fs.existsSync(settingsPath)) return { path: settingsPath, results: { statusline: { action: 'absent' }, ctxMonitor: { action: 'absent' }, security: { action: 'absent' } } };
|
|
339
|
+
if (!fs.existsSync(settingsPath)) return { path: settingsPath, results: { statusline: { action: 'absent' }, ctxMonitor: { action: 'absent' }, security: { action: 'absent' }, learnings: { action: 'absent' } } };
|
|
283
340
|
|
|
284
341
|
return withFileLock(settingsPath, () => {
|
|
285
342
|
const settings = _readJsonSafe(settingsPath);
|
|
@@ -287,6 +344,7 @@ function uninstallClaudeHooks(opts) {
|
|
|
287
344
|
statusline: _removeStatusLine(settings),
|
|
288
345
|
ctxMonitor: _removePostToolUse(settings),
|
|
289
346
|
security: _removeSecurity(settings),
|
|
347
|
+
learnings: _removeLearnings(settings),
|
|
290
348
|
};
|
|
291
349
|
if (o.dryRun) return { dryRun: true, path: settingsPath, results, settings };
|
|
292
350
|
atomicWriteFileSync(settingsPath, JSON.stringify(settings, null, 2) + '\n');
|
|
@@ -304,6 +362,9 @@ module.exports = {
|
|
|
304
362
|
NP_CTX_MONITOR_MARKER,
|
|
305
363
|
NP_SECURITY_MARKER,
|
|
306
364
|
SECURITY_HOOKS,
|
|
365
|
+
LEARNINGS_HOOK_REL,
|
|
366
|
+
NP_LEARNINGS_MARKER,
|
|
367
|
+
LEARNINGS_HOOKS,
|
|
307
368
|
_settingsPath,
|
|
308
369
|
_hookCommand,
|
|
309
370
|
};
|
|
@@ -230,7 +230,7 @@ function _mkSandboxAll() {
|
|
|
230
230
|
const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'np-claude-hooks-all-'));
|
|
231
231
|
const hooksDir = path.join(dir, '.claude', 'nubos-pilot', 'hooks');
|
|
232
232
|
fs.mkdirSync(hooksDir, { recursive: true });
|
|
233
|
-
for (const f of ['np-statusline.cjs', 'np-ctx-monitor.cjs', 'np-security-hook.cjs']) {
|
|
233
|
+
for (const f of ['np-statusline.cjs', 'np-ctx-monitor.cjs', 'np-security-hook.cjs', 'np-learnings-hook.cjs']) {
|
|
234
234
|
fs.writeFileSync(path.join(hooksDir, f), '// stub\n');
|
|
235
235
|
}
|
|
236
236
|
return dir;
|
|
@@ -269,7 +269,10 @@ test('claude-hooks SEC: re-install is idempotent (no duplicate entries)', () =>
|
|
|
269
269
|
assert.equal(res2.results.security.scan.action, 'updated');
|
|
270
270
|
const s = JSON.parse(fs.readFileSync(res2.path, 'utf-8'));
|
|
271
271
|
assert.equal(s.hooks.SessionStart.length, 1);
|
|
272
|
-
|
|
272
|
+
// Stop now carries the security 'review' hook + the learnings 'capture' hook (which=all installs both).
|
|
273
|
+
assert.equal(s.hooks.Stop.length, 2);
|
|
274
|
+
assert.equal(s.hooks.Stop.filter((e) => e.hooks[0].command.includes('np-security-hook.')).length, 1);
|
|
275
|
+
assert.equal(s.hooks.Stop.filter((e) => e.hooks[0].command.includes('np-learnings-hook.')).length, 1);
|
|
273
276
|
assert.equal(s.hooks.PostToolUse.filter((e) => e.hooks[0].command.includes('np-security-hook.')).length, 2);
|
|
274
277
|
} finally {
|
|
275
278
|
fs.rmSync(dir, { recursive: true, force: true });
|