@lamentis/naome 1.4.0 → 1.4.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/Cargo.lock +2 -2
- package/README.md +17 -122
- package/crates/naome-cli/Cargo.toml +1 -1
- package/crates/naome-cli/src/main.rs +13 -0
- package/crates/naome-cli/src/task_commands/can_edit.rs +116 -0
- package/crates/naome-cli/src/task_commands/check_run/output.rs +34 -0
- package/crates/naome-cli/src/task_commands/check_run/receipts.rs +155 -0
- package/crates/naome-cli/src/task_commands/check_run/verification.rs +165 -0
- package/crates/naome-cli/src/task_commands/check_run.rs +192 -0
- package/crates/naome-cli/src/task_commands/common.rs +70 -0
- package/crates/naome-cli/src/task_commands/complete.rs +43 -0
- package/crates/naome-cli/src/task_commands/loop_control.rs +55 -0
- package/crates/naome-cli/src/task_commands/readiness.rs +44 -0
- package/crates/naome-cli/src/task_commands/record.rs +236 -0
- package/crates/naome-cli/src/task_commands/repair.rs +77 -0
- package/crates/naome-cli/src/task_commands/scope_request.rs +24 -0
- package/crates/naome-cli/src/task_commands/timeline.rs +71 -0
- package/crates/naome-cli/src/task_commands.rs +80 -1
- package/crates/naome-cli/tests/task_cli.rs +58 -0
- package/crates/naome-cli/tests/task_cli_agent_controls.rs +210 -0
- package/crates/naome-cli/tests/task_cli_control.rs +126 -0
- package/crates/naome-cli/tests/task_cli_loop.rs +383 -0
- package/crates/naome-cli/tests/task_cli_loop_edit.rs +144 -0
- package/crates/naome-cli/tests/task_cli_support/mod.rs +178 -0
- package/crates/naome-core/Cargo.toml +1 -1
- package/crates/naome-core/src/lib.rs +7 -2
- package/crates/naome-core/src/task_state/evidence_fingerprint.rs +47 -0
- package/crates/naome-core/src/task_state/mod.rs +12 -0
- package/crates/naome-core/src/task_state/status/agent_model.rs +76 -0
- package/crates/naome-core/src/task_state/status/control/action.rs +87 -0
- package/crates/naome-core/src/task_state/status/control/exit_code.rs +32 -0
- package/crates/naome-core/src/task_state/status/control/loop_state.rs +70 -0
- package/crates/naome-core/src/task_state/status/control/policy.rs +31 -0
- package/crates/naome-core/src/task_state/status/control/proof_recording.rs +25 -0
- package/crates/naome-core/src/task_state/status/control/recovery.rs +19 -0
- package/crates/naome-core/src/task_state/status/control/repair.rs +125 -0
- package/crates/naome-core/src/task_state/status/control/shared.rs +25 -0
- package/crates/naome-core/src/task_state/status/control.rs +16 -0
- package/crates/naome-core/src/task_state/status/git.rs +133 -0
- package/crates/naome-core/src/task_state/status/model.rs +152 -0
- package/crates/naome-core/src/task_state/status/proof.rs +217 -0
- package/crates/naome-core/src/task_state/status/proof_read.rs +164 -0
- package/crates/naome-core/src/task_state/status/report.rs +148 -0
- package/crates/naome-core/src/task_state/status/report_context.rs +148 -0
- package/crates/naome-core/src/task_state/status/report_support.rs +117 -0
- package/crates/naome-core/src/task_state/status/scope.rs +111 -0
- package/crates/naome-core/src/task_state/status/transition.rs +101 -0
- package/crates/naome-core/src/task_state/status.rs +23 -0
- package/crates/naome-core/src/task_state/status_output.rs +103 -0
- package/crates/naome-core/tests/task_state_support/mod.rs +15 -1
- package/crates/naome-core/tests/task_state_support/states.rs +4 -0
- package/crates/naome-core/tests/task_status.rs +423 -0
- package/crates/naome-core/tests/task_status_git.rs +141 -0
- package/installer/context.js +1 -1
- package/installer/harness-verification.js +2 -6
- package/installer/manifest-state.js +2 -2
- package/installer/native.js +3 -31
- package/native/darwin-arm64/naome +0 -0
- package/native/linux-x64/naome +0 -0
- package/package.json +1 -1
- package/templates/naome-root/.naome/bin/check-harness-health.js +2 -2
- package/templates/naome-root/.naome/bin/check-task-state.js +4 -39
- package/templates/naome-root/.naome/bin/naome.js +2 -30
- package/templates/naome-root/.naome/manifest.json +2 -2
|
@@ -0,0 +1,383 @@
|
|
|
1
|
+
use std::fs;
|
|
2
|
+
use std::process::Command;
|
|
3
|
+
|
|
4
|
+
use serde_json::{json, Value};
|
|
5
|
+
|
|
6
|
+
mod task_cli_support;
|
|
7
|
+
|
|
8
|
+
use task_cli_support::{
|
|
9
|
+
active_task, fixture_root, git, init_git, run_json, task_state, task_state_with_active_task,
|
|
10
|
+
write_fixture_file, write_verification_checks,
|
|
11
|
+
};
|
|
12
|
+
|
|
13
|
+
#[test]
|
|
14
|
+
fn run_check_rejects_unknown_and_records_successful_safe_checks() {
|
|
15
|
+
let root = fixture_root(task_state());
|
|
16
|
+
init_git(&root);
|
|
17
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
18
|
+
|
|
19
|
+
let unknown = run_json(&root, ["task", "run-check", "--check", "missing", "--json"]);
|
|
20
|
+
assert_eq!(unknown["schema"], "naome.task.run-check.v1");
|
|
21
|
+
assert_eq!(unknown["executed"], false);
|
|
22
|
+
assert_eq!(unknown["findings"][0]["id"], "task.check.unknown");
|
|
23
|
+
|
|
24
|
+
let result = run_json(
|
|
25
|
+
&root,
|
|
26
|
+
[
|
|
27
|
+
"task",
|
|
28
|
+
"run-check",
|
|
29
|
+
"--check",
|
|
30
|
+
"diff-check",
|
|
31
|
+
"--record-proof",
|
|
32
|
+
"--json",
|
|
33
|
+
"--agent-session",
|
|
34
|
+
"loop-a",
|
|
35
|
+
],
|
|
36
|
+
);
|
|
37
|
+
assert_eq!(result["executed"], true);
|
|
38
|
+
assert_eq!(result["exitCode"], 0);
|
|
39
|
+
assert_eq!(result["recordedProof"], true);
|
|
40
|
+
assert_eq!(result["agentSession"], "loop-a");
|
|
41
|
+
|
|
42
|
+
let task_state: Value =
|
|
43
|
+
serde_json::from_str(&fs::read_to_string(root.join(".naome/task-state.json")).unwrap())
|
|
44
|
+
.unwrap();
|
|
45
|
+
assert_eq!(
|
|
46
|
+
task_state["activeTask"]["proofBatches"][0]["proofs"][0]["agentSession"],
|
|
47
|
+
"loop-a"
|
|
48
|
+
);
|
|
49
|
+
assert_eq!(
|
|
50
|
+
task_state["activeTask"]["proofBatches"][0]["proofs"][0]["command"],
|
|
51
|
+
"git diff --check"
|
|
52
|
+
);
|
|
53
|
+
assert_eq!(
|
|
54
|
+
task_state["activeTask"]["proofBatches"][0]["proofs"][0]["cwd"],
|
|
55
|
+
"."
|
|
56
|
+
);
|
|
57
|
+
}
|
|
58
|
+
|
|
59
|
+
#[test]
|
|
60
|
+
fn record_proof_requires_recent_success_evidence() {
|
|
61
|
+
let root = fixture_root(task_state());
|
|
62
|
+
init_git(&root);
|
|
63
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
64
|
+
|
|
65
|
+
let recorded = run_json(
|
|
66
|
+
&root,
|
|
67
|
+
["task", "record-proof", "--from-proof-plan", "--json"],
|
|
68
|
+
);
|
|
69
|
+
|
|
70
|
+
assert_eq!(recorded["recorded"], false);
|
|
71
|
+
assert_eq!(
|
|
72
|
+
recorded["findings"][0]["id"],
|
|
73
|
+
"task.proof.no_recent_success"
|
|
74
|
+
);
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
#[test]
|
|
78
|
+
fn record_proof_rejects_receipts_from_older_same_path_content() {
|
|
79
|
+
let root = fixture_root(task_state());
|
|
80
|
+
init_git(&root);
|
|
81
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
82
|
+
|
|
83
|
+
let checked = run_json(
|
|
84
|
+
&root,
|
|
85
|
+
["task", "run-check", "--check", "diff-check", "--json"],
|
|
86
|
+
);
|
|
87
|
+
assert_eq!(checked["executed"], true);
|
|
88
|
+
assert_eq!(checked["exitCode"], 0);
|
|
89
|
+
|
|
90
|
+
write_fixture_file(&root, "README.md", "changed with trailing whitespace \n");
|
|
91
|
+
let recorded = run_json(
|
|
92
|
+
&root,
|
|
93
|
+
["task", "record-proof", "--from-proof-plan", "--json"],
|
|
94
|
+
);
|
|
95
|
+
|
|
96
|
+
assert_eq!(recorded["recorded"], false);
|
|
97
|
+
assert_eq!(
|
|
98
|
+
recorded["findings"][0]["id"],
|
|
99
|
+
"task.proof.no_recent_success"
|
|
100
|
+
);
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
#[test]
|
|
104
|
+
fn record_proof_rejects_receipts_from_old_check_metadata() {
|
|
105
|
+
let root = fixture_root(task_state());
|
|
106
|
+
init_git(&root);
|
|
107
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
108
|
+
|
|
109
|
+
let checked = run_json(
|
|
110
|
+
&root,
|
|
111
|
+
["task", "run-check", "--check", "diff-check", "--json"],
|
|
112
|
+
);
|
|
113
|
+
assert_eq!(checked["executed"], true);
|
|
114
|
+
assert_eq!(checked["exitCode"], 0);
|
|
115
|
+
|
|
116
|
+
write_verification_checks(
|
|
117
|
+
&root,
|
|
118
|
+
json!([{
|
|
119
|
+
"id": "diff-check",
|
|
120
|
+
"command": "node .naome/bin/naome.js quality check --changed",
|
|
121
|
+
"cwd": ".",
|
|
122
|
+
"purpose": "Updated check command.",
|
|
123
|
+
"cost": "fast",
|
|
124
|
+
"source": "test",
|
|
125
|
+
"evidence": ["README.md"],
|
|
126
|
+
"lastVerified": null
|
|
127
|
+
}]),
|
|
128
|
+
);
|
|
129
|
+
git(&root, ["add", ".naome/verification.json"]);
|
|
130
|
+
git(&root, ["commit", "-m", "update verification metadata"]);
|
|
131
|
+
|
|
132
|
+
let recorded = run_json(
|
|
133
|
+
&root,
|
|
134
|
+
["task", "record-proof", "--from-proof-plan", "--json"],
|
|
135
|
+
);
|
|
136
|
+
|
|
137
|
+
assert_eq!(recorded["recorded"], false);
|
|
138
|
+
assert_eq!(
|
|
139
|
+
recorded["findings"][0]["id"],
|
|
140
|
+
"task.proof.no_recent_success"
|
|
141
|
+
);
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
#[test]
|
|
145
|
+
fn run_check_diff_check_covers_staged_diff() {
|
|
146
|
+
let root = fixture_root(task_state());
|
|
147
|
+
init_git(&root);
|
|
148
|
+
write_fixture_file(&root, "README.md", "staged trailing whitespace \n");
|
|
149
|
+
git(&root, ["add", "README.md"]);
|
|
150
|
+
|
|
151
|
+
let result = run_json(
|
|
152
|
+
&root,
|
|
153
|
+
[
|
|
154
|
+
"task",
|
|
155
|
+
"run-check",
|
|
156
|
+
"--check",
|
|
157
|
+
"diff-check",
|
|
158
|
+
"--record-proof",
|
|
159
|
+
"--json",
|
|
160
|
+
],
|
|
161
|
+
);
|
|
162
|
+
|
|
163
|
+
assert_eq!(result["executed"], true);
|
|
164
|
+
assert_ne!(result["exitCode"], 0);
|
|
165
|
+
assert_eq!(result["recordedProof"], false);
|
|
166
|
+
assert!(result["stdoutSummary"]
|
|
167
|
+
.as_str()
|
|
168
|
+
.is_some_and(|summary| summary.contains("trailing whitespace")));
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
#[test]
|
|
172
|
+
fn repair_execute_safe_runs_checks_but_refuses_scope_repairs() {
|
|
173
|
+
let root = fixture_root(task_state());
|
|
174
|
+
init_git(&root);
|
|
175
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
176
|
+
write_fixture_file(&root, "src/lib.rs", "outside\n");
|
|
177
|
+
|
|
178
|
+
let scope = run_json(
|
|
179
|
+
&root,
|
|
180
|
+
[
|
|
181
|
+
"task",
|
|
182
|
+
"repair",
|
|
183
|
+
"--plan",
|
|
184
|
+
"remove_out_of_scope_change_src_lib_rs",
|
|
185
|
+
"--execute-safe",
|
|
186
|
+
"--json",
|
|
187
|
+
],
|
|
188
|
+
);
|
|
189
|
+
assert_eq!(scope["executed"], false);
|
|
190
|
+
assert_eq!(scope["requiresUserApproval"], true);
|
|
191
|
+
|
|
192
|
+
fs::remove_file(root.join("src/lib.rs")).unwrap();
|
|
193
|
+
let check = run_json(
|
|
194
|
+
&root,
|
|
195
|
+
[
|
|
196
|
+
"task",
|
|
197
|
+
"repair",
|
|
198
|
+
"--plan",
|
|
199
|
+
"rerun_diff-check",
|
|
200
|
+
"--execute-safe",
|
|
201
|
+
"--json",
|
|
202
|
+
],
|
|
203
|
+
);
|
|
204
|
+
assert_eq!(check["executed"], true);
|
|
205
|
+
assert_eq!(check["steps"][0]["schema"], "naome.task.run-check.v1");
|
|
206
|
+
}
|
|
207
|
+
|
|
208
|
+
#[test]
|
|
209
|
+
fn repair_execute_safe_rejects_dry_run_combo_and_unsafe_check_plans() {
|
|
210
|
+
let root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
211
|
+
"requiredCheckIds": ["unsafe-check"],
|
|
212
|
+
"proofResults": []
|
|
213
|
+
}))));
|
|
214
|
+
write_verification_checks(
|
|
215
|
+
&root,
|
|
216
|
+
json!([{
|
|
217
|
+
"id": "unsafe-check",
|
|
218
|
+
"command": "sh -c 'echo unsafe'",
|
|
219
|
+
"cwd": ".",
|
|
220
|
+
"purpose": "Unsafe check for repair planning tests.",
|
|
221
|
+
"cost": "fast",
|
|
222
|
+
"source": "test",
|
|
223
|
+
"evidence": ["README.md"],
|
|
224
|
+
"lastVerified": null
|
|
225
|
+
}]),
|
|
226
|
+
);
|
|
227
|
+
init_git(&root);
|
|
228
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
229
|
+
|
|
230
|
+
let combo = Command::new(env!("CARGO_BIN_EXE_naome"))
|
|
231
|
+
.args([
|
|
232
|
+
"task",
|
|
233
|
+
"repair",
|
|
234
|
+
"--plan",
|
|
235
|
+
"rerun_unsafe-check",
|
|
236
|
+
"--dry-run",
|
|
237
|
+
"--execute-safe",
|
|
238
|
+
"--json",
|
|
239
|
+
])
|
|
240
|
+
.current_dir(&root)
|
|
241
|
+
.output()
|
|
242
|
+
.unwrap();
|
|
243
|
+
assert!(!combo.status.success());
|
|
244
|
+
assert!(String::from_utf8_lossy(&combo.stderr).contains("--dry-run"));
|
|
245
|
+
|
|
246
|
+
let unsafe_repair = run_json(
|
|
247
|
+
&root,
|
|
248
|
+
[
|
|
249
|
+
"task",
|
|
250
|
+
"repair",
|
|
251
|
+
"--plan",
|
|
252
|
+
"rerun_unsafe-check",
|
|
253
|
+
"--execute-safe",
|
|
254
|
+
"--json",
|
|
255
|
+
],
|
|
256
|
+
);
|
|
257
|
+
assert_eq!(unsafe_repair["executed"], false);
|
|
258
|
+
assert_eq!(unsafe_repair["requiresUserApproval"], true);
|
|
259
|
+
assert!(unsafe_repair["steps"].as_array().unwrap().is_empty());
|
|
260
|
+
}
|
|
261
|
+
|
|
262
|
+
#[test]
|
|
263
|
+
fn run_check_rejects_changed_npm_scripts_from_safe_execution() {
|
|
264
|
+
let root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
265
|
+
"requiredCheckIds": ["task-state-tests"],
|
|
266
|
+
"allowedPaths": ["package.json"],
|
|
267
|
+
"proofResults": []
|
|
268
|
+
}))));
|
|
269
|
+
write_verification_checks(
|
|
270
|
+
&root,
|
|
271
|
+
json!([{
|
|
272
|
+
"id": "task-state-tests",
|
|
273
|
+
"command": "npm run test:task-state",
|
|
274
|
+
"cwd": ".",
|
|
275
|
+
"purpose": "Task-state regression tests.",
|
|
276
|
+
"cost": "medium",
|
|
277
|
+
"source": "test",
|
|
278
|
+
"evidence": ["package.json"],
|
|
279
|
+
"lastVerified": null
|
|
280
|
+
}]),
|
|
281
|
+
);
|
|
282
|
+
init_git(&root);
|
|
283
|
+
write_fixture_file(
|
|
284
|
+
&root,
|
|
285
|
+
"package.json",
|
|
286
|
+
r#"{"scripts":{"test:task-state":"node -e \"process.exit(0)\"}}"#,
|
|
287
|
+
);
|
|
288
|
+
|
|
289
|
+
let result = run_json(
|
|
290
|
+
&root,
|
|
291
|
+
["task", "run-check", "--check", "task-state-tests", "--json"],
|
|
292
|
+
);
|
|
293
|
+
|
|
294
|
+
assert_eq!(result["executed"], false);
|
|
295
|
+
assert_eq!(result["findings"][0]["id"], "task.check.unsafe_command");
|
|
296
|
+
}
|
|
297
|
+
|
|
298
|
+
#[test]
|
|
299
|
+
fn run_check_rejects_pack_dry_run_as_not_read_only() {
|
|
300
|
+
let root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
301
|
+
"requiredCheckIds": ["package-dry-run"],
|
|
302
|
+
"proofResults": []
|
|
303
|
+
}))));
|
|
304
|
+
write_verification_checks(
|
|
305
|
+
&root,
|
|
306
|
+
json!([{
|
|
307
|
+
"id": "package-dry-run",
|
|
308
|
+
"command": "npm run pack:dry-run",
|
|
309
|
+
"cwd": ".",
|
|
310
|
+
"purpose": "Package dry run.",
|
|
311
|
+
"cost": "medium",
|
|
312
|
+
"source": "test",
|
|
313
|
+
"evidence": ["README.md"],
|
|
314
|
+
"lastVerified": null
|
|
315
|
+
}]),
|
|
316
|
+
);
|
|
317
|
+
init_git(&root);
|
|
318
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
319
|
+
|
|
320
|
+
let result = run_json(
|
|
321
|
+
&root,
|
|
322
|
+
["task", "run-check", "--check", "package-dry-run", "--json"],
|
|
323
|
+
);
|
|
324
|
+
|
|
325
|
+
assert_eq!(result["executed"], false);
|
|
326
|
+
assert_eq!(result["findings"][0]["id"], "task.check.unsafe_command");
|
|
327
|
+
}
|
|
328
|
+
|
|
329
|
+
#[test]
|
|
330
|
+
fn task_loop_read_only_and_execute_safe_drive_proof_to_completion() {
|
|
331
|
+
let root = fixture_root(task_state());
|
|
332
|
+
init_git(&root);
|
|
333
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
334
|
+
|
|
335
|
+
let read_only = run_json(&root, ["task", "loop", "--json"]);
|
|
336
|
+
assert_eq!(read_only["schema"], "naome.task.loop.v1");
|
|
337
|
+
assert_eq!(read_only["mode"], "read_only");
|
|
338
|
+
assert!(read_only["executedSteps"].as_array().unwrap().is_empty());
|
|
339
|
+
assert_eq!(
|
|
340
|
+
read_only["status"]["proof"]["missingChecks"],
|
|
341
|
+
json!(["diff-check"])
|
|
342
|
+
);
|
|
343
|
+
|
|
344
|
+
let executed = run_json(&root, ["task", "loop", "--execute-safe", "--json"]);
|
|
345
|
+
assert_eq!(executed["mode"], "execute_safe");
|
|
346
|
+
assert_eq!(
|
|
347
|
+
executed["executedSteps"][0]["schema"],
|
|
348
|
+
"naome.task.run-check.v1"
|
|
349
|
+
);
|
|
350
|
+
assert_eq!(executed["executedSteps"][0]["recordedProof"], true);
|
|
351
|
+
|
|
352
|
+
let completed = run_json(
|
|
353
|
+
&root,
|
|
354
|
+
["task", "complete", "--from-can-transition", "--json"],
|
|
355
|
+
);
|
|
356
|
+
assert_eq!(completed["schema"], "naome.task.complete.v1");
|
|
357
|
+
assert_eq!(completed["completed"], true);
|
|
358
|
+
|
|
359
|
+
let state: Value =
|
|
360
|
+
serde_json::from_str(&fs::read_to_string(root.join(".naome/task-state.json")).unwrap())
|
|
361
|
+
.unwrap();
|
|
362
|
+
assert_eq!(state["status"], "complete");
|
|
363
|
+
}
|
|
364
|
+
|
|
365
|
+
#[test]
|
|
366
|
+
fn complete_blocks_when_transition_is_not_allowed() {
|
|
367
|
+
let root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
368
|
+
"proofResults": []
|
|
369
|
+
}))));
|
|
370
|
+
init_git(&root);
|
|
371
|
+
write_fixture_file(&root, "README.md", "changed\n");
|
|
372
|
+
|
|
373
|
+
let completed = run_json(
|
|
374
|
+
&root,
|
|
375
|
+
["task", "complete", "--from-can-transition", "--json"],
|
|
376
|
+
);
|
|
377
|
+
|
|
378
|
+
assert_eq!(completed["completed"], false);
|
|
379
|
+
assert_eq!(
|
|
380
|
+
completed["blockingFindings"][0]["id"],
|
|
381
|
+
"task.proof.missing_check"
|
|
382
|
+
);
|
|
383
|
+
}
|
|
@@ -0,0 +1,144 @@
|
|
|
1
|
+
use std::process::Command;
|
|
2
|
+
|
|
3
|
+
mod task_cli_support;
|
|
4
|
+
|
|
5
|
+
use serde_json::json;
|
|
6
|
+
|
|
7
|
+
use task_cli_support::{
|
|
8
|
+
active_task, fixture_root, init_git, run_json, task_state, task_state_with_active_task,
|
|
9
|
+
write_fixture_file,
|
|
10
|
+
};
|
|
11
|
+
|
|
12
|
+
#[test]
|
|
13
|
+
fn can_edit_allows_in_scope_and_blocks_unsafe_paths() {
|
|
14
|
+
let root = fixture_root(task_state());
|
|
15
|
+
init_git(&root);
|
|
16
|
+
|
|
17
|
+
let allowed = run_json(&root, ["task", "can-edit", "--path", "README.md", "--json"]);
|
|
18
|
+
assert_eq!(allowed["schema"], "naome.task.can-edit.v1");
|
|
19
|
+
assert_eq!(allowed["path"], "README.md");
|
|
20
|
+
assert_eq!(allowed["allowed"], true);
|
|
21
|
+
|
|
22
|
+
let outside = run_json(
|
|
23
|
+
&root,
|
|
24
|
+
["task", "can-edit", "--path", "src/lib.rs", "--json"],
|
|
25
|
+
);
|
|
26
|
+
assert_eq!(outside["allowed"], false);
|
|
27
|
+
assert_eq!(outside["findings"][0]["id"], "task.edit.out_of_scope");
|
|
28
|
+
|
|
29
|
+
let traversal = run_json(
|
|
30
|
+
&root,
|
|
31
|
+
["task", "can-edit", "--path", "../README.md", "--json"],
|
|
32
|
+
);
|
|
33
|
+
assert_eq!(traversal["allowed"], false);
|
|
34
|
+
assert_eq!(traversal["findings"][0]["id"], "task.edit.unsafe_path");
|
|
35
|
+
|
|
36
|
+
let backslash_traversal = run_json(
|
|
37
|
+
&root,
|
|
38
|
+
["task", "can-edit", "--path", "..\\README.md", "--json"],
|
|
39
|
+
);
|
|
40
|
+
assert_eq!(backslash_traversal["allowed"], false);
|
|
41
|
+
assert_eq!(
|
|
42
|
+
backslash_traversal["findings"][0]["id"],
|
|
43
|
+
"task.edit.unsafe_path"
|
|
44
|
+
);
|
|
45
|
+
|
|
46
|
+
let absolute = run_json(
|
|
47
|
+
&root,
|
|
48
|
+
["task", "can-edit", "--path", "/tmp/file.rs", "--json"],
|
|
49
|
+
);
|
|
50
|
+
assert_eq!(absolute["allowed"], false);
|
|
51
|
+
assert_eq!(absolute["findings"][0]["id"], "task.edit.unsafe_path");
|
|
52
|
+
|
|
53
|
+
let control = run_json(
|
|
54
|
+
&root,
|
|
55
|
+
[
|
|
56
|
+
"task",
|
|
57
|
+
"can-edit",
|
|
58
|
+
"--path",
|
|
59
|
+
".naome/task-state.json",
|
|
60
|
+
"--json",
|
|
61
|
+
],
|
|
62
|
+
);
|
|
63
|
+
assert_eq!(control["allowed"], false);
|
|
64
|
+
assert_eq!(control["findings"][0]["id"], "task.edit.control_path");
|
|
65
|
+
|
|
66
|
+
let ignore_control = run_json(
|
|
67
|
+
&root,
|
|
68
|
+
["task", "can-edit", "--path", ".naomeignore", "--json"],
|
|
69
|
+
);
|
|
70
|
+
assert_eq!(ignore_control["allowed"], false);
|
|
71
|
+
assert_eq!(
|
|
72
|
+
ignore_control["findings"][0]["id"],
|
|
73
|
+
"task.edit.control_path"
|
|
74
|
+
);
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
#[test]
|
|
78
|
+
fn can_edit_honors_ignore_directories_wildcards_and_blocked_states() {
|
|
79
|
+
let root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
80
|
+
"allowedPaths": ["**"]
|
|
81
|
+
}))));
|
|
82
|
+
std::fs::write(
|
|
83
|
+
root.join(".naomeignore"),
|
|
84
|
+
".naome/archive/\n.naome/tasks/\ndist/\n",
|
|
85
|
+
)
|
|
86
|
+
.unwrap();
|
|
87
|
+
init_git(&root);
|
|
88
|
+
write_fixture_file(&root, "dist/bundle.js", "generated\n");
|
|
89
|
+
|
|
90
|
+
let ignored = run_json(
|
|
91
|
+
&root,
|
|
92
|
+
["task", "can-edit", "--path", "dist/bundle.js", "--json"],
|
|
93
|
+
);
|
|
94
|
+
assert_eq!(ignored["allowed"], false);
|
|
95
|
+
assert_eq!(ignored["findings"][0]["id"], "task.edit.ignored_path");
|
|
96
|
+
|
|
97
|
+
let wildcard_root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
98
|
+
"allowedPaths": ["scripts/*.js"]
|
|
99
|
+
}))));
|
|
100
|
+
init_git(&wildcard_root);
|
|
101
|
+
let wildcard = run_json(
|
|
102
|
+
&wildcard_root,
|
|
103
|
+
["task", "can-edit", "--path", "scripts/check.js", "--json"],
|
|
104
|
+
);
|
|
105
|
+
assert_eq!(wildcard["allowed"], true);
|
|
106
|
+
|
|
107
|
+
let blocked_root = fixture_root(task_state_with_active_task(active_task(json!({
|
|
108
|
+
"allowedPaths": ["README.md"]
|
|
109
|
+
}))));
|
|
110
|
+
let mut state: serde_json::Value = serde_json::from_str(
|
|
111
|
+
&std::fs::read_to_string(blocked_root.join(".naome/task-state.json")).unwrap(),
|
|
112
|
+
)
|
|
113
|
+
.unwrap();
|
|
114
|
+
state["status"] = json!("blocked");
|
|
115
|
+
state["activeTask"]["status"] = json!("blocked");
|
|
116
|
+
task_cli_support::write_json(&blocked_root, ".naome/task-state.json", &state);
|
|
117
|
+
init_git(&blocked_root);
|
|
118
|
+
let blocked = run_json(
|
|
119
|
+
&blocked_root,
|
|
120
|
+
["task", "can-edit", "--path", "README.md", "--json"],
|
|
121
|
+
);
|
|
122
|
+
assert_eq!(blocked["allowed"], false);
|
|
123
|
+
assert_eq!(blocked["findings"][0]["id"], "task.edit.no_active_task");
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
#[test]
|
|
127
|
+
fn agent_session_is_validated_and_reflected_in_json() {
|
|
128
|
+
let root = fixture_root(task_state());
|
|
129
|
+
init_git(&root);
|
|
130
|
+
|
|
131
|
+
let status = run_json(
|
|
132
|
+
&root,
|
|
133
|
+
["task", "status", "--json", "--agent-session", "agent-42"],
|
|
134
|
+
);
|
|
135
|
+
assert_eq!(status["agentSession"], "agent-42");
|
|
136
|
+
|
|
137
|
+
let rejected = Command::new(env!("CARGO_BIN_EXE_naome"))
|
|
138
|
+
.args(["task", "status", "--json", "--agent-session", "../bad"])
|
|
139
|
+
.current_dir(root)
|
|
140
|
+
.output()
|
|
141
|
+
.unwrap();
|
|
142
|
+
assert!(!rejected.status.success());
|
|
143
|
+
assert!(String::from_utf8_lossy(&rejected.stderr).contains("agent-session"));
|
|
144
|
+
}
|
|
@@ -0,0 +1,178 @@
|
|
|
1
|
+
#![allow(dead_code)]
|
|
2
|
+
|
|
3
|
+
use std::fs;
|
|
4
|
+
use std::process::Command;
|
|
5
|
+
use std::sync::atomic::{AtomicU64, Ordering};
|
|
6
|
+
use std::time::{SystemTime, UNIX_EPOCH};
|
|
7
|
+
|
|
8
|
+
use serde_json::{json, Value};
|
|
9
|
+
|
|
10
|
+
static FIXTURE_COUNTER: AtomicU64 = AtomicU64::new(0);
|
|
11
|
+
|
|
12
|
+
pub fn task_state() -> Value {
|
|
13
|
+
task_state_with_active_task(active_task(json!({ "proofResults": [] })))
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
pub fn task_state_with_active_task(active_task: Value) -> Value {
|
|
17
|
+
let mut state: Value = serde_json::from_str(include_str!(
|
|
18
|
+
"../../../../templates/naome-root/.naome/task-state.json"
|
|
19
|
+
))
|
|
20
|
+
.unwrap();
|
|
21
|
+
state["status"] = json!("implementing");
|
|
22
|
+
state["activeTask"] = active_task;
|
|
23
|
+
state["updatedAt"] = json!("2026-05-04T12:00:00.000Z");
|
|
24
|
+
state
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
pub fn active_task(overrides: Value) -> Value {
|
|
28
|
+
let mut task = json!({
|
|
29
|
+
"id": "cli-task",
|
|
30
|
+
"request": "Exercise task CLI.",
|
|
31
|
+
"userPrompt": {
|
|
32
|
+
"receivedAt": "2026-05-04T12:00:00.000Z",
|
|
33
|
+
"text": "Exercise task CLI."
|
|
34
|
+
},
|
|
35
|
+
"admission": {
|
|
36
|
+
"command": "node .naome/bin/check-task-state.js --admission",
|
|
37
|
+
"cwd": ".",
|
|
38
|
+
"exitCode": 0,
|
|
39
|
+
"checkedAt": "2026-05-04T12:00:00.000Z",
|
|
40
|
+
"gitHead": "pending-test-head",
|
|
41
|
+
"changedPaths": []
|
|
42
|
+
},
|
|
43
|
+
"allowedPaths": ["README.md"],
|
|
44
|
+
"declaredChangeTypes": ["docs"],
|
|
45
|
+
"requiredCheckIds": ["diff-check"],
|
|
46
|
+
"humanReview": {
|
|
47
|
+
"required": false,
|
|
48
|
+
"approved": false,
|
|
49
|
+
"reason": null
|
|
50
|
+
}
|
|
51
|
+
});
|
|
52
|
+
for (key, value) in overrides.as_object().unwrap() {
|
|
53
|
+
task.as_object_mut()
|
|
54
|
+
.unwrap()
|
|
55
|
+
.insert(key.clone(), value.clone());
|
|
56
|
+
}
|
|
57
|
+
task
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
pub fn successful_proof(evidence: Value) -> Value {
|
|
61
|
+
json!({
|
|
62
|
+
"checkId": "diff-check",
|
|
63
|
+
"command": "git diff --check",
|
|
64
|
+
"cwd": ".",
|
|
65
|
+
"exitCode": 0,
|
|
66
|
+
"checkedAt": "2026-05-04T12:00:00.000Z",
|
|
67
|
+
"evidence": evidence
|
|
68
|
+
})
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
pub fn fixture_root(task_state: Value) -> std::path::PathBuf {
|
|
72
|
+
let nonce = SystemTime::now()
|
|
73
|
+
.duration_since(UNIX_EPOCH)
|
|
74
|
+
.unwrap()
|
|
75
|
+
.as_nanos();
|
|
76
|
+
let counter = FIXTURE_COUNTER.fetch_add(1, Ordering::Relaxed);
|
|
77
|
+
let root = std::env::temp_dir().join(format!(
|
|
78
|
+
"naome-task-cli-fixture-{}-{nonce}-{counter}",
|
|
79
|
+
std::process::id()
|
|
80
|
+
));
|
|
81
|
+
fs::create_dir_all(root.join(".naome")).unwrap();
|
|
82
|
+
fs::write(
|
|
83
|
+
root.join(".naomeignore"),
|
|
84
|
+
".naome/archive/\n.naome/tasks/\n",
|
|
85
|
+
)
|
|
86
|
+
.unwrap();
|
|
87
|
+
write_json(&root, ".naome/task-state.json", &task_state);
|
|
88
|
+
write_json(&root, ".naome/verification.json", &verification());
|
|
89
|
+
write_fixture_file(&root, "README.md", "initial\n");
|
|
90
|
+
root
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
pub fn init_git(root: &std::path::Path) {
|
|
94
|
+
git(root, ["init"]);
|
|
95
|
+
git(root, ["config", "user.email", "naome@example.com"]);
|
|
96
|
+
git(root, ["config", "user.name", "NAOME Test"]);
|
|
97
|
+
git(root, ["add", "."]);
|
|
98
|
+
git(root, ["commit", "-m", "baseline"]);
|
|
99
|
+
let head = git(root, ["rev-parse", "HEAD"]).trim().to_string();
|
|
100
|
+
let path = root.join(".naome/task-state.json");
|
|
101
|
+
let mut state: Value = serde_json::from_str(&fs::read_to_string(&path).unwrap()).unwrap();
|
|
102
|
+
state["activeTask"]["admission"]["gitHead"] = json!(head);
|
|
103
|
+
write_json(root, ".naome/task-state.json", &state);
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
pub fn git<const N: usize>(root: &std::path::Path, args: [&str; N]) -> String {
|
|
107
|
+
let output = Command::new("git")
|
|
108
|
+
.args(args)
|
|
109
|
+
.current_dir(root)
|
|
110
|
+
.output()
|
|
111
|
+
.unwrap();
|
|
112
|
+
assert!(
|
|
113
|
+
output.status.success(),
|
|
114
|
+
"{}",
|
|
115
|
+
String::from_utf8_lossy(&output.stderr)
|
|
116
|
+
);
|
|
117
|
+
String::from_utf8_lossy(&output.stdout).to_string()
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
pub fn write_fixture_file(root: &std::path::Path, path: &str, content: &str) {
|
|
121
|
+
let target = root.join(path);
|
|
122
|
+
fs::create_dir_all(target.parent().unwrap()).unwrap();
|
|
123
|
+
fs::write(target, content).unwrap();
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
pub fn write_json(root: &std::path::Path, path: &str, value: &Value) {
|
|
127
|
+
write_fixture_file(
|
|
128
|
+
root,
|
|
129
|
+
path,
|
|
130
|
+
&format!("{}\n", serde_json::to_string_pretty(value).unwrap()),
|
|
131
|
+
);
|
|
132
|
+
}
|
|
133
|
+
|
|
134
|
+
pub fn write_verification_checks(root: &std::path::Path, checks: Value) {
|
|
135
|
+
write_json(
|
|
136
|
+
root,
|
|
137
|
+
".naome/verification.json",
|
|
138
|
+
&json!({
|
|
139
|
+
"schema": "naome.verification.v1",
|
|
140
|
+
"version": 1,
|
|
141
|
+
"status": "ready",
|
|
142
|
+
"checks": checks
|
|
143
|
+
}),
|
|
144
|
+
);
|
|
145
|
+
}
|
|
146
|
+
|
|
147
|
+
pub fn run_json<const N: usize>(root: &std::path::Path, args: [&str; N]) -> Value {
|
|
148
|
+
let output = Command::new(env!("CARGO_BIN_EXE_naome"))
|
|
149
|
+
.args(args)
|
|
150
|
+
.current_dir(root)
|
|
151
|
+
.output()
|
|
152
|
+
.unwrap();
|
|
153
|
+
assert!(
|
|
154
|
+
output.status.success(),
|
|
155
|
+
"{}{}",
|
|
156
|
+
String::from_utf8_lossy(&output.stdout),
|
|
157
|
+
String::from_utf8_lossy(&output.stderr)
|
|
158
|
+
);
|
|
159
|
+
serde_json::from_slice(&output.stdout).unwrap()
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
fn verification() -> Value {
|
|
163
|
+
json!({
|
|
164
|
+
"schema": "naome.verification.v1",
|
|
165
|
+
"version": 1,
|
|
166
|
+
"status": "ready",
|
|
167
|
+
"checks": [{
|
|
168
|
+
"id": "diff-check",
|
|
169
|
+
"command": "git diff --check",
|
|
170
|
+
"cwd": ".",
|
|
171
|
+
"purpose": "Detect whitespace and patch formatting issues.",
|
|
172
|
+
"cost": "fast",
|
|
173
|
+
"source": "git",
|
|
174
|
+
"evidence": ["README.md"],
|
|
175
|
+
"lastVerified": null
|
|
176
|
+
}]
|
|
177
|
+
})
|
|
178
|
+
}
|