agentflight 0.6.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (119) hide show
  1. package/CHANGELOG.md +284 -2
  2. package/README.md +86 -34
  3. package/dist/adapters/agentloopkit.d.ts +2 -1
  4. package/dist/adapters/agentloopkit.d.ts.map +1 -1
  5. package/dist/adapters/agentloopkit.js +53 -58
  6. package/dist/adapters/agentloopkit.js.map +1 -1
  7. package/dist/adapters/projscan.d.ts +1 -0
  8. package/dist/adapters/projscan.d.ts.map +1 -1
  9. package/dist/adapters/projscan.js +36 -44
  10. package/dist/adapters/projscan.js.map +1 -1
  11. package/dist/adapters/tool-runner.d.ts +16 -0
  12. package/dist/adapters/tool-runner.d.ts.map +1 -0
  13. package/dist/adapters/tool-runner.js +43 -0
  14. package/dist/adapters/tool-runner.js.map +1 -0
  15. package/dist/cli.d.ts.map +1 -1
  16. package/dist/cli.js +24 -2
  17. package/dist/cli.js.map +1 -1
  18. package/dist/commands/doctor.d.ts.map +1 -1
  19. package/dist/commands/doctor.js +26 -2
  20. package/dist/commands/doctor.js.map +1 -1
  21. package/dist/commands/handoff.d.ts +17 -0
  22. package/dist/commands/handoff.d.ts.map +1 -0
  23. package/dist/commands/handoff.js +286 -0
  24. package/dist/commands/handoff.js.map +1 -0
  25. package/dist/commands/history.d.ts +11 -0
  26. package/dist/commands/history.d.ts.map +1 -0
  27. package/dist/commands/history.js +251 -0
  28. package/dist/commands/history.js.map +1 -0
  29. package/dist/commands/init.d.ts +5 -0
  30. package/dist/commands/init.d.ts.map +1 -1
  31. package/dist/commands/init.js +28 -10
  32. package/dist/commands/init.js.map +1 -1
  33. package/dist/commands/replay.d.ts.map +1 -1
  34. package/dist/commands/replay.js +23 -16
  35. package/dist/commands/replay.js.map +1 -1
  36. package/dist/commands/report.d.ts.map +1 -1
  37. package/dist/commands/report.js +22 -16
  38. package/dist/commands/report.js.map +1 -1
  39. package/dist/commands/resume.d.ts +1 -0
  40. package/dist/commands/resume.d.ts.map +1 -1
  41. package/dist/commands/resume.js +24 -14
  42. package/dist/commands/resume.js.map +1 -1
  43. package/dist/commands/start.d.ts +12 -0
  44. package/dist/commands/start.d.ts.map +1 -1
  45. package/dist/commands/start.js +53 -33
  46. package/dist/commands/start.js.map +1 -1
  47. package/dist/commands/status.d.ts.map +1 -1
  48. package/dist/commands/status.js +74 -9
  49. package/dist/commands/status.js.map +1 -1
  50. package/dist/commands/verify.d.ts.map +1 -1
  51. package/dist/commands/verify.js +22 -9
  52. package/dist/commands/verify.js.map +1 -1
  53. package/dist/core/artifacts.d.ts +11 -0
  54. package/dist/core/artifacts.d.ts.map +1 -0
  55. package/dist/core/artifacts.js +39 -0
  56. package/dist/core/artifacts.js.map +1 -0
  57. package/dist/core/config.d.ts +2 -0
  58. package/dist/core/config.d.ts.map +1 -1
  59. package/dist/core/config.js +16 -14
  60. package/dist/core/config.js.map +1 -1
  61. package/dist/core/doctor.d.ts +4 -0
  62. package/dist/core/doctor.d.ts.map +1 -1
  63. package/dist/core/doctor.js +37 -2
  64. package/dist/core/doctor.js.map +1 -1
  65. package/dist/core/fs-safe.d.ts +6 -0
  66. package/dist/core/fs-safe.d.ts.map +1 -1
  67. package/dist/core/fs-safe.js +50 -4
  68. package/dist/core/fs-safe.js.map +1 -1
  69. package/dist/core/git.d.ts.map +1 -1
  70. package/dist/core/git.js +7 -1
  71. package/dist/core/git.js.map +1 -1
  72. package/dist/core/output.d.ts +14 -0
  73. package/dist/core/output.d.ts.map +1 -1
  74. package/dist/core/output.js +72 -4
  75. package/dist/core/output.js.map +1 -1
  76. package/dist/core/paths.d.ts +1 -0
  77. package/dist/core/paths.d.ts.map +1 -1
  78. package/dist/core/paths.js +9 -1
  79. package/dist/core/paths.js.map +1 -1
  80. package/dist/core/review-intelligence.d.ts.map +1 -1
  81. package/dist/core/review-intelligence.js +182 -104
  82. package/dist/core/review-intelligence.js.map +1 -1
  83. package/dist/core/risk.d.ts.map +1 -1
  84. package/dist/core/risk.js +9 -4
  85. package/dist/core/risk.js.map +1 -1
  86. package/dist/core/session.d.ts +47 -1
  87. package/dist/core/session.d.ts.map +1 -1
  88. package/dist/core/session.js +203 -10
  89. package/dist/core/session.js.map +1 -1
  90. package/dist/core/verification-runs.d.ts +6 -0
  91. package/dist/core/verification-runs.d.ts.map +1 -0
  92. package/dist/core/verification-runs.js +104 -0
  93. package/dist/core/verification-runs.js.map +1 -0
  94. package/dist/core/verification.d.ts +4 -3
  95. package/dist/core/verification.d.ts.map +1 -1
  96. package/dist/core/verification.js +33 -66
  97. package/dist/core/verification.js.map +1 -1
  98. package/dist/renderers/html-replay.d.ts +2 -0
  99. package/dist/renderers/html-replay.d.ts.map +1 -1
  100. package/dist/renderers/html-replay.js +169 -9
  101. package/dist/renderers/html-replay.js.map +1 -1
  102. package/dist/renderers/markdown-report.d.ts +2 -0
  103. package/dist/renderers/markdown-report.d.ts.map +1 -1
  104. package/dist/renderers/markdown-report.js +20 -6
  105. package/dist/renderers/markdown-report.js.map +1 -1
  106. package/dist/renderers/resume-prompt.d.ts +2 -0
  107. package/dist/renderers/resume-prompt.d.ts.map +1 -1
  108. package/dist/renderers/resume-prompt.js +47 -10
  109. package/dist/renderers/resume-prompt.js.map +1 -1
  110. package/dist/types/index.d.ts +3 -3
  111. package/dist/types/index.d.ts.map +1 -1
  112. package/docs/assets/agentflight-cli-demo.svg +3 -3
  113. package/docs/assets/agentflight-terminal-demo.gif +0 -0
  114. package/docs/development/changed-file-filters.md +19 -7
  115. package/docs/development/dogfooding.md +1 -1
  116. package/docs/examples/basic-agentflight-session.md +21 -10
  117. package/docs/roadmap/index.md +11 -3
  118. package/docs/roadmap/v0.4.0-review-intelligence-plan.md +1 -1
  119. package/package.json +3 -3
package/CHANGELOG.md CHANGED
@@ -2,6 +2,275 @@
2
2
 
3
3
  All notable AgentFlight changes are documented here.
4
4
 
5
+ ## [0.7.1] - 2026-06-21
6
+
7
+ ### Fixed
8
+
9
+ - Refreshed the README terminal hero GIF so it shows the current
10
+ handoff-first review flow instead of the older replay-first flow.
11
+ - Updated the README hero caption and sample output to include `handoff` and
12
+ `history` accurately.
13
+
14
+ ### Changed
15
+
16
+ - Tightened README workflow copy around the local handoff packet, recent local
17
+ session history, and current failure-excerpt surfaces.
18
+
19
+ ## [0.7.0] - 2026-06-21
20
+
21
+ ### Added
22
+
23
+ - Added `agentflight handoff`, a local-only review handoff command that generates the report, replay, and resume artifacts and summarizes readiness, proof gaps, review focus, and failed verification excerpts.
24
+ - Added `agentflight history`, a read-only local command for listing recent
25
+ sessions, proof counts, the current-session marker, and existing report/replay
26
+ artifact paths without search indexing, export, sync, or session switching.
27
+ - Added local `agentflight history --task <text>` and
28
+ `agentflight history --state ready|blocked|needs_verification|unknown|current`
29
+ filters so engineers can find relevant local sessions without scanning long
30
+ histories or adding any index, sync, export, or session switching behavior.
31
+ - Added a compact Review Path section to local HTML replay artifacts so long
32
+ sessions lead reviewers through proof gaps, unresolved failed runs, review
33
+ focus, and verification evidence without adding scripts, exports, or hosted
34
+ behavior.
35
+ - Documented the `agentflight history --limit 1` latest-action workflow for
36
+ reopening local handoff/report/replay/resume artifacts.
37
+ - Added session-specific handoff artifacts under `.agentflight/reports/` so
38
+ `agentflight history` can point to stable handoff packets from prior sessions.
39
+ - Added session-specific resume artifacts under `.agentflight/reports/` so
40
+ `agentflight history` can point to stable continuation prompts from prior
41
+ sessions.
42
+ - Added post-v0.6.0 user-research findings and a v0.6.0 website update prompt focused on the local handoff workflow.
43
+ - Added a post-v0.6.0 product direction note that keeps local handoff, first-run
44
+ workspace hygiene, replay ergonomics, proof guidance, and explainable ranking
45
+ as the priority order.
46
+
47
+ ### Fixed
48
+
49
+ - Ready `agentflight status` output now points at an existing local handoff,
50
+ replay, or report artifact when one already exists, instead of repeating
51
+ handoff-generation guidance.
52
+ - Ready `agentflight resume` prompts now point at an existing local handoff,
53
+ replay, or report artifact when one already exists, instead of repeating
54
+ handoff-generation guidance.
55
+ - Review Intelligence now ignores unfinished AgentFlight readout/artifact
56
+ commands such as `agentflight replay` and `node dist/cli.js replay` when
57
+ computing incomplete proof gaps, so readiness guidance keeps pointing at
58
+ meaningful verification commands.
59
+ - Incomplete verification guidance now says a command may still be running and
60
+ suggests waiting before rerunning, avoiding false lost-evidence alarms when
61
+ status is checked during parallel verification.
62
+ - Ready `agentflight handoff` terminal guidance now tells reviewers to share
63
+ the local handoff packet first, with report/replay as supporting detail
64
+ artifacts.
65
+ - Current start-only `agentflight history` sessions now guide users to run
66
+ verification before handoff when no proof exists yet, while keeping
67
+ handoff-only guidance once verification has been recorded.
68
+ - Public positioning regression coverage now guards current public/runtime
69
+ surfaces against stale assistant-style positioning.
70
+ - Clean-worktree status now tells users to open handoff/report/replay or JSON
71
+ output for tucked verification details, matching the handoff-first ready
72
+ review path.
73
+ - Ready-session `Open first` guidance now prefers the generated handoff packet
74
+ in handoff, clean status/resume, and history surfaces, while blocked sessions
75
+ still point to the report/fix path.
76
+ - Full Markdown proof reports now show changed files, risk, verification,
77
+ review focus, proof gaps, readiness, recommendation, and next action before
78
+ the timeline, keeping long sessions faster to review.
79
+ - `agentflight history` now compacts non-current start-only sessions that have
80
+ no proof or review artifacts, keeping recent local artifacts easier to scan.
81
+ - Review Intelligence now keeps generated `.agentflight/.gitignore` helper files
82
+ below real first-run review targets while leaving them visible.
83
+ - `agentflight resume` now includes unresolved and historical failed-run context
84
+ below the verification count, matching status/report trust cues.
85
+ - Clean-worktree `agentflight resume` prompts now include the latest local
86
+ `Open first:` artifact path when current report/replay/handoff evidence
87
+ exists.
88
+ - Clean-worktree `agentflight status` now shows the latest local `Open first:`
89
+ artifact path when current report/replay/handoff evidence exists.
90
+ - `agentflight history` now shows the nearest previous local artifact when the
91
+ current latest session has none yet, while keeping the current-session
92
+ handoff next action.
93
+ - First-run AgentFlight generated-file lists and local-file guidance now use
94
+ shared output helpers, keeping `init` and `start --yes` copy consistent.
95
+ - `agentflight start --yes` now explains the AgentFlight files it generated
96
+ during safe auto-init, including project config and local runtime evidence.
97
+ - `agentflight init` and `agentflight start` now use concise ProjScan version
98
+ checks instead of extra help probing, while `agentflight doctor` keeps deeper
99
+ diagnostics.
100
+ - `agentflight doctor` now renders multiple detected proof-command suggestions
101
+ as an indented list instead of one long semicolon-separated line.
102
+ - `agentflight history` now prefers useful review-ready or blocked artifact
103
+ metadata over later clean-worktree artifact metadata, while preserving
104
+ clean-only session history.
105
+ - Clean-worktree `agentflight handoff` now preserves existing session review
106
+ artifacts instead of overwriting report/replay/resume evidence with an empty
107
+ post-commit clean-state artifact.
108
+ - Clean-worktree `agentflight handoff` now exits successfully instead of
109
+ treating an informational post-commit handoff as a command failure.
110
+ - `agentflight doctor` now suggests concrete detected `agentflight verify -- ...`
111
+ commands when config verification commands are empty.
112
+ - `agentflight verify` now suggests detected package proof commands when no
113
+ explicit command is provided and config commands are empty.
114
+ - `agentflight doctor` now warns when package proof scripts exist but
115
+ `.agentflight/config.json` has no configured verification commands.
116
+ - `agentflight history` now lists capped repo-relative malformed session paths
117
+ instead of only reporting a skipped-file count.
118
+ - Concurrent `agentflight verify` runs now reserve distinct stdout/stderr
119
+ evidence paths and merge verification updates without dropping either run.
120
+ - `agentflight history --limit` now rejects non-integer, zero, and negative
121
+ values with a clear local error instead of silently falling back or returning
122
+ an empty history.
123
+ - Review Intelligence now treats an earlier failed verification as resolved when
124
+ the same stored command later passes, so TDD red/green and format-fix loops do
125
+ not leave handoffs permanently blocked.
126
+ - Status, report, replay, and handoff now distinguish unresolved failed
127
+ verification from historical failed runs that later passed.
128
+ - Resume prompts now use the same unresolved-versus-resolved verification count
129
+ wording as the other review surfaces.
130
+ - Clean-worktree status now points users to `agentflight history --limit 1` to
131
+ reopen the latest local artifacts before starting the next session.
132
+ - History now shows unresolved-versus-resolved failed verification counts for
133
+ prior sessions.
134
+ - History now includes stable handoff artifact paths alongside report and
135
+ replay paths when those artifacts exist.
136
+ - History now includes stable resume artifact paths when those artifacts exist.
137
+ - History now suggests which existing local artifact to open first for each
138
+ session.
139
+ - History now surfaces the newest session's open-first action before the full
140
+ session list, reducing scan work in long local histories.
141
+ - History now tells users to run `agentflight handoff` when the latest local
142
+ session is current but no handoff/report/replay artifact exists yet.
143
+ - History now shows the latest session's recorded readiness in the top-level
144
+ `Latest action:` block.
145
+ - History now says `Open first: none yet` when no handoff, report, or replay
146
+ artifact exists.
147
+ - HTML replay now reserves urgent failed-run navigation for unresolved failed
148
+ verification while keeping historical failed runs visible in the ledger.
149
+ - Ready handoffs no longer inline historical failed verification excerpts once
150
+ no unresolved failed-verification proof gap remains; those excerpts stay in
151
+ report/replay evidence.
152
+ - `agentflight start` now treats AgentLoopKit's `Active task: none pinned.`
153
+ status as no active task instead of falsely reporting task reuse.
154
+ - AgentLoopKit task-link diagnostics now use generic link-check wording instead
155
+ of stale automatic task-creation copy.
156
+ - `agentflight init` now reports ProjScan and AgentLoopKit CLI availability
157
+ using the same concise tool formatter as start/report surfaces instead of
158
+ relying on repo marker files.
159
+ - `agentflight status` now reports a clean worktree explicitly instead of
160
+ calling zero changed files `Unknown` after a completed session has been
161
+ committed.
162
+ - `agentflight status` now compacts very long terminal verification run lists
163
+ while keeping full verification runs in JSON, report/replay, and local
164
+ evidence files.
165
+ - Clean-worktree `agentflight status` now tucks individual verification run
166
+ details when there are no unresolved failed runs, while keeping counts and
167
+ JSON evidence complete.
168
+ - Review Intelligence now treats incomplete verification attempts as blocking
169
+ before clean-worktree readiness, so live status cannot call a session clean
170
+ while verification is still in progress.
171
+ - `agentflight init` now lists created and skipped files by repo-relative path
172
+ instead of only showing counts.
173
+ - `agentflight doctor` now warns when `.projscan-memory/memory.json` exists
174
+ without a matching project filter and reports OK once the repo filters it
175
+ through `changedFileFilters.ignore`.
176
+ - `agentflight history` now labels stored review metadata as
177
+ `Recorded readiness:` so it is not confused with live worktree readiness.
178
+ - `agentflight doctor` no longer prints the absolute repository root in the
179
+ successful repository-root check.
180
+ - HTML replay now labels resolved failed verification rows as historical when
181
+ no unresolved failed runs remain.
182
+ - `agentflight doctor` now treats a missing current session as OK first-run
183
+ guidance instead of warning when the rest of the local setup is healthy.
184
+ - Clean-worktree status now reports `Risk: none` instead of `Risk: unknown`
185
+ while preserving `unknown` for legacy or genuinely missing metadata.
186
+ - Clean-worktree risk reasons now use current-state wording instead of saying
187
+ no changed files were detected "yet."
188
+ - Parallel report, replay, and resume commands now preserve each artifact event
189
+ in session history instead of letting the last stale session write win.
190
+ - Review Intelligence no longer lets ProjScan risk hints boost generated
191
+ `.projscan-memory/memory.json` above real first-run review targets, while the
192
+ file remains visible with the existing `changedFileFilters.ignore` guidance.
193
+ - `agentflight history` now includes the selected local artifact path directly
194
+ on the `Open first:` line, reducing lookup work in long session lists.
195
+ - `agentflight handoff` now includes the selected report or replay path directly
196
+ on the `Open first:` line while preserving the full artifact list.
197
+
198
+ ### Changed
199
+
200
+ - Clean-worktree `agentflight resume` constraints now tell agents to start a new
201
+ AgentFlight session before unrelated work instead of applying active-task
202
+ constraints to a completed clean session.
203
+ - `agentflight start` now prefers configured no-arg `agentflight verify`
204
+ guidance when `.agentflight/config.json` already has verification commands,
205
+ while keeping detected package-script fallback guidance for empty configs.
206
+ - Current product copy now uses `coding agent sessions` and agentic engineering
207
+ language instead of assistant-style positioning.
208
+ - Idempotent `agentflight init` now shows a concrete detected proof command
209
+ when existing config verification commands are empty.
210
+ - First-run `agentflight init` now points seeded configs at no-arg
211
+ `agentflight verify` in the primary workflow.
212
+ - `agentflight init` now points first-run users through the handoff golden path:
213
+ start a session, capture verification, then generate a local handoff, with
214
+ status and doctor listed as supporting checks.
215
+ - `agentflight init` now uses the first detected verification command in its
216
+ primary workflow guidance, falling back to `<proof command>` when no proof
217
+ script is detected.
218
+ - Newly generated `.agentflight/config.json` files now seed detected
219
+ verification commands from package scripts while leaving profiles empty and
220
+ preserving existing configs.
221
+ - README and verification docs now describe the handoff-first first-run workflow
222
+ and init-seeded verification commands.
223
+ - Kept ready-review report, replay, resume, examples, and demo copy aligned with
224
+ the `agentflight handoff` golden path while keeping report/replay/resume as
225
+ supporting local artifacts.
226
+ - Changed-file review surfaces now fail with an actionable git-status error
227
+ instead of treating git-status failures as an empty diff.
228
+ - Shortened the optional ProjScan baseline budget during `agentflight start` so
229
+ busy local ProjScan work cannot stall session startup for too long.
230
+ - `agentflight start` now reuses an active AgentLoopKit task instead of creating
231
+ a duplicate AgentFlight placeholder task.
232
+ - `agentflight start` now shows concise ProjScan and AgentLoopKit warning
233
+ summaries when optional tooling is available but degraded.
234
+ - `agentflight start` now inspects ProjScan availability without running the
235
+ heavier optional `projscan start` baseline on the startup path.
236
+ - `agentflight start` now uses lightweight AgentLoopKit availability inspection
237
+ on the startup path while preserving task reuse/linking.
238
+ - `agentflight start` now reuses AgentLoopKit's local active-task state file
239
+ directly instead of parsing `agentloopkit status` output.
240
+ - `agentflight start` now links existing AgentLoopKit task state without
241
+ creating new AgentLoopKit task contracts automatically.
242
+ - Start output and Markdown tooling rows now show whether AgentLoopKit has an
243
+ active task linked when that local state is known.
244
+ - `agentflight handoff` now treats missing required proof as not ready to share:
245
+ it exits non-zero, uses `Fix before sharing`, and points users to the report
246
+ first.
247
+ - Start, report, replay, and handoff terminal output now display local
248
+ `.agentflight/...` artifact paths relative to the repo instead of absolute
249
+ user-directory paths.
250
+ - Handoff verification details now distinguish zero verification runs from
251
+ passing runs that simply have no failed excerpts.
252
+ - Review Intelligence suggested proof now follows each proof gap's preferred
253
+ proof-kind order, so source gaps prefer `npm test` when available and
254
+ dependency gaps prefer build/install-style proof before typecheck.
255
+ - Review Intelligence proof-gap rules are now centralized in one ordered table
256
+ to keep future proof guidance changes easier to review.
257
+ - HTML replay verification ledgers now display long run commands compactly while
258
+ keeping the full command available in the title text.
259
+ - Status and Markdown report verification evidence rows now use compact display
260
+ labels for long run commands while preserving stored command evidence.
261
+ - `agentflight init` now writes `.agentflight/.gitignore` for runtime evidence
262
+ directories instead of seeding new runtime `.gitkeep` files, reducing
263
+ first-run Git noise while keeping `.agentflight/config.json` and the local
264
+ AgentFlight ignore file visible as project config.
265
+ - AgentFlight session JSON writes now use same-directory temp files and atomic
266
+ rename so concurrent report, replay, resume, and handoff commands do not read
267
+ partially written session state.
268
+ - Review Intelligence now describes `.projscan-memory/memory.json` as generated
269
+ tool state instead of arbitrary unknown code while keeping the file visible.
270
+ - Report and replay generation now persist a compact local readiness summary in
271
+ session events, letting `agentflight history` show the latest recorded
272
+ readiness without recalculating old sessions.
273
+
5
274
  ## AgentFlight v0.6.0 - 2026-06-19
6
275
 
7
276
  Local review ergonomics and automation surfaces for heavier real-world dogfood.
@@ -19,7 +288,20 @@ Local review ergonomics and automation surfaces for heavier real-world dogfood.
19
288
 
20
289
  ### Changed
21
290
 
22
- - AgentFlight now describes itself as a local-first review layer for AI coding sessions across package metadata, README, and product docs.
291
+ - Clarified first-run workspace hygiene docs: `.projscan-memory/**` can be added
292
+ to `changedFileFilters.ignore` when ProjScan memory is generated evidence
293
+ rather than a review target.
294
+ - Lowered generated ProjScan memory priority in Review Intelligence so
295
+ `.projscan-memory/memory.json` remains visible but no longer outranks real
296
+ first-run review targets such as `.agentflight/config.json` or docs changes.
297
+ - Classified first-party TypeScript/JavaScript source files under `src/` as
298
+ source changes so review focus gives clearer guidance and proof gaps than the
299
+ previous unknown-file fallback.
300
+ - Aligned ready-review next actions with the handoff golden path: status,
301
+ report, replay, and resume now point users toward `agentflight handoff`, while
302
+ the handoff artifact itself tells users to share the generated local packet.
303
+
304
+ - AgentFlight now describes itself as a local-first review layer for coding agent sessions across package metadata, README, and product docs.
23
305
  - Long suggested proof commands stay compact in high-density review surfaces while preserving the full suggested action where useful.
24
306
  - Local AgentLoopKit evidence paths are filtered from AgentFlight changed-file review surfaces:
25
307
  - `.agentloop/state.json`
@@ -151,7 +433,7 @@ Review Intelligence trust patch focused on v0.4.0 dogfood findings.
151
433
 
152
434
  ### Added
153
435
 
154
- - Added deterministic Review Intelligence for AI coding sessions.
436
+ - Added deterministic Review Intelligence for coding agent sessions.
155
437
  - Added review focus ranking to highlight the files developers should inspect first.
156
438
  - Added proof gap detection for missing or failed verification evidence.
157
439
  - Added clearer readiness states and next-best-action guidance.
package/README.md CHANGED
@@ -8,21 +8,22 @@
8
8
 
9
9
  See what your coding agent did, what failed, and whether the work is ready for review.
10
10
 
11
- AgentFlight is a local-first review layer for AI coding sessions from Baseframe Labs. It records what your coding agent did, captures verification evidence, shows failure excerpts, and tells you what needs review before you trust the result.
11
+ AgentFlight is a local-first review layer for coding agent sessions from Baseframe Labs. It records what your coding agent did, captures verification evidence, shows failure excerpts, and tells you what needs review before you trust the result.
12
12
 
13
13
  Website: [baseframelabs.com/apps/agentflight](https://www.baseframelabs.com/apps/agentflight)
14
14
 
15
15
  AgentFlight helps you:
16
16
 
17
- - start an AI coding session
17
+ - start a coding agent session
18
18
  - capture verification evidence
19
19
  - see changed files and risk
20
20
  - create snapshots during the session
21
- - generate a proof report
22
- - generate a local replay timeline
21
+ - generate a local review handoff
22
+ - generate a proof report and local replay timeline
23
+ - find recent local sessions and their artifacts
23
24
  - create a resume prompt for the next agent or reviewer
24
25
 
25
- ![AgentFlight CLI workflow: start, verify, status, and replay](docs/assets/agentflight-terminal-demo.gif)
26
+ ![AgentFlight CLI workflow: init, start, verify, status, handoff, and history](docs/assets/agentflight-terminal-demo.gif)
26
27
 
27
28
  ## 60-Second Workflow
28
29
 
@@ -30,38 +31,40 @@ AgentFlight helps you:
30
31
  npx agentflight@latest init
31
32
  npx agentflight@latest start --task "Add password reset flow"
32
33
 
33
- # Run Codex, Claude Code, Cursor, or your coding agent normally
34
+ # Run your coding agent normally
34
35
 
35
- npx agentflight@latest verify -- npm test
36
+ npx agentflight@latest verify
36
37
  npx agentflight@latest snapshot --note "Initial implementation verified"
37
38
  npx agentflight@latest status
38
- npx agentflight@latest report
39
- npx agentflight@latest replay
40
- npx agentflight@latest resume
39
+ npx agentflight@latest handoff
40
+ npx agentflight@latest history --limit 1
41
41
  ```
42
42
 
43
43
  What you get:
44
44
 
45
- - `init` creates local `.agentflight/` project files.
45
+ - `init` creates local `.agentflight/` project files and seeds detected verification commands into `.agentflight/config.json` when package scripts exist.
46
46
  - `start` records the task, git branch, commit, dirty state, package manager, and tool availability.
47
- - `verify -- npm test` runs the command and stores stdout, stderr, exit code, timing, and pass/fail status.
48
- - `snapshot --note "..."` records the current git, risk, and proof state as a timeline event.
47
+ - `verify` runs configured commands and stores stdout, stderr, exit code, timing, and pass/fail status. Use `verify -- <command>` for one explicit proof command.
49
48
  - `status` answers what changed, how risky it is, what proof exists, what proof is missing, and what to do next.
49
+ - `snapshot --note "..."` records the current git, risk, and proof state as a timeline event.
50
+ - `handoff` generates the local review packet: readiness, proof gaps, failed excerpts, and report/replay/resume artifact paths.
50
51
  - `report` writes a Markdown proof report for review.
51
- - `replay` writes a local HTML timeline you can open in a browser.
52
- - `resume` writes a Codex/Claude-ready prompt for the next safe step.
52
+ - `replay` writes a local HTML review path and timeline you can open in a browser.
53
+ - `resume` writes a continuation prompt for the next safe step.
54
+ - `history` shows a latest action with recorded readiness, the artifact to open first, and recent local handoff/report/replay/resume paths without uploading, syncing, or switching sessions. Use `history --task <text>` or `history --state ready|blocked|needs_verification|unknown|current` to narrow existing local records.
53
55
 
54
56
  ## Watch The Flow
55
57
 
56
- AgentFlight turns a loose AI-agent session into a local proof trail:
58
+ AgentFlight turns a loose coding agent session into a local proof trail:
57
59
 
58
60
  1. Start a session before you ask the coding agent to work.
59
61
  2. Capture real verification output with `agentflight verify`.
60
62
  3. Snapshot meaningful checkpoints.
61
63
  4. Read `status` to see changed files, risk, proof, gaps, and next action.
62
- 5. Generate `report`, `replay`, and `resume` when the work is ready to review or hand off.
64
+ 5. Run `handoff` when the work is ready to review or when you need a clear fix-before-sharing summary.
65
+ 6. Use `history --limit 1` to reopen the latest local handoff, report, replay, or resume artifact.
63
66
 
64
- The replay artifact is a self-contained local HTML file. It leads with the review verdict, then lays out risk, review focus, proof gaps, the session timeline, and verification evidence (with inline failure excerpts, so you can see what broke without opening a log file) as a readable flight record:
67
+ The replay artifact is a self-contained local HTML file. It leads with the review verdict and a compact review path, then lays out risk, review focus, proof gaps, the session timeline, and verification evidence (with inline failure excerpts, so you can see what broke without opening a log file) as a readable flight record:
65
68
 
66
69
  ![AgentFlight replay: review verdict, risk, timeline, and verification evidence](docs/assets/agentflight-replay-scroll.gif)
67
70
 
@@ -69,7 +72,7 @@ A high-resolution still is also available at [`docs/assets/agentflight-replay-ti
69
72
 
70
73
  ## Why This Exists
71
74
 
72
- AI coding agents move fast. After a few prompts, you can lose track of:
75
+ Coding agents move fast. After a few prompts, you can lose track of:
73
76
 
74
77
  - what changed
75
78
  - whether the agent drifted from the task
@@ -94,30 +97,30 @@ Changed files:
94
97
  3
95
98
 
96
99
  Risk: medium
97
- - Dependency, backend, or unknown files changed.
100
+ - Application source files changed.
98
101
 
99
102
  Verification Evidence:
100
103
  1 passed, 0 failed
101
104
 
102
105
  Review first:
103
106
  1. src/auth/reset.ts
104
- Why: identity/session path; no passing test evidence
107
+ Why: identity/session path
105
108
  Focus: Check session, permission, and identity boundaries first.
106
109
  Suggested proof: npm test
107
110
 
108
111
  Proof gaps:
109
- - blocking: Sensitive auth, payment, or security files changed without passing test evidence.
112
+ - none
110
113
 
111
114
  Latest snapshot:
112
115
  - Note: Initial implementation verified
113
116
  - Risk: medium
114
117
  - Changed files: 3
115
118
 
116
- Readiness: Needs verification
117
- Reason: Sensitive auth, payment, or security files changed without passing test evidence.
119
+ Readiness: Ready for review
120
+ Reason: Verification evidence is present and no blocking proof gaps were detected.
118
121
 
119
122
  Next action:
120
- Run agentflight verify -- npm test
123
+ Run agentflight handoff to generate the local review packet.
121
124
  ```
122
125
 
123
126
  `agentflight report`:
@@ -127,7 +130,7 @@ Run agentflight verify -- npm test
127
130
 
128
131
  ## Review First
129
132
  1. src/auth/reset.ts
130
- - Why: identity/session path; no passing test evidence
133
+ - Why: identity/session path
131
134
 
132
135
  ## Verification Evidence
133
136
  - passed: npm test
@@ -135,7 +138,25 @@ Run agentflight verify -- npm test
135
138
  - stderr: .agentflight/evidence/.../verification-1.stderr.txt
136
139
 
137
140
  ## Review Readiness
138
- Needs verification
141
+ Ready for review
142
+ ```
143
+
144
+ `agentflight handoff`:
145
+
146
+ ```text
147
+ AgentFlight handoff
148
+
149
+ Task:
150
+ Add password reset flow
151
+
152
+ Readiness: Ready for review
153
+ Open first: handoff .agentflight/reports/af-...-handoff.md
154
+
155
+ Artifacts:
156
+ - Handoff: .agentflight/reports/af-...-handoff.md
157
+ - Report: .agentflight/reports/af-...-report.md
158
+ - Replay: .agentflight/reports/af-...-replay.html
159
+ - Resume: .agentflight/reports/af-...-resume.md
139
160
  ```
140
161
 
141
162
  `agentflight replay`:
@@ -145,7 +166,22 @@ Replay saved:
145
166
  .agentflight/reports/af-...-replay.html
146
167
 
147
168
  Timeline:
148
- session_started -> verification_passed -> snapshot_created -> replay_generated
169
+ session_started -> verification_passed -> snapshot_created -> report_generated -> replay_generated
170
+ ```
171
+
172
+ `agentflight history --limit 1`:
173
+
174
+ ```text
175
+ AgentFlight history
176
+
177
+ Latest action:
178
+ Open first: handoff .agentflight/reports/af-...-handoff.md
179
+ Recorded readiness: Ready for review
180
+
181
+ Recent sessions:
182
+ 1. Add password reset flow
183
+ Proof: 1 passed, 0 failed
184
+ Handoff: .agentflight/reports/af-...-handoff.md
149
185
  ```
150
186
 
151
187
  `agentflight resume`:
@@ -181,12 +217,14 @@ The current AgentFlight release supports:
181
217
  - config-defined verification profiles for repeated local command groups
182
218
  - configurable generated/internal changed-file filters
183
219
  - verification evidence capture with `agentflight verify`
184
- - inline failure excerpts in the replay and report, so failures are visible without opening evidence files
220
+ - inline failure excerpts in terminal output, handoffs, reports, and replays, so failures are visible without opening evidence files
185
221
  - session events
186
222
  - snapshots with `agentflight snapshot --note "..."`
187
223
  - Markdown proof reports
188
- - self-contained HTML replay timelines
189
- - resume prompts for Codex, Claude Code, or a human reviewer
224
+ - self-contained HTML replays with review-path guidance and timelines
225
+ - local review handoffs that point to the report, replay, and resume artifacts
226
+ - local history filters for finding sessions by task text or recorded readiness
227
+ - resume prompts for the next agent or reviewer
190
228
  - doctor checks for local setup
191
229
  - defensive ProjScan and AgentLoopKit adapters
192
230
  - no telemetry, cloud sync, or source upload
@@ -213,10 +251,13 @@ AgentFlight creates a local `.agentflight/` directory in your repo:
213
251
  - `current/` stores the active session, handoff, and resume prompt.
214
252
  - `reports/` stores Markdown proof reports and HTML replays.
215
253
  - `evidence/` stores stdout and stderr from captured verification runs.
254
+ - `.gitignore` keeps those runtime directories out of git while leaving
255
+ `config.json` visible.
216
256
 
217
257
  Sessions store an `events` timeline with meaningful moments such as session start, verification attempts, snapshots, and generated artifacts. Reports include filenames and summaries by default, not full source diffs.
218
258
 
219
- Runtime session data is ignored by git by default in this repo:
259
+ Runtime session data is ignored by the `.agentflight/.gitignore` created by
260
+ `agentflight init`:
220
261
 
221
262
  - `.agentflight/sessions/`
222
263
  - `.agentflight/reports/`
@@ -235,11 +276,18 @@ AgentFlight always excludes its own runtime session/report/current/evidence file
235
276
  }
236
277
  ```
237
278
 
279
+ On a first run, ProjScan fallback state may create `.projscan-memory/memory.json`
280
+ and AgentFlight may surface it in status, report, replay, or handoff output. If
281
+ that memory file is generated evidence rather than something reviewers should
282
+ inspect, add `.projscan-memory/**` to `changedFileFilters.ignore`. AgentFlight
283
+ does not ignore it by default, because some teams may want generated tool state
284
+ to stay visible.
285
+
238
286
  See [docs/development/changed-file-filters.md](docs/development/changed-file-filters.md).
239
287
 
240
288
  ## Commands
241
289
 
242
- - `agentflight init` initializes `.agentflight/` with safe writes and explains which local files are project config versus runtime evidence.
290
+ - `agentflight init` initializes `.agentflight/` with safe writes, seeds detected verification commands into config when package scripts exist, and explains which local files are project config versus runtime evidence.
243
291
  - `agentflight start --task "..."` starts a session and writes the current handoff.
244
292
  - `agentflight status` summarizes changed files, risk, verification status, review focus, proof gaps, readiness, snapshots, and next action.
245
293
  - `agentflight status --format json` prints the same local status data as structured JSON for scripts.
@@ -252,6 +300,10 @@ See [docs/development/changed-file-filters.md](docs/development/changed-file-fil
252
300
  - `agentflight report --mode pr-comment` writes a local PR-comment draft without posting anywhere.
253
301
  - `agentflight replay` generates a local self-contained HTML replay with review focus and proof gaps.
254
302
  - `agentflight resume` prints and saves a continuation prompt with the next safest action.
303
+ - `agentflight handoff` generates a local review handoff, report, replay, and resume prompt without posting anywhere. It exits non-zero when verification failures or missing proof make the work not ready to share.
304
+ - `agentflight history` shows the latest action first, including recorded readiness, open-first artifact guidance, current-session marker, proof counts, and existing local handoff/report/replay/resume paths.
305
+ - `agentflight history --task <text>` narrows existing local sessions by task title before applying `--limit`.
306
+ - `agentflight history --state ready|blocked|needs_verification|unknown|current` narrows existing local sessions by recorded readiness or the current-session marker before applying `--limit`.
255
307
  - `agentflight doctor` checks local setup, scripts, tools, config, and current session state.
256
308
 
257
309
  Future placeholders exist for `upgrade`, `license`, and `login`; AgentFlight Pro/Team is not available yet.
@@ -273,7 +325,7 @@ Strategic architecture:
273
325
 
274
326
  ## Example Session
275
327
 
276
- Read [docs/examples/basic-agentflight-session.md](docs/examples/basic-agentflight-session.md) for a short password-reset walkthrough with status, report, replay, and resume artifacts.
328
+ Read [docs/examples/basic-agentflight-session.md](docs/examples/basic-agentflight-session.md) for a short password-reset walkthrough with status, handoff, report, replay, and resume artifacts.
277
329
 
278
330
  ## Roadmap
279
331
 
@@ -4,7 +4,8 @@ export interface InspectAgentLoopKitOptions {
4
4
  cwd?: string;
5
5
  run?: CommandRunner;
6
6
  command?: string;
7
+ includeDoctor?: boolean;
7
8
  }
8
9
  export declare function inspectAgentLoopKit(options?: InspectAgentLoopKitOptions): Promise<ToolAdapterResult>;
9
- export declare function createAgentLoopTask(cwd: string, title: string, run?: CommandRunner): Promise<ToolAdapterResult>;
10
+ export declare function linkAgentLoopTask(cwd: string): Promise<ToolAdapterResult>;
10
11
  //# sourceMappingURL=agentloopkit.d.ts.map
@@ -1 +1 @@
1
- {"version":3,"file":"agentloopkit.d.ts","sourceRoot":"","sources":["../../src/adapters/agentloopkit.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,oBAAoB,CAAC;AAExD,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,mBAAmB,CAAC;AAE3D,MAAM,WAAW,0BAA0B;IACzC,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,GAAG,CAAC,EAAE,aAAa,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,wBAAsB,mBAAmB,CACvC,OAAO,GAAE,0BAA+B,GACvC,OAAO,CAAC,iBAAiB,CAAC,CAsC5B;AAED,wBAAsB,mBAAmB,CACvC,GAAG,EAAE,MAAM,EACX,KAAK,EAAE,MAAM,EACb,GAAG,GAAE,aAA0B,GAC9B,OAAO,CAAC,iBAAiB,CAAC,CAoC5B"}
1
+ {"version":3,"file":"agentloopkit.d.ts","sourceRoot":"","sources":["../../src/adapters/agentloopkit.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,oBAAoB,CAAC;AAExD,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,mBAAmB,CAAC;AAG3D,MAAM,WAAW,0BAA0B;IACzC,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,GAAG,CAAC,EAAE,aAAa,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,aAAa,CAAC,EAAE,OAAO,CAAC;CACzB;AAED,wBAAsB,mBAAmB,CACvC,OAAO,GAAE,0BAA+B,GACvC,OAAO,CAAC,iBAAiB,CAAC,CA+C5B;AAED,wBAAsB,iBAAiB,CAAC,GAAG,EAAE,MAAM,GAAG,OAAO,CAAC,iBAAiB,CAAC,CAU/E"}