agentflight 0.6.0 → 0.7.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +284 -2
- package/README.md +86 -34
- package/dist/adapters/agentloopkit.d.ts +2 -1
- package/dist/adapters/agentloopkit.d.ts.map +1 -1
- package/dist/adapters/agentloopkit.js +53 -58
- package/dist/adapters/agentloopkit.js.map +1 -1
- package/dist/adapters/projscan.d.ts +1 -0
- package/dist/adapters/projscan.d.ts.map +1 -1
- package/dist/adapters/projscan.js +36 -44
- package/dist/adapters/projscan.js.map +1 -1
- package/dist/adapters/tool-runner.d.ts +16 -0
- package/dist/adapters/tool-runner.d.ts.map +1 -0
- package/dist/adapters/tool-runner.js +43 -0
- package/dist/adapters/tool-runner.js.map +1 -0
- package/dist/cli.d.ts.map +1 -1
- package/dist/cli.js +24 -2
- package/dist/cli.js.map +1 -1
- package/dist/commands/doctor.d.ts.map +1 -1
- package/dist/commands/doctor.js +26 -2
- package/dist/commands/doctor.js.map +1 -1
- package/dist/commands/handoff.d.ts +17 -0
- package/dist/commands/handoff.d.ts.map +1 -0
- package/dist/commands/handoff.js +286 -0
- package/dist/commands/handoff.js.map +1 -0
- package/dist/commands/history.d.ts +11 -0
- package/dist/commands/history.d.ts.map +1 -0
- package/dist/commands/history.js +251 -0
- package/dist/commands/history.js.map +1 -0
- package/dist/commands/init.d.ts +5 -0
- package/dist/commands/init.d.ts.map +1 -1
- package/dist/commands/init.js +28 -10
- package/dist/commands/init.js.map +1 -1
- package/dist/commands/replay.d.ts.map +1 -1
- package/dist/commands/replay.js +23 -16
- package/dist/commands/replay.js.map +1 -1
- package/dist/commands/report.d.ts.map +1 -1
- package/dist/commands/report.js +22 -16
- package/dist/commands/report.js.map +1 -1
- package/dist/commands/resume.d.ts +1 -0
- package/dist/commands/resume.d.ts.map +1 -1
- package/dist/commands/resume.js +24 -14
- package/dist/commands/resume.js.map +1 -1
- package/dist/commands/start.d.ts +12 -0
- package/dist/commands/start.d.ts.map +1 -1
- package/dist/commands/start.js +53 -33
- package/dist/commands/start.js.map +1 -1
- package/dist/commands/status.d.ts.map +1 -1
- package/dist/commands/status.js +74 -9
- package/dist/commands/status.js.map +1 -1
- package/dist/commands/verify.d.ts.map +1 -1
- package/dist/commands/verify.js +22 -9
- package/dist/commands/verify.js.map +1 -1
- package/dist/core/artifacts.d.ts +11 -0
- package/dist/core/artifacts.d.ts.map +1 -0
- package/dist/core/artifacts.js +39 -0
- package/dist/core/artifacts.js.map +1 -0
- package/dist/core/config.d.ts +2 -0
- package/dist/core/config.d.ts.map +1 -1
- package/dist/core/config.js +16 -14
- package/dist/core/config.js.map +1 -1
- package/dist/core/doctor.d.ts +4 -0
- package/dist/core/doctor.d.ts.map +1 -1
- package/dist/core/doctor.js +37 -2
- package/dist/core/doctor.js.map +1 -1
- package/dist/core/fs-safe.d.ts +6 -0
- package/dist/core/fs-safe.d.ts.map +1 -1
- package/dist/core/fs-safe.js +50 -4
- package/dist/core/fs-safe.js.map +1 -1
- package/dist/core/git.d.ts.map +1 -1
- package/dist/core/git.js +7 -1
- package/dist/core/git.js.map +1 -1
- package/dist/core/output.d.ts +14 -0
- package/dist/core/output.d.ts.map +1 -1
- package/dist/core/output.js +72 -4
- package/dist/core/output.js.map +1 -1
- package/dist/core/paths.d.ts +1 -0
- package/dist/core/paths.d.ts.map +1 -1
- package/dist/core/paths.js +9 -1
- package/dist/core/paths.js.map +1 -1
- package/dist/core/review-intelligence.d.ts.map +1 -1
- package/dist/core/review-intelligence.js +182 -104
- package/dist/core/review-intelligence.js.map +1 -1
- package/dist/core/risk.d.ts.map +1 -1
- package/dist/core/risk.js +9 -4
- package/dist/core/risk.js.map +1 -1
- package/dist/core/session.d.ts +47 -1
- package/dist/core/session.d.ts.map +1 -1
- package/dist/core/session.js +203 -10
- package/dist/core/session.js.map +1 -1
- package/dist/core/verification-runs.d.ts +6 -0
- package/dist/core/verification-runs.d.ts.map +1 -0
- package/dist/core/verification-runs.js +104 -0
- package/dist/core/verification-runs.js.map +1 -0
- package/dist/core/verification.d.ts +4 -3
- package/dist/core/verification.d.ts.map +1 -1
- package/dist/core/verification.js +33 -66
- package/dist/core/verification.js.map +1 -1
- package/dist/renderers/html-replay.d.ts +2 -0
- package/dist/renderers/html-replay.d.ts.map +1 -1
- package/dist/renderers/html-replay.js +169 -9
- package/dist/renderers/html-replay.js.map +1 -1
- package/dist/renderers/markdown-report.d.ts +2 -0
- package/dist/renderers/markdown-report.d.ts.map +1 -1
- package/dist/renderers/markdown-report.js +20 -6
- package/dist/renderers/markdown-report.js.map +1 -1
- package/dist/renderers/resume-prompt.d.ts +2 -0
- package/dist/renderers/resume-prompt.d.ts.map +1 -1
- package/dist/renderers/resume-prompt.js +47 -10
- package/dist/renderers/resume-prompt.js.map +1 -1
- package/dist/types/index.d.ts +3 -3
- package/dist/types/index.d.ts.map +1 -1
- package/docs/assets/agentflight-cli-demo.svg +3 -3
- package/docs/assets/agentflight-terminal-demo.gif +0 -0
- package/docs/development/changed-file-filters.md +19 -7
- package/docs/development/dogfooding.md +1 -1
- package/docs/examples/basic-agentflight-session.md +21 -10
- package/docs/roadmap/index.md +11 -3
- package/docs/roadmap/v0.4.0-review-intelligence-plan.md +1 -1
- package/package.json +3 -3
package/CHANGELOG.md
CHANGED
|
@@ -2,6 +2,275 @@
|
|
|
2
2
|
|
|
3
3
|
All notable AgentFlight changes are documented here.
|
|
4
4
|
|
|
5
|
+
## [0.7.1] - 2026-06-21
|
|
6
|
+
|
|
7
|
+
### Fixed
|
|
8
|
+
|
|
9
|
+
- Refreshed the README terminal hero GIF so it shows the current
|
|
10
|
+
handoff-first review flow instead of the older replay-first flow.
|
|
11
|
+
- Updated the README hero caption and sample output to include `handoff` and
|
|
12
|
+
`history` accurately.
|
|
13
|
+
|
|
14
|
+
### Changed
|
|
15
|
+
|
|
16
|
+
- Tightened README workflow copy around the local handoff packet, recent local
|
|
17
|
+
session history, and current failure-excerpt surfaces.
|
|
18
|
+
|
|
19
|
+
## [0.7.0] - 2026-06-21
|
|
20
|
+
|
|
21
|
+
### Added
|
|
22
|
+
|
|
23
|
+
- Added `agentflight handoff`, a local-only review handoff command that generates the report, replay, and resume artifacts and summarizes readiness, proof gaps, review focus, and failed verification excerpts.
|
|
24
|
+
- Added `agentflight history`, a read-only local command for listing recent
|
|
25
|
+
sessions, proof counts, the current-session marker, and existing report/replay
|
|
26
|
+
artifact paths without search indexing, export, sync, or session switching.
|
|
27
|
+
- Added local `agentflight history --task <text>` and
|
|
28
|
+
`agentflight history --state ready|blocked|needs_verification|unknown|current`
|
|
29
|
+
filters so engineers can find relevant local sessions without scanning long
|
|
30
|
+
histories or adding any index, sync, export, or session switching behavior.
|
|
31
|
+
- Added a compact Review Path section to local HTML replay artifacts so long
|
|
32
|
+
sessions lead reviewers through proof gaps, unresolved failed runs, review
|
|
33
|
+
focus, and verification evidence without adding scripts, exports, or hosted
|
|
34
|
+
behavior.
|
|
35
|
+
- Documented the `agentflight history --limit 1` latest-action workflow for
|
|
36
|
+
reopening local handoff/report/replay/resume artifacts.
|
|
37
|
+
- Added session-specific handoff artifacts under `.agentflight/reports/` so
|
|
38
|
+
`agentflight history` can point to stable handoff packets from prior sessions.
|
|
39
|
+
- Added session-specific resume artifacts under `.agentflight/reports/` so
|
|
40
|
+
`agentflight history` can point to stable continuation prompts from prior
|
|
41
|
+
sessions.
|
|
42
|
+
- Added post-v0.6.0 user-research findings and a v0.6.0 website update prompt focused on the local handoff workflow.
|
|
43
|
+
- Added a post-v0.6.0 product direction note that keeps local handoff, first-run
|
|
44
|
+
workspace hygiene, replay ergonomics, proof guidance, and explainable ranking
|
|
45
|
+
as the priority order.
|
|
46
|
+
|
|
47
|
+
### Fixed
|
|
48
|
+
|
|
49
|
+
- Ready `agentflight status` output now points at an existing local handoff,
|
|
50
|
+
replay, or report artifact when one already exists, instead of repeating
|
|
51
|
+
handoff-generation guidance.
|
|
52
|
+
- Ready `agentflight resume` prompts now point at an existing local handoff,
|
|
53
|
+
replay, or report artifact when one already exists, instead of repeating
|
|
54
|
+
handoff-generation guidance.
|
|
55
|
+
- Review Intelligence now ignores unfinished AgentFlight readout/artifact
|
|
56
|
+
commands such as `agentflight replay` and `node dist/cli.js replay` when
|
|
57
|
+
computing incomplete proof gaps, so readiness guidance keeps pointing at
|
|
58
|
+
meaningful verification commands.
|
|
59
|
+
- Incomplete verification guidance now says a command may still be running and
|
|
60
|
+
suggests waiting before rerunning, avoiding false lost-evidence alarms when
|
|
61
|
+
status is checked during parallel verification.
|
|
62
|
+
- Ready `agentflight handoff` terminal guidance now tells reviewers to share
|
|
63
|
+
the local handoff packet first, with report/replay as supporting detail
|
|
64
|
+
artifacts.
|
|
65
|
+
- Current start-only `agentflight history` sessions now guide users to run
|
|
66
|
+
verification before handoff when no proof exists yet, while keeping
|
|
67
|
+
handoff-only guidance once verification has been recorded.
|
|
68
|
+
- Public positioning regression coverage now guards current public/runtime
|
|
69
|
+
surfaces against stale assistant-style positioning.
|
|
70
|
+
- Clean-worktree status now tells users to open handoff/report/replay or JSON
|
|
71
|
+
output for tucked verification details, matching the handoff-first ready
|
|
72
|
+
review path.
|
|
73
|
+
- Ready-session `Open first` guidance now prefers the generated handoff packet
|
|
74
|
+
in handoff, clean status/resume, and history surfaces, while blocked sessions
|
|
75
|
+
still point to the report/fix path.
|
|
76
|
+
- Full Markdown proof reports now show changed files, risk, verification,
|
|
77
|
+
review focus, proof gaps, readiness, recommendation, and next action before
|
|
78
|
+
the timeline, keeping long sessions faster to review.
|
|
79
|
+
- `agentflight history` now compacts non-current start-only sessions that have
|
|
80
|
+
no proof or review artifacts, keeping recent local artifacts easier to scan.
|
|
81
|
+
- Review Intelligence now keeps generated `.agentflight/.gitignore` helper files
|
|
82
|
+
below real first-run review targets while leaving them visible.
|
|
83
|
+
- `agentflight resume` now includes unresolved and historical failed-run context
|
|
84
|
+
below the verification count, matching status/report trust cues.
|
|
85
|
+
- Clean-worktree `agentflight resume` prompts now include the latest local
|
|
86
|
+
`Open first:` artifact path when current report/replay/handoff evidence
|
|
87
|
+
exists.
|
|
88
|
+
- Clean-worktree `agentflight status` now shows the latest local `Open first:`
|
|
89
|
+
artifact path when current report/replay/handoff evidence exists.
|
|
90
|
+
- `agentflight history` now shows the nearest previous local artifact when the
|
|
91
|
+
current latest session has none yet, while keeping the current-session
|
|
92
|
+
handoff next action.
|
|
93
|
+
- First-run AgentFlight generated-file lists and local-file guidance now use
|
|
94
|
+
shared output helpers, keeping `init` and `start --yes` copy consistent.
|
|
95
|
+
- `agentflight start --yes` now explains the AgentFlight files it generated
|
|
96
|
+
during safe auto-init, including project config and local runtime evidence.
|
|
97
|
+
- `agentflight init` and `agentflight start` now use concise ProjScan version
|
|
98
|
+
checks instead of extra help probing, while `agentflight doctor` keeps deeper
|
|
99
|
+
diagnostics.
|
|
100
|
+
- `agentflight doctor` now renders multiple detected proof-command suggestions
|
|
101
|
+
as an indented list instead of one long semicolon-separated line.
|
|
102
|
+
- `agentflight history` now prefers useful review-ready or blocked artifact
|
|
103
|
+
metadata over later clean-worktree artifact metadata, while preserving
|
|
104
|
+
clean-only session history.
|
|
105
|
+
- Clean-worktree `agentflight handoff` now preserves existing session review
|
|
106
|
+
artifacts instead of overwriting report/replay/resume evidence with an empty
|
|
107
|
+
post-commit clean-state artifact.
|
|
108
|
+
- Clean-worktree `agentflight handoff` now exits successfully instead of
|
|
109
|
+
treating an informational post-commit handoff as a command failure.
|
|
110
|
+
- `agentflight doctor` now suggests concrete detected `agentflight verify -- ...`
|
|
111
|
+
commands when config verification commands are empty.
|
|
112
|
+
- `agentflight verify` now suggests detected package proof commands when no
|
|
113
|
+
explicit command is provided and config commands are empty.
|
|
114
|
+
- `agentflight doctor` now warns when package proof scripts exist but
|
|
115
|
+
`.agentflight/config.json` has no configured verification commands.
|
|
116
|
+
- `agentflight history` now lists capped repo-relative malformed session paths
|
|
117
|
+
instead of only reporting a skipped-file count.
|
|
118
|
+
- Concurrent `agentflight verify` runs now reserve distinct stdout/stderr
|
|
119
|
+
evidence paths and merge verification updates without dropping either run.
|
|
120
|
+
- `agentflight history --limit` now rejects non-integer, zero, and negative
|
|
121
|
+
values with a clear local error instead of silently falling back or returning
|
|
122
|
+
an empty history.
|
|
123
|
+
- Review Intelligence now treats an earlier failed verification as resolved when
|
|
124
|
+
the same stored command later passes, so TDD red/green and format-fix loops do
|
|
125
|
+
not leave handoffs permanently blocked.
|
|
126
|
+
- Status, report, replay, and handoff now distinguish unresolved failed
|
|
127
|
+
verification from historical failed runs that later passed.
|
|
128
|
+
- Resume prompts now use the same unresolved-versus-resolved verification count
|
|
129
|
+
wording as the other review surfaces.
|
|
130
|
+
- Clean-worktree status now points users to `agentflight history --limit 1` to
|
|
131
|
+
reopen the latest local artifacts before starting the next session.
|
|
132
|
+
- History now shows unresolved-versus-resolved failed verification counts for
|
|
133
|
+
prior sessions.
|
|
134
|
+
- History now includes stable handoff artifact paths alongside report and
|
|
135
|
+
replay paths when those artifacts exist.
|
|
136
|
+
- History now includes stable resume artifact paths when those artifacts exist.
|
|
137
|
+
- History now suggests which existing local artifact to open first for each
|
|
138
|
+
session.
|
|
139
|
+
- History now surfaces the newest session's open-first action before the full
|
|
140
|
+
session list, reducing scan work in long local histories.
|
|
141
|
+
- History now tells users to run `agentflight handoff` when the latest local
|
|
142
|
+
session is current but no handoff/report/replay artifact exists yet.
|
|
143
|
+
- History now shows the latest session's recorded readiness in the top-level
|
|
144
|
+
`Latest action:` block.
|
|
145
|
+
- History now says `Open first: none yet` when no handoff, report, or replay
|
|
146
|
+
artifact exists.
|
|
147
|
+
- HTML replay now reserves urgent failed-run navigation for unresolved failed
|
|
148
|
+
verification while keeping historical failed runs visible in the ledger.
|
|
149
|
+
- Ready handoffs no longer inline historical failed verification excerpts once
|
|
150
|
+
no unresolved failed-verification proof gap remains; those excerpts stay in
|
|
151
|
+
report/replay evidence.
|
|
152
|
+
- `agentflight start` now treats AgentLoopKit's `Active task: none pinned.`
|
|
153
|
+
status as no active task instead of falsely reporting task reuse.
|
|
154
|
+
- AgentLoopKit task-link diagnostics now use generic link-check wording instead
|
|
155
|
+
of stale automatic task-creation copy.
|
|
156
|
+
- `agentflight init` now reports ProjScan and AgentLoopKit CLI availability
|
|
157
|
+
using the same concise tool formatter as start/report surfaces instead of
|
|
158
|
+
relying on repo marker files.
|
|
159
|
+
- `agentflight status` now reports a clean worktree explicitly instead of
|
|
160
|
+
calling zero changed files `Unknown` after a completed session has been
|
|
161
|
+
committed.
|
|
162
|
+
- `agentflight status` now compacts very long terminal verification run lists
|
|
163
|
+
while keeping full verification runs in JSON, report/replay, and local
|
|
164
|
+
evidence files.
|
|
165
|
+
- Clean-worktree `agentflight status` now tucks individual verification run
|
|
166
|
+
details when there are no unresolved failed runs, while keeping counts and
|
|
167
|
+
JSON evidence complete.
|
|
168
|
+
- Review Intelligence now treats incomplete verification attempts as blocking
|
|
169
|
+
before clean-worktree readiness, so live status cannot call a session clean
|
|
170
|
+
while verification is still in progress.
|
|
171
|
+
- `agentflight init` now lists created and skipped files by repo-relative path
|
|
172
|
+
instead of only showing counts.
|
|
173
|
+
- `agentflight doctor` now warns when `.projscan-memory/memory.json` exists
|
|
174
|
+
without a matching project filter and reports OK once the repo filters it
|
|
175
|
+
through `changedFileFilters.ignore`.
|
|
176
|
+
- `agentflight history` now labels stored review metadata as
|
|
177
|
+
`Recorded readiness:` so it is not confused with live worktree readiness.
|
|
178
|
+
- `agentflight doctor` no longer prints the absolute repository root in the
|
|
179
|
+
successful repository-root check.
|
|
180
|
+
- HTML replay now labels resolved failed verification rows as historical when
|
|
181
|
+
no unresolved failed runs remain.
|
|
182
|
+
- `agentflight doctor` now treats a missing current session as OK first-run
|
|
183
|
+
guidance instead of warning when the rest of the local setup is healthy.
|
|
184
|
+
- Clean-worktree status now reports `Risk: none` instead of `Risk: unknown`
|
|
185
|
+
while preserving `unknown` for legacy or genuinely missing metadata.
|
|
186
|
+
- Clean-worktree risk reasons now use current-state wording instead of saying
|
|
187
|
+
no changed files were detected "yet."
|
|
188
|
+
- Parallel report, replay, and resume commands now preserve each artifact event
|
|
189
|
+
in session history instead of letting the last stale session write win.
|
|
190
|
+
- Review Intelligence no longer lets ProjScan risk hints boost generated
|
|
191
|
+
`.projscan-memory/memory.json` above real first-run review targets, while the
|
|
192
|
+
file remains visible with the existing `changedFileFilters.ignore` guidance.
|
|
193
|
+
- `agentflight history` now includes the selected local artifact path directly
|
|
194
|
+
on the `Open first:` line, reducing lookup work in long session lists.
|
|
195
|
+
- `agentflight handoff` now includes the selected report or replay path directly
|
|
196
|
+
on the `Open first:` line while preserving the full artifact list.
|
|
197
|
+
|
|
198
|
+
### Changed
|
|
199
|
+
|
|
200
|
+
- Clean-worktree `agentflight resume` constraints now tell agents to start a new
|
|
201
|
+
AgentFlight session before unrelated work instead of applying active-task
|
|
202
|
+
constraints to a completed clean session.
|
|
203
|
+
- `agentflight start` now prefers configured no-arg `agentflight verify`
|
|
204
|
+
guidance when `.agentflight/config.json` already has verification commands,
|
|
205
|
+
while keeping detected package-script fallback guidance for empty configs.
|
|
206
|
+
- Current product copy now uses `coding agent sessions` and agentic engineering
|
|
207
|
+
language instead of assistant-style positioning.
|
|
208
|
+
- Idempotent `agentflight init` now shows a concrete detected proof command
|
|
209
|
+
when existing config verification commands are empty.
|
|
210
|
+
- First-run `agentflight init` now points seeded configs at no-arg
|
|
211
|
+
`agentflight verify` in the primary workflow.
|
|
212
|
+
- `agentflight init` now points first-run users through the handoff golden path:
|
|
213
|
+
start a session, capture verification, then generate a local handoff, with
|
|
214
|
+
status and doctor listed as supporting checks.
|
|
215
|
+
- `agentflight init` now uses the first detected verification command in its
|
|
216
|
+
primary workflow guidance, falling back to `<proof command>` when no proof
|
|
217
|
+
script is detected.
|
|
218
|
+
- Newly generated `.agentflight/config.json` files now seed detected
|
|
219
|
+
verification commands from package scripts while leaving profiles empty and
|
|
220
|
+
preserving existing configs.
|
|
221
|
+
- README and verification docs now describe the handoff-first first-run workflow
|
|
222
|
+
and init-seeded verification commands.
|
|
223
|
+
- Kept ready-review report, replay, resume, examples, and demo copy aligned with
|
|
224
|
+
the `agentflight handoff` golden path while keeping report/replay/resume as
|
|
225
|
+
supporting local artifacts.
|
|
226
|
+
- Changed-file review surfaces now fail with an actionable git-status error
|
|
227
|
+
instead of treating git-status failures as an empty diff.
|
|
228
|
+
- Shortened the optional ProjScan baseline budget during `agentflight start` so
|
|
229
|
+
busy local ProjScan work cannot stall session startup for too long.
|
|
230
|
+
- `agentflight start` now reuses an active AgentLoopKit task instead of creating
|
|
231
|
+
a duplicate AgentFlight placeholder task.
|
|
232
|
+
- `agentflight start` now shows concise ProjScan and AgentLoopKit warning
|
|
233
|
+
summaries when optional tooling is available but degraded.
|
|
234
|
+
- `agentflight start` now inspects ProjScan availability without running the
|
|
235
|
+
heavier optional `projscan start` baseline on the startup path.
|
|
236
|
+
- `agentflight start` now uses lightweight AgentLoopKit availability inspection
|
|
237
|
+
on the startup path while preserving task reuse/linking.
|
|
238
|
+
- `agentflight start` now reuses AgentLoopKit's local active-task state file
|
|
239
|
+
directly instead of parsing `agentloopkit status` output.
|
|
240
|
+
- `agentflight start` now links existing AgentLoopKit task state without
|
|
241
|
+
creating new AgentLoopKit task contracts automatically.
|
|
242
|
+
- Start output and Markdown tooling rows now show whether AgentLoopKit has an
|
|
243
|
+
active task linked when that local state is known.
|
|
244
|
+
- `agentflight handoff` now treats missing required proof as not ready to share:
|
|
245
|
+
it exits non-zero, uses `Fix before sharing`, and points users to the report
|
|
246
|
+
first.
|
|
247
|
+
- Start, report, replay, and handoff terminal output now display local
|
|
248
|
+
`.agentflight/...` artifact paths relative to the repo instead of absolute
|
|
249
|
+
user-directory paths.
|
|
250
|
+
- Handoff verification details now distinguish zero verification runs from
|
|
251
|
+
passing runs that simply have no failed excerpts.
|
|
252
|
+
- Review Intelligence suggested proof now follows each proof gap's preferred
|
|
253
|
+
proof-kind order, so source gaps prefer `npm test` when available and
|
|
254
|
+
dependency gaps prefer build/install-style proof before typecheck.
|
|
255
|
+
- Review Intelligence proof-gap rules are now centralized in one ordered table
|
|
256
|
+
to keep future proof guidance changes easier to review.
|
|
257
|
+
- HTML replay verification ledgers now display long run commands compactly while
|
|
258
|
+
keeping the full command available in the title text.
|
|
259
|
+
- Status and Markdown report verification evidence rows now use compact display
|
|
260
|
+
labels for long run commands while preserving stored command evidence.
|
|
261
|
+
- `agentflight init` now writes `.agentflight/.gitignore` for runtime evidence
|
|
262
|
+
directories instead of seeding new runtime `.gitkeep` files, reducing
|
|
263
|
+
first-run Git noise while keeping `.agentflight/config.json` and the local
|
|
264
|
+
AgentFlight ignore file visible as project config.
|
|
265
|
+
- AgentFlight session JSON writes now use same-directory temp files and atomic
|
|
266
|
+
rename so concurrent report, replay, resume, and handoff commands do not read
|
|
267
|
+
partially written session state.
|
|
268
|
+
- Review Intelligence now describes `.projscan-memory/memory.json` as generated
|
|
269
|
+
tool state instead of arbitrary unknown code while keeping the file visible.
|
|
270
|
+
- Report and replay generation now persist a compact local readiness summary in
|
|
271
|
+
session events, letting `agentflight history` show the latest recorded
|
|
272
|
+
readiness without recalculating old sessions.
|
|
273
|
+
|
|
5
274
|
## AgentFlight v0.6.0 - 2026-06-19
|
|
6
275
|
|
|
7
276
|
Local review ergonomics and automation surfaces for heavier real-world dogfood.
|
|
@@ -19,7 +288,20 @@ Local review ergonomics and automation surfaces for heavier real-world dogfood.
|
|
|
19
288
|
|
|
20
289
|
### Changed
|
|
21
290
|
|
|
22
|
-
-
|
|
291
|
+
- Clarified first-run workspace hygiene docs: `.projscan-memory/**` can be added
|
|
292
|
+
to `changedFileFilters.ignore` when ProjScan memory is generated evidence
|
|
293
|
+
rather than a review target.
|
|
294
|
+
- Lowered generated ProjScan memory priority in Review Intelligence so
|
|
295
|
+
`.projscan-memory/memory.json` remains visible but no longer outranks real
|
|
296
|
+
first-run review targets such as `.agentflight/config.json` or docs changes.
|
|
297
|
+
- Classified first-party TypeScript/JavaScript source files under `src/` as
|
|
298
|
+
source changes so review focus gives clearer guidance and proof gaps than the
|
|
299
|
+
previous unknown-file fallback.
|
|
300
|
+
- Aligned ready-review next actions with the handoff golden path: status,
|
|
301
|
+
report, replay, and resume now point users toward `agentflight handoff`, while
|
|
302
|
+
the handoff artifact itself tells users to share the generated local packet.
|
|
303
|
+
|
|
304
|
+
- AgentFlight now describes itself as a local-first review layer for coding agent sessions across package metadata, README, and product docs.
|
|
23
305
|
- Long suggested proof commands stay compact in high-density review surfaces while preserving the full suggested action where useful.
|
|
24
306
|
- Local AgentLoopKit evidence paths are filtered from AgentFlight changed-file review surfaces:
|
|
25
307
|
- `.agentloop/state.json`
|
|
@@ -151,7 +433,7 @@ Review Intelligence trust patch focused on v0.4.0 dogfood findings.
|
|
|
151
433
|
|
|
152
434
|
### Added
|
|
153
435
|
|
|
154
|
-
- Added deterministic Review Intelligence for
|
|
436
|
+
- Added deterministic Review Intelligence for coding agent sessions.
|
|
155
437
|
- Added review focus ranking to highlight the files developers should inspect first.
|
|
156
438
|
- Added proof gap detection for missing or failed verification evidence.
|
|
157
439
|
- Added clearer readiness states and next-best-action guidance.
|
package/README.md
CHANGED
|
@@ -8,21 +8,22 @@
|
|
|
8
8
|
|
|
9
9
|
See what your coding agent did, what failed, and whether the work is ready for review.
|
|
10
10
|
|
|
11
|
-
AgentFlight is a local-first review layer for
|
|
11
|
+
AgentFlight is a local-first review layer for coding agent sessions from Baseframe Labs. It records what your coding agent did, captures verification evidence, shows failure excerpts, and tells you what needs review before you trust the result.
|
|
12
12
|
|
|
13
13
|
Website: [baseframelabs.com/apps/agentflight](https://www.baseframelabs.com/apps/agentflight)
|
|
14
14
|
|
|
15
15
|
AgentFlight helps you:
|
|
16
16
|
|
|
17
|
-
- start
|
|
17
|
+
- start a coding agent session
|
|
18
18
|
- capture verification evidence
|
|
19
19
|
- see changed files and risk
|
|
20
20
|
- create snapshots during the session
|
|
21
|
-
- generate a
|
|
22
|
-
- generate a local replay timeline
|
|
21
|
+
- generate a local review handoff
|
|
22
|
+
- generate a proof report and local replay timeline
|
|
23
|
+
- find recent local sessions and their artifacts
|
|
23
24
|
- create a resume prompt for the next agent or reviewer
|
|
24
25
|
|
|
25
|
-

|
|
26
27
|
|
|
27
28
|
## 60-Second Workflow
|
|
28
29
|
|
|
@@ -30,38 +31,40 @@ AgentFlight helps you:
|
|
|
30
31
|
npx agentflight@latest init
|
|
31
32
|
npx agentflight@latest start --task "Add password reset flow"
|
|
32
33
|
|
|
33
|
-
# Run
|
|
34
|
+
# Run your coding agent normally
|
|
34
35
|
|
|
35
|
-
npx agentflight@latest verify
|
|
36
|
+
npx agentflight@latest verify
|
|
36
37
|
npx agentflight@latest snapshot --note "Initial implementation verified"
|
|
37
38
|
npx agentflight@latest status
|
|
38
|
-
npx agentflight@latest
|
|
39
|
-
npx agentflight@latest
|
|
40
|
-
npx agentflight@latest resume
|
|
39
|
+
npx agentflight@latest handoff
|
|
40
|
+
npx agentflight@latest history --limit 1
|
|
41
41
|
```
|
|
42
42
|
|
|
43
43
|
What you get:
|
|
44
44
|
|
|
45
|
-
- `init` creates local `.agentflight/` project files.
|
|
45
|
+
- `init` creates local `.agentflight/` project files and seeds detected verification commands into `.agentflight/config.json` when package scripts exist.
|
|
46
46
|
- `start` records the task, git branch, commit, dirty state, package manager, and tool availability.
|
|
47
|
-
- `verify
|
|
48
|
-
- `snapshot --note "..."` records the current git, risk, and proof state as a timeline event.
|
|
47
|
+
- `verify` runs configured commands and stores stdout, stderr, exit code, timing, and pass/fail status. Use `verify -- <command>` for one explicit proof command.
|
|
49
48
|
- `status` answers what changed, how risky it is, what proof exists, what proof is missing, and what to do next.
|
|
49
|
+
- `snapshot --note "..."` records the current git, risk, and proof state as a timeline event.
|
|
50
|
+
- `handoff` generates the local review packet: readiness, proof gaps, failed excerpts, and report/replay/resume artifact paths.
|
|
50
51
|
- `report` writes a Markdown proof report for review.
|
|
51
|
-
- `replay` writes a local HTML timeline you can open in a browser.
|
|
52
|
-
- `resume` writes a
|
|
52
|
+
- `replay` writes a local HTML review path and timeline you can open in a browser.
|
|
53
|
+
- `resume` writes a continuation prompt for the next safe step.
|
|
54
|
+
- `history` shows a latest action with recorded readiness, the artifact to open first, and recent local handoff/report/replay/resume paths without uploading, syncing, or switching sessions. Use `history --task <text>` or `history --state ready|blocked|needs_verification|unknown|current` to narrow existing local records.
|
|
53
55
|
|
|
54
56
|
## Watch The Flow
|
|
55
57
|
|
|
56
|
-
AgentFlight turns a loose
|
|
58
|
+
AgentFlight turns a loose coding agent session into a local proof trail:
|
|
57
59
|
|
|
58
60
|
1. Start a session before you ask the coding agent to work.
|
|
59
61
|
2. Capture real verification output with `agentflight verify`.
|
|
60
62
|
3. Snapshot meaningful checkpoints.
|
|
61
63
|
4. Read `status` to see changed files, risk, proof, gaps, and next action.
|
|
62
|
-
5.
|
|
64
|
+
5. Run `handoff` when the work is ready to review or when you need a clear fix-before-sharing summary.
|
|
65
|
+
6. Use `history --limit 1` to reopen the latest local handoff, report, replay, or resume artifact.
|
|
63
66
|
|
|
64
|
-
The replay artifact is a self-contained local HTML file. It leads with the review verdict, then lays out risk, review focus, proof gaps, the session timeline, and verification evidence (with inline failure excerpts, so you can see what broke without opening a log file) as a readable flight record:
|
|
67
|
+
The replay artifact is a self-contained local HTML file. It leads with the review verdict and a compact review path, then lays out risk, review focus, proof gaps, the session timeline, and verification evidence (with inline failure excerpts, so you can see what broke without opening a log file) as a readable flight record:
|
|
65
68
|
|
|
66
69
|

|
|
67
70
|
|
|
@@ -69,7 +72,7 @@ A high-resolution still is also available at [`docs/assets/agentflight-replay-ti
|
|
|
69
72
|
|
|
70
73
|
## Why This Exists
|
|
71
74
|
|
|
72
|
-
|
|
75
|
+
Coding agents move fast. After a few prompts, you can lose track of:
|
|
73
76
|
|
|
74
77
|
- what changed
|
|
75
78
|
- whether the agent drifted from the task
|
|
@@ -94,30 +97,30 @@ Changed files:
|
|
|
94
97
|
3
|
|
95
98
|
|
|
96
99
|
Risk: medium
|
|
97
|
-
-
|
|
100
|
+
- Application source files changed.
|
|
98
101
|
|
|
99
102
|
Verification Evidence:
|
|
100
103
|
1 passed, 0 failed
|
|
101
104
|
|
|
102
105
|
Review first:
|
|
103
106
|
1. src/auth/reset.ts
|
|
104
|
-
Why: identity/session path
|
|
107
|
+
Why: identity/session path
|
|
105
108
|
Focus: Check session, permission, and identity boundaries first.
|
|
106
109
|
Suggested proof: npm test
|
|
107
110
|
|
|
108
111
|
Proof gaps:
|
|
109
|
-
-
|
|
112
|
+
- none
|
|
110
113
|
|
|
111
114
|
Latest snapshot:
|
|
112
115
|
- Note: Initial implementation verified
|
|
113
116
|
- Risk: medium
|
|
114
117
|
- Changed files: 3
|
|
115
118
|
|
|
116
|
-
Readiness:
|
|
117
|
-
Reason:
|
|
119
|
+
Readiness: Ready for review
|
|
120
|
+
Reason: Verification evidence is present and no blocking proof gaps were detected.
|
|
118
121
|
|
|
119
122
|
Next action:
|
|
120
|
-
Run agentflight
|
|
123
|
+
Run agentflight handoff to generate the local review packet.
|
|
121
124
|
```
|
|
122
125
|
|
|
123
126
|
`agentflight report`:
|
|
@@ -127,7 +130,7 @@ Run agentflight verify -- npm test
|
|
|
127
130
|
|
|
128
131
|
## Review First
|
|
129
132
|
1. src/auth/reset.ts
|
|
130
|
-
- Why: identity/session path
|
|
133
|
+
- Why: identity/session path
|
|
131
134
|
|
|
132
135
|
## Verification Evidence
|
|
133
136
|
- passed: npm test
|
|
@@ -135,7 +138,25 @@ Run agentflight verify -- npm test
|
|
|
135
138
|
- stderr: .agentflight/evidence/.../verification-1.stderr.txt
|
|
136
139
|
|
|
137
140
|
## Review Readiness
|
|
138
|
-
|
|
141
|
+
Ready for review
|
|
142
|
+
```
|
|
143
|
+
|
|
144
|
+
`agentflight handoff`:
|
|
145
|
+
|
|
146
|
+
```text
|
|
147
|
+
AgentFlight handoff
|
|
148
|
+
|
|
149
|
+
Task:
|
|
150
|
+
Add password reset flow
|
|
151
|
+
|
|
152
|
+
Readiness: Ready for review
|
|
153
|
+
Open first: handoff .agentflight/reports/af-...-handoff.md
|
|
154
|
+
|
|
155
|
+
Artifacts:
|
|
156
|
+
- Handoff: .agentflight/reports/af-...-handoff.md
|
|
157
|
+
- Report: .agentflight/reports/af-...-report.md
|
|
158
|
+
- Replay: .agentflight/reports/af-...-replay.html
|
|
159
|
+
- Resume: .agentflight/reports/af-...-resume.md
|
|
139
160
|
```
|
|
140
161
|
|
|
141
162
|
`agentflight replay`:
|
|
@@ -145,7 +166,22 @@ Replay saved:
|
|
|
145
166
|
.agentflight/reports/af-...-replay.html
|
|
146
167
|
|
|
147
168
|
Timeline:
|
|
148
|
-
session_started -> verification_passed -> snapshot_created -> replay_generated
|
|
169
|
+
session_started -> verification_passed -> snapshot_created -> report_generated -> replay_generated
|
|
170
|
+
```
|
|
171
|
+
|
|
172
|
+
`agentflight history --limit 1`:
|
|
173
|
+
|
|
174
|
+
```text
|
|
175
|
+
AgentFlight history
|
|
176
|
+
|
|
177
|
+
Latest action:
|
|
178
|
+
Open first: handoff .agentflight/reports/af-...-handoff.md
|
|
179
|
+
Recorded readiness: Ready for review
|
|
180
|
+
|
|
181
|
+
Recent sessions:
|
|
182
|
+
1. Add password reset flow
|
|
183
|
+
Proof: 1 passed, 0 failed
|
|
184
|
+
Handoff: .agentflight/reports/af-...-handoff.md
|
|
149
185
|
```
|
|
150
186
|
|
|
151
187
|
`agentflight resume`:
|
|
@@ -181,12 +217,14 @@ The current AgentFlight release supports:
|
|
|
181
217
|
- config-defined verification profiles for repeated local command groups
|
|
182
218
|
- configurable generated/internal changed-file filters
|
|
183
219
|
- verification evidence capture with `agentflight verify`
|
|
184
|
-
- inline failure excerpts in
|
|
220
|
+
- inline failure excerpts in terminal output, handoffs, reports, and replays, so failures are visible without opening evidence files
|
|
185
221
|
- session events
|
|
186
222
|
- snapshots with `agentflight snapshot --note "..."`
|
|
187
223
|
- Markdown proof reports
|
|
188
|
-
- self-contained HTML
|
|
189
|
-
-
|
|
224
|
+
- self-contained HTML replays with review-path guidance and timelines
|
|
225
|
+
- local review handoffs that point to the report, replay, and resume artifacts
|
|
226
|
+
- local history filters for finding sessions by task text or recorded readiness
|
|
227
|
+
- resume prompts for the next agent or reviewer
|
|
190
228
|
- doctor checks for local setup
|
|
191
229
|
- defensive ProjScan and AgentLoopKit adapters
|
|
192
230
|
- no telemetry, cloud sync, or source upload
|
|
@@ -213,10 +251,13 @@ AgentFlight creates a local `.agentflight/` directory in your repo:
|
|
|
213
251
|
- `current/` stores the active session, handoff, and resume prompt.
|
|
214
252
|
- `reports/` stores Markdown proof reports and HTML replays.
|
|
215
253
|
- `evidence/` stores stdout and stderr from captured verification runs.
|
|
254
|
+
- `.gitignore` keeps those runtime directories out of git while leaving
|
|
255
|
+
`config.json` visible.
|
|
216
256
|
|
|
217
257
|
Sessions store an `events` timeline with meaningful moments such as session start, verification attempts, snapshots, and generated artifacts. Reports include filenames and summaries by default, not full source diffs.
|
|
218
258
|
|
|
219
|
-
Runtime session data is ignored by
|
|
259
|
+
Runtime session data is ignored by the `.agentflight/.gitignore` created by
|
|
260
|
+
`agentflight init`:
|
|
220
261
|
|
|
221
262
|
- `.agentflight/sessions/`
|
|
222
263
|
- `.agentflight/reports/`
|
|
@@ -235,11 +276,18 @@ AgentFlight always excludes its own runtime session/report/current/evidence file
|
|
|
235
276
|
}
|
|
236
277
|
```
|
|
237
278
|
|
|
279
|
+
On a first run, ProjScan fallback state may create `.projscan-memory/memory.json`
|
|
280
|
+
and AgentFlight may surface it in status, report, replay, or handoff output. If
|
|
281
|
+
that memory file is generated evidence rather than something reviewers should
|
|
282
|
+
inspect, add `.projscan-memory/**` to `changedFileFilters.ignore`. AgentFlight
|
|
283
|
+
does not ignore it by default, because some teams may want generated tool state
|
|
284
|
+
to stay visible.
|
|
285
|
+
|
|
238
286
|
See [docs/development/changed-file-filters.md](docs/development/changed-file-filters.md).
|
|
239
287
|
|
|
240
288
|
## Commands
|
|
241
289
|
|
|
242
|
-
- `agentflight init` initializes `.agentflight/` with safe writes and explains which local files are project config versus runtime evidence.
|
|
290
|
+
- `agentflight init` initializes `.agentflight/` with safe writes, seeds detected verification commands into config when package scripts exist, and explains which local files are project config versus runtime evidence.
|
|
243
291
|
- `agentflight start --task "..."` starts a session and writes the current handoff.
|
|
244
292
|
- `agentflight status` summarizes changed files, risk, verification status, review focus, proof gaps, readiness, snapshots, and next action.
|
|
245
293
|
- `agentflight status --format json` prints the same local status data as structured JSON for scripts.
|
|
@@ -252,6 +300,10 @@ See [docs/development/changed-file-filters.md](docs/development/changed-file-fil
|
|
|
252
300
|
- `agentflight report --mode pr-comment` writes a local PR-comment draft without posting anywhere.
|
|
253
301
|
- `agentflight replay` generates a local self-contained HTML replay with review focus and proof gaps.
|
|
254
302
|
- `agentflight resume` prints and saves a continuation prompt with the next safest action.
|
|
303
|
+
- `agentflight handoff` generates a local review handoff, report, replay, and resume prompt without posting anywhere. It exits non-zero when verification failures or missing proof make the work not ready to share.
|
|
304
|
+
- `agentflight history` shows the latest action first, including recorded readiness, open-first artifact guidance, current-session marker, proof counts, and existing local handoff/report/replay/resume paths.
|
|
305
|
+
- `agentflight history --task <text>` narrows existing local sessions by task title before applying `--limit`.
|
|
306
|
+
- `agentflight history --state ready|blocked|needs_verification|unknown|current` narrows existing local sessions by recorded readiness or the current-session marker before applying `--limit`.
|
|
255
307
|
- `agentflight doctor` checks local setup, scripts, tools, config, and current session state.
|
|
256
308
|
|
|
257
309
|
Future placeholders exist for `upgrade`, `license`, and `login`; AgentFlight Pro/Team is not available yet.
|
|
@@ -273,7 +325,7 @@ Strategic architecture:
|
|
|
273
325
|
|
|
274
326
|
## Example Session
|
|
275
327
|
|
|
276
|
-
Read [docs/examples/basic-agentflight-session.md](docs/examples/basic-agentflight-session.md) for a short password-reset walkthrough with status, report, replay, and resume artifacts.
|
|
328
|
+
Read [docs/examples/basic-agentflight-session.md](docs/examples/basic-agentflight-session.md) for a short password-reset walkthrough with status, handoff, report, replay, and resume artifacts.
|
|
277
329
|
|
|
278
330
|
## Roadmap
|
|
279
331
|
|
|
@@ -4,7 +4,8 @@ export interface InspectAgentLoopKitOptions {
|
|
|
4
4
|
cwd?: string;
|
|
5
5
|
run?: CommandRunner;
|
|
6
6
|
command?: string;
|
|
7
|
+
includeDoctor?: boolean;
|
|
7
8
|
}
|
|
8
9
|
export declare function inspectAgentLoopKit(options?: InspectAgentLoopKitOptions): Promise<ToolAdapterResult>;
|
|
9
|
-
export declare function
|
|
10
|
+
export declare function linkAgentLoopTask(cwd: string): Promise<ToolAdapterResult>;
|
|
10
11
|
//# sourceMappingURL=agentloopkit.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"agentloopkit.d.ts","sourceRoot":"","sources":["../../src/adapters/agentloopkit.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"agentloopkit.d.ts","sourceRoot":"","sources":["../../src/adapters/agentloopkit.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,oBAAoB,CAAC;AAExD,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,mBAAmB,CAAC;AAG3D,MAAM,WAAW,0BAA0B;IACzC,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,GAAG,CAAC,EAAE,aAAa,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,aAAa,CAAC,EAAE,OAAO,CAAC;CACzB;AAED,wBAAsB,mBAAmB,CACvC,OAAO,GAAE,0BAA+B,GACvC,OAAO,CAAC,iBAAiB,CAAC,CA+C5B;AAED,wBAAsB,iBAAiB,CAAC,GAAG,EAAE,MAAM,GAAG,OAAO,CAAC,iBAAiB,CAAC,CAU/E"}
|