npm - akm-cli - Versions diffs - 0.8.3 → 0.9.0-beta.1 - Mend

akm-cli 0.8.3 → 0.9.0-beta.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (316) hide show

package/CHANGELOG.md +209 -0
package/dist/assets/help/help-proposals.md +1 -2
package/dist/assets/hints/cli-hints-full.md +34 -19
package/dist/assets/hints/cli-hints-short.md +1 -1
package/dist/assets/profiles/catchup.json +13 -0
package/dist/assets/profiles/consolidate.json +13 -0
package/dist/assets/profiles/frequent.json +13 -0
package/dist/assets/tasks/core/backup.yml +4 -0
package/dist/assets/tasks/core/extract.yml +4 -0
package/dist/assets/tasks/core/improve.yml +4 -0
package/dist/assets/tasks/core/index-refresh.yml +4 -0
package/dist/assets/tasks/core/sync.yml +4 -0
package/dist/assets/tasks/core/update-stashes.yml +4 -0
package/dist/assets/tasks/core/version-check.yml +4 -0
package/dist/cli/config-migrate.js +6 -6
package/dist/cli/config-validate.js +4 -4
package/dist/cli/confirm.js +3 -3
package/dist/cli/parse-args.js +1 -1
package/dist/cli/shared.js +51 -14
package/dist/cli-node.mjs +26 -0
package/dist/cli.js +171 -3862
package/dist/commands/{agent-dispatch.js → agent/agent-dispatch.js} +6 -6
package/dist/commands/{agent-support.js → agent/agent-support.js} +2 -2
package/dist/commands/agent/contribute-cli.js +200 -0
package/dist/commands/completions.js +1 -1
package/dist/commands/config-cli.js +240 -3
package/dist/commands/config-edit.js +344 -0
package/dist/commands/db-cli.js +2 -2
package/dist/commands/env/env-cli.js +529 -0
package/dist/commands/env/env.js +410 -0
package/dist/commands/env/secret-cli.js +259 -0
package/dist/commands/{secret.js → env/secret.js} +6 -47
package/dist/commands/events.js +4 -4
package/dist/commands/feedback-cli.js +18 -34
package/dist/commands/graph/graph-cli.js +132 -0
package/dist/commands/{graph.js → graph/graph.js} +22 -16
package/dist/commands/health/checks.js +279 -0
package/dist/commands/health.js +94 -262
package/dist/commands/{consolidate.js → improve/consolidate.js} +48 -36
package/dist/commands/{distill-promotion-policy.js → improve/distill-promotion-policy.js} +3 -3
package/dist/commands/{distill.js → improve/distill.js} +39 -18
package/dist/commands/{eval-cases.js → improve/eval-cases.js} +1 -1
package/dist/commands/{extract-cli.js → improve/extract-cli.js} +4 -4
package/dist/commands/{extract-prompt.js → improve/extract-prompt.js} +2 -2
package/dist/commands/{extract.js → improve/extract.js} +185 -26
package/dist/commands/{improve-auto-accept.js → improve/improve-auto-accept.js} +4 -4
package/dist/commands/{improve-cli.js → improve/improve-cli.js} +44 -22
package/dist/commands/{improve-profiles.js → improve/improve-profiles.js} +13 -7
package/dist/commands/{improve-result-file.js → improve/improve-result-file.js} +1 -1
package/dist/commands/{improve.js → improve/improve.js} +517 -253
package/dist/{core → commands/improve/memory}/memory-belief.js +2 -2
package/dist/{core → commands/improve/memory}/memory-contradiction-detect.js +5 -5
package/dist/{core → commands/improve/memory}/memory-improve.js +4 -4
package/dist/commands/{reflect.js → improve/reflect.js} +33 -28
package/dist/commands/improve/session-asset.js +248 -0
package/dist/commands/lint/agent-linter.js +1 -1
package/dist/commands/lint/base-linter.js +55 -37
package/dist/commands/lint/command-linter.js +1 -1
package/dist/commands/lint/default-linter.js +1 -1
package/dist/commands/lint/env-key-rules.js +1 -1
package/dist/commands/lint/index.js +19 -25
package/dist/commands/lint/knowledge-linter.js +1 -1
package/dist/commands/lint/memory-linter.js +1 -1
package/dist/commands/lint/registry.js +8 -8
package/dist/commands/lint/skill-linter.js +1 -1
package/dist/commands/lint/task-linter.js +1 -1
package/dist/commands/lint/workflow-linter.js +1 -1
package/dist/commands/lint.js +1 -1
package/dist/commands/observability-cli.js +244 -0
package/dist/commands/proposal/drain-policies.js +3 -3
package/dist/commands/proposal/drain.js +15 -10
package/dist/commands/proposal/proposal-cli.js +478 -0
package/dist/commands/{proposal.js → proposal/proposal.js} +5 -5
package/dist/commands/{propose.js → proposal/propose.js} +11 -11
package/dist/{core → commands/proposal/validators}/proposal-quality-validators.js +8 -3
package/dist/{core → commands/proposal/validators}/proposal-validators.js +5 -5
package/dist/{core → commands/proposal/validators}/proposals.js +13 -7
package/dist/commands/{curate.js → read/curate.js} +7 -7
package/dist/commands/{knowledge.js → read/knowledge.js} +22 -9
package/dist/commands/{registry-search.js → read/registry-search.js} +5 -5
package/dist/commands/{remember-cli.js → read/remember-cli.js} +15 -7
package/dist/commands/read/search-cli.js +207 -0
package/dist/commands/{search.js → read/search.js} +22 -27
package/dist/commands/{show.js → read/show.js} +31 -45
package/dist/commands/registry-cli.js +8 -8
package/dist/commands/remember.js +8 -8
package/dist/commands/sources/add-cli.js +293 -0
package/dist/commands/{history.js → sources/history.js} +27 -25
package/dist/commands/{info.js → sources/info.js} +6 -6
package/dist/commands/{init.js → sources/init.js} +6 -6
package/dist/commands/{installed-stashes.js → sources/installed-stashes.js} +12 -12
package/dist/commands/{migration-help.js → sources/migration-help.js} +3 -2
package/dist/commands/{schema-repair.js → sources/schema-repair.js} +8 -8
package/dist/commands/{self-update.js → sources/self-update.js} +10 -9
package/dist/commands/{source-add.js → sources/source-add.js} +10 -10
package/dist/commands/{source-clone.js → sources/source-clone.js} +7 -7
package/dist/commands/{source-manage.js → sources/source-manage.js} +4 -4
package/dist/commands/sources/sources-cli.js +305 -0
package/dist/commands/sources/stash-cli.js +219 -0
package/dist/commands/{stash-skeleton.js → sources/stash-skeleton.js} +2 -1
package/dist/commands/tasks/default-tasks.js +173 -0
package/dist/commands/tasks/tasks-cli.js +210 -0
package/dist/commands/{tasks.js → tasks/tasks.js} +14 -14
package/dist/commands/wiki-cli.js +307 -0
package/dist/commands/workflow-cli.js +329 -0
package/dist/core/action-contributors.js +1 -1
package/dist/core/assert.js +40 -0
package/dist/core/asset/asset-create.js +54 -0
package/dist/core/{asset-ref.js → asset/asset-ref.js} +21 -4
package/dist/core/{asset-registry.js → asset/asset-registry.js} +3 -3
package/dist/core/{asset-spec.js → asset/asset-spec.js} +17 -31
package/dist/core/{markdown.js → asset/markdown.js} +1 -1
package/dist/core/{stash-meta.js → asset/stash-meta.js} +1 -1
package/dist/core/best-effort.js +64 -0
package/dist/core/common.js +32 -18
package/dist/core/{config-io.js → config/config-io.js} +29 -19
package/dist/core/{config-migration.js → config/config-migration.js} +11 -9
package/dist/core/{config-schema.js → config/config-schema.js} +45 -1
package/dist/core/config/config-types.js +16 -0
package/dist/core/{config-walker.js → config/config-walker.js} +2 -2
package/dist/core/{config.js → config/config.js} +10 -8
package/dist/core/env-secret-ref.js +90 -0
package/dist/core/errors.js +13 -3
package/dist/core/events.js +27 -4
package/dist/core/file-lock.js +1 -1
package/dist/core/improve-types.js +48 -0
package/dist/core/lesson-lint.js +2 -2
package/dist/core/paths.js +2 -2
package/dist/core/ripgrep/install.js +2 -2
package/dist/core/ripgrep/resolve.js +2 -2
package/dist/core/state-db.js +88 -46
package/dist/core/text-truncation.js +148 -0
package/dist/core/time.js +1 -1
package/dist/core/write-source.js +98 -85
package/dist/indexer/{db-backup.js → db/db-backup.js} +9 -24
package/dist/indexer/{db.js → db/db.js} +126 -116
package/dist/indexer/{graph-db.js → db/graph-db.js} +9 -4
package/dist/indexer/{llm-cache.js → db/llm-cache.js} +15 -12
package/dist/indexer/ensure-index.js +4 -4
package/dist/indexer/{graph-boost.js → graph/graph-boost.js} +1 -1
package/dist/indexer/{graph-extraction.js → graph/graph-extraction.js} +55 -13
package/dist/indexer/indexer.js +37 -30
package/dist/indexer/init.js +54 -0
package/dist/indexer/manifest.js +10 -10
package/dist/indexer/{memory-inference.js → passes/memory-inference.js} +92 -23
package/dist/indexer/{metadata-contributors.js → passes/metadata-contributors.js} +10 -8
package/dist/indexer/{metadata.js → passes/metadata.js} +15 -19
package/dist/indexer/{staleness-detect.js → passes/staleness-detect.js} +53 -12
package/dist/indexer/{db-search.js → search/db-search.js} +28 -16
package/dist/indexer/{ranking-contributors.js → search/ranking-contributors.js} +1 -1
package/dist/indexer/{ranking.js → search/ranking.js} +2 -2
package/dist/indexer/{search-hit-enrichers.js → search/search-hit-enrichers.js} +3 -3
package/dist/indexer/{search-source.js → search/search-source.js} +8 -8
package/dist/indexer/{semantic-status.js → search/semantic-status.js} +3 -3
package/dist/indexer/usage/unmigrated-vaults-guard.js +94 -0
package/dist/indexer/{usage-events.js → usage/usage-events.js} +32 -0
package/dist/indexer/{file-context.js → walk/file-context.js} +10 -15
package/dist/indexer/{matchers.js → walk/matchers.js} +13 -9
package/dist/indexer/{path-resolver.js → walk/path-resolver.js} +6 -6
package/dist/indexer/{project-context.js → walk/project-context.js} +1 -1
package/dist/indexer/{walker.js → walk/walker.js} +4 -3
package/dist/integrations/agent/builder-shared.js +39 -0
package/dist/integrations/agent/builders.js +14 -81
package/dist/integrations/agent/config.js +6 -4
package/dist/integrations/agent/detect.js +1 -1
package/dist/integrations/agent/index.js +23 -8
package/dist/integrations/agent/prompts.js +2 -3
package/dist/integrations/agent/runner.js +22 -3
package/dist/integrations/agent/spawn.js +9 -10
package/dist/integrations/harnesses/claude/agent-builder.js +48 -0
package/dist/integrations/harnesses/claude/config-import.js +70 -0
package/dist/integrations/harnesses/claude/index.js +64 -0
package/dist/integrations/{session-logs/providers/claude-code.js → harnesses/claude/session-log.js} +16 -1
package/dist/integrations/harnesses/index.js +144 -0
package/dist/integrations/harnesses/opencode/agent-builder.js +43 -0
package/dist/integrations/harnesses/opencode/config-import.js +82 -0
package/dist/integrations/harnesses/opencode/index.js +59 -0
package/dist/integrations/{session-logs/providers/opencode.js → harnesses/opencode/session-log.js} +1 -1
package/dist/integrations/harnesses/opencode-sdk/index.js +49 -0
package/dist/integrations/harnesses/opencode-sdk/sdk-runner.js +234 -0
package/dist/integrations/harnesses/types.js +43 -0
package/dist/integrations/lockfile.js +7 -16
package/dist/integrations/session-logs/index.js +82 -9
package/dist/llm/call-ai.js +4 -4
package/dist/llm/client.js +131 -6
package/dist/llm/embedder.js +6 -6
package/dist/llm/embedders/local.js +9 -22
package/dist/llm/embedders/remote.js +2 -2
package/dist/llm/embedders/types.js +1 -1
package/dist/llm/graph-extract.js +31 -12
package/dist/llm/index-passes.js +1 -1
package/dist/llm/memory-infer.js +12 -5
package/dist/llm/metadata-enhance.js +2 -2
package/dist/output/context.js +6 -44
package/dist/output/renderers.js +88 -58
package/dist/output/shapes/curate.js +7 -3
package/dist/output/shapes/distill.js +7 -3
package/dist/output/shapes/env-list.js +18 -16
package/dist/output/shapes/events.js +5 -4
package/dist/output/shapes/helpers.js +2 -4
package/dist/output/shapes/history.js +7 -3
package/dist/output/shapes/passthrough.js +8 -11
package/dist/output/shapes/{proposal-accept.js → proposal/accept.js} +7 -3
package/dist/output/shapes/{proposal-diff.js → proposal/diff.js} +7 -3
package/dist/output/shapes/{proposal-list.js → proposal/list.js} +7 -3
package/dist/output/shapes/{proposal-producer.js → proposal/producer.js} +5 -4
package/dist/output/shapes/{proposal-reject.js → proposal/reject.js} +7 -3
package/dist/output/shapes/{proposal-show.js → proposal/show.js} +7 -3
package/dist/output/shapes/registry-search.js +7 -3
package/dist/output/shapes/registry.js +12 -0
package/dist/output/shapes/search.js +7 -3
package/dist/output/shapes/secret-list.js +18 -16
package/dist/output/shapes/show.js +7 -3
package/dist/output/shapes.js +55 -30
package/dist/output/text/add.js +2 -3
package/dist/output/text/clone.js +2 -3
package/dist/output/text/config.js +2 -3
package/dist/output/text/curate.js +4 -3
package/dist/output/text/distill.js +2 -3
package/dist/output/text/enable-disable.js +5 -4
package/dist/output/text/env.js +13 -0
package/dist/output/text/events.js +5 -4
package/dist/output/text/feedback.js +4 -3
package/dist/output/text/helpers.js +54 -39
package/dist/output/text/history.js +2 -3
package/dist/output/text/import.js +2 -3
package/dist/output/text/index.js +2 -3
package/dist/output/text/info.js +2 -3
package/dist/output/text/init.js +2 -3
package/dist/output/text/list.js +2 -3
package/dist/output/text/proposal/producer.js +9 -0
package/dist/output/text/proposal/proposal.js +13 -0
package/dist/output/text/registry-commands.js +8 -7
package/dist/output/text/registry.js +12 -0
package/dist/output/text/remember.js +4 -3
package/dist/output/text/remove.js +2 -3
package/dist/output/text/save.js +2 -3
package/dist/output/text/search.js +4 -3
package/dist/output/text/show.js +4 -3
package/dist/output/text/update.js +2 -3
package/dist/output/text/upgrade.js +2 -3
package/dist/output/text/wiki.js +12 -11
package/dist/output/text/workflow.js +12 -10
package/dist/output/text.js +66 -32
package/dist/registry/build-index.js +11 -10
package/dist/registry/factory.js +1 -1
package/dist/registry/origin-resolve.js +1 -1
package/dist/registry/providers/index.js +2 -2
package/dist/registry/providers/skills-sh.js +91 -72
package/dist/registry/providers/static-index.js +75 -52
package/dist/registry/resolve.js +3 -3
package/dist/runtime.js +242 -0
package/dist/scripts/migrate-storage.js +1594 -673
package/dist/scripts/migrations/import-fs-improve-runs-to-db.js +240 -166
package/dist/setup/detect.js +311 -9
package/dist/setup/harness-config-import.js +6 -120
package/dist/setup/setup.js +454 -43
package/dist/sources/include.js +1 -1
package/dist/sources/provider-factory.js +2 -2
package/dist/sources/providers/filesystem.js +3 -3
package/dist/sources/providers/git.js +9 -9
package/dist/sources/providers/index.js +4 -4
package/dist/sources/providers/npm.js +6 -6
package/dist/sources/providers/provider-utils.js +13 -20
package/dist/sources/providers/sync-from-ref.js +5 -5
package/dist/sources/providers/tar-utils.js +2 -2
package/dist/sources/providers/website.js +2 -2
package/dist/sources/resolve.js +5 -5
package/dist/sources/website-ingest.js +5 -5
package/dist/storage/database.js +102 -0
package/dist/storage/engines/sqlite-migrations.js +42 -0
package/dist/storage/locations.js +25 -0
package/dist/storage/repositories/index-db.js +43 -0
package/dist/storage/repositories/workflow-runs-repository.js +141 -0
package/dist/tasks/backends/cron.js +4 -4
package/dist/tasks/backends/exec-utils.js +32 -0
package/dist/tasks/backends/index.js +3 -3
package/dist/tasks/backends/launchd.js +7 -14
package/dist/tasks/backends/schtasks.js +7 -16
package/dist/tasks/embedded.js +71 -0
package/dist/tasks/parser.js +2 -2
package/dist/tasks/resolveAkmBin.js +1 -1
package/dist/tasks/runner.js +28 -15
package/dist/tasks/schedule.js +1 -1
package/dist/tasks/validator.js +7 -7
package/dist/text-import-hook.mjs +51 -0
package/dist/version.js +2 -1
package/dist/wiki/wiki.js +7 -7
package/dist/workflows/{authoring.js → authoring/authoring.js} +6 -6
package/dist/workflows/{scope-key.js → authoring/scope-key.js} +1 -1
package/dist/workflows/cli.js +1 -1
package/dist/workflows/db.js +50 -32
package/dist/workflows/parser.js +4 -4
package/dist/workflows/renderer.js +5 -5
package/dist/workflows/runtime/agent-identity.js +56 -0
package/dist/workflows/runtime/checkin.js +57 -0
package/dist/workflows/{runs.js → runtime/runs.js} +197 -101
package/dist/workflows/validate-summary.js +82 -0
package/docs/README.md +1 -1
package/docs/data-and-telemetry.md +6 -6
package/package.json +16 -8
package/dist/commands/add-cli.js +0 -279
package/dist/commands/env.js +0 -213
package/dist/integrations/agent/sdk-runner.js +0 -126
package/dist/output/shapes/vault-list.js +0 -19
package/dist/output/text/proposal-producer.js +0 -8
package/dist/output/text/proposal.js +0 -12
package/dist/output/text/vault.js +0 -16
/package/dist/core/{asset-serialize.js → asset/asset-serialize.js} +0 -0
/package/dist/core/{frontmatter.js → asset/frontmatter.js} +0 -0
/package/dist/core/{config-sources.js → config/config-sources.js} +0 -0
/package/dist/indexer/{graph-dedup.js → graph/graph-dedup.js} +0 -0
/package/dist/{core/config-types.js → indexer/passes/pass-context.js} +0 -0
/package/dist/indexer/{search-fields.js → search/search-fields.js} +0 -0
/package/dist/indexer/{index-context.js → walk/index-context.js} +0 -0
/package/dist/workflows/{document-cache.js → runtime/document-cache.js} +0 -0

package/dist/commands/{consolidate.js → improve/consolidate.js} RENAMED Viewed

@@ -5,28 +5,28 @@ import { createHash } from "node:crypto";
 import fs from "node:fs";
 import path from "node:path";
 import readline from "node:readline";
-import { parse as yamlParse, stringify as yamlStringify } from "yaml";
-import { parseAssetRef } from "../core/asset-ref";
-import { assembleAssetFromString } from "../core/asset-serialize";
-import { resolveStashDir, timestampForFilename } from "../core/common";
-import { getDefaultLlmConfig, loadConfig } from "../core/config";
-import { ConfigError } from "../core/errors";
-import { appendEvent } from "../core/events";
-import { parseFrontmatter } from "../core/frontmatter";
-import { writeContradictEdge } from "../core/memory-belief";
-import { parseEmbeddedJsonResponse } from "../core/parse";
-import { hasHotCaptureMode, hasSupersededStatus, MERGE_ABSOLUTE_FLOOR_CHARS, MERGE_SHRINK_RATIO_MIN, validateProposalFrontmatter, } from "../core/proposal-quality-validators";
-import { createProposal, isProposalSkipped, listProposals } from "../core/proposals";
-import { detectTruncatedDescription } from "../core/text-truncation";
+import { parse as yamlParse } from "yaml";
+import { parseAssetRef } from "../../core/asset/asset-ref.js";
+import { assembleAssetFromString, serializeFrontmatter } from "../../core/asset/asset-serialize.js";
+import { parseFrontmatter } from "../../core/asset/frontmatter.js";
+import { resolveStashDir, timestampForFilename } from "../../core/common.js";
+import { getDefaultLlmConfig, loadConfig } from "../../core/config/config.js";
+import { ConfigError } from "../../core/errors.js";
+import { appendEvent } from "../../core/events.js";
+import { parseEmbeddedJsonResponse } from "../../core/parse.js";
+import { detectTruncatedDescription } from "../../core/text-truncation.js";
+import { hasHotCaptureMode, hasSupersededStatus, MERGE_ABSOLUTE_FLOOR_CHARS, MERGE_SHRINK_RATIO_MIN, validateProposalFrontmatter, } from "../proposal/validators/proposal-quality-validators.js";
+import { createProposal, isProposalSkipped, listProposals } from "../proposal/validators/proposals.js";
+import { writeContradictEdge } from "./memory/memory-belief.js";
 // Re-export the moved helpers so existing test imports continue to resolve.
 export { hasSupersededStatus, validateProposalFrontmatter };
-import { warn } from "../core/warn";
-import { deleteAssetFromSource, resolveWriteTarget, writeAssetToSource } from "../core/write-source";
-import { closeDatabase, findEntryIdByRef, getAllEntries, getEntryById, getNeighborsByEntryId, openExistingDatabase, } from "../indexer/db";
-import { resolveImproveProcessRunnerFromProfile } from "../integrations/agent/runner";
-import { chatCompletion } from "../llm/client";
-import { cosineSimilarity, embedBatch } from "../llm/embedder";
-import { isLlmFeatureEnabled, tryLlmFeature } from "../llm/feature-gate";
+import { warn } from "../../core/warn.js";
+import { commitWriteTargetBoundary, deleteAssetFromSource, resolveWriteTarget, writeAssetToSource, } from "../../core/write-source.js";
+import { closeDatabase, findEntryIdByRef, getAllEntries, getEntryById, getNeighborsByEntryId, openExistingDatabase, } from "../../indexer/db/db.js";
+import { resolveImproveProcessRunnerFromProfile, runnerIsLlm } from "../../integrations/agent/runner.js";
+import { chatCompletion } from "../../llm/client.js";
+import { cosineSimilarity, embedBatch } from "../../llm/embedder.js";
+import { isLlmFeatureEnabled, tryLlmFeature } from "../../llm/feature-gate.js";
 // ── Prompts ─────────────────────────────────────────────────────────────────
 const CONSOLIDATE_SYSTEM_PROMPT = `You are the akm consolidate assistant analyzing memory assets.
@@ -704,7 +704,7 @@ function archiveMemory(filePath, stashDir, ref, reason, opIndex, supersededBy, w
             ...(supersededBy ? { superseded_by: supersededBy } : {}),
             superseded_reason: reason,
         };
-        content = assembleAssetFromString(yamlStringify(newFm).trimEnd(), parsed.content);
+        content = assembleAssetFromString(serializeFrontmatter(newFm), parsed.content);
     }
     catch {
         if (warnings)
@@ -745,7 +745,7 @@ function archiveMemory(filePath, stashDir, ref, reason, opIndex, supersededBy, w
 function resolveConsolidateLlmConfig(config) {
     const consolidateProcess = config.profiles?.improve?.default?.processes?.consolidate;
     const runnerSpec = resolveImproveProcessRunnerFromProfile(consolidateProcess, config);
-    if (runnerSpec && runnerSpec.kind === "llm") {
+    if (runnerSpec && runnerIsLlm(runnerSpec)) {
         return runnerSpec.connection;
     }
     // Non-LLM runner modes (agent/sdk) don't apply to consolidate's HTTP path;
@@ -877,11 +877,12 @@ export async function akmConsolidate(opts = {}) {
     // health rollup can aggregate without regex-parsing English warning
     // strings. See `/tmp/akm-health-investigations/tuning-reasons-investigation.md` §Q2.
     const skipReasons = [];
-    // Tracks refs already emitted to skipReasons. A ref can only occupy one
-    // accounting bucket; subsequent skip ops for the same ref are recorded as
-    // warnings but must not push a second skipReasons entry (that would inflate
+    // Per-ref grouping of skipReasons entries. A ref occupies exactly one
+    // accounting bucket and therefore exactly one skipReasons array entry;
+    // subsequent skip ops for the same ref append to that entry's `skips[]`
+    // rather than pushing a second array entry (that would inflate
     // Σ(skipReasons) and break the invariant by +1 per duplicate).
-    const skipReasonEmittedRefs = new Set();
+    const skipReasonByRef = new Map();
     const pushSkipReason = (op, ref, reason) => {
         // 2026-05-27 cross-chunk double-count fix: if `ref` already contributed
         // to judgedNoAction in its own chunk (a different chunk proposed an op
@@ -891,14 +892,17 @@ export async function akmConsolidate(opts = {}) {
         // Σ(skipReasons) + failedChunkMemories.
         if (judgedNoActionRefs.delete(ref))
             judgedNoAction--;
-        if (skipReasonEmittedRefs.has(ref)) {
-            // Already counted once. Record the extra skip for observability but
-            // don't push to skipReasons — that would break the accounting invariant.
-            warnings.push(`Skip: ${ref} already in skipReasons (${reason} via ${op}); not re-counted.`);
+        const existing = skipReasonByRef.get(ref);
+        if (existing) {
+            // Already counted once for accounting. Append the extra skip to the
+            // ref's grouped entry for observability without adding a new array
+            // entry (which would break the accounting invariant).
+            existing.skips.push({ op, reason });
             return;
         }
-        skipReasonEmittedRefs.add(ref);
-        skipReasons.push({ op, ref, reason });
+        const entry = { ref, skips: [{ op, reason }] };
+        skipReasonByRef.set(ref, entry);
+        skipReasons.push(entry);
     };
     // judgedNoAction tracks memories the LLM saw inside a chunk but proposed
     // no op for. Computed per chunk as `chunk.length − unique(targetRefs in ops)`.
@@ -1560,7 +1564,7 @@ export async function akmConsolidate(opts = {}) {
                     ...(parsedMemory.data ?? {}),
                     description,
                 };
-                const serializedMergedFm = yamlStringify(mergedBodyFm).trimEnd();
+                const serializedMergedFm = serializeFrontmatter(mergedBodyFm);
                 const proposalContent = assembleAssetFromString(serializedMergedFm, parsedMemory.content);
                 // Pre-emit dedup against pending consolidate proposals from the
                 // same improve run (slug-variant match). The cross-run content-hash
@@ -1634,6 +1638,14 @@ export async function akmConsolidate(opts = {}) {
             }
         }
     }
+    // 0.9.0 (issue #507): batch-at-boundary commit. The merge/delete loop above
+    // wrote one merged primary and deleted N secondaries to the resolved target
+    // with NO per-asset commit. If the target is a writable git source and any
+    // asset was mutated, commit the whole batch ONCE here (stages .akm/ +
+    // siblings together). No-op for filesystem/primary-stash targets.
+    if (merged > 0 || deleted > 0) {
+        commitWriteTargetBoundary(target, `Consolidate: ${merged} merged, ${deleted} removed`);
+    }
     cleanupJournal(stashDir, timestamp);
     // TTL cleanup: remove archive entries older than archiveRetentionDays (default 90).
     // C-5 / #391: emit an `archive_cleanup` event before each deletion so the
@@ -1828,7 +1840,7 @@ export function sanitizeMergedContent(raw) {
     // Recovery: if the strict yaml library fails, fall back to the lenient
     // hand-rolled parseFrontmatter parser, which tolerates common LLM YAML
     // quirks (unescaped special chars, bare scalars, etc.). If it recovers
-    // at least one key, proceed — yamlStringify below will re-serialize
+    // at least one key, proceed — serializeFrontmatter below will re-serialize
     // cleanly. Only reject if both parsers fail to extract any data.
     let parsedFm;
     try {
@@ -1855,7 +1867,7 @@ export function sanitizeMergedContent(raw) {
     // Re-serialise via yaml.stringify to fix any quoting quirks.
     let serialized;
     try {
-        serialized = yamlStringify(fm).trimEnd();
+        serialized = serializeFrontmatter(fm);
     }
     catch (e) {
         return { ok: false, reason: `YAML_STRINGIFY_FAILED: ${e instanceof Error ? e.message : String(e)}` };
@@ -2205,7 +2217,7 @@ async function generateMergedContent(config, primaryRef, primaryBody, secondaryR
                         : secFm.data[key];
             }
             normalizeUpdatedField(repairedFmData);
-            const repairedYaml = yamlStringify(repairedFmData).trimEnd();
+            const repairedYaml = serializeFrontmatter(repairedFmData);
             const bodyPart = mergedFm.content ?? "";
             return { content: `---\n${repairedYaml}\n---\n${bodyPart}` };
         }

package/dist/commands/{distill-promotion-policy.js → improve/distill-promotion-policy.js} RENAMED Viewed

@@ -1,9 +1,9 @@
 // This Source Code Form is subject to the terms of the Mozilla Public
 // License, v. 2.0. If a copy of the MPL was not distributed with this
 // file, You can obtain one at https://mozilla.org/MPL/2.0/.
-import { parseAssetRef } from "../core/asset-ref";
-import { assembleAsset } from "../core/asset-serialize";
-import { parseFrontmatter } from "../core/frontmatter";
+import { parseAssetRef } from "../../core/asset/asset-ref.js";
+import { assembleAsset } from "../../core/asset/asset-serialize.js";
+import { parseFrontmatter } from "../../core/asset/frontmatter.js";
 function hasNonEmptyList(value) {
     return Array.isArray(value) && value.some((item) => typeof item === "string" && item.trim().length > 0);
 }

package/dist/commands/{distill.js → improve/distill.js} RENAMED Viewed

@@ -52,22 +52,22 @@
  */
 import fs from "node:fs";
 import path from "node:path";
-import { parseAssetRef } from "../core/asset-ref";
-import { assembleAssetFromString } from "../core/asset-serialize";
-import { resolveStashDir, timestampForFilename } from "../core/common";
-import { getDefaultLlmConfig, loadConfig } from "../core/config";
-import { ConfigError, UsageError } from "../core/errors";
-import { appendEvent, readEvents } from "../core/events";
-import { parseFrontmatter } from "../core/frontmatter";
-import { lintLessonContent } from "../core/lesson-lint";
-import { stripMarkdownFences } from "../core/markdown";
-import { createProposal, isProposalSkipped, listProposals, } from "../core/proposals";
-import { warnVerbose } from "../core/warn";
-import { resolveAssetPath } from "../indexer/path-resolver";
-import { chatCompletion, parseEmbeddedJsonResponse } from "../llm/client";
-import { isLlmFeatureEnabled, tryLlmFeature } from "../llm/feature-gate";
-import { assessMemoryKnowledgePromotionCandidate, deriveKnowledgeRef } from "./distill-promotion-policy";
-import { akmSearch } from "./search";
+import { parseAssetRef } from "../../core/asset/asset-ref.js";
+import { assembleAssetFromString } from "../../core/asset/asset-serialize.js";
+import { parseFrontmatter } from "../../core/asset/frontmatter.js";
+import { stripMarkdownFences } from "../../core/asset/markdown.js";
+import { resolveStashDir, timestampForFilename } from "../../core/common.js";
+import { getDefaultLlmConfig, loadConfig } from "../../core/config/config.js";
+import { ConfigError, UsageError } from "../../core/errors.js";
+import { appendEvent, readEvents } from "../../core/events.js";
+import { lintLessonContent } from "../../core/lesson-lint.js";
+import { warnVerbose } from "../../core/warn.js";
+import { resolveAssetPath } from "../../indexer/walk/path-resolver.js";
+import { chatCompletion, parseEmbeddedJsonResponse } from "../../llm/client.js";
+import { isLlmFeatureEnabled, tryLlmFeature } from "../../llm/feature-gate.js";
+import { createProposal, isProposalSkipped, listProposals, } from "../proposal/validators/proposals.js";
+import { akmSearch } from "../read/search.js";
+import { assessMemoryKnowledgePromotionCandidate, deriveKnowledgeRef } from "./distill-promotion-policy.js";
 /**
  * Asset-ref types that `akm distill` structurally refuses as inputs.
  *
@@ -112,13 +112,14 @@ export function deriveLessonRef(inputRef) {
         .replace(/^-|-$/g, "");
     return `lesson:${safe}-lesson`;
 }
+import { repairTruncatedDescription } from "../../core/text-truncation.js";
 // ── Content quality validators ──────────────────────────────────────────────
 //
 // The actual implementations now live in `core/proposal-quality-validators.ts`
 // so the same checks run inside `runProposalValidators` on `proposal accept`.
 // We re-export the public-facing helpers here so existing imports
-// (`from "../src/commands/distill"`) continue to resolve.
-import { detectDoubleFrontmatter, isValidDescription, isValidWhenToUse } from "../core/proposal-quality-validators";
+// (`from "../../src/commands/distill"`) continue to resolve.
+import { detectDoubleFrontmatter, isValidDescription, isValidWhenToUse, } from "../proposal/validators/proposal-quality-validators.js";
 export { detectDoubleFrontmatter, isValidDescription, isValidWhenToUse };
 // ── Prompt assembly ─────────────────────────────────────────────────────────
 const LESSON_SYSTEM_PROMPT = [
@@ -1121,6 +1122,26 @@ export async function akmDistill(options) {
             }
         }
     }
+    // Post-generation truncation repair (#556): if the LLM sliced the
+    // description mid-sentence, deterministically complete it from its own text
+    // / the lesson body BEFORE the lint + quality validators run. No-op
+    // (byte-identical) for already-complete descriptions, so this never alters
+    // a valid proposal. Runs on the lesson path only (knowledge has no
+    // description field gate here).
+    if (effectiveProposalKind !== "knowledge") {
+        const parsedRepair = parseFrontmatter(content);
+        const fmRepair = (parsedRepair.data ?? {});
+        const descRepairRaw = typeof fmRepair.description === "string" ? fmRepair.description : "";
+        if (descRepairRaw) {
+            const repaired = repairTruncatedDescription(descRepairRaw, parsedRepair.content);
+            if (repaired !== descRepairRaw) {
+                const repairedFmLines = Object.entries({ ...fmRepair, description: repaired })
+                    .map(([k, v]) => `${k}: ${JSON.stringify(v)}`)
+                    .join("\n");
+                content = assembleAssetFromString(repairedFmLines, parsedRepair.content);
+            }
+        }
+    }
     // Parse + lint the lesson before creating the proposal. The lint is the
     // canonical gate for required frontmatter (v1 spec §13). On failure we
     // surface a structured error and exit non-zero — but still emit

package/dist/commands/{eval-cases.js → improve/eval-cases.js} RENAMED Viewed

@@ -3,7 +3,7 @@
 // file, You can obtain one at https://mozilla.org/MPL/2.0/.
 import fs from "node:fs";
 import path from "node:path";
-import { writeFileAtomic } from "../core/common";
+import { writeFileAtomic } from "../../core/common.js";
 export function writeEvalCase(stashDir, evalCase) {
     const evalDir = path.join(stashDir, ".akm", "eval-cases");
     fs.mkdirSync(evalDir, { recursive: true });

package/dist/commands/{extract-cli.js → improve/extract-cli.js} RENAMED Viewed

@@ -15,10 +15,10 @@
  * `--auto` runs multiple harnesses).
  */
 import { defineCommand } from "citty";
-import { output, runWithJsonErrors } from "../cli/shared";
-import { UsageError } from "../core/errors";
-import { getAvailableHarnesses } from "../integrations/session-logs";
-import { akmExtract } from "./extract";
+import { output, runWithJsonErrors } from "../../cli/shared.js";
+import { UsageError } from "../../core/errors.js";
+import { getAvailableHarnesses } from "../../integrations/session-logs/index.js";
+import { akmExtract } from "./extract.js";
 export const extractCommand = defineCommand({
     meta: {
         name: "extract",

package/dist/commands/{extract-prompt.js → improve/extract-prompt.js} RENAMED Viewed

@@ -14,7 +14,7 @@
  * happy path. `additionalProperties: false` means any hallucinated keys
  * the model emits get dropped before we parse.
  */
-import promptTemplate from "../assets/prompts/extract-session.md" with { type: "text" };
+import promptTemplate from "../../assets/prompts/extract-session.md" with { type: "text" };
 /**
  * JSON Schema for the structured extract output. Passed to `chatCompletion`
  * when the configured LLM connection has `supportsJsonSchema: true`.
@@ -55,7 +55,7 @@ export const EXTRACT_JSON_SCHEMA = {
                         type: "string",
                         minLength: 20,
                         maxLength: 400,
-                        description: "One-sentence summary of the candidate.",
+                        description: "One-sentence summary of the candidate. Must be a complete sentence; do not end mid-clause.",
                     },
                     when_to_use: {
                         type: "string",

package/dist/commands/{extract.js → improve/extract.js} RENAMED Viewed

@@ -1,21 +1,47 @@
 // This Source Code Form is subject to the terms of the Mozilla Public
 // License, v. 2.0. If a copy of the MPL was not distributed with this
 // file, You can obtain one at https://mozilla.org/MPL/2.0/.
-import { stringify as yamlStringify } from "yaml";
-import { assembleAssetFromString } from "../core/asset-serialize";
-import { resolveStashDir, timestampForFilename } from "../core/common";
-import { getDefaultLlmConfig, loadConfig } from "../core/config";
-import { ConfigError, UsageError } from "../core/errors";
-import { appendEvent } from "../core/events";
-import { createProposal, isProposalSkipped } from "../core/proposals";
-import { getExtractedSessionsMap, openStateDatabase, shouldSkipAlreadyExtractedSession, upsertExtractedSession, } from "../core/state-db";
-import { warn } from "../core/warn";
-import { resolveImproveProcessRunnerFromProfile } from "../integrations/agent/runner";
-import { getAvailableHarnesses } from "../integrations/session-logs";
-import { preFilterSession } from "../integrations/session-logs/pre-filter";
-import { chatCompletion } from "../llm/client";
-import { isLlmFeatureEnabled, tryLlmFeature } from "../llm/feature-gate";
-import { buildExtractPrompt, EXTRACT_JSON_SCHEMA, parseExtractPayload } from "./extract-prompt";
+/**
+ * `akm extract` — session-insight extractor.
+ *
+ * Replaces the akm-plugin session-checkpoint hook with an on-demand extractor
+ * that reads native session files (claude-code JSONL, opencode storage tree)
+ * through the {@link SessionLogHarness} registry, pre-filters noise, and asks
+ * a bounded in-tree LLM to produce candidate memory/lesson/knowledge proposals
+ * for content the agent did NOT preserve via inline `akm remember`/`akm feedback`.
+ *
+ * Architectural notes:
+ *   - Stateless. All file/LLM access goes through injectable seams so tests
+ *     never touch a real platform.
+ *   - Bounded LLM call wrapped by {@link tryLlmFeature} under the
+ *     `session_extraction` gate (default-on; opt out via
+ *     `profiles.improve.default.processes.extract.enabled: false`).
+ *   - Proposals routed via `createProposal({ source: "extract", ... })` — the
+ *     same review queue as reflect / distill / consolidate. Never direct-write.
+ *   - Per-candidate body assembly merges description (+ when_to_use for lessons)
+ *     into the body's YAML frontmatter so the accept-time
+ *     descriptionQualityValidator passes — same pattern as the
+ *     consolidate-writer fix.
+ */
+import { assembleAsset } from "../../core/asset/asset-serialize.js";
+import { resolveStashDir, timestampForFilename } from "../../core/common.js";
+import { getDefaultLlmConfig, loadConfig } from "../../core/config/config.js";
+import { ConfigError, UsageError } from "../../core/errors.js";
+import { appendEvent } from "../../core/events.js";
+import { getExtractedSessionsMap, openStateDatabase, shouldSkipAlreadyExtractedSession, upsertExtractedSession, } from "../../core/state-db.js";
+import { repairTruncatedDescription } from "../../core/text-truncation.js";
+import { warn } from "../../core/warn.js";
+import { resolveImproveProcessRunnerFromProfile, runnerIsLlm } from "../../integrations/agent/runner.js";
+import { normalizeHarnessId } from "../../integrations/harnesses/index.js";
+import { getAvailableHarnesses } from "../../integrations/session-logs/index.js";
+import { preFilterSession } from "../../integrations/session-logs/pre-filter.js";
+import { chatCompletion } from "../../llm/client.js";
+import { isLlmFeatureEnabled, tryLlmFeature } from "../../llm/feature-gate.js";
+import { createProposal, isProposalSkipped } from "../proposal/validators/proposals.js";
+import { buildExtractPrompt, EXTRACT_JSON_SCHEMA, parseExtractPayload } from "./extract-prompt.js";
+import { buildSessionSummaryPrompt, parseSessionSummary, SESSION_SUMMARY_JSON_SCHEMA, sessionMeetsDurationGate, writeSessionAsset, } from "./session-asset.js";
+/** Default minimum session duration (minutes) for session indexing (#561). */
+const DEFAULT_MIN_SESSION_DURATION_MINUTES = 5;
 // ── Helpers ──────────────────────────────────────────────────────────────────
 /**
  * Parse a since-string into an absolute ms-epoch cutoff. Accepts:
@@ -49,7 +75,15 @@ export function parseSinceArg(value, now = Date.now()) {
  */
 function resolveHarness(type, harnesses) {
     const pool = harnesses ?? getAvailableHarnesses();
-    return pool.find((h) => h.name === type);
+    // #563 id-normalization bridge: a provider's `name` is its runtime id (e.g.
+    // the Claude provider is "claude-code"), but the canonical harness id is
+    // "claude". Normalize BOTH the requested `--type` and each provider name to
+    // canonical before comparing, so `--type claude` and `--type claude-code`
+    // both resolve to the Claude provider. Behaviour fix: previously only the
+    // exact runtime string ("claude-code") matched; the canonical "claude" used
+    // everywhere else (agent profiles, config schema) silently found nothing.
+    const wanted = normalizeHarnessId(type);
+    return pool.find((h) => normalizeHarnessId(h.name) === wanted);
 }
 /**
  * Build the ref + content for a candidate. The body must contain a
@@ -59,16 +93,19 @@ function resolveHarness(type, harnesses) {
  */
 function buildCandidateProposal(candidate, sourceRef) {
     const ref = `${candidate.type}:${candidate.name}`;
+    // Post-generation repair pass (#556): deterministically complete a
+    // description the LLM sliced mid-sentence before it reaches the
+    // auto-accept validators. No-op (byte-identical) for valid descriptions.
+    const description = repairTruncatedDescription(candidate.description, candidate.body);
     const fm = {
-        description: candidate.description,
+        description,
         sources: [`session:${sourceRef.harness}:${sourceRef.sessionId}`],
     };
     if (candidate.type === "lesson" && candidate.when_to_use) {
         fm.when_to_use = candidate.when_to_use;
     }
-    const serialized = yamlStringify(fm).trimEnd();
-    const content = assembleAssetFromString(serialized, candidate.body);
-    return { ref, content };
+    const content = assembleAsset(fm, candidate.body);
+    return { ref, content, description };
 }
 /**
  * Process one session through the full pipeline: read → pre-filter → LLM →
@@ -78,7 +115,7 @@ function buildCandidateProposal(candidate, sourceRef) {
  * proposal validation failure) the session result records a warning and
  * keeps going — one session's bad luck never aborts a multi-session run.
  */
-async function processSession(harness, sessionRef, stashDir, config, llmConfig, chat, ctx, sourceRun, dryRun, timeoutMs, maxTotalChars) {
+async function processSession(harness, sessionRef, stashDir, config, llmConfig, chat, ctx, sourceRun, dryRun, timeoutMs, maxTotalChars, sessionIndexing) {
     const warnings = [];
     let data;
     try {
@@ -100,6 +137,30 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
         ...(typeof maxTotalChars === "number" ? { maxTotalChars } : {}),
     });
     const prompt = buildExtractPrompt({ data, events: filtered.events, inlineRefs: data.inlineRefs });
+    // #561 — ADDITIVE session indexing. Generate + write the session asset
+    // (`sessions/<harness>/<id>.md`). FAIL-OPEN: any failure only records a
+    // warning; it NEVER changes the proposal/skip outcome of extract. Returns the
+    // frontmatter fields to merge into the per-session result for state-db
+    // correlation. When disabled this closure makes NO LLM call and writes NOTHING.
+    const maybeWriteSessionAsset = async () => {
+        if (!sessionIndexing.enabled || dryRun)
+            return {};
+        if (!sessionMeetsDurationGate(data, sessionIndexing.minDurationMinutes))
+            return {};
+        try {
+            const result = await writeSessionAsset(data, stashDir, sessionIndexing.generate);
+            if (result.written) {
+                return {
+                    ...(result.ref ? { sessionAssetRef: result.ref } : {}),
+                    ...(result.logPath ? { sessionLogPath: result.logPath } : {}),
+                };
+            }
+        }
+        catch (err) {
+            warnings.push(`session asset write failed: ${err instanceof Error ? err.message : String(err)}`);
+        }
+        return {};
+    };
     let llmRaw = "";
     const llmResult = await tryLlmFeature("session_extraction", config, async () => {
         llmRaw = await chat(llmConfig, [{ role: "user", content: prompt }], {
@@ -141,6 +202,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
                 preFilterOutput: filtered.stats.outputCount,
             },
         }, ctx);
+        const sessionAsset = await maybeWriteSessionAsset();
         return {
             sessionId: sessionRef.sessionId,
             harness: harness.name,
@@ -153,6 +215,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
                 truncatedCount: filtered.stats.truncatedCount,
             },
             warnings,
+            ...sessionAsset,
         };
     }
     for (const candidate of payload.candidates) {
@@ -161,7 +224,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
             continue;
         }
         try {
-            const { ref, content } = buildCandidateProposal(candidate, sessionRef);
+            const { ref, content, description } = buildCandidateProposal(candidate, sessionRef);
             const result = createProposal(stashDir, {
                 ref,
                 source: "extract",
@@ -169,7 +232,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
                 payload: {
                     content,
                     frontmatter: {
-                        description: candidate.description,
+                        description,
                         ...(candidate.when_to_use ? { when_to_use: candidate.when_to_use } : {}),
                         ...(typeof candidate.confidence === "number" ? { confidence: candidate.confidence } : {}),
                         sources: [`session:${sessionRef.harness}:${sessionRef.sessionId}`],
@@ -202,6 +265,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
             preFilterOutput: filtered.stats.outputCount,
         },
     }, ctx);
+    const sessionAsset = await maybeWriteSessionAsset();
     return {
         sessionId: sessionRef.sessionId,
         harness: harness.name,
@@ -213,6 +277,7 @@ async function processSession(harness, sessionRef, stashDir, config, llmConfig,
             truncatedCount: filtered.stats.truncatedCount,
         },
         warnings,
+        ...sessionAsset,
     };
 }
 // ── Public entrypoint ────────────────────────────────────────────────────────
@@ -257,7 +322,7 @@ export async function akmExtract(options) {
     let llmConfig;
     const runnerSpec = resolveImproveProcessRunnerFromProfile(extractProcess, config);
     if (runnerSpec) {
-        if (runnerSpec.kind !== "llm") {
+        if (!runnerIsLlm(runnerSpec)) {
             throw new ConfigError(`Extract only supports mode: "llm" (in-tree LLM call). Got mode: "${runnerSpec.kind}" from profiles.improve.default.processes.extract — change it to "llm" or remove the override.`, "INVALID_CONFIG_FILE");
         }
         llmConfig = runnerSpec.connection;
@@ -276,6 +341,35 @@ export async function akmExtract(options) {
     const maxTotalChars = typeof extractProcess?.maxTotalChars === "number" ? extractProcess.maxTotalChars : undefined;
     // Default discovery window — process config can override the built-in 24h.
     const effectiveSince = options.since ?? extractProcess?.defaultSince;
+    // #561 — resolve session-indexing config. Default ON: we only reach this code
+    // when `session_extraction` is enabled AND an LLM is configured (both checked
+    // above), so defaulting on costs nothing offline (the summary call fails open)
+    // while making sessions searchable in the common LLM-configured case. Set
+    // `processes.extract.indexSessions: false` for byte-identical legacy behaviour.
+    const sessionIndexingEnabled = extractProcess?.indexSessions ?? true;
+    const minSessionDuration = typeof extractProcess?.minSessionDuration === "number"
+        ? extractProcess.minSessionDuration
+        : DEFAULT_MIN_SESSION_DURATION_MINUTES;
+    // Production summary generator: a bounded in-tree LLM call wrapped in the same
+    // fail-open `tryLlmFeature` seam as the rest of extract. Returns `undefined`
+    // on disablement / timeout / error so no asset is written. Tests inject a fake.
+    const chatForSummary = options.chat ?? chatCompletion;
+    const defaultSessionSummaryGenerator = async (data) => {
+        let raw = "";
+        await tryLlmFeature("session_extraction", config, async () => {
+            raw = await chatForSummary(llmConfig, [{ role: "user", content: buildSessionSummaryPrompt(data) }], {
+                timeoutMs,
+                responseSchema: SESSION_SUMMARY_JSON_SCHEMA,
+            });
+            return raw;
+        }, "", { timeoutMs });
+        return parseSessionSummary(raw);
+    };
+    const sessionIndexing = {
+        enabled: sessionIndexingEnabled,
+        minDurationMinutes: minSessionDuration,
+        generate: options.generateSessionSummary ?? defaultSessionSummaryGenerator,
+    };
     const harness = resolveHarness(options.type, options.harnesses);
     if (!harness) {
         return {
@@ -355,7 +449,7 @@ export async function akmExtract(options) {
     let seenMap = new Map();
     if (trackingEnabled && candidates.length > 0) {
         try {
-            stateDb = options.stateDb ?? openStateDatabase();
+            stateDb = options.stateDb ?? openStateDatabase(options.stateDbPath);
             seenMap = getExtractedSessionsMap(stateDb, harness.name, candidates.map((c) => c.sessionId));
         }
         catch (err) {
@@ -389,7 +483,7 @@ export async function akmExtract(options) {
             continue;
         }
         try {
-            const result = await processSession(harness, summary, stashDir, config, llmConfig, chat, options.ctx, sourceRun, dryRun, timeoutMs, maxTotalChars);
+            const result = await processSession(harness, summary, stashDir, config, llmConfig, chat, options.ctx, sourceRun, dryRun, timeoutMs, maxTotalChars, sessionIndexing);
             sessions.push(result);
             if (result.skipped)
                 skippedCount += 1;
@@ -423,6 +517,11 @@ export async function akmExtract(options) {
                             preFilterOutputCount: result.preFilter.outputCount,
                             preFilterTruncatedCount: result.preFilter.truncatedCount,
                             ...(result.skipReason ? { skipReason: result.skipReason } : {}),
+                            // #561 — record the session's log_path for correlation across
+                            // index rebuilds (the session asset frontmatter is the primary
+                            // durable key; this is the state-db mirror of it).
+                            ...(result.sessionLogPath ? { logPath: result.sessionLogPath } : {}),
+                            ...(result.sessionAssetRef ? { sessionAssetRef: result.sessionAssetRef } : {}),
                         },
                     });
                 }
@@ -475,3 +574,63 @@ export async function akmExtract(options) {
         durationMs: Date.now() - startMs,
     };
 }
+/**
+ * Count NEW (unseen, in-window) extract candidate sessions across all available
+ * harnesses WITHOUT making any LLM calls. Mirrors the discovery + seen-filter
+ * logic in {@link akmExtract} so the `#554 minNewSessions` gate in `improve`
+ * can decide whether the extract pass is worth running before any work begins.
+ *
+ * A session is a "new candidate" when it is in the `since` window AND it would
+ * not be skipped by {@link shouldSkipAlreadyExtractedSession} (i.e. it has never
+ * been extracted, or new events have arrived since it was last extracted).
+ */
+export function countNewExtractCandidates(config, options = {}) {
+    const extractProcess = config.profiles?.improve?.default?.processes?.extract;
+    const effectiveSince = options.since ?? extractProcess?.defaultSince;
+    const sinceMs = parseSinceArg(effectiveSince);
+    const harnesses = (options.harnesses ?? getAvailableHarnesses()).filter((h) => h.isAvailable());
+    let stateDb = options.stateDb;
+    let openedStateDb = false;
+    let total = 0;
+    try {
+        for (const harness of harnesses) {
+            const candidates = harness.listSessions({ sinceMs });
+            if (candidates.length === 0)
+                continue;
+            let seenMap = new Map();
+            try {
+                if (!stateDb) {
+                    stateDb = openStateDatabase(options.stateDbPath);
+                    openedStateDb = true;
+                }
+                seenMap = getExtractedSessionsMap(stateDb, harness.name, candidates.map((c) => c.sessionId));
+            }
+            catch (err) {
+                // state.db unavailable — treat every in-window session as a new
+                // candidate (fail-open: never let a transient sqlite error wrongly
+                // trip the gate and skip a pass that should have run).
+                const msg = err instanceof Error ? err.message : String(err);
+                warn(`[extract] state.db unavailable while counting candidates, treating all as new: ${msg}`);
+                total += candidates.length;
+                continue;
+            }
+            for (const summary of candidates) {
+                const prior = seenMap.get(summary.sessionId);
+                if (shouldSkipAlreadyExtractedSession(prior, summary.endedAt))
+                    continue;
+                total += 1;
+            }
+        }
+    }
+    finally {
+        if (stateDb && openedStateDb) {
+            try {
+                stateDb.close();
+            }
+            catch {
+                // best-effort close
+            }
+        }
+    }
+    return total;
+}