akm-cli 0.6.1 → 0.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +66 -0
- package/dist/{cli.js → src/cli.js} +712 -34
- package/dist/{commands → src/commands}/config-cli.js +47 -4
- package/dist/src/commands/distill.js +283 -0
- package/dist/src/commands/events.js +108 -0
- package/dist/src/commands/history.js +191 -0
- package/dist/{commands → src/commands}/installed-stashes.js +1 -1
- package/dist/src/commands/proposal.js +119 -0
- package/dist/src/commands/propose.js +171 -0
- package/dist/src/commands/reflect.js +193 -0
- package/dist/{commands → src/commands}/registry-search.js +71 -7
- package/dist/{commands → src/commands}/remember.js +12 -0
- package/dist/{commands → src/commands}/search.js +104 -4
- package/dist/{commands → src/commands}/self-update.js +4 -3
- package/dist/{commands → src/commands}/show.js +73 -0
- package/dist/{commands → src/commands}/source-add.js +5 -1
- package/dist/{commands → src/commands}/source-manage.js +7 -1
- package/dist/{core → src/core}/asset-ref.js +5 -5
- package/dist/{core → src/core}/asset-spec.js +12 -0
- package/dist/{core → src/core}/common.js +1 -1
- package/dist/{core → src/core}/config.js +203 -121
- package/dist/{core → src/core}/errors.js +4 -0
- package/dist/src/core/events.js +239 -0
- package/dist/src/core/lesson-lint.js +86 -0
- package/dist/src/core/proposals.js +406 -0
- package/dist/src/core/warn.js +72 -0
- package/dist/{core → src/core}/write-source.js +80 -5
- package/dist/{indexer → src/indexer}/db-search.js +114 -24
- package/dist/{indexer → src/indexer}/db.js +76 -23
- package/dist/{indexer → src/indexer}/file-context.js +0 -3
- package/dist/src/indexer/graph-boost.js +179 -0
- package/dist/src/indexer/graph-extraction.js +212 -0
- package/dist/{indexer → src/indexer}/indexer.js +88 -7
- package/dist/{indexer → src/indexer}/matchers.js +1 -1
- package/dist/src/indexer/memory-inference.js +263 -0
- package/dist/{indexer → src/indexer}/metadata.js +111 -3
- package/dist/{indexer → src/indexer}/search-source.js +4 -2
- package/dist/src/integrations/agent/config.js +292 -0
- package/dist/src/integrations/agent/detect.js +94 -0
- package/dist/src/integrations/agent/index.js +17 -0
- package/dist/src/integrations/agent/profiles.js +65 -0
- package/dist/src/integrations/agent/prompts.js +167 -0
- package/dist/src/integrations/agent/spawn.js +272 -0
- package/dist/{integrations → src/integrations}/github.js +9 -3
- package/dist/{integrations → src/integrations}/lockfile.js +0 -26
- package/dist/{llm → src/llm}/client.js +33 -2
- package/dist/{llm → src/llm}/embedders/remote.js +37 -3
- package/dist/src/llm/feature-gate.js +108 -0
- package/dist/src/llm/graph-extract.js +107 -0
- package/dist/src/llm/index-passes.js +35 -0
- package/dist/src/llm/memory-infer.js +86 -0
- package/dist/{output → src/output}/cli-hints.js +15 -2
- package/dist/{output → src/output}/renderers.js +63 -2
- package/dist/src/output/shapes.js +523 -0
- package/dist/src/output/text.js +1116 -0
- package/dist/{registry → src/registry}/build-index.js +19 -8
- package/dist/{registry → src/registry}/factory.js +0 -8
- package/dist/{registry → src/registry}/providers/static-index.js +6 -3
- package/dist/{registry → src/registry}/resolve.js +68 -2
- package/dist/{setup → src/setup}/setup.js +52 -5
- package/dist/{sources → src/sources}/providers/git.js +7 -15
- package/dist/{wiki → src/wiki}/wiki.js +54 -6
- package/dist/{workflows → src/workflows}/runs.js +37 -3
- package/dist/tests/add-website-source.test.js +119 -0
- package/dist/tests/agent/agent-config-loader.test.js +70 -0
- package/dist/tests/agent/agent-config.test.js +221 -0
- package/dist/tests/agent/agent-detect.test.js +100 -0
- package/dist/tests/agent/agent-spawn.test.js +234 -0
- package/dist/tests/agent-output.test.js +186 -0
- package/dist/tests/architecture/agent-no-llm-sdk-guard.test.js +103 -0
- package/dist/tests/architecture/agent-spawn-seam.test.js +193 -0
- package/dist/tests/architecture/llm-stateless-seam.test.js +112 -0
- package/dist/tests/asset-ref.test.js +192 -0
- package/dist/tests/asset-registry.test.js +103 -0
- package/dist/tests/asset-spec.test.js +241 -0
- package/dist/tests/bench/attribution.test.js +996 -0
- package/dist/tests/bench/cleanup-sigint.test.js +83 -0
- package/dist/tests/bench/cleanup.js +234 -0
- package/dist/tests/bench/cleanup.test.js +166 -0
- package/dist/tests/bench/cli.js +1018 -0
- package/dist/tests/bench/cli.test.js +445 -0
- package/dist/tests/bench/compare.test.js +556 -0
- package/dist/tests/bench/corpus.js +317 -0
- package/dist/tests/bench/corpus.test.js +258 -0
- package/dist/tests/bench/doctor.js +525 -0
- package/dist/tests/bench/driver.js +401 -0
- package/dist/tests/bench/driver.test.js +584 -0
- package/dist/tests/bench/environment.js +233 -0
- package/dist/tests/bench/environment.test.js +199 -0
- package/dist/tests/bench/evolve-metrics.js +179 -0
- package/dist/tests/bench/evolve-metrics.test.js +187 -0
- package/dist/tests/bench/evolve.js +647 -0
- package/dist/tests/bench/evolve.test.js +624 -0
- package/dist/tests/bench/failure-modes.test.js +349 -0
- package/dist/tests/bench/feedback-integrity.test.js +457 -0
- package/dist/tests/bench/leakage.test.js +228 -0
- package/dist/tests/bench/learning-curve.test.js +134 -0
- package/dist/tests/bench/metrics.js +2395 -0
- package/dist/tests/bench/metrics.test.js +1150 -0
- package/dist/tests/bench/no-os-tmpdir-invariant.test.js +43 -0
- package/dist/tests/bench/opencode-config.js +194 -0
- package/dist/tests/bench/opencode-config.test.js +370 -0
- package/dist/tests/bench/report.js +1885 -0
- package/dist/tests/bench/report.test.js +1038 -0
- package/dist/tests/bench/run-config.js +355 -0
- package/dist/tests/bench/run-config.test.js +298 -0
- package/dist/tests/bench/run-curate-test.js +32 -0
- package/dist/tests/bench/run-failing-tasks.js +56 -0
- package/dist/tests/bench/run-full-bench.js +51 -0
- package/dist/tests/bench/run-items36-targeted.js +69 -0
- package/dist/tests/bench/run-nano-quick.js +42 -0
- package/dist/tests/bench/run-waveg-targeted.js +62 -0
- package/dist/tests/bench/runner.js +699 -0
- package/dist/tests/bench/runner.test.js +958 -0
- package/dist/tests/bench/search-bridge.test.js +331 -0
- package/dist/tests/bench/tmp.js +131 -0
- package/dist/tests/bench/trajectory.js +116 -0
- package/dist/tests/bench/trajectory.test.js +127 -0
- package/dist/tests/bench/verifier.js +114 -0
- package/dist/tests/bench/verifier.test.js +118 -0
- package/dist/tests/bench/workflow-evaluator.js +557 -0
- package/dist/tests/bench/workflow-evaluator.test.js +421 -0
- package/dist/tests/bench/workflow-spec.js +345 -0
- package/dist/tests/bench/workflow-spec.test.js +363 -0
- package/dist/tests/bench/workflow-trace.js +472 -0
- package/dist/tests/bench/workflow-trace.test.js +254 -0
- package/dist/tests/benchmark-search-quality.js +536 -0
- package/dist/tests/benchmark-suite.js +1441 -0
- package/dist/tests/capture-cli.test.js +112 -0
- package/dist/tests/cli-errors.test.js +204 -0
- package/dist/tests/commands/events.test.js +370 -0
- package/dist/tests/commands/history.test.js +418 -0
- package/dist/tests/commands/import.test.js +103 -0
- package/dist/tests/commands/proposal-cli.test.js +209 -0
- package/dist/tests/commands/reflect-propose-cli.test.js +333 -0
- package/dist/tests/commands/remember.test.js +97 -0
- package/dist/tests/commands/scope-flags.test.js +300 -0
- package/dist/tests/commands/search.test.js +537 -0
- package/dist/tests/commands/show-indexer-parity.test.js +117 -0
- package/dist/tests/commands/show.test.js +294 -0
- package/dist/tests/common.test.js +266 -0
- package/dist/tests/completions.test.js +142 -0
- package/dist/tests/config-cli.test.js +193 -0
- package/dist/tests/config-llm-features.test.js +139 -0
- package/dist/tests/config.test.js +569 -0
- package/dist/tests/contracts/migration-baseline.test.js +43 -0
- package/dist/tests/contracts/reflect-propose-envelope.test.js +139 -0
- package/dist/tests/contracts/spec-helpers.js +46 -0
- package/dist/tests/contracts/v1-spec-section-11-proposal-queue.test.js +228 -0
- package/dist/tests/contracts/v1-spec-section-12-agent-config.test.js +56 -0
- package/dist/tests/contracts/v1-spec-section-13-lesson-type.test.js +34 -0
- package/dist/tests/contracts/v1-spec-section-14-llm-features.test.js +94 -0
- package/dist/tests/contracts/v1-spec-section-4-1-asset-types.test.js +39 -0
- package/dist/tests/contracts/v1-spec-section-4-2-quality-rules.test.js +44 -0
- package/dist/tests/contracts/v1-spec-section-5-configuration.test.js +47 -0
- package/dist/tests/contracts/v1-spec-section-6-orchestration.test.js +40 -0
- package/dist/tests/contracts/v1-spec-section-7-module-layout.test.js +58 -0
- package/dist/tests/contracts/v1-spec-section-8-extension-points.test.js +34 -0
- package/dist/tests/contracts/v1-spec-section-9-4-cli-surface.test.js +75 -0
- package/dist/tests/contracts/v1-spec-section-9-7-llm-agent-boundary.test.js +36 -0
- package/dist/tests/core/write-source.test.js +366 -0
- package/dist/tests/curate-command.test.js +87 -0
- package/dist/tests/db-scoring.test.js +201 -0
- package/dist/tests/db.test.js +654 -0
- package/dist/tests/distill-cli-flag.test.js +208 -0
- package/dist/tests/distill.test.js +515 -0
- package/dist/tests/docker-install.test.js +120 -0
- package/dist/tests/e2e.test.js +1419 -0
- package/dist/tests/embedder.test.js +340 -0
- package/dist/tests/embedding-model-config.test.js +379 -0
- package/dist/tests/feedback-command.test.js +172 -0
- package/dist/tests/file-context.test.js +552 -0
- package/dist/tests/fixtures/scripts/git/summarize-diff.js +9 -0
- package/dist/tests/fixtures/scripts/lint/eslint-check.js +7 -0
- package/dist/tests/fixtures/stashes/load.js +166 -0
- package/dist/tests/fixtures/stashes/load.test.js +97 -0
- package/dist/tests/fixtures/stashes/ranking-baseline/scripts/mem0-search.js +12 -0
- package/dist/tests/frontmatter.test.js +190 -0
- package/dist/tests/fts-field-weighting.test.js +254 -0
- package/dist/tests/fuzzy-search.test.js +230 -0
- package/dist/tests/git-provider-clone.test.js +45 -0
- package/dist/tests/github.test.js +161 -0
- package/dist/tests/graph-boost-ranking.test.js +305 -0
- package/dist/tests/graph-extraction.test.js +282 -0
- package/dist/tests/helpers/usage-events.js +8 -0
- package/dist/tests/index-pass-llm.test.js +161 -0
- package/dist/tests/indexer.test.js +570 -0
- package/dist/tests/info-command.test.js +166 -0
- package/dist/tests/init.test.js +69 -0
- package/dist/tests/install-script.test.js +246 -0
- package/dist/tests/integration/agent-real-profile.test.js +94 -0
- package/dist/tests/issue-36-repro.test.js +304 -0
- package/dist/tests/issues-191-194.test.js +160 -0
- package/dist/tests/lesson-lint.test.js +111 -0
- package/dist/tests/llm-client.test.js +115 -0
- package/dist/tests/llm-feature-gate.test.js +151 -0
- package/dist/tests/llm.test.js +139 -0
- package/dist/tests/lockfile.test.js +216 -0
- package/dist/tests/manifest.test.js +205 -0
- package/dist/tests/markdown.test.js +126 -0
- package/dist/tests/matchers-unit.test.js +189 -0
- package/dist/tests/memory-inference.test.js +299 -0
- package/dist/tests/merge-scoring.test.js +136 -0
- package/dist/tests/metadata.test.js +313 -0
- package/dist/tests/migration-help.test.js +89 -0
- package/dist/tests/origin-resolve.test.js +124 -0
- package/dist/tests/output-baseline.test.js +218 -0
- package/dist/tests/output-shapes-unit.test.js +478 -0
- package/dist/tests/parallel-search.test.js +272 -0
- package/dist/tests/parameter-metadata.test.js +365 -0
- package/dist/tests/paths.test.js +177 -0
- package/dist/tests/progressive-disclosure.test.js +280 -0
- package/dist/tests/proposals.test.js +279 -0
- package/dist/tests/proposed-quality.test.js +271 -0
- package/dist/tests/provider-registry.test.js +32 -0
- package/dist/tests/ranking-regression.test.js +548 -0
- package/dist/tests/reflect-propose.test.js +455 -0
- package/dist/tests/registry-build-index.test.js +394 -0
- package/dist/tests/registry-cli.test.js +290 -0
- package/dist/tests/registry-index-v2.test.js +430 -0
- package/dist/tests/registry-install.test.js +728 -0
- package/dist/tests/registry-providers/parity.test.js +189 -0
- package/dist/tests/registry-providers/skills-sh.test.js +309 -0
- package/dist/tests/registry-providers/static-index.test.js +238 -0
- package/dist/tests/registry-resolve.test.js +126 -0
- package/dist/tests/registry-search.test.js +923 -0
- package/dist/tests/remember-frontmatter.test.js +378 -0
- package/dist/tests/remember-unit.test.js +123 -0
- package/dist/tests/ripgrep-install.test.js +251 -0
- package/dist/tests/ripgrep-resolve.test.js +108 -0
- package/dist/tests/ripgrep.test.js +163 -0
- package/dist/tests/save-command.test.js +94 -0
- package/dist/tests/save-trust-qa-fixes.test.js +270 -0
- package/dist/tests/scoring-pipeline.test.js +648 -0
- package/dist/tests/search-include-proposed-cli.test.js +118 -0
- package/dist/tests/self-update.test.js +442 -0
- package/dist/tests/semantic-search-e2e.test.js +512 -0
- package/dist/tests/semantic-status.test.js +471 -0
- package/dist/tests/setup-run.integration.js +877 -0
- package/dist/tests/setup-wizard.test.js +198 -0
- package/dist/tests/setup.test.js +131 -0
- package/dist/tests/source-add.test.js +11 -0
- package/dist/tests/source-clone.test.js +254 -0
- package/dist/tests/source-manage.test.js +366 -0
- package/dist/tests/source-providers/filesystem.test.js +82 -0
- package/dist/tests/source-providers/git.test.js +252 -0
- package/dist/tests/source-providers/website.test.js +128 -0
- package/dist/tests/source-qa-fixes.test.js +286 -0
- package/dist/tests/source-registry.test.js +350 -0
- package/dist/tests/source-resolve.test.js +100 -0
- package/dist/tests/source-source.test.js +281 -0
- package/dist/tests/source.test.js +533 -0
- package/dist/tests/tar-utils-scan.test.js +73 -0
- package/dist/tests/toggle-components.test.js +73 -0
- package/dist/tests/usage-telemetry.test.js +265 -0
- package/dist/tests/utility-scoring.test.js +558 -0
- package/dist/tests/vault-load-error.test.js +78 -0
- package/dist/tests/vault-qa-fixes.test.js +194 -0
- package/dist/tests/vault.test.js +429 -0
- package/dist/tests/vector-search.test.js +608 -0
- package/dist/tests/walker.test.js +252 -0
- package/dist/tests/wave2-cluster-bc.test.js +228 -0
- package/dist/tests/wave2-cluster-d.test.js +180 -0
- package/dist/tests/wave2-cluster-e.test.js +179 -0
- package/dist/tests/wiki-qa-fixes.test.js +270 -0
- package/dist/tests/wiki.test.js +529 -0
- package/dist/tests/workflow-cli.test.js +271 -0
- package/dist/tests/workflow-markdown.test.js +171 -0
- package/dist/tests/workflow-path-escape.test.js +132 -0
- package/dist/tests/workflow-qa-fixes.test.js +395 -0
- package/dist/tests/workflows/indexer-rejection.test.js +213 -0
- package/docs/README.md +8 -0
- package/docs/migration/release-notes/0.7.0.md +244 -0
- package/package.json +2 -2
- package/dist/core/warn.js +0 -27
- package/dist/output/shapes.js +0 -212
- package/dist/output/text.js +0 -520
- /package/dist/{commands → src/commands}/completions.js +0 -0
- /package/dist/{commands → src/commands}/curate.js +0 -0
- /package/dist/{commands → src/commands}/info.js +0 -0
- /package/dist/{commands → src/commands}/init.js +0 -0
- /package/dist/{commands → src/commands}/install-audit.js +0 -0
- /package/dist/{commands → src/commands}/migration-help.js +0 -0
- /package/dist/{commands → src/commands}/source-clone.js +0 -0
- /package/dist/{commands → src/commands}/vault.js +0 -0
- /package/dist/{core → src/core}/asset-registry.js +0 -0
- /package/dist/{core → src/core}/frontmatter.js +0 -0
- /package/dist/{core → src/core}/markdown.js +0 -0
- /package/dist/{core → src/core}/paths.js +0 -0
- /package/dist/{indexer → src/indexer}/manifest.js +0 -0
- /package/dist/{indexer → src/indexer}/search-fields.js +0 -0
- /package/dist/{indexer → src/indexer}/semantic-status.js +0 -0
- /package/dist/{indexer → src/indexer}/usage-events.js +0 -0
- /package/dist/{indexer → src/indexer}/walker.js +0 -0
- /package/dist/{llm → src/llm}/embedder.js +0 -0
- /package/dist/{llm → src/llm}/embedders/cache.js +0 -0
- /package/dist/{llm → src/llm}/embedders/local.js +0 -0
- /package/dist/{llm → src/llm}/embedders/types.js +0 -0
- /package/dist/{llm → src/llm}/metadata-enhance.js +0 -0
- /package/dist/{output → src/output}/context.js +0 -0
- /package/dist/{registry → src/registry}/create-provider-registry.js +0 -0
- /package/dist/{registry → src/registry}/origin-resolve.js +0 -0
- /package/dist/{registry → src/registry}/providers/index.js +0 -0
- /package/dist/{registry → src/registry}/providers/skills-sh.js +0 -0
- /package/dist/{registry → src/registry}/providers/types.js +0 -0
- /package/dist/{registry → src/registry}/types.js +0 -0
- /package/dist/{setup → src/setup}/detect.js +0 -0
- /package/dist/{setup → src/setup}/ripgrep-install.js +0 -0
- /package/dist/{setup → src/setup}/ripgrep-resolve.js +0 -0
- /package/dist/{setup → src/setup}/steps.js +0 -0
- /package/dist/{sources → src/sources}/include.js +0 -0
- /package/dist/{sources → src/sources}/provider-factory.js +0 -0
- /package/dist/{sources → src/sources}/provider.js +0 -0
- /package/dist/{sources → src/sources}/providers/filesystem.js +0 -0
- /package/dist/{sources → src/sources}/providers/index.js +0 -0
- /package/dist/{sources → src/sources}/providers/install-types.js +0 -0
- /package/dist/{sources → src/sources}/providers/npm.js +0 -0
- /package/dist/{sources → src/sources}/providers/provider-utils.js +0 -0
- /package/dist/{sources → src/sources}/providers/sync-from-ref.js +0 -0
- /package/dist/{sources → src/sources}/providers/tar-utils.js +0 -0
- /package/dist/{sources → src/sources}/providers/website.js +0 -0
- /package/dist/{sources → src/sources}/resolve.js +0 -0
- /package/dist/{sources → src/sources}/types.js +0 -0
- /package/dist/{templates → src/templates}/wiki-templates.js +0 -0
- /package/dist/{version.js → src/version.js} +0 -0
- /package/dist/{workflows → src/workflows}/authoring.js +0 -0
- /package/dist/{workflows → src/workflows}/cli.js +0 -0
- /package/dist/{workflows → src/workflows}/db.js +0 -0
- /package/dist/{workflows → src/workflows}/document-cache.js +0 -0
- /package/dist/{workflows → src/workflows}/parser.js +0 -0
- /package/dist/{workflows → src/workflows}/renderer.js +0 -0
- /package/dist/{workflows → src/workflows}/schema.js +0 -0
- /package/dist/{workflows → src/workflows}/validator.js +0 -0
|
@@ -0,0 +1,254 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Tests for tests/bench/workflow-trace.ts (issue #254).
|
|
3
|
+
*/
|
|
4
|
+
import { describe, expect, test } from "bun:test";
|
|
5
|
+
import { MAX_EVENT_BYTES, MAX_EVENT_COUNT, MAX_STDOUT_SCAN_BYTES, normalizeRunToTrace, } from "./workflow-trace";
|
|
6
|
+
function makeRun(overrides = {}) {
|
|
7
|
+
return {
|
|
8
|
+
schemaVersion: 1,
|
|
9
|
+
taskId: "deploy-docker",
|
|
10
|
+
arm: "akm",
|
|
11
|
+
seed: 42,
|
|
12
|
+
model: "anthropic/claude-opus-4-7",
|
|
13
|
+
outcome: "pass",
|
|
14
|
+
tokens: { input: 0, output: 0 },
|
|
15
|
+
tokenMeasurement: "parsed",
|
|
16
|
+
wallclockMs: 1234,
|
|
17
|
+
trajectory: { correctAssetLoaded: null, feedbackRecorded: null },
|
|
18
|
+
events: [],
|
|
19
|
+
verifierStdout: "",
|
|
20
|
+
verifierExitCode: 0,
|
|
21
|
+
assetsLoaded: [],
|
|
22
|
+
...overrides,
|
|
23
|
+
};
|
|
24
|
+
}
|
|
25
|
+
function ev(eventType, ts, extra = {}) {
|
|
26
|
+
return {
|
|
27
|
+
schemaVersion: 1,
|
|
28
|
+
id: 0,
|
|
29
|
+
ts,
|
|
30
|
+
eventType,
|
|
31
|
+
...extra,
|
|
32
|
+
};
|
|
33
|
+
}
|
|
34
|
+
describe("normalizeRunToTrace — AKM event input", () => {
|
|
35
|
+
test("maps search/show/feedback events to typed trace events with stable order", () => {
|
|
36
|
+
const run = makeRun({
|
|
37
|
+
events: [
|
|
38
|
+
ev("show", "2026-04-27T10:00:01.000Z", { ref: "skill:deploy" }),
|
|
39
|
+
ev("search", "2026-04-27T10:00:00.000Z", { metadata: { query: "deploy docker" } }),
|
|
40
|
+
ev("feedback", "2026-04-27T10:00:02.000Z", { ref: "skill:deploy", metadata: { vote: 1 } }),
|
|
41
|
+
],
|
|
42
|
+
});
|
|
43
|
+
const trace = normalizeRunToTrace(run);
|
|
44
|
+
expect(trace.schemaVersion).toBe(1);
|
|
45
|
+
expect(trace.taskId).toBe("deploy-docker");
|
|
46
|
+
expect(trace.arm).toBe("akm");
|
|
47
|
+
expect(trace.seed).toBe(42);
|
|
48
|
+
expect(trace.truncated).toBe(false);
|
|
49
|
+
// `verifier_run` is auto-derived from RunResult.verifierExitCode, so we
|
|
50
|
+
// expect 4 events: search, show, feedback, verifier.
|
|
51
|
+
const types = trace.events.map((e) => e.type);
|
|
52
|
+
expect(types).toEqual(["akm_search", "akm_show", "akm_feedback", "verifier_run"]);
|
|
53
|
+
expect(trace.events[0].source).toBe("akm_events");
|
|
54
|
+
expect(trace.events[0].query).toBe("deploy docker");
|
|
55
|
+
expect(trace.events[1].assetRef).toBe("skill:deploy");
|
|
56
|
+
expect(trace.events[2].assetRef).toBe("skill:deploy");
|
|
57
|
+
expect(trace.events[3].source).toBe("verifier");
|
|
58
|
+
expect(trace.events[3].exitCode).toBe(0);
|
|
59
|
+
// Ids are 0..n-1, monotonic.
|
|
60
|
+
for (let i = 0; i < trace.events.length; i += 1) {
|
|
61
|
+
expect(trace.events[i].id).toBe(i);
|
|
62
|
+
}
|
|
63
|
+
});
|
|
64
|
+
test("ignores unrelated AKM event types (add/remove/update)", () => {
|
|
65
|
+
const run = makeRun({
|
|
66
|
+
events: [
|
|
67
|
+
ev("add", "2026-04-27T10:00:00.000Z", { ref: "skill:foo" }),
|
|
68
|
+
ev("remove", "2026-04-27T10:00:01.000Z", { ref: "skill:bar" }),
|
|
69
|
+
ev("search", "2026-04-27T10:00:02.000Z", { metadata: { query: "x" } }),
|
|
70
|
+
],
|
|
71
|
+
});
|
|
72
|
+
const trace = normalizeRunToTrace(run);
|
|
73
|
+
const types = trace.events.map((e) => e.type);
|
|
74
|
+
expect(types).toEqual(["akm_search", "verifier_run"]);
|
|
75
|
+
});
|
|
76
|
+
test("records verifier_run with exitCode from the run envelope", () => {
|
|
77
|
+
const run = makeRun({ verifierExitCode: 1, outcome: "fail" });
|
|
78
|
+
const trace = normalizeRunToTrace(run);
|
|
79
|
+
const verifier = trace.events.find((e) => e.type === "verifier_run");
|
|
80
|
+
expect(verifier).toBeDefined();
|
|
81
|
+
expect(verifier?.exitCode).toBe(1);
|
|
82
|
+
expect(verifier?.source).toBe("verifier");
|
|
83
|
+
});
|
|
84
|
+
});
|
|
85
|
+
describe("normalizeRunToTrace — stdout / tool-call input", () => {
|
|
86
|
+
test("detects akm CLI invocations from agent stdout", () => {
|
|
87
|
+
const stdout = [
|
|
88
|
+
'tool: akm search "deploy docker"',
|
|
89
|
+
"tool: akm show skill:deploy",
|
|
90
|
+
"tool: akm feedback +1 skill:deploy",
|
|
91
|
+
].join("\n");
|
|
92
|
+
const run = makeRun();
|
|
93
|
+
const trace = normalizeRunToTrace(run, { agentStdout: stdout });
|
|
94
|
+
const cliEvents = trace.events.filter((e) => e.source === "agent_stdout");
|
|
95
|
+
expect(cliEvents.map((e) => e.type)).toEqual(["akm_search", "akm_show", "akm_feedback"]);
|
|
96
|
+
expect(cliEvents[0].query).toBe("deploy docker");
|
|
97
|
+
expect(cliEvents[1].assetRef).toBe("skill:deploy");
|
|
98
|
+
expect(cliEvents[2].assetRef).toBe("skill:deploy");
|
|
99
|
+
});
|
|
100
|
+
test("detects JSON tool-call shape", () => {
|
|
101
|
+
const stdout = '{"command":"akm","args":["show","skill:foo"]}';
|
|
102
|
+
const run = makeRun();
|
|
103
|
+
const trace = normalizeRunToTrace(run, { agentStdout: stdout });
|
|
104
|
+
const showEv = trace.events.find((e) => e.type === "akm_show");
|
|
105
|
+
expect(showEv).toBeDefined();
|
|
106
|
+
expect(showEv?.assetRef).toBe("skill:foo");
|
|
107
|
+
expect(showEv?.source).toBe("agent_stdout");
|
|
108
|
+
});
|
|
109
|
+
test("AKM events sort before stdout-derived events when both have the same verb", () => {
|
|
110
|
+
const run = makeRun({
|
|
111
|
+
events: [ev("search", "2026-04-27T10:00:00.000Z", { metadata: { query: "structured" } })],
|
|
112
|
+
});
|
|
113
|
+
const trace = normalizeRunToTrace(run, { agentStdout: 'akm search "stdout"' });
|
|
114
|
+
const searches = trace.events.filter((e) => e.type === "akm_search");
|
|
115
|
+
expect(searches.length).toBe(2);
|
|
116
|
+
expect(searches[0].source).toBe("akm_events");
|
|
117
|
+
expect(searches[1].source).toBe("agent_stdout");
|
|
118
|
+
});
|
|
119
|
+
});
|
|
120
|
+
describe("normalizeRunToTrace — workspace-write detection", () => {
|
|
121
|
+
test("first workspace path becomes first_workspace_write, rest become workspace_write", () => {
|
|
122
|
+
const run = makeRun();
|
|
123
|
+
const trace = normalizeRunToTrace(run, {
|
|
124
|
+
workspaceWrites: ["src/a.ts", "src/b.ts", "src/c.ts"],
|
|
125
|
+
});
|
|
126
|
+
const writes = trace.events.filter((e) => e.type === "first_workspace_write" || e.type === "workspace_write");
|
|
127
|
+
expect(writes.length).toBe(3);
|
|
128
|
+
expect(writes[0].type).toBe("first_workspace_write");
|
|
129
|
+
expect(writes[0].filePath).toBe("src/a.ts");
|
|
130
|
+
expect(writes[1].type).toBe("workspace_write");
|
|
131
|
+
expect(writes[1].filePath).toBe("src/b.ts");
|
|
132
|
+
expect(writes[2].type).toBe("workspace_write");
|
|
133
|
+
expect(writes[2].filePath).toBe("src/c.ts");
|
|
134
|
+
for (const w of writes) {
|
|
135
|
+
expect(w.source).toBe("filesystem_diff");
|
|
136
|
+
}
|
|
137
|
+
});
|
|
138
|
+
test("no workspace writes => no workspace events", () => {
|
|
139
|
+
const run = makeRun();
|
|
140
|
+
const trace = normalizeRunToTrace(run, { workspaceWrites: [] });
|
|
141
|
+
const writes = trace.events.filter((e) => e.type === "first_workspace_write" || e.type === "workspace_write");
|
|
142
|
+
expect(writes.length).toBe(0);
|
|
143
|
+
});
|
|
144
|
+
test("harness lifecycle markers emit agent_started and agent_finished", () => {
|
|
145
|
+
const run = makeRun();
|
|
146
|
+
const trace = normalizeRunToTrace(run, {
|
|
147
|
+
harness: {
|
|
148
|
+
agentStartedTs: "2026-04-27T09:59:59.000Z",
|
|
149
|
+
agentFinishedTs: "2026-04-27T10:00:30.000Z",
|
|
150
|
+
},
|
|
151
|
+
});
|
|
152
|
+
const types = trace.events.map((e) => e.type);
|
|
153
|
+
expect(types[0]).toBe("agent_started");
|
|
154
|
+
expect(types[types.length - 1]).toBe("agent_finished");
|
|
155
|
+
});
|
|
156
|
+
});
|
|
157
|
+
describe("normalizeRunToTrace — malformed/noisy input", () => {
|
|
158
|
+
test("ignores malformed events instead of throwing", () => {
|
|
159
|
+
const malformed = [
|
|
160
|
+
null,
|
|
161
|
+
undefined,
|
|
162
|
+
42,
|
|
163
|
+
"string-not-an-event",
|
|
164
|
+
{ eventType: 123 }, // eventType not a string
|
|
165
|
+
{ eventType: "search" }, // no ts — still valid, mapped
|
|
166
|
+
];
|
|
167
|
+
const run = makeRun({
|
|
168
|
+
// Cast through unknown — we explicitly want to test garbage input.
|
|
169
|
+
events: malformed,
|
|
170
|
+
});
|
|
171
|
+
const trace = normalizeRunToTrace(run);
|
|
172
|
+
// The only valid event is the trailing { eventType: "search" } (it has no
|
|
173
|
+
// ts so it sorts after the synthesised verifier_run sentinel), plus the
|
|
174
|
+
// verifier_run derived from RunResult.
|
|
175
|
+
const types = trace.events.map((e) => e.type).sort();
|
|
176
|
+
expect(types).toEqual(["akm_search", "verifier_run"].sort());
|
|
177
|
+
expect(trace.events.length).toBe(2);
|
|
178
|
+
});
|
|
179
|
+
test("clamps oversized fields to MAX_EVENT_BYTES UTF-8 bytes and flags bytesTruncated", () => {
|
|
180
|
+
const giantQuery = "😀".repeat(MAX_EVENT_BYTES);
|
|
181
|
+
const run = makeRun({
|
|
182
|
+
events: [ev("search", "2026-04-27T10:00:00.000Z", { metadata: { query: giantQuery } })],
|
|
183
|
+
});
|
|
184
|
+
const trace = normalizeRunToTrace(run);
|
|
185
|
+
const search = trace.events.find((e) => e.type === "akm_search");
|
|
186
|
+
expect(Buffer.byteLength(search.query ?? "", "utf8")).toBeLessThanOrEqual(MAX_EVENT_BYTES);
|
|
187
|
+
expect(Buffer.byteLength(search.query ?? "", "utf8")).toBeLessThan(Buffer.byteLength(giantQuery, "utf8"));
|
|
188
|
+
expect(search.bytesTruncated).toBe(true);
|
|
189
|
+
});
|
|
190
|
+
test("does not flag bytesTruncated when a field already fits the byte cap exactly", () => {
|
|
191
|
+
const exactQuery = "x".repeat(MAX_EVENT_BYTES);
|
|
192
|
+
const run = makeRun({
|
|
193
|
+
events: [ev("search", "2026-04-27T10:00:00.000Z", { metadata: { query: exactQuery } })],
|
|
194
|
+
});
|
|
195
|
+
const trace = normalizeRunToTrace(run);
|
|
196
|
+
const search = trace.events.find((e) => e.type === "akm_search");
|
|
197
|
+
expect(search.query).toBe(exactQuery);
|
|
198
|
+
expect(search.bytesTruncated).toBeUndefined();
|
|
199
|
+
});
|
|
200
|
+
test("caps total event count at MAX_EVENT_COUNT and surfaces a warning", () => {
|
|
201
|
+
const events = [];
|
|
202
|
+
for (let i = 0; i < MAX_EVENT_COUNT + 50; i += 1) {
|
|
203
|
+
events.push(ev("search",
|
|
204
|
+
// Pad timestamps so they sort lexicographically.
|
|
205
|
+
`2026-04-27T${String(Math.floor(i / 60) % 24).padStart(2, "0")}:${String(i % 60).padStart(2, "0")}:00.${String(i).padStart(6, "0").slice(-3)}Z`, { metadata: { query: `q-${i}` } }));
|
|
206
|
+
}
|
|
207
|
+
const run = makeRun({ events });
|
|
208
|
+
const warnings = [];
|
|
209
|
+
const trace = normalizeRunToTrace(run, { warnings });
|
|
210
|
+
expect(trace.events.length).toBe(MAX_EVENT_COUNT);
|
|
211
|
+
expect(trace.truncated).toBe(true);
|
|
212
|
+
expect(warnings.some((w) => w.includes("workflow trace truncated"))).toBe(true);
|
|
213
|
+
});
|
|
214
|
+
test("clamps oversized stdout and surfaces a warning instead of OOM", () => {
|
|
215
|
+
// A pathological 1MiB single line plus a trailing real CLI invocation that
|
|
216
|
+
// would be cut off if the cap weren't applied.
|
|
217
|
+
const giantLine = "akm show ".concat("y".repeat(MAX_EVENT_BYTES * 4));
|
|
218
|
+
const run = makeRun();
|
|
219
|
+
const warnings = [];
|
|
220
|
+
const stdout = giantLine; // single line, larger than MAX_EVENT_BYTES but below MAX_STDOUT_SCAN_BYTES
|
|
221
|
+
const trace = normalizeRunToTrace(run, { agentStdout: stdout, warnings });
|
|
222
|
+
const showEv = trace.events.find((e) => e.type === "akm_show");
|
|
223
|
+
expect(showEv).toBeDefined();
|
|
224
|
+
// assetRef must be clamped — it cannot be 4 * MAX_EVENT_BYTES.
|
|
225
|
+
expect(showEv?.assetRef?.length ?? 0).toBeLessThanOrEqual(MAX_EVENT_BYTES);
|
|
226
|
+
expect(showEv?.bytesTruncated).toBe(true);
|
|
227
|
+
});
|
|
228
|
+
test("stdout larger than MAX_STDOUT_SCAN_BYTES is truncated with a warning", () => {
|
|
229
|
+
// Build a stdout > scan cap. We want this to actually exceed the cap so the
|
|
230
|
+
// truncation branch fires, but we keep it minimally larger to keep the test fast.
|
|
231
|
+
const overshoot = 1024;
|
|
232
|
+
const huge = "z".repeat(MAX_STDOUT_SCAN_BYTES + overshoot);
|
|
233
|
+
const run = makeRun();
|
|
234
|
+
const warnings = [];
|
|
235
|
+
normalizeRunToTrace(run, { agentStdout: huge, warnings });
|
|
236
|
+
expect(warnings.some((w) => w.includes("workflow trace stdout truncated"))).toBe(true);
|
|
237
|
+
});
|
|
238
|
+
test("no events, no stdout, no writes => only verifier_run is produced", () => {
|
|
239
|
+
const trace = normalizeRunToTrace(makeRun());
|
|
240
|
+
expect(trace.events.length).toBe(1);
|
|
241
|
+
expect(trace.events[0].type).toBe("verifier_run");
|
|
242
|
+
});
|
|
243
|
+
test("identical inputs produce identical traces (deterministic)", () => {
|
|
244
|
+
const run = makeRun({
|
|
245
|
+
events: [
|
|
246
|
+
ev("show", "2026-04-27T10:00:01.000Z", { ref: "skill:a" }),
|
|
247
|
+
ev("search", "2026-04-27T10:00:00.000Z", { metadata: { query: "q" } }),
|
|
248
|
+
],
|
|
249
|
+
});
|
|
250
|
+
const a = normalizeRunToTrace(run, { agentStdout: "akm show skill:b" });
|
|
251
|
+
const b = normalizeRunToTrace(run, { agentStdout: "akm show skill:b" });
|
|
252
|
+
expect(JSON.stringify(a)).toBe(JSON.stringify(b));
|
|
253
|
+
});
|
|
254
|
+
});
|