audrey 1.0.0 → 1.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +54 -0
- package/README.md +30 -6
- package/benchmarks/adapter-self-test.mjs +6 -2
- package/benchmarks/adapters/example-allow.mjs +5 -2
- package/benchmarks/adapters/mem0-platform.mjs +19 -12
- package/benchmarks/adapters/zep-cloud.mjs +51 -27
- package/benchmarks/baselines.js +11 -6
- package/benchmarks/build-leaderboard.mjs +36 -23
- package/benchmarks/cases.js +24 -12
- package/benchmarks/create-conformance-card.mjs +12 -3
- package/benchmarks/create-submission-bundle.mjs +22 -8
- package/benchmarks/dry-run-external-adapters.mjs +24 -12
- package/benchmarks/guardbench.js +354 -124
- package/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +7 -7
- package/benchmarks/output/external/guardbench-external-dry-run.json +1 -1
- package/benchmarks/output/external/guardbench-external-evidence.json +1 -1
- package/benchmarks/output/guardbench-conformance-card.json +12 -12
- package/benchmarks/output/guardbench-raw.json +243 -144
- package/benchmarks/output/guardbench-summary.json +354 -230
- package/benchmarks/output/leaderboard/guardbench-leaderboard.json +5 -5
- package/benchmarks/output/leaderboard/guardbench-leaderboard.md +2 -2
- package/benchmarks/output/submission-bundle/guardbench-conformance-card.json +12 -12
- package/benchmarks/output/submission-bundle/guardbench-raw.json +243 -144
- package/benchmarks/output/submission-bundle/guardbench-summary.json +354 -230
- package/benchmarks/output/submission-bundle/schemas/guardbench-raw.schema.json +21 -1
- package/benchmarks/output/submission-bundle/schemas/guardbench-summary.schema.json +23 -2
- package/benchmarks/output/submission-bundle/submission-manifest.json +15 -15
- package/benchmarks/output/submission-bundle/validation-report.json +1 -1
- package/benchmarks/output/summary.json +58 -58
- package/benchmarks/perf-snapshot.js +12 -9
- package/benchmarks/perf.bench.js +14 -6
- package/benchmarks/public-paths.mjs +11 -5
- package/benchmarks/reference-results.js +10 -5
- package/benchmarks/report.js +48 -27
- package/benchmarks/run-external-guardbench.mjs +47 -25
- package/benchmarks/run.js +112 -59
- package/benchmarks/schemas/guardbench-raw.schema.json +21 -1
- package/benchmarks/schemas/guardbench-summary.schema.json +23 -2
- package/benchmarks/validate-adapter-module.mjs +13 -10
- package/benchmarks/validate-adapter-registry.mjs +16 -5
- package/benchmarks/validate-guardbench-artifacts.mjs +76 -19
- package/benchmarks/verify-external-evidence.mjs +86 -31
- package/benchmarks/verify-publication-artifacts.mjs +34 -11
- package/benchmarks/verify-submission-bundle.mjs +9 -4
- package/dist/mcp-server/config.d.ts +1 -1
- package/dist/mcp-server/config.d.ts.map +1 -1
- package/dist/mcp-server/config.js +5 -3
- package/dist/mcp-server/config.js.map +1 -1
- package/dist/mcp-server/index.d.ts +4 -3
- package/dist/mcp-server/index.d.ts.map +1 -1
- package/dist/mcp-server/index.js +479 -172
- package/dist/mcp-server/index.js.map +1 -1
- package/dist/src/action-key.d.ts.map +1 -1
- package/dist/src/action-key.js +6 -2
- package/dist/src/action-key.js.map +1 -1
- package/dist/src/adaptive.d.ts.map +1 -1
- package/dist/src/adaptive.js +4 -2
- package/dist/src/adaptive.js.map +1 -1
- package/dist/src/affect.d.ts.map +1 -1
- package/dist/src/affect.js +8 -5
- package/dist/src/affect.js.map +1 -1
- package/dist/src/audrey.d.ts +11 -1
- package/dist/src/audrey.d.ts.map +1 -1
- package/dist/src/audrey.js +110 -53
- package/dist/src/audrey.js.map +1 -1
- package/dist/src/capsule.d.ts.map +1 -1
- package/dist/src/capsule.js +37 -15
- package/dist/src/capsule.js.map +1 -1
- package/dist/src/causal.d.ts +1 -1
- package/dist/src/causal.d.ts.map +1 -1
- package/dist/src/causal.js +4 -2
- package/dist/src/causal.js.map +1 -1
- package/dist/src/confidence.d.ts.map +1 -1
- package/dist/src/confidence.js +5 -5
- package/dist/src/confidence.js.map +1 -1
- package/dist/src/consolidate.d.ts.map +1 -1
- package/dist/src/consolidate.js +17 -9
- package/dist/src/consolidate.js.map +1 -1
- package/dist/src/context.js +1 -1
- package/dist/src/context.js.map +1 -1
- package/dist/src/controller.d.ts +17 -1
- package/dist/src/controller.d.ts.map +1 -1
- package/dist/src/controller.js +73 -23
- package/dist/src/controller.js.map +1 -1
- package/dist/src/db.d.ts.map +1 -1
- package/dist/src/db.js +78 -27
- package/dist/src/db.js.map +1 -1
- package/dist/src/decay.d.ts +1 -1
- package/dist/src/decay.d.ts.map +1 -1
- package/dist/src/decay.js +1 -1
- package/dist/src/decay.js.map +1 -1
- package/dist/src/embedding.d.ts +12 -4
- package/dist/src/embedding.d.ts.map +1 -1
- package/dist/src/embedding.js +18 -16
- package/dist/src/embedding.js.map +1 -1
- package/dist/src/encode.d.ts.map +1 -1
- package/dist/src/encode.js +5 -4
- package/dist/src/encode.js.map +1 -1
- package/dist/src/events.d.ts +3 -2
- package/dist/src/events.d.ts.map +1 -1
- package/dist/src/events.js +7 -3
- package/dist/src/events.js.map +1 -1
- package/dist/src/export.d.ts.map +1 -1
- package/dist/src/export.js +21 -7
- package/dist/src/export.js.map +1 -1
- package/dist/src/feedback.d.ts.map +1 -1
- package/dist/src/feedback.js +1 -1
- package/dist/src/feedback.js.map +1 -1
- package/dist/src/forget.d.ts.map +1 -1
- package/dist/src/forget.js +12 -6
- package/dist/src/forget.js.map +1 -1
- package/dist/src/fts.d.ts.map +1 -1
- package/dist/src/fts.js +20 -8
- package/dist/src/fts.js.map +1 -1
- package/dist/src/hybrid-recall.d.ts.map +1 -1
- package/dist/src/hybrid-recall.js +12 -6
- package/dist/src/hybrid-recall.js.map +1 -1
- package/dist/src/impact.d.ts.map +1 -1
- package/dist/src/impact.js +26 -10
- package/dist/src/impact.js.map +1 -1
- package/dist/src/import.d.ts.map +1 -1
- package/dist/src/import.js +11 -6
- package/dist/src/import.js.map +1 -1
- package/dist/src/index.d.ts +5 -4
- package/dist/src/index.d.ts.map +1 -1
- package/dist/src/index.js +4 -4
- package/dist/src/index.js.map +1 -1
- package/dist/src/interference.d.ts.map +1 -1
- package/dist/src/interference.js +10 -5
- package/dist/src/interference.js.map +1 -1
- package/dist/src/introspect.d.ts.map +1 -1
- package/dist/src/introspect.js +12 -6
- package/dist/src/introspect.js.map +1 -1
- package/dist/src/llm.d.ts +2 -2
- package/dist/src/llm.d.ts.map +1 -1
- package/dist/src/llm.js +6 -6
- package/dist/src/llm.js.map +1 -1
- package/dist/src/migrate.d.ts.map +1 -1
- package/dist/src/migrate.js +10 -4
- package/dist/src/migrate.js.map +1 -1
- package/dist/src/preflight.d.ts.map +1 -1
- package/dist/src/preflight.js +6 -8
- package/dist/src/preflight.js.map +1 -1
- package/dist/src/profile.d.ts.map +1 -1
- package/dist/src/profile.js.map +1 -1
- package/dist/src/promote.d.ts.map +1 -1
- package/dist/src/promote.js +16 -7
- package/dist/src/promote.js.map +1 -1
- package/dist/src/prompts.d.ts.map +1 -1
- package/dist/src/prompts.js +1 -2
- package/dist/src/prompts.js.map +1 -1
- package/dist/src/recall.d.ts.map +1 -1
- package/dist/src/recall.js +85 -18
- package/dist/src/recall.js.map +1 -1
- package/dist/src/redact.d.ts.map +1 -1
- package/dist/src/redact.js +9 -4
- package/dist/src/redact.js.map +1 -1
- package/dist/src/reflexes.d.ts.map +1 -1
- package/dist/src/reflexes.js +1 -7
- package/dist/src/reflexes.js.map +1 -1
- package/dist/src/rollback.d.ts.map +1 -1
- package/dist/src/rollback.js +4 -2
- package/dist/src/rollback.js.map +1 -1
- package/dist/src/routes.d.ts.map +1 -1
- package/dist/src/routes.js +37 -14
- package/dist/src/routes.js.map +1 -1
- package/dist/src/rules-compiler.d.ts.map +1 -1
- package/dist/src/rules-compiler.js +24 -2
- package/dist/src/rules-compiler.js.map +1 -1
- package/dist/src/server.js +2 -2
- package/dist/src/server.js.map +1 -1
- package/dist/src/tool-trace.d.ts +2 -2
- package/dist/src/tool-trace.d.ts.map +1 -1
- package/dist/src/tool-trace.js +12 -4
- package/dist/src/tool-trace.js.map +1 -1
- package/dist/src/types.d.ts.map +1 -1
- package/dist/src/ulid.js +1 -1
- package/dist/src/ulid.js.map +1 -1
- package/dist/src/utils.d.ts.map +1 -1
- package/dist/src/utils.js.map +1 -1
- package/dist/src/validate.d.ts.map +1 -1
- package/dist/src/validate.js +20 -10
- package/dist/src/validate.js.map +1 -1
- package/docs/paper/07-evaluation.md +5 -5
- package/docs/paper/audrey-paper-v1.md +6 -6
- package/docs/paper/evidence-ledger.md +1 -1
- package/docs/paper/output/arxiv/arxiv-manifest.json +4 -4
- package/docs/paper/output/arxiv/main.tex +6 -6
- package/docs/paper/output/arxiv-compile-report.json +3 -3
- package/docs/paper/output/submission-bundle/README.md +30 -6
- package/docs/paper/output/submission-bundle/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +7 -7
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-dry-run.json +1 -1
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-evidence.json +1 -1
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-conformance-card.json +12 -12
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-raw.json +243 -144
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-summary.json +354 -230
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.json +5 -5
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.md +2 -2
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/submission-manifest.json +15 -15
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/validation-report.json +1 -1
- package/docs/paper/output/submission-bundle/benchmarks/output/summary.json +52 -52
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-raw.schema.json +21 -1
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-summary.schema.json +23 -2
- package/docs/paper/output/submission-bundle/docs/paper/07-evaluation.md +5 -5
- package/docs/paper/output/submission-bundle/docs/paper/audrey-paper-v1.md +6 -6
- package/docs/paper/output/submission-bundle/docs/paper/evidence-ledger.md +1 -1
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/arxiv-manifest.json +4 -4
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/main.tex +6 -6
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv-compile-report.json +3 -3
- package/docs/paper/output/submission-bundle/package.json +18 -5
- package/docs/paper/output/submission-bundle/paper-submission-manifest.json +40 -40
- package/examples/fintech-ops-demo.js +12 -5
- package/examples/healthcare-ops-demo.js +8 -4
- package/examples/ollama-memory-agent.js +41 -13
- package/examples/stripe-demo.js +12 -5
- package/package.json +18 -5
- package/scripts/audit-release-completion.mjs +179 -101
- package/scripts/create-arxiv-source.mjs +20 -14
- package/scripts/create-paper-submission-bundle.mjs +6 -2
- package/scripts/finalize-release.mjs +111 -36
- package/scripts/prepare-release-cut.mjs +14 -6
- package/scripts/publish-release-bundle.mjs +62 -23
- package/scripts/publish-release-github-api.mjs +89 -24
- package/scripts/smoke-cli.js +26 -6
- package/scripts/sync-paper-artifacts.mjs +5 -1
- package/scripts/verify-arxiv-compile.mjs +52 -16
- package/scripts/verify-arxiv-source.mjs +45 -15
- package/scripts/verify-browser-launch-plan.mjs +28 -11
- package/scripts/verify-browser-launch-results.mjs +32 -14
- package/scripts/verify-paper-artifacts.mjs +539 -79
- package/scripts/verify-paper-claims.mjs +48 -20
- package/scripts/verify-paper-submission-bundle.mjs +22 -11
- package/scripts/verify-publication-pack.mjs +23 -9
- package/scripts/verify-release-readiness.mjs +250 -71
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"suite": "GuardBench comparative",
|
|
3
|
-
"generatedAt": "2026-05-
|
|
3
|
+
"generatedAt": "2026-05-29T03:45:36.607Z",
|
|
4
4
|
"manifest": {
|
|
5
5
|
"manifestVersion": "0.2.0",
|
|
6
6
|
"suiteId": "guardbench-local-comparative",
|
|
@@ -416,15 +416,15 @@
|
|
|
416
416
|
]
|
|
417
417
|
},
|
|
418
418
|
"provenance": {
|
|
419
|
-
"generatedAt": "2026-05-
|
|
420
|
-
"gitSha": "
|
|
419
|
+
"generatedAt": "2026-05-29T03:45:36.607Z",
|
|
420
|
+
"gitSha": "ceed2f51b615175c8bb412b96b5e5a501561189f",
|
|
421
421
|
"gitDirty": false,
|
|
422
|
-
"node": "v24.
|
|
423
|
-
"v8": "13.6.233.17-node.
|
|
422
|
+
"node": "v24.16.0",
|
|
423
|
+
"v8": "13.6.233.17-node.49",
|
|
424
424
|
"platform": "linux",
|
|
425
425
|
"arch": "x64",
|
|
426
|
-
"osRelease": "6.17.0-
|
|
427
|
-
"cpuModel": "AMD EPYC
|
|
426
|
+
"osRelease": "6.17.0-1015-azure",
|
|
427
|
+
"cpuModel": "AMD EPYC 9V74 80-Core Processor",
|
|
428
428
|
"cpuCount": 4,
|
|
429
429
|
"totalMemoryGb": 15.61,
|
|
430
430
|
"embeddingProvider": "mock",
|
|
@@ -449,14 +449,14 @@
|
|
|
449
449
|
"redactionLeaks": 0,
|
|
450
450
|
"recallDegradationDetectionRate": 1,
|
|
451
451
|
"latency": {
|
|
452
|
-
"p50Ms":
|
|
453
|
-
"p95Ms":
|
|
454
|
-
"maxMs":
|
|
452
|
+
"p50Ms": 2.916,
|
|
453
|
+
"p95Ms": 21.17,
|
|
454
|
+
"maxMs": 21.17
|
|
455
455
|
},
|
|
456
456
|
"systemSummaries": [
|
|
457
457
|
{
|
|
458
458
|
"system": "Audrey Guard",
|
|
459
|
-
"generatedAt": "2026-05-
|
|
459
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
460
460
|
"scenarios": 10,
|
|
461
461
|
"passed": 10,
|
|
462
462
|
"passRate": 1,
|
|
@@ -466,117 +466,123 @@
|
|
|
466
466
|
"falseBlockRate": 0,
|
|
467
467
|
"usefulWarningPrecision": 1,
|
|
468
468
|
"evidenceRecall": 1,
|
|
469
|
+
"lineageRichness": 1,
|
|
469
470
|
"redactionLeaks": 0,
|
|
470
471
|
"recallDegradationDetectionRate": 1,
|
|
471
472
|
"latency": {
|
|
472
|
-
"p50Ms":
|
|
473
|
-
"p95Ms":
|
|
474
|
-
"maxMs":
|
|
473
|
+
"p50Ms": 2.916,
|
|
474
|
+
"p95Ms": 21.17,
|
|
475
|
+
"maxMs": 21.17
|
|
475
476
|
}
|
|
476
477
|
},
|
|
477
478
|
{
|
|
478
479
|
"system": "No Memory",
|
|
479
|
-
"generatedAt": "2026-05-
|
|
480
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
480
481
|
"scenarios": 10,
|
|
481
|
-
"passed":
|
|
482
|
-
"passRate": 0,
|
|
482
|
+
"passed": 1,
|
|
483
|
+
"passRate": 0.1,
|
|
483
484
|
"decisionCorrect": 1,
|
|
484
485
|
"decisionAccuracy": 0.1,
|
|
485
486
|
"preventionRate": 0,
|
|
486
487
|
"falseBlockRate": 0,
|
|
487
488
|
"usefulWarningPrecision": null,
|
|
488
|
-
"evidenceRecall": 0,
|
|
489
|
+
"evidenceRecall": 0.1,
|
|
490
|
+
"lineageRichness": 0,
|
|
489
491
|
"redactionLeaks": 0,
|
|
490
492
|
"recallDegradationDetectionRate": 0,
|
|
491
493
|
"latency": {
|
|
492
|
-
"p50Ms": 0.
|
|
493
|
-
"p95Ms": 0.
|
|
494
|
-
"maxMs": 0.
|
|
494
|
+
"p50Ms": 0.007,
|
|
495
|
+
"p95Ms": 0.035,
|
|
496
|
+
"maxMs": 0.035
|
|
495
497
|
}
|
|
496
498
|
},
|
|
497
499
|
{
|
|
498
500
|
"system": "Recent Window",
|
|
499
|
-
"generatedAt": "2026-05-
|
|
501
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
500
502
|
"scenarios": 10,
|
|
501
|
-
"passed":
|
|
502
|
-
"passRate": 0,
|
|
503
|
+
"passed": 6,
|
|
504
|
+
"passRate": 0.6,
|
|
503
505
|
"decisionCorrect": 6,
|
|
504
506
|
"decisionAccuracy": 0.6,
|
|
505
507
|
"preventionRate": 0.5714285714285714,
|
|
506
508
|
"falseBlockRate": 0,
|
|
507
509
|
"usefulWarningPrecision": 0.3333333333333333,
|
|
508
|
-
"evidenceRecall":
|
|
510
|
+
"evidenceRecall": 1,
|
|
511
|
+
"lineageRichness": 0,
|
|
509
512
|
"redactionLeaks": 0,
|
|
510
|
-
"recallDegradationDetectionRate": 0,
|
|
513
|
+
"recallDegradationDetectionRate": 0.5,
|
|
511
514
|
"latency": {
|
|
512
|
-
"p50Ms": 0.
|
|
513
|
-
"p95Ms": 0.
|
|
514
|
-
"maxMs": 0.
|
|
515
|
+
"p50Ms": 0.106,
|
|
516
|
+
"p95Ms": 0.421,
|
|
517
|
+
"maxMs": 0.421
|
|
515
518
|
}
|
|
516
519
|
},
|
|
517
520
|
{
|
|
518
521
|
"system": "Vector Only",
|
|
519
|
-
"generatedAt": "2026-05-
|
|
522
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
520
523
|
"scenarios": 10,
|
|
521
|
-
"passed":
|
|
522
|
-
"passRate": 0,
|
|
524
|
+
"passed": 4,
|
|
525
|
+
"passRate": 0.4,
|
|
523
526
|
"decisionCorrect": 4,
|
|
524
527
|
"decisionAccuracy": 0.4,
|
|
525
528
|
"preventionRate": 0.2857142857142857,
|
|
526
529
|
"falseBlockRate": 0,
|
|
527
530
|
"usefulWarningPrecision": 0.25,
|
|
528
|
-
"evidenceRecall": 0,
|
|
531
|
+
"evidenceRecall": 0.9,
|
|
532
|
+
"lineageRichness": 0,
|
|
529
533
|
"redactionLeaks": 0,
|
|
530
534
|
"recallDegradationDetectionRate": 0,
|
|
531
535
|
"latency": {
|
|
532
|
-
"p50Ms": 0.
|
|
533
|
-
"p95Ms": 1.
|
|
534
|
-
"maxMs": 1.
|
|
536
|
+
"p50Ms": 0.451,
|
|
537
|
+
"p95Ms": 1.551,
|
|
538
|
+
"maxMs": 1.551
|
|
535
539
|
}
|
|
536
540
|
},
|
|
537
541
|
{
|
|
538
542
|
"system": "FTS Only",
|
|
539
|
-
"generatedAt": "2026-05-
|
|
543
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
540
544
|
"scenarios": 10,
|
|
541
|
-
"passed":
|
|
542
|
-
"passRate": 0,
|
|
545
|
+
"passed": 1,
|
|
546
|
+
"passRate": 0.1,
|
|
543
547
|
"decisionCorrect": 1,
|
|
544
548
|
"decisionAccuracy": 0.1,
|
|
545
549
|
"preventionRate": 0,
|
|
546
550
|
"falseBlockRate": 0,
|
|
547
551
|
"usefulWarningPrecision": 0,
|
|
548
552
|
"evidenceRecall": 0.1,
|
|
553
|
+
"lineageRichness": 0.1,
|
|
549
554
|
"redactionLeaks": 0,
|
|
550
555
|
"recallDegradationDetectionRate": 0,
|
|
551
556
|
"latency": {
|
|
552
|
-
"p50Ms": 0.
|
|
553
|
-
"p95Ms": 0.
|
|
554
|
-
"maxMs": 0.
|
|
557
|
+
"p50Ms": 0.43,
|
|
558
|
+
"p95Ms": 0.717,
|
|
559
|
+
"maxMs": 0.717
|
|
555
560
|
}
|
|
556
561
|
}
|
|
557
562
|
],
|
|
558
563
|
"comparisons": {
|
|
559
564
|
"bestBaseline": {
|
|
560
|
-
"system": "
|
|
561
|
-
"generatedAt": "2026-05-
|
|
565
|
+
"system": "Recent Window",
|
|
566
|
+
"generatedAt": "2026-05-29T03:45:36.606Z",
|
|
562
567
|
"scenarios": 10,
|
|
563
|
-
"passed":
|
|
564
|
-
"passRate": 0,
|
|
565
|
-
"decisionCorrect":
|
|
566
|
-
"decisionAccuracy": 0.
|
|
567
|
-
"preventionRate": 0,
|
|
568
|
+
"passed": 6,
|
|
569
|
+
"passRate": 0.6,
|
|
570
|
+
"decisionCorrect": 6,
|
|
571
|
+
"decisionAccuracy": 0.6,
|
|
572
|
+
"preventionRate": 0.5714285714285714,
|
|
568
573
|
"falseBlockRate": 0,
|
|
569
|
-
"usefulWarningPrecision":
|
|
570
|
-
"evidenceRecall":
|
|
574
|
+
"usefulWarningPrecision": 0.3333333333333333,
|
|
575
|
+
"evidenceRecall": 1,
|
|
576
|
+
"lineageRichness": 0,
|
|
571
577
|
"redactionLeaks": 0,
|
|
572
|
-
"recallDegradationDetectionRate": 0,
|
|
578
|
+
"recallDegradationDetectionRate": 0.5,
|
|
573
579
|
"latency": {
|
|
574
|
-
"p50Ms": 0.
|
|
575
|
-
"p95Ms": 0.
|
|
576
|
-
"maxMs": 0.
|
|
580
|
+
"p50Ms": 0.106,
|
|
581
|
+
"p95Ms": 0.421,
|
|
582
|
+
"maxMs": 0.421
|
|
577
583
|
}
|
|
578
584
|
},
|
|
579
|
-
"audreyMarginOverBestBaseline":
|
|
585
|
+
"audreyMarginOverBestBaseline": 0.4
|
|
580
586
|
},
|
|
581
587
|
"rows": [
|
|
582
588
|
{
|
|
@@ -588,11 +594,11 @@
|
|
|
588
594
|
"decisionCorrect": true,
|
|
589
595
|
"riskScore": 0.9,
|
|
590
596
|
"passed": true,
|
|
591
|
-
"latencyMs": 8.
|
|
597
|
+
"latencyMs": 8.156,
|
|
592
598
|
"evidenceCount": 2,
|
|
593
599
|
"evidenceIds": [
|
|
594
|
-
"
|
|
595
|
-
"failure:Bash:2026-05-
|
|
600
|
+
"01KSRXCP2KSTEGGHFKA5WRR1S8",
|
|
601
|
+
"failure:Bash:2026-05-29T03:45:33.268Z"
|
|
596
602
|
],
|
|
597
603
|
"recommendedActions": [
|
|
598
604
|
"Do not repeat the exact failed action until the prior error is understood or the command is changed.",
|
|
@@ -601,6 +607,8 @@
|
|
|
601
607
|
"summary": "Blocked: this exact Bash action failed before. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
602
608
|
"recallErrors": [],
|
|
603
609
|
"leakedSecrets": [],
|
|
610
|
+
"hasEvidenceForDecision": true,
|
|
611
|
+
"lineageTextMatched": true,
|
|
604
612
|
"requiredEvidenceMatched": true
|
|
605
613
|
},
|
|
606
614
|
{
|
|
@@ -612,10 +620,10 @@
|
|
|
612
620
|
"decisionCorrect": true,
|
|
613
621
|
"riskScore": 0.85,
|
|
614
622
|
"passed": true,
|
|
615
|
-
"latencyMs": 2.
|
|
623
|
+
"latencyMs": 2.277,
|
|
616
624
|
"evidenceCount": 1,
|
|
617
625
|
"evidenceIds": [
|
|
618
|
-
"
|
|
626
|
+
"01KSRXCP4XYS02ZWPSKVYA7A0G"
|
|
619
627
|
],
|
|
620
628
|
"recommendedActions": [
|
|
621
629
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -624,6 +632,8 @@
|
|
|
624
632
|
"summary": "Blocked: 1 memory signal, 1 high severity found before acting.",
|
|
625
633
|
"recallErrors": [],
|
|
626
634
|
"leakedSecrets": [],
|
|
635
|
+
"hasEvidenceForDecision": true,
|
|
636
|
+
"lineageTextMatched": true,
|
|
627
637
|
"requiredEvidenceMatched": true
|
|
628
638
|
},
|
|
629
639
|
{
|
|
@@ -635,10 +645,10 @@
|
|
|
635
645
|
"decisionCorrect": true,
|
|
636
646
|
"riskScore": 0.55,
|
|
637
647
|
"passed": true,
|
|
638
|
-
"latencyMs": 3.
|
|
648
|
+
"latencyMs": 3.184,
|
|
639
649
|
"evidenceCount": 1,
|
|
640
650
|
"evidenceIds": [
|
|
641
|
-
"failure:Bash:2026-05-
|
|
651
|
+
"failure:Bash:2026-05-29T03:45:33.404Z"
|
|
642
652
|
],
|
|
643
653
|
"recommendedActions": [
|
|
644
654
|
"Before re-running Bash, check what changed since the last failure."
|
|
@@ -646,6 +656,8 @@
|
|
|
646
656
|
"summary": "Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
647
657
|
"recallErrors": [],
|
|
648
658
|
"leakedSecrets": [],
|
|
659
|
+
"hasEvidenceForDecision": true,
|
|
660
|
+
"lineageTextMatched": true,
|
|
649
661
|
"requiredEvidenceMatched": true
|
|
650
662
|
},
|
|
651
663
|
{
|
|
@@ -657,10 +669,10 @@
|
|
|
657
669
|
"decisionCorrect": true,
|
|
658
670
|
"riskScore": 0.55,
|
|
659
671
|
"passed": true,
|
|
660
|
-
"latencyMs":
|
|
672
|
+
"latencyMs": 2.916,
|
|
661
673
|
"evidenceCount": 1,
|
|
662
674
|
"evidenceIds": [
|
|
663
|
-
"failure:Bash:2026-05-
|
|
675
|
+
"failure:Bash:2026-05-29T03:45:33.469Z"
|
|
664
676
|
],
|
|
665
677
|
"recommendedActions": [
|
|
666
678
|
"Before re-running Bash, check what changed since the last failure."
|
|
@@ -668,6 +680,8 @@
|
|
|
668
680
|
"summary": "Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
669
681
|
"recallErrors": [],
|
|
670
682
|
"leakedSecrets": [],
|
|
683
|
+
"hasEvidenceForDecision": true,
|
|
684
|
+
"lineageTextMatched": true,
|
|
671
685
|
"requiredEvidenceMatched": true
|
|
672
686
|
},
|
|
673
687
|
{
|
|
@@ -679,11 +693,11 @@
|
|
|
679
693
|
"decisionCorrect": true,
|
|
680
694
|
"riskScore": 0.2,
|
|
681
695
|
"passed": true,
|
|
682
|
-
"latencyMs": 3.
|
|
696
|
+
"latencyMs": 3.161,
|
|
683
697
|
"evidenceCount": 2,
|
|
684
698
|
"evidenceIds": [
|
|
685
|
-
"
|
|
686
|
-
"failure:Bash:2026-05-
|
|
699
|
+
"01KSRXCPAXZX9BGBD93N5CDDCM",
|
|
700
|
+
"failure:Bash:2026-05-29T03:45:33.531Z"
|
|
687
701
|
],
|
|
688
702
|
"recommendedActions": [
|
|
689
703
|
"This exact action has succeeded since its last failure; proceed with normal validation.",
|
|
@@ -692,6 +706,8 @@
|
|
|
692
706
|
"summary": "Allowed: this exact Bash action has succeeded since the prior failure. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
693
707
|
"recallErrors": [],
|
|
694
708
|
"leakedSecrets": [],
|
|
709
|
+
"hasEvidenceForDecision": true,
|
|
710
|
+
"lineageTextMatched": true,
|
|
695
711
|
"requiredEvidenceMatched": true
|
|
696
712
|
},
|
|
697
713
|
{
|
|
@@ -703,7 +719,7 @@
|
|
|
703
719
|
"decisionCorrect": true,
|
|
704
720
|
"riskScore": 0.85,
|
|
705
721
|
"passed": true,
|
|
706
|
-
"latencyMs": 2.
|
|
722
|
+
"latencyMs": 2.647,
|
|
707
723
|
"evidenceCount": 1,
|
|
708
724
|
"evidenceIds": [
|
|
709
725
|
"recall:episodic:recall.vector_counts"
|
|
@@ -716,6 +732,8 @@
|
|
|
716
732
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
717
733
|
"recallErrors": [],
|
|
718
734
|
"leakedSecrets": [],
|
|
735
|
+
"hasEvidenceForDecision": true,
|
|
736
|
+
"lineageTextMatched": true,
|
|
719
737
|
"requiredEvidenceMatched": true
|
|
720
738
|
},
|
|
721
739
|
{
|
|
@@ -727,11 +745,11 @@
|
|
|
727
745
|
"decisionCorrect": true,
|
|
728
746
|
"riskScore": 0.85,
|
|
729
747
|
"passed": true,
|
|
730
|
-
"latencyMs":
|
|
748
|
+
"latencyMs": 1.934,
|
|
731
749
|
"evidenceCount": 2,
|
|
732
750
|
"evidenceIds": [
|
|
733
751
|
"recall:fts:recall.fts_lookup",
|
|
734
|
-
"
|
|
752
|
+
"01KSRXCPEXC1RDR4VFSV3ZV759"
|
|
735
753
|
],
|
|
736
754
|
"recommendedActions": [
|
|
737
755
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -741,6 +759,8 @@
|
|
|
741
759
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
742
760
|
"recallErrors": [],
|
|
743
761
|
"leakedSecrets": [],
|
|
762
|
+
"hasEvidenceForDecision": true,
|
|
763
|
+
"lineageTextMatched": true,
|
|
744
764
|
"requiredEvidenceMatched": true
|
|
745
765
|
},
|
|
746
766
|
{
|
|
@@ -752,11 +772,11 @@
|
|
|
752
772
|
"decisionCorrect": true,
|
|
753
773
|
"riskScore": 0.9,
|
|
754
774
|
"passed": true,
|
|
755
|
-
"latencyMs": 2.
|
|
775
|
+
"latencyMs": 2.599,
|
|
756
776
|
"evidenceCount": 2,
|
|
757
777
|
"evidenceIds": [
|
|
758
|
-
"
|
|
759
|
-
"failure:Bash:2026-05-
|
|
778
|
+
"01KSRXCPGV1X3H49QBRCN72084",
|
|
779
|
+
"failure:Bash:2026-05-29T03:45:33.723Z"
|
|
760
780
|
],
|
|
761
781
|
"recommendedActions": [
|
|
762
782
|
"Do not repeat the exact failed action until the prior error is understood or the command is changed.",
|
|
@@ -765,6 +785,8 @@
|
|
|
765
785
|
"summary": "Blocked: this exact Bash action failed before. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
766
786
|
"recallErrors": [],
|
|
767
787
|
"leakedSecrets": [],
|
|
788
|
+
"hasEvidenceForDecision": true,
|
|
789
|
+
"lineageTextMatched": true,
|
|
768
790
|
"requiredEvidenceMatched": true
|
|
769
791
|
},
|
|
770
792
|
{
|
|
@@ -776,11 +798,11 @@
|
|
|
776
798
|
"decisionCorrect": true,
|
|
777
799
|
"riskScore": 0.85,
|
|
778
800
|
"passed": true,
|
|
779
|
-
"latencyMs": 2.
|
|
801
|
+
"latencyMs": 2.391,
|
|
780
802
|
"evidenceCount": 2,
|
|
781
803
|
"evidenceIds": [
|
|
782
|
-
"
|
|
783
|
-
"
|
|
804
|
+
"01KSRXCPJTXVN9X36WASHM2QY6",
|
|
805
|
+
"01KSRXCPJV1JQBFZ19K6H796AG"
|
|
784
806
|
],
|
|
785
807
|
"recommendedActions": [
|
|
786
808
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -789,6 +811,8 @@
|
|
|
789
811
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
790
812
|
"recallErrors": [],
|
|
791
813
|
"leakedSecrets": [],
|
|
814
|
+
"hasEvidenceForDecision": true,
|
|
815
|
+
"lineageTextMatched": true,
|
|
792
816
|
"requiredEvidenceMatched": true
|
|
793
817
|
},
|
|
794
818
|
{
|
|
@@ -800,31 +824,32 @@
|
|
|
800
824
|
"decisionCorrect": true,
|
|
801
825
|
"riskScore": 0.85,
|
|
802
826
|
"passed": true,
|
|
803
|
-
"latencyMs":
|
|
804
|
-
"evidenceCount":
|
|
827
|
+
"latencyMs": 21.17,
|
|
828
|
+
"evidenceCount": 12,
|
|
805
829
|
"evidenceIds": [
|
|
806
|
-
"
|
|
807
|
-
"
|
|
808
|
-
"
|
|
809
|
-
"
|
|
810
|
-
"
|
|
811
|
-
"
|
|
812
|
-
"
|
|
813
|
-
"
|
|
814
|
-
"
|
|
815
|
-
"
|
|
816
|
-
"
|
|
817
|
-
"
|
|
818
|
-
"01KRHV0Y0MWQGN3QAWME8F5554"
|
|
830
|
+
"01KSRXCQ4DK284E35ZKNYDXWBQ",
|
|
831
|
+
"01KSRXCQ3H1TVR4E552DQVV9MG",
|
|
832
|
+
"01KSRXCQ39QKSSNZWEFZBHMNT9",
|
|
833
|
+
"01KSRXCPYP6VKM8AZC7KZ4SN6W",
|
|
834
|
+
"01KSRXCPVWWCPWE3M38G6VM1BG",
|
|
835
|
+
"01KSRXCPV7YMCBAT0602VZ3DQG",
|
|
836
|
+
"01KSRXCPTM8GHZXKXNKH5FMRG6",
|
|
837
|
+
"01KSRXCPSNJTZHJK1MWE6WNNYW",
|
|
838
|
+
"01KSRXCPS3K2GR6MFXTMTDEKD3",
|
|
839
|
+
"01KSRXCPS3K2GR6MFXTMTDEKD2",
|
|
840
|
+
"01KSRXCPRGC2EN41NQD4MYJ1Q1",
|
|
841
|
+
"01KSRXCPNG135506TFPF1WMAVB"
|
|
819
842
|
],
|
|
820
843
|
"recommendedActions": [
|
|
821
844
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
822
845
|
"Apply this must-follow rule before acting.",
|
|
823
846
|
"Treat this as uncertain context and verify before relying on it."
|
|
824
847
|
],
|
|
825
|
-
"summary": "Blocked:
|
|
848
|
+
"summary": "Blocked: 12 memory signals, 1 high severity, 11 medium severity found before acting.",
|
|
826
849
|
"recallErrors": [],
|
|
827
850
|
"leakedSecrets": [],
|
|
851
|
+
"hasEvidenceForDecision": true,
|
|
852
|
+
"lineageTextMatched": true,
|
|
828
853
|
"requiredEvidenceMatched": true
|
|
829
854
|
}
|
|
830
855
|
],
|
|
@@ -843,11 +868,11 @@
|
|
|
843
868
|
"decisionCorrect": true,
|
|
844
869
|
"riskScore": 0.9,
|
|
845
870
|
"passed": true,
|
|
846
|
-
"latencyMs": 8.
|
|
871
|
+
"latencyMs": 8.156,
|
|
847
872
|
"evidenceCount": 2,
|
|
848
873
|
"evidenceIds": [
|
|
849
|
-
"
|
|
850
|
-
"failure:Bash:2026-05-
|
|
874
|
+
"01KSRXCP2KSTEGGHFKA5WRR1S8",
|
|
875
|
+
"failure:Bash:2026-05-29T03:45:33.268Z"
|
|
851
876
|
],
|
|
852
877
|
"recommendedActions": [
|
|
853
878
|
"Do not repeat the exact failed action until the prior error is understood or the command is changed.",
|
|
@@ -856,6 +881,8 @@
|
|
|
856
881
|
"summary": "Blocked: this exact Bash action failed before. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
857
882
|
"recallErrors": [],
|
|
858
883
|
"leakedSecrets": [],
|
|
884
|
+
"hasEvidenceForDecision": true,
|
|
885
|
+
"lineageTextMatched": true,
|
|
859
886
|
"requiredEvidenceMatched": true
|
|
860
887
|
},
|
|
861
888
|
{
|
|
@@ -867,13 +894,15 @@
|
|
|
867
894
|
"decisionCorrect": false,
|
|
868
895
|
"riskScore": 0,
|
|
869
896
|
"passed": false,
|
|
870
|
-
"latencyMs": 0.
|
|
897
|
+
"latencyMs": 0.035,
|
|
871
898
|
"evidenceCount": 0,
|
|
872
899
|
"evidenceIds": [],
|
|
873
900
|
"recommendedActions": [],
|
|
874
901
|
"summary": "No memory baseline always allows proposed actions.",
|
|
875
902
|
"recallErrors": [],
|
|
876
903
|
"leakedSecrets": [],
|
|
904
|
+
"hasEvidenceForDecision": false,
|
|
905
|
+
"lineageTextMatched": false,
|
|
877
906
|
"requiredEvidenceMatched": false
|
|
878
907
|
},
|
|
879
908
|
{
|
|
@@ -885,10 +914,10 @@
|
|
|
885
914
|
"decisionCorrect": false,
|
|
886
915
|
"riskScore": 0.55,
|
|
887
916
|
"passed": false,
|
|
888
|
-
"latencyMs": 0.
|
|
917
|
+
"latencyMs": 0.223,
|
|
889
918
|
"evidenceCount": 1,
|
|
890
919
|
"evidenceIds": [
|
|
891
|
-
"
|
|
920
|
+
"01KSRXCP3QFKSFEB9TZNQV7P48"
|
|
892
921
|
],
|
|
893
922
|
"recommendedActions": [
|
|
894
923
|
"Check the recent failed event before repeating a similar action."
|
|
@@ -896,7 +925,9 @@
|
|
|
896
925
|
"summary": "Recent-window baseline found a failed Bash event.",
|
|
897
926
|
"recallErrors": [],
|
|
898
927
|
"leakedSecrets": [],
|
|
899
|
-
"
|
|
928
|
+
"hasEvidenceForDecision": true,
|
|
929
|
+
"lineageTextMatched": false,
|
|
930
|
+
"requiredEvidenceMatched": true
|
|
900
931
|
},
|
|
901
932
|
{
|
|
902
933
|
"system": "Vector Only",
|
|
@@ -907,10 +938,10 @@
|
|
|
907
938
|
"decisionCorrect": false,
|
|
908
939
|
"riskScore": 0.35,
|
|
909
940
|
"passed": false,
|
|
910
|
-
"latencyMs":
|
|
941
|
+
"latencyMs": 0.945,
|
|
911
942
|
"evidenceCount": 1,
|
|
912
943
|
"evidenceIds": [
|
|
913
|
-
"
|
|
944
|
+
"01KSRXCP44MHYS3JJJN1C3H0SR"
|
|
914
945
|
],
|
|
915
946
|
"recommendedActions": [
|
|
916
947
|
"Treat retrieved memory as advisory context."
|
|
@@ -918,7 +949,9 @@
|
|
|
918
949
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
919
950
|
"recallErrors": [],
|
|
920
951
|
"leakedSecrets": [],
|
|
921
|
-
"
|
|
952
|
+
"hasEvidenceForDecision": true,
|
|
953
|
+
"lineageTextMatched": false,
|
|
954
|
+
"requiredEvidenceMatched": true
|
|
922
955
|
},
|
|
923
956
|
{
|
|
924
957
|
"system": "FTS Only",
|
|
@@ -929,13 +962,15 @@
|
|
|
929
962
|
"decisionCorrect": false,
|
|
930
963
|
"riskScore": 0,
|
|
931
964
|
"passed": false,
|
|
932
|
-
"latencyMs": 0.
|
|
965
|
+
"latencyMs": 0.467,
|
|
933
966
|
"evidenceCount": 0,
|
|
934
967
|
"evidenceIds": [],
|
|
935
968
|
"recommendedActions": [],
|
|
936
969
|
"summary": "No memory signal found by this baseline.",
|
|
937
970
|
"recallErrors": [],
|
|
938
971
|
"leakedSecrets": [],
|
|
972
|
+
"hasEvidenceForDecision": false,
|
|
973
|
+
"lineageTextMatched": false,
|
|
939
974
|
"requiredEvidenceMatched": false
|
|
940
975
|
}
|
|
941
976
|
]
|
|
@@ -954,10 +989,10 @@
|
|
|
954
989
|
"decisionCorrect": true,
|
|
955
990
|
"riskScore": 0.85,
|
|
956
991
|
"passed": true,
|
|
957
|
-
"latencyMs": 2.
|
|
992
|
+
"latencyMs": 2.277,
|
|
958
993
|
"evidenceCount": 1,
|
|
959
994
|
"evidenceIds": [
|
|
960
|
-
"
|
|
995
|
+
"01KSRXCP4XYS02ZWPSKVYA7A0G"
|
|
961
996
|
],
|
|
962
997
|
"recommendedActions": [
|
|
963
998
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -966,6 +1001,8 @@
|
|
|
966
1001
|
"summary": "Blocked: 1 memory signal, 1 high severity found before acting.",
|
|
967
1002
|
"recallErrors": [],
|
|
968
1003
|
"leakedSecrets": [],
|
|
1004
|
+
"hasEvidenceForDecision": true,
|
|
1005
|
+
"lineageTextMatched": true,
|
|
969
1006
|
"requiredEvidenceMatched": true
|
|
970
1007
|
},
|
|
971
1008
|
{
|
|
@@ -977,13 +1014,15 @@
|
|
|
977
1014
|
"decisionCorrect": false,
|
|
978
1015
|
"riskScore": 0,
|
|
979
1016
|
"passed": false,
|
|
980
|
-
"latencyMs": 0.
|
|
1017
|
+
"latencyMs": 0.004,
|
|
981
1018
|
"evidenceCount": 0,
|
|
982
1019
|
"evidenceIds": [],
|
|
983
1020
|
"recommendedActions": [],
|
|
984
1021
|
"summary": "No memory baseline always allows proposed actions.",
|
|
985
1022
|
"recallErrors": [],
|
|
986
1023
|
"leakedSecrets": [],
|
|
1024
|
+
"hasEvidenceForDecision": false,
|
|
1025
|
+
"lineageTextMatched": false,
|
|
987
1026
|
"requiredEvidenceMatched": false
|
|
988
1027
|
},
|
|
989
1028
|
{
|
|
@@ -994,11 +1033,11 @@
|
|
|
994
1033
|
"decision": "block",
|
|
995
1034
|
"decisionCorrect": true,
|
|
996
1035
|
"riskScore": 0.85,
|
|
997
|
-
"passed":
|
|
998
|
-
"latencyMs": 0.
|
|
1036
|
+
"passed": true,
|
|
1037
|
+
"latencyMs": 0.322,
|
|
999
1038
|
"evidenceCount": 1,
|
|
1000
1039
|
"evidenceIds": [
|
|
1001
|
-
"
|
|
1040
|
+
"01KSRXCP5QE5HDWCC6T278MZFJ"
|
|
1002
1041
|
],
|
|
1003
1042
|
"recommendedActions": [
|
|
1004
1043
|
"Review retrieved memory before acting."
|
|
@@ -1006,7 +1045,9 @@
|
|
|
1006
1045
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1007
1046
|
"recallErrors": [],
|
|
1008
1047
|
"leakedSecrets": [],
|
|
1009
|
-
"
|
|
1048
|
+
"hasEvidenceForDecision": true,
|
|
1049
|
+
"lineageTextMatched": false,
|
|
1050
|
+
"requiredEvidenceMatched": true
|
|
1010
1051
|
},
|
|
1011
1052
|
{
|
|
1012
1053
|
"system": "Vector Only",
|
|
@@ -1016,11 +1057,11 @@
|
|
|
1016
1057
|
"decision": "block",
|
|
1017
1058
|
"decisionCorrect": true,
|
|
1018
1059
|
"riskScore": 0.85,
|
|
1019
|
-
"passed":
|
|
1020
|
-
"latencyMs": 0.
|
|
1060
|
+
"passed": true,
|
|
1061
|
+
"latencyMs": 0.508,
|
|
1021
1062
|
"evidenceCount": 1,
|
|
1022
1063
|
"evidenceIds": [
|
|
1023
|
-
"
|
|
1064
|
+
"01KSRXCP63JE2K5CC3CMMWRZVM"
|
|
1024
1065
|
],
|
|
1025
1066
|
"recommendedActions": [
|
|
1026
1067
|
"Review retrieved memory before acting."
|
|
@@ -1028,7 +1069,9 @@
|
|
|
1028
1069
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1029
1070
|
"recallErrors": [],
|
|
1030
1071
|
"leakedSecrets": [],
|
|
1031
|
-
"
|
|
1072
|
+
"hasEvidenceForDecision": true,
|
|
1073
|
+
"lineageTextMatched": false,
|
|
1074
|
+
"requiredEvidenceMatched": true
|
|
1032
1075
|
},
|
|
1033
1076
|
{
|
|
1034
1077
|
"system": "FTS Only",
|
|
@@ -1039,13 +1082,15 @@
|
|
|
1039
1082
|
"decisionCorrect": false,
|
|
1040
1083
|
"riskScore": 0,
|
|
1041
1084
|
"passed": false,
|
|
1042
|
-
"latencyMs": 0.
|
|
1085
|
+
"latencyMs": 0.428,
|
|
1043
1086
|
"evidenceCount": 0,
|
|
1044
1087
|
"evidenceIds": [],
|
|
1045
1088
|
"recommendedActions": [],
|
|
1046
1089
|
"summary": "No memory signal found by this baseline.",
|
|
1047
1090
|
"recallErrors": [],
|
|
1048
1091
|
"leakedSecrets": [],
|
|
1092
|
+
"hasEvidenceForDecision": false,
|
|
1093
|
+
"lineageTextMatched": false,
|
|
1049
1094
|
"requiredEvidenceMatched": false
|
|
1050
1095
|
}
|
|
1051
1096
|
]
|
|
@@ -1064,10 +1109,10 @@
|
|
|
1064
1109
|
"decisionCorrect": true,
|
|
1065
1110
|
"riskScore": 0.55,
|
|
1066
1111
|
"passed": true,
|
|
1067
|
-
"latencyMs": 3.
|
|
1112
|
+
"latencyMs": 3.184,
|
|
1068
1113
|
"evidenceCount": 1,
|
|
1069
1114
|
"evidenceIds": [
|
|
1070
|
-
"failure:Bash:2026-05-
|
|
1115
|
+
"failure:Bash:2026-05-29T03:45:33.404Z"
|
|
1071
1116
|
],
|
|
1072
1117
|
"recommendedActions": [
|
|
1073
1118
|
"Before re-running Bash, check what changed since the last failure."
|
|
@@ -1075,6 +1120,8 @@
|
|
|
1075
1120
|
"summary": "Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
1076
1121
|
"recallErrors": [],
|
|
1077
1122
|
"leakedSecrets": [],
|
|
1123
|
+
"hasEvidenceForDecision": true,
|
|
1124
|
+
"lineageTextMatched": true,
|
|
1078
1125
|
"requiredEvidenceMatched": true
|
|
1079
1126
|
},
|
|
1080
1127
|
{
|
|
@@ -1086,13 +1133,15 @@
|
|
|
1086
1133
|
"decisionCorrect": false,
|
|
1087
1134
|
"riskScore": 0,
|
|
1088
1135
|
"passed": false,
|
|
1089
|
-
"latencyMs": 0.
|
|
1136
|
+
"latencyMs": 0.005,
|
|
1090
1137
|
"evidenceCount": 0,
|
|
1091
1138
|
"evidenceIds": [],
|
|
1092
1139
|
"recommendedActions": [],
|
|
1093
1140
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1094
1141
|
"recallErrors": [],
|
|
1095
1142
|
"leakedSecrets": [],
|
|
1143
|
+
"hasEvidenceForDecision": false,
|
|
1144
|
+
"lineageTextMatched": false,
|
|
1096
1145
|
"requiredEvidenceMatched": false
|
|
1097
1146
|
},
|
|
1098
1147
|
{
|
|
@@ -1103,11 +1152,11 @@
|
|
|
1103
1152
|
"decision": "warn",
|
|
1104
1153
|
"decisionCorrect": true,
|
|
1105
1154
|
"riskScore": 0.55,
|
|
1106
|
-
"passed":
|
|
1107
|
-
"latencyMs": 0.
|
|
1155
|
+
"passed": true,
|
|
1156
|
+
"latencyMs": 0.071,
|
|
1108
1157
|
"evidenceCount": 1,
|
|
1109
1158
|
"evidenceIds": [
|
|
1110
|
-
"
|
|
1159
|
+
"01KSRXCP7QG82ZMEVDA0WPBDGS"
|
|
1111
1160
|
],
|
|
1112
1161
|
"recommendedActions": [
|
|
1113
1162
|
"Check the recent failed event before repeating a similar action."
|
|
@@ -1115,7 +1164,9 @@
|
|
|
1115
1164
|
"summary": "Recent-window baseline found a failed Bash event.",
|
|
1116
1165
|
"recallErrors": [],
|
|
1117
1166
|
"leakedSecrets": [],
|
|
1118
|
-
"
|
|
1167
|
+
"hasEvidenceForDecision": true,
|
|
1168
|
+
"lineageTextMatched": false,
|
|
1169
|
+
"requiredEvidenceMatched": true
|
|
1119
1170
|
},
|
|
1120
1171
|
{
|
|
1121
1172
|
"system": "Vector Only",
|
|
@@ -1125,11 +1176,11 @@
|
|
|
1125
1176
|
"decision": "warn",
|
|
1126
1177
|
"decisionCorrect": true,
|
|
1127
1178
|
"riskScore": 0.35,
|
|
1128
|
-
"passed":
|
|
1129
|
-
"latencyMs": 0.
|
|
1179
|
+
"passed": true,
|
|
1180
|
+
"latencyMs": 0.523,
|
|
1130
1181
|
"evidenceCount": 1,
|
|
1131
1182
|
"evidenceIds": [
|
|
1132
|
-
"
|
|
1183
|
+
"01KSRXCP85A8VZCV4YFYWDBZY4"
|
|
1133
1184
|
],
|
|
1134
1185
|
"recommendedActions": [
|
|
1135
1186
|
"Treat retrieved memory as advisory context."
|
|
@@ -1137,7 +1188,9 @@
|
|
|
1137
1188
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1138
1189
|
"recallErrors": [],
|
|
1139
1190
|
"leakedSecrets": [],
|
|
1140
|
-
"
|
|
1191
|
+
"hasEvidenceForDecision": true,
|
|
1192
|
+
"lineageTextMatched": false,
|
|
1193
|
+
"requiredEvidenceMatched": true
|
|
1141
1194
|
},
|
|
1142
1195
|
{
|
|
1143
1196
|
"system": "FTS Only",
|
|
@@ -1148,13 +1201,15 @@
|
|
|
1148
1201
|
"decisionCorrect": false,
|
|
1149
1202
|
"riskScore": 0,
|
|
1150
1203
|
"passed": false,
|
|
1151
|
-
"latencyMs": 0.
|
|
1204
|
+
"latencyMs": 0.457,
|
|
1152
1205
|
"evidenceCount": 0,
|
|
1153
1206
|
"evidenceIds": [],
|
|
1154
1207
|
"recommendedActions": [],
|
|
1155
1208
|
"summary": "No memory signal found by this baseline.",
|
|
1156
1209
|
"recallErrors": [],
|
|
1157
1210
|
"leakedSecrets": [],
|
|
1211
|
+
"hasEvidenceForDecision": false,
|
|
1212
|
+
"lineageTextMatched": false,
|
|
1158
1213
|
"requiredEvidenceMatched": false
|
|
1159
1214
|
}
|
|
1160
1215
|
]
|
|
@@ -1173,10 +1228,10 @@
|
|
|
1173
1228
|
"decisionCorrect": true,
|
|
1174
1229
|
"riskScore": 0.55,
|
|
1175
1230
|
"passed": true,
|
|
1176
|
-
"latencyMs":
|
|
1231
|
+
"latencyMs": 2.916,
|
|
1177
1232
|
"evidenceCount": 1,
|
|
1178
1233
|
"evidenceIds": [
|
|
1179
|
-
"failure:Bash:2026-05-
|
|
1234
|
+
"failure:Bash:2026-05-29T03:45:33.469Z"
|
|
1180
1235
|
],
|
|
1181
1236
|
"recommendedActions": [
|
|
1182
1237
|
"Before re-running Bash, check what changed since the last failure."
|
|
@@ -1184,6 +1239,8 @@
|
|
|
1184
1239
|
"summary": "Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
1185
1240
|
"recallErrors": [],
|
|
1186
1241
|
"leakedSecrets": [],
|
|
1242
|
+
"hasEvidenceForDecision": true,
|
|
1243
|
+
"lineageTextMatched": true,
|
|
1187
1244
|
"requiredEvidenceMatched": true
|
|
1188
1245
|
},
|
|
1189
1246
|
{
|
|
@@ -1195,13 +1252,15 @@
|
|
|
1195
1252
|
"decisionCorrect": false,
|
|
1196
1253
|
"riskScore": 0,
|
|
1197
1254
|
"passed": false,
|
|
1198
|
-
"latencyMs": 0.
|
|
1255
|
+
"latencyMs": 0.008,
|
|
1199
1256
|
"evidenceCount": 0,
|
|
1200
1257
|
"evidenceIds": [],
|
|
1201
1258
|
"recommendedActions": [],
|
|
1202
1259
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1203
1260
|
"recallErrors": [],
|
|
1204
1261
|
"leakedSecrets": [],
|
|
1262
|
+
"hasEvidenceForDecision": false,
|
|
1263
|
+
"lineageTextMatched": false,
|
|
1205
1264
|
"requiredEvidenceMatched": false
|
|
1206
1265
|
},
|
|
1207
1266
|
{
|
|
@@ -1212,11 +1271,11 @@
|
|
|
1212
1271
|
"decision": "warn",
|
|
1213
1272
|
"decisionCorrect": true,
|
|
1214
1273
|
"riskScore": 0.55,
|
|
1215
|
-
"passed":
|
|
1216
|
-
"latencyMs": 0.
|
|
1274
|
+
"passed": true,
|
|
1275
|
+
"latencyMs": 0.079,
|
|
1217
1276
|
"evidenceCount": 1,
|
|
1218
1277
|
"evidenceIds": [
|
|
1219
|
-
"
|
|
1278
|
+
"01KSRXCP9QC1E626F1EMNFSYVM"
|
|
1220
1279
|
],
|
|
1221
1280
|
"recommendedActions": [
|
|
1222
1281
|
"Check the recent failed event before repeating a similar action."
|
|
@@ -1224,7 +1283,9 @@
|
|
|
1224
1283
|
"summary": "Recent-window baseline found a failed Bash event.",
|
|
1225
1284
|
"recallErrors": [],
|
|
1226
1285
|
"leakedSecrets": [],
|
|
1227
|
-
"
|
|
1286
|
+
"hasEvidenceForDecision": true,
|
|
1287
|
+
"lineageTextMatched": false,
|
|
1288
|
+
"requiredEvidenceMatched": true
|
|
1228
1289
|
},
|
|
1229
1290
|
{
|
|
1230
1291
|
"system": "Vector Only",
|
|
@@ -1234,11 +1295,11 @@
|
|
|
1234
1295
|
"decision": "warn",
|
|
1235
1296
|
"decisionCorrect": true,
|
|
1236
1297
|
"riskScore": 0.35,
|
|
1237
|
-
"passed":
|
|
1238
|
-
"latencyMs": 0.
|
|
1298
|
+
"passed": true,
|
|
1299
|
+
"latencyMs": 0.427,
|
|
1239
1300
|
"evidenceCount": 1,
|
|
1240
1301
|
"evidenceIds": [
|
|
1241
|
-
"
|
|
1302
|
+
"01KSRXCPA32S387Y36NHQRFNPT"
|
|
1242
1303
|
],
|
|
1243
1304
|
"recommendedActions": [
|
|
1244
1305
|
"Treat retrieved memory as advisory context."
|
|
@@ -1246,7 +1307,9 @@
|
|
|
1246
1307
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1247
1308
|
"recallErrors": [],
|
|
1248
1309
|
"leakedSecrets": [],
|
|
1249
|
-
"
|
|
1310
|
+
"hasEvidenceForDecision": true,
|
|
1311
|
+
"lineageTextMatched": false,
|
|
1312
|
+
"requiredEvidenceMatched": true
|
|
1250
1313
|
},
|
|
1251
1314
|
{
|
|
1252
1315
|
"system": "FTS Only",
|
|
@@ -1257,13 +1320,15 @@
|
|
|
1257
1320
|
"decisionCorrect": false,
|
|
1258
1321
|
"riskScore": 0,
|
|
1259
1322
|
"passed": false,
|
|
1260
|
-
"latencyMs": 0.
|
|
1323
|
+
"latencyMs": 0.43,
|
|
1261
1324
|
"evidenceCount": 0,
|
|
1262
1325
|
"evidenceIds": [],
|
|
1263
1326
|
"recommendedActions": [],
|
|
1264
1327
|
"summary": "No memory signal found by this baseline.",
|
|
1265
1328
|
"recallErrors": [],
|
|
1266
1329
|
"leakedSecrets": [],
|
|
1330
|
+
"hasEvidenceForDecision": false,
|
|
1331
|
+
"lineageTextMatched": false,
|
|
1267
1332
|
"requiredEvidenceMatched": false
|
|
1268
1333
|
}
|
|
1269
1334
|
]
|
|
@@ -1282,11 +1347,11 @@
|
|
|
1282
1347
|
"decisionCorrect": true,
|
|
1283
1348
|
"riskScore": 0.2,
|
|
1284
1349
|
"passed": true,
|
|
1285
|
-
"latencyMs": 3.
|
|
1350
|
+
"latencyMs": 3.161,
|
|
1286
1351
|
"evidenceCount": 2,
|
|
1287
1352
|
"evidenceIds": [
|
|
1288
|
-
"
|
|
1289
|
-
"failure:Bash:2026-05-
|
|
1353
|
+
"01KSRXCPAXZX9BGBD93N5CDDCM",
|
|
1354
|
+
"failure:Bash:2026-05-29T03:45:33.531Z"
|
|
1290
1355
|
],
|
|
1291
1356
|
"recommendedActions": [
|
|
1292
1357
|
"This exact action has succeeded since its last failure; proceed with normal validation.",
|
|
@@ -1295,6 +1360,8 @@
|
|
|
1295
1360
|
"summary": "Allowed: this exact Bash action has succeeded since the prior failure. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
1296
1361
|
"recallErrors": [],
|
|
1297
1362
|
"leakedSecrets": [],
|
|
1363
|
+
"hasEvidenceForDecision": true,
|
|
1364
|
+
"lineageTextMatched": true,
|
|
1298
1365
|
"requiredEvidenceMatched": true
|
|
1299
1366
|
},
|
|
1300
1367
|
{
|
|
@@ -1305,15 +1372,17 @@
|
|
|
1305
1372
|
"decision": "allow",
|
|
1306
1373
|
"decisionCorrect": true,
|
|
1307
1374
|
"riskScore": 0,
|
|
1308
|
-
"passed":
|
|
1309
|
-
"latencyMs": 0.
|
|
1375
|
+
"passed": true,
|
|
1376
|
+
"latencyMs": 0.007,
|
|
1310
1377
|
"evidenceCount": 0,
|
|
1311
1378
|
"evidenceIds": [],
|
|
1312
1379
|
"recommendedActions": [],
|
|
1313
1380
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1314
1381
|
"recallErrors": [],
|
|
1315
1382
|
"leakedSecrets": [],
|
|
1316
|
-
"
|
|
1383
|
+
"hasEvidenceForDecision": true,
|
|
1384
|
+
"lineageTextMatched": false,
|
|
1385
|
+
"requiredEvidenceMatched": true
|
|
1317
1386
|
},
|
|
1318
1387
|
{
|
|
1319
1388
|
"system": "Recent Window",
|
|
@@ -1324,10 +1393,10 @@
|
|
|
1324
1393
|
"decisionCorrect": false,
|
|
1325
1394
|
"riskScore": 0.55,
|
|
1326
1395
|
"passed": false,
|
|
1327
|
-
"latencyMs": 0.
|
|
1396
|
+
"latencyMs": 0.077,
|
|
1328
1397
|
"evidenceCount": 1,
|
|
1329
1398
|
"evidenceIds": [
|
|
1330
|
-
"
|
|
1399
|
+
"01KSRXCPBRH43HFGR41QC4C6S1"
|
|
1331
1400
|
],
|
|
1332
1401
|
"recommendedActions": [
|
|
1333
1402
|
"Check the recent failed event before repeating a similar action."
|
|
@@ -1335,7 +1404,9 @@
|
|
|
1335
1404
|
"summary": "Recent-window baseline found a failed Bash event.",
|
|
1336
1405
|
"recallErrors": [],
|
|
1337
1406
|
"leakedSecrets": [],
|
|
1338
|
-
"
|
|
1407
|
+
"hasEvidenceForDecision": true,
|
|
1408
|
+
"lineageTextMatched": false,
|
|
1409
|
+
"requiredEvidenceMatched": true
|
|
1339
1410
|
},
|
|
1340
1411
|
{
|
|
1341
1412
|
"system": "Vector Only",
|
|
@@ -1346,10 +1417,10 @@
|
|
|
1346
1417
|
"decisionCorrect": false,
|
|
1347
1418
|
"riskScore": 0.35,
|
|
1348
1419
|
"passed": false,
|
|
1349
|
-
"latencyMs": 0.
|
|
1420
|
+
"latencyMs": 0.451,
|
|
1350
1421
|
"evidenceCount": 1,
|
|
1351
1422
|
"evidenceIds": [
|
|
1352
|
-
"
|
|
1423
|
+
"01KSRXCPC5FRNJEG2MV4DA0M6B"
|
|
1353
1424
|
],
|
|
1354
1425
|
"recommendedActions": [
|
|
1355
1426
|
"Treat retrieved memory as advisory context."
|
|
@@ -1357,7 +1428,9 @@
|
|
|
1357
1428
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1358
1429
|
"recallErrors": [],
|
|
1359
1430
|
"leakedSecrets": [],
|
|
1360
|
-
"
|
|
1431
|
+
"hasEvidenceForDecision": true,
|
|
1432
|
+
"lineageTextMatched": false,
|
|
1433
|
+
"requiredEvidenceMatched": true
|
|
1361
1434
|
},
|
|
1362
1435
|
{
|
|
1363
1436
|
"system": "FTS Only",
|
|
@@ -1367,15 +1440,17 @@
|
|
|
1367
1440
|
"decision": "allow",
|
|
1368
1441
|
"decisionCorrect": true,
|
|
1369
1442
|
"riskScore": 0,
|
|
1370
|
-
"passed":
|
|
1371
|
-
"latencyMs": 0.
|
|
1443
|
+
"passed": true,
|
|
1444
|
+
"latencyMs": 0.44,
|
|
1372
1445
|
"evidenceCount": 0,
|
|
1373
1446
|
"evidenceIds": [],
|
|
1374
1447
|
"recommendedActions": [],
|
|
1375
1448
|
"summary": "No memory signal found by this baseline.",
|
|
1376
1449
|
"recallErrors": [],
|
|
1377
1450
|
"leakedSecrets": [],
|
|
1378
|
-
"
|
|
1451
|
+
"hasEvidenceForDecision": true,
|
|
1452
|
+
"lineageTextMatched": false,
|
|
1453
|
+
"requiredEvidenceMatched": true
|
|
1379
1454
|
}
|
|
1380
1455
|
]
|
|
1381
1456
|
},
|
|
@@ -1393,7 +1468,7 @@
|
|
|
1393
1468
|
"decisionCorrect": true,
|
|
1394
1469
|
"riskScore": 0.85,
|
|
1395
1470
|
"passed": true,
|
|
1396
|
-
"latencyMs": 2.
|
|
1471
|
+
"latencyMs": 2.647,
|
|
1397
1472
|
"evidenceCount": 1,
|
|
1398
1473
|
"evidenceIds": [
|
|
1399
1474
|
"recall:episodic:recall.vector_counts"
|
|
@@ -1406,6 +1481,8 @@
|
|
|
1406
1481
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
1407
1482
|
"recallErrors": [],
|
|
1408
1483
|
"leakedSecrets": [],
|
|
1484
|
+
"hasEvidenceForDecision": true,
|
|
1485
|
+
"lineageTextMatched": true,
|
|
1409
1486
|
"requiredEvidenceMatched": true
|
|
1410
1487
|
},
|
|
1411
1488
|
{
|
|
@@ -1417,13 +1494,15 @@
|
|
|
1417
1494
|
"decisionCorrect": false,
|
|
1418
1495
|
"riskScore": 0,
|
|
1419
1496
|
"passed": false,
|
|
1420
|
-
"latencyMs": 0.
|
|
1497
|
+
"latencyMs": 0.01,
|
|
1421
1498
|
"evidenceCount": 0,
|
|
1422
1499
|
"evidenceIds": [],
|
|
1423
1500
|
"recommendedActions": [],
|
|
1424
1501
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1425
1502
|
"recallErrors": [],
|
|
1426
1503
|
"leakedSecrets": [],
|
|
1504
|
+
"hasEvidenceForDecision": false,
|
|
1505
|
+
"lineageTextMatched": false,
|
|
1427
1506
|
"requiredEvidenceMatched": false
|
|
1428
1507
|
},
|
|
1429
1508
|
{
|
|
@@ -1434,11 +1513,11 @@
|
|
|
1434
1513
|
"decision": "block",
|
|
1435
1514
|
"decisionCorrect": true,
|
|
1436
1515
|
"riskScore": 0.85,
|
|
1437
|
-
"passed":
|
|
1438
|
-
"latencyMs": 0.
|
|
1516
|
+
"passed": true,
|
|
1517
|
+
"latencyMs": 0.153,
|
|
1439
1518
|
"evidenceCount": 1,
|
|
1440
1519
|
"evidenceIds": [
|
|
1441
|
-
"
|
|
1520
|
+
"01KSRXCPDRK36MH6YDNH3JKEXF"
|
|
1442
1521
|
],
|
|
1443
1522
|
"recommendedActions": [
|
|
1444
1523
|
"Review retrieved memory before acting."
|
|
@@ -1446,7 +1525,9 @@
|
|
|
1446
1525
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1447
1526
|
"recallErrors": [],
|
|
1448
1527
|
"leakedSecrets": [],
|
|
1449
|
-
"
|
|
1528
|
+
"hasEvidenceForDecision": true,
|
|
1529
|
+
"lineageTextMatched": false,
|
|
1530
|
+
"requiredEvidenceMatched": true
|
|
1450
1531
|
},
|
|
1451
1532
|
{
|
|
1452
1533
|
"system": "Vector Only",
|
|
@@ -1457,7 +1538,7 @@
|
|
|
1457
1538
|
"decisionCorrect": false,
|
|
1458
1539
|
"riskScore": 0.55,
|
|
1459
1540
|
"passed": false,
|
|
1460
|
-
"latencyMs": 0.
|
|
1541
|
+
"latencyMs": 0.304,
|
|
1461
1542
|
"evidenceCount": 0,
|
|
1462
1543
|
"evidenceIds": [],
|
|
1463
1544
|
"recommendedActions": [
|
|
@@ -1472,6 +1553,8 @@
|
|
|
1472
1553
|
}
|
|
1473
1554
|
],
|
|
1474
1555
|
"leakedSecrets": [],
|
|
1556
|
+
"hasEvidenceForDecision": false,
|
|
1557
|
+
"lineageTextMatched": false,
|
|
1475
1558
|
"requiredEvidenceMatched": false
|
|
1476
1559
|
},
|
|
1477
1560
|
{
|
|
@@ -1483,13 +1566,15 @@
|
|
|
1483
1566
|
"decisionCorrect": false,
|
|
1484
1567
|
"riskScore": 0,
|
|
1485
1568
|
"passed": false,
|
|
1486
|
-
"latencyMs": 0.
|
|
1569
|
+
"latencyMs": 0.376,
|
|
1487
1570
|
"evidenceCount": 0,
|
|
1488
1571
|
"evidenceIds": [],
|
|
1489
1572
|
"recommendedActions": [],
|
|
1490
1573
|
"summary": "No memory signal found by this baseline.",
|
|
1491
1574
|
"recallErrors": [],
|
|
1492
1575
|
"leakedSecrets": [],
|
|
1576
|
+
"hasEvidenceForDecision": false,
|
|
1577
|
+
"lineageTextMatched": false,
|
|
1493
1578
|
"requiredEvidenceMatched": false
|
|
1494
1579
|
}
|
|
1495
1580
|
]
|
|
@@ -1508,11 +1593,11 @@
|
|
|
1508
1593
|
"decisionCorrect": true,
|
|
1509
1594
|
"riskScore": 0.85,
|
|
1510
1595
|
"passed": true,
|
|
1511
|
-
"latencyMs":
|
|
1596
|
+
"latencyMs": 1.934,
|
|
1512
1597
|
"evidenceCount": 2,
|
|
1513
1598
|
"evidenceIds": [
|
|
1514
1599
|
"recall:fts:recall.fts_lookup",
|
|
1515
|
-
"
|
|
1600
|
+
"01KSRXCPEXC1RDR4VFSV3ZV759"
|
|
1516
1601
|
],
|
|
1517
1602
|
"recommendedActions": [
|
|
1518
1603
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -1522,6 +1607,8 @@
|
|
|
1522
1607
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
1523
1608
|
"recallErrors": [],
|
|
1524
1609
|
"leakedSecrets": [],
|
|
1610
|
+
"hasEvidenceForDecision": true,
|
|
1611
|
+
"lineageTextMatched": true,
|
|
1525
1612
|
"requiredEvidenceMatched": true
|
|
1526
1613
|
},
|
|
1527
1614
|
{
|
|
@@ -1533,13 +1620,15 @@
|
|
|
1533
1620
|
"decisionCorrect": false,
|
|
1534
1621
|
"riskScore": 0,
|
|
1535
1622
|
"passed": false,
|
|
1536
|
-
"latencyMs": 0.
|
|
1623
|
+
"latencyMs": 0.006,
|
|
1537
1624
|
"evidenceCount": 0,
|
|
1538
1625
|
"evidenceIds": [],
|
|
1539
1626
|
"recommendedActions": [],
|
|
1540
1627
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1541
1628
|
"recallErrors": [],
|
|
1542
1629
|
"leakedSecrets": [],
|
|
1630
|
+
"hasEvidenceForDecision": false,
|
|
1631
|
+
"lineageTextMatched": false,
|
|
1543
1632
|
"requiredEvidenceMatched": false
|
|
1544
1633
|
},
|
|
1545
1634
|
{
|
|
@@ -1551,10 +1640,10 @@
|
|
|
1551
1640
|
"decisionCorrect": false,
|
|
1552
1641
|
"riskScore": 0.35,
|
|
1553
1642
|
"passed": false,
|
|
1554
|
-
"latencyMs": 0.
|
|
1643
|
+
"latencyMs": 0.105,
|
|
1555
1644
|
"evidenceCount": 1,
|
|
1556
1645
|
"evidenceIds": [
|
|
1557
|
-
"
|
|
1646
|
+
"01KSRXCPFQ579DG3V402TKWYPM"
|
|
1558
1647
|
],
|
|
1559
1648
|
"recommendedActions": [
|
|
1560
1649
|
"Treat retrieved memory as advisory context."
|
|
@@ -1562,7 +1651,9 @@
|
|
|
1562
1651
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1563
1652
|
"recallErrors": [],
|
|
1564
1653
|
"leakedSecrets": [],
|
|
1565
|
-
"
|
|
1654
|
+
"hasEvidenceForDecision": true,
|
|
1655
|
+
"lineageTextMatched": false,
|
|
1656
|
+
"requiredEvidenceMatched": true
|
|
1566
1657
|
},
|
|
1567
1658
|
{
|
|
1568
1659
|
"system": "Vector Only",
|
|
@@ -1573,10 +1664,10 @@
|
|
|
1573
1664
|
"decisionCorrect": false,
|
|
1574
1665
|
"riskScore": 0.35,
|
|
1575
1666
|
"passed": false,
|
|
1576
|
-
"latencyMs": 0.
|
|
1667
|
+
"latencyMs": 0.347,
|
|
1577
1668
|
"evidenceCount": 1,
|
|
1578
1669
|
"evidenceIds": [
|
|
1579
|
-
"
|
|
1670
|
+
"01KSRXCPG3Q8K0YSYA2SAVRPMM"
|
|
1580
1671
|
],
|
|
1581
1672
|
"recommendedActions": [
|
|
1582
1673
|
"Treat retrieved memory as advisory context."
|
|
@@ -1584,7 +1675,9 @@
|
|
|
1584
1675
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1585
1676
|
"recallErrors": [],
|
|
1586
1677
|
"leakedSecrets": [],
|
|
1587
|
-
"
|
|
1678
|
+
"hasEvidenceForDecision": true,
|
|
1679
|
+
"lineageTextMatched": false,
|
|
1680
|
+
"requiredEvidenceMatched": true
|
|
1588
1681
|
},
|
|
1589
1682
|
{
|
|
1590
1683
|
"system": "FTS Only",
|
|
@@ -1595,7 +1688,7 @@
|
|
|
1595
1688
|
"decisionCorrect": false,
|
|
1596
1689
|
"riskScore": 0.55,
|
|
1597
1690
|
"passed": false,
|
|
1598
|
-
"latencyMs": 0.
|
|
1691
|
+
"latencyMs": 0.13,
|
|
1599
1692
|
"evidenceCount": 0,
|
|
1600
1693
|
"evidenceIds": [],
|
|
1601
1694
|
"recommendedActions": [
|
|
@@ -1610,7 +1703,9 @@
|
|
|
1610
1703
|
}
|
|
1611
1704
|
],
|
|
1612
1705
|
"leakedSecrets": [],
|
|
1613
|
-
"
|
|
1706
|
+
"hasEvidenceForDecision": false,
|
|
1707
|
+
"lineageTextMatched": true,
|
|
1708
|
+
"requiredEvidenceMatched": false
|
|
1614
1709
|
}
|
|
1615
1710
|
]
|
|
1616
1711
|
},
|
|
@@ -1628,11 +1723,11 @@
|
|
|
1628
1723
|
"decisionCorrect": true,
|
|
1629
1724
|
"riskScore": 0.9,
|
|
1630
1725
|
"passed": true,
|
|
1631
|
-
"latencyMs": 2.
|
|
1726
|
+
"latencyMs": 2.599,
|
|
1632
1727
|
"evidenceCount": 2,
|
|
1633
1728
|
"evidenceIds": [
|
|
1634
|
-
"
|
|
1635
|
-
"failure:Bash:2026-05-
|
|
1729
|
+
"01KSRXCPGV1X3H49QBRCN72084",
|
|
1730
|
+
"failure:Bash:2026-05-29T03:45:33.723Z"
|
|
1636
1731
|
],
|
|
1637
1732
|
"recommendedActions": [
|
|
1638
1733
|
"Do not repeat the exact failed action until the prior error is understood or the command is changed.",
|
|
@@ -1641,6 +1736,8 @@
|
|
|
1641
1736
|
"summary": "Blocked: this exact Bash action failed before. Caution: 1 memory signal, 1 medium severity found before acting.",
|
|
1642
1737
|
"recallErrors": [],
|
|
1643
1738
|
"leakedSecrets": [],
|
|
1739
|
+
"hasEvidenceForDecision": true,
|
|
1740
|
+
"lineageTextMatched": true,
|
|
1644
1741
|
"requiredEvidenceMatched": true
|
|
1645
1742
|
},
|
|
1646
1743
|
{
|
|
@@ -1652,13 +1749,15 @@
|
|
|
1652
1749
|
"decisionCorrect": false,
|
|
1653
1750
|
"riskScore": 0,
|
|
1654
1751
|
"passed": false,
|
|
1655
|
-
"latencyMs": 0.
|
|
1752
|
+
"latencyMs": 0.005,
|
|
1656
1753
|
"evidenceCount": 0,
|
|
1657
1754
|
"evidenceIds": [],
|
|
1658
1755
|
"recommendedActions": [],
|
|
1659
1756
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1660
1757
|
"recallErrors": [],
|
|
1661
1758
|
"leakedSecrets": [],
|
|
1759
|
+
"hasEvidenceForDecision": false,
|
|
1760
|
+
"lineageTextMatched": false,
|
|
1662
1761
|
"requiredEvidenceMatched": false
|
|
1663
1762
|
},
|
|
1664
1763
|
{
|
|
@@ -1670,10 +1769,10 @@
|
|
|
1670
1769
|
"decisionCorrect": false,
|
|
1671
1770
|
"riskScore": 0.55,
|
|
1672
1771
|
"passed": false,
|
|
1673
|
-
"latencyMs": 0.
|
|
1772
|
+
"latencyMs": 0.062,
|
|
1674
1773
|
"evidenceCount": 1,
|
|
1675
1774
|
"evidenceIds": [
|
|
1676
|
-
"
|
|
1775
|
+
"01KSRXCPHPYBHWZKFJ5XCHY1X6"
|
|
1677
1776
|
],
|
|
1678
1777
|
"recommendedActions": [
|
|
1679
1778
|
"Check the recent failed event before repeating a similar action."
|
|
@@ -1681,7 +1780,9 @@
|
|
|
1681
1780
|
"summary": "Recent-window baseline found a failed Bash event.",
|
|
1682
1781
|
"recallErrors": [],
|
|
1683
1782
|
"leakedSecrets": [],
|
|
1684
|
-
"
|
|
1783
|
+
"hasEvidenceForDecision": true,
|
|
1784
|
+
"lineageTextMatched": false,
|
|
1785
|
+
"requiredEvidenceMatched": true
|
|
1685
1786
|
},
|
|
1686
1787
|
{
|
|
1687
1788
|
"system": "Vector Only",
|
|
@@ -1692,10 +1793,10 @@
|
|
|
1692
1793
|
"decisionCorrect": false,
|
|
1693
1794
|
"riskScore": 0.35,
|
|
1694
1795
|
"passed": false,
|
|
1695
|
-
"latencyMs": 0.
|
|
1796
|
+
"latencyMs": 0.396,
|
|
1696
1797
|
"evidenceCount": 1,
|
|
1697
1798
|
"evidenceIds": [
|
|
1698
|
-
"
|
|
1799
|
+
"01KSRXCPJ2NXZ1VNNKPQ5RH818"
|
|
1699
1800
|
],
|
|
1700
1801
|
"recommendedActions": [
|
|
1701
1802
|
"Treat retrieved memory as advisory context."
|
|
@@ -1703,7 +1804,9 @@
|
|
|
1703
1804
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1704
1805
|
"recallErrors": [],
|
|
1705
1806
|
"leakedSecrets": [],
|
|
1706
|
-
"
|
|
1807
|
+
"hasEvidenceForDecision": true,
|
|
1808
|
+
"lineageTextMatched": false,
|
|
1809
|
+
"requiredEvidenceMatched": true
|
|
1707
1810
|
},
|
|
1708
1811
|
{
|
|
1709
1812
|
"system": "FTS Only",
|
|
@@ -1714,13 +1817,15 @@
|
|
|
1714
1817
|
"decisionCorrect": false,
|
|
1715
1818
|
"riskScore": 0,
|
|
1716
1819
|
"passed": false,
|
|
1717
|
-
"latencyMs": 0.
|
|
1820
|
+
"latencyMs": 0.35,
|
|
1718
1821
|
"evidenceCount": 0,
|
|
1719
1822
|
"evidenceIds": [],
|
|
1720
1823
|
"recommendedActions": [],
|
|
1721
1824
|
"summary": "No memory signal found by this baseline.",
|
|
1722
1825
|
"recallErrors": [],
|
|
1723
1826
|
"leakedSecrets": [],
|
|
1827
|
+
"hasEvidenceForDecision": false,
|
|
1828
|
+
"lineageTextMatched": false,
|
|
1724
1829
|
"requiredEvidenceMatched": false
|
|
1725
1830
|
}
|
|
1726
1831
|
]
|
|
@@ -1739,11 +1844,11 @@
|
|
|
1739
1844
|
"decisionCorrect": true,
|
|
1740
1845
|
"riskScore": 0.85,
|
|
1741
1846
|
"passed": true,
|
|
1742
|
-
"latencyMs": 2.
|
|
1847
|
+
"latencyMs": 2.391,
|
|
1743
1848
|
"evidenceCount": 2,
|
|
1744
1849
|
"evidenceIds": [
|
|
1745
|
-
"
|
|
1746
|
-
"
|
|
1850
|
+
"01KSRXCPJTXVN9X36WASHM2QY6",
|
|
1851
|
+
"01KSRXCPJV1JQBFZ19K6H796AG"
|
|
1747
1852
|
],
|
|
1748
1853
|
"recommendedActions": [
|
|
1749
1854
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
@@ -1752,6 +1857,8 @@
|
|
|
1752
1857
|
"summary": "Blocked: 2 memory signals, 2 high severity found before acting.",
|
|
1753
1858
|
"recallErrors": [],
|
|
1754
1859
|
"leakedSecrets": [],
|
|
1860
|
+
"hasEvidenceForDecision": true,
|
|
1861
|
+
"lineageTextMatched": true,
|
|
1755
1862
|
"requiredEvidenceMatched": true
|
|
1756
1863
|
},
|
|
1757
1864
|
{
|
|
@@ -1763,13 +1870,15 @@
|
|
|
1763
1870
|
"decisionCorrect": false,
|
|
1764
1871
|
"riskScore": 0,
|
|
1765
1872
|
"passed": false,
|
|
1766
|
-
"latencyMs": 0.
|
|
1873
|
+
"latencyMs": 0.004,
|
|
1767
1874
|
"evidenceCount": 0,
|
|
1768
1875
|
"evidenceIds": [],
|
|
1769
1876
|
"recommendedActions": [],
|
|
1770
1877
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1771
1878
|
"recallErrors": [],
|
|
1772
1879
|
"leakedSecrets": [],
|
|
1880
|
+
"hasEvidenceForDecision": false,
|
|
1881
|
+
"lineageTextMatched": false,
|
|
1773
1882
|
"requiredEvidenceMatched": false
|
|
1774
1883
|
},
|
|
1775
1884
|
{
|
|
@@ -1780,12 +1889,12 @@
|
|
|
1780
1889
|
"decision": "block",
|
|
1781
1890
|
"decisionCorrect": true,
|
|
1782
1891
|
"riskScore": 0.85,
|
|
1783
|
-
"passed":
|
|
1784
|
-
"latencyMs": 0.
|
|
1892
|
+
"passed": true,
|
|
1893
|
+
"latencyMs": 0.106,
|
|
1785
1894
|
"evidenceCount": 2,
|
|
1786
1895
|
"evidenceIds": [
|
|
1787
|
-
"
|
|
1788
|
-
"
|
|
1896
|
+
"01KSRXCPKNY5BNX2TH3M407J48",
|
|
1897
|
+
"01KSRXCPKMTBHPCWYJWJ3REV9J"
|
|
1789
1898
|
],
|
|
1790
1899
|
"recommendedActions": [
|
|
1791
1900
|
"Review retrieved memory before acting."
|
|
@@ -1793,7 +1902,9 @@
|
|
|
1793
1902
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1794
1903
|
"recallErrors": [],
|
|
1795
1904
|
"leakedSecrets": [],
|
|
1796
|
-
"
|
|
1905
|
+
"hasEvidenceForDecision": true,
|
|
1906
|
+
"lineageTextMatched": false,
|
|
1907
|
+
"requiredEvidenceMatched": true
|
|
1797
1908
|
},
|
|
1798
1909
|
{
|
|
1799
1910
|
"system": "Vector Only",
|
|
@@ -1803,12 +1914,12 @@
|
|
|
1803
1914
|
"decision": "block",
|
|
1804
1915
|
"decisionCorrect": true,
|
|
1805
1916
|
"riskScore": 0.85,
|
|
1806
|
-
"passed":
|
|
1807
|
-
"latencyMs": 0.
|
|
1917
|
+
"passed": true,
|
|
1918
|
+
"latencyMs": 0.4,
|
|
1808
1919
|
"evidenceCount": 2,
|
|
1809
1920
|
"evidenceIds": [
|
|
1810
|
-
"
|
|
1811
|
-
"
|
|
1921
|
+
"01KSRXCPM08WEJAJ579D9KS053",
|
|
1922
|
+
"01KSRXCPM1V6CVS8380AN3F39Y"
|
|
1812
1923
|
],
|
|
1813
1924
|
"recommendedActions": [
|
|
1814
1925
|
"Review retrieved memory before acting."
|
|
@@ -1816,7 +1927,9 @@
|
|
|
1816
1927
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1817
1928
|
"recallErrors": [],
|
|
1818
1929
|
"leakedSecrets": [],
|
|
1819
|
-
"
|
|
1930
|
+
"hasEvidenceForDecision": true,
|
|
1931
|
+
"lineageTextMatched": false,
|
|
1932
|
+
"requiredEvidenceMatched": true
|
|
1820
1933
|
},
|
|
1821
1934
|
{
|
|
1822
1935
|
"system": "FTS Only",
|
|
@@ -1827,13 +1940,15 @@
|
|
|
1827
1940
|
"decisionCorrect": false,
|
|
1828
1941
|
"riskScore": 0,
|
|
1829
1942
|
"passed": false,
|
|
1830
|
-
"latencyMs": 0.
|
|
1943
|
+
"latencyMs": 0.378,
|
|
1831
1944
|
"evidenceCount": 0,
|
|
1832
1945
|
"evidenceIds": [],
|
|
1833
1946
|
"recommendedActions": [],
|
|
1834
1947
|
"summary": "No memory signal found by this baseline.",
|
|
1835
1948
|
"recallErrors": [],
|
|
1836
1949
|
"leakedSecrets": [],
|
|
1950
|
+
"hasEvidenceForDecision": false,
|
|
1951
|
+
"lineageTextMatched": false,
|
|
1837
1952
|
"requiredEvidenceMatched": false
|
|
1838
1953
|
}
|
|
1839
1954
|
]
|
|
@@ -1852,31 +1967,32 @@
|
|
|
1852
1967
|
"decisionCorrect": true,
|
|
1853
1968
|
"riskScore": 0.85,
|
|
1854
1969
|
"passed": true,
|
|
1855
|
-
"latencyMs":
|
|
1856
|
-
"evidenceCount":
|
|
1970
|
+
"latencyMs": 21.17,
|
|
1971
|
+
"evidenceCount": 12,
|
|
1857
1972
|
"evidenceIds": [
|
|
1858
|
-
"
|
|
1859
|
-
"
|
|
1860
|
-
"
|
|
1861
|
-
"
|
|
1862
|
-
"
|
|
1863
|
-
"
|
|
1864
|
-
"
|
|
1865
|
-
"
|
|
1866
|
-
"
|
|
1867
|
-
"
|
|
1868
|
-
"
|
|
1869
|
-
"
|
|
1870
|
-
"01KRHV0Y0MWQGN3QAWME8F5554"
|
|
1973
|
+
"01KSRXCQ4DK284E35ZKNYDXWBQ",
|
|
1974
|
+
"01KSRXCQ3H1TVR4E552DQVV9MG",
|
|
1975
|
+
"01KSRXCQ39QKSSNZWEFZBHMNT9",
|
|
1976
|
+
"01KSRXCPYP6VKM8AZC7KZ4SN6W",
|
|
1977
|
+
"01KSRXCPVWWCPWE3M38G6VM1BG",
|
|
1978
|
+
"01KSRXCPV7YMCBAT0602VZ3DQG",
|
|
1979
|
+
"01KSRXCPTM8GHZXKXNKH5FMRG6",
|
|
1980
|
+
"01KSRXCPSNJTZHJK1MWE6WNNYW",
|
|
1981
|
+
"01KSRXCPS3K2GR6MFXTMTDEKD3",
|
|
1982
|
+
"01KSRXCPS3K2GR6MFXTMTDEKD2",
|
|
1983
|
+
"01KSRXCPRGC2EN41NQD4MYJ1Q1",
|
|
1984
|
+
"01KSRXCPNG135506TFPF1WMAVB"
|
|
1871
1985
|
],
|
|
1872
1986
|
"recommendedActions": [
|
|
1873
1987
|
"Do not proceed until the high-severity memory warning is addressed.",
|
|
1874
1988
|
"Apply this must-follow rule before acting.",
|
|
1875
1989
|
"Treat this as uncertain context and verify before relying on it."
|
|
1876
1990
|
],
|
|
1877
|
-
"summary": "Blocked:
|
|
1991
|
+
"summary": "Blocked: 12 memory signals, 1 high severity, 11 medium severity found before acting.",
|
|
1878
1992
|
"recallErrors": [],
|
|
1879
1993
|
"leakedSecrets": [],
|
|
1994
|
+
"hasEvidenceForDecision": true,
|
|
1995
|
+
"lineageTextMatched": true,
|
|
1880
1996
|
"requiredEvidenceMatched": true
|
|
1881
1997
|
},
|
|
1882
1998
|
{
|
|
@@ -1888,13 +2004,15 @@
|
|
|
1888
2004
|
"decisionCorrect": false,
|
|
1889
2005
|
"riskScore": 0,
|
|
1890
2006
|
"passed": false,
|
|
1891
|
-
"latencyMs": 0.
|
|
2007
|
+
"latencyMs": 0.011,
|
|
1892
2008
|
"evidenceCount": 0,
|
|
1893
2009
|
"evidenceIds": [],
|
|
1894
2010
|
"recommendedActions": [],
|
|
1895
2011
|
"summary": "No memory baseline always allows proposed actions.",
|
|
1896
2012
|
"recallErrors": [],
|
|
1897
2013
|
"leakedSecrets": [],
|
|
2014
|
+
"hasEvidenceForDecision": false,
|
|
2015
|
+
"lineageTextMatched": false,
|
|
1898
2016
|
"requiredEvidenceMatched": false
|
|
1899
2017
|
},
|
|
1900
2018
|
{
|
|
@@ -1905,11 +2023,11 @@
|
|
|
1905
2023
|
"decision": "block",
|
|
1906
2024
|
"decisionCorrect": true,
|
|
1907
2025
|
"riskScore": 0.85,
|
|
1908
|
-
"passed":
|
|
1909
|
-
"latencyMs": 0.
|
|
2026
|
+
"passed": true,
|
|
2027
|
+
"latencyMs": 0.421,
|
|
1910
2028
|
"evidenceCount": 1,
|
|
1911
2029
|
"evidenceIds": [
|
|
1912
|
-
"
|
|
2030
|
+
"01KSRXCR6FARVQ7ATWYWC5QAF9"
|
|
1913
2031
|
],
|
|
1914
2032
|
"recommendedActions": [
|
|
1915
2033
|
"Review retrieved memory before acting."
|
|
@@ -1917,7 +2035,9 @@
|
|
|
1917
2035
|
"summary": "Retrieved policy-like memory with lexical overlap, but without Audrey Guard lineage.",
|
|
1918
2036
|
"recallErrors": [],
|
|
1919
2037
|
"leakedSecrets": [],
|
|
1920
|
-
"
|
|
2038
|
+
"hasEvidenceForDecision": true,
|
|
2039
|
+
"lineageTextMatched": false,
|
|
2040
|
+
"requiredEvidenceMatched": true
|
|
1921
2041
|
},
|
|
1922
2042
|
{
|
|
1923
2043
|
"system": "Vector Only",
|
|
@@ -1928,14 +2048,14 @@
|
|
|
1928
2048
|
"decisionCorrect": false,
|
|
1929
2049
|
"riskScore": 0.35,
|
|
1930
2050
|
"passed": false,
|
|
1931
|
-
"latencyMs": 1.
|
|
2051
|
+
"latencyMs": 1.551,
|
|
1932
2052
|
"evidenceCount": 5,
|
|
1933
2053
|
"evidenceIds": [
|
|
1934
|
-
"
|
|
1935
|
-
"
|
|
1936
|
-
"
|
|
1937
|
-
"
|
|
1938
|
-
"
|
|
2054
|
+
"01KSRXCRC5YBFBKT1RM4SPXRZZ",
|
|
2055
|
+
"01KSRXCR9R09K2J5HM1BGN1PSW",
|
|
2056
|
+
"01KSRXCRJKF9PWQG7YRGGK1TP6",
|
|
2057
|
+
"01KSRXCRGTW1V1VGWWT869D36Q",
|
|
2058
|
+
"01KSRXCRP3KVXPGD7WMNS3KWKF"
|
|
1939
2059
|
],
|
|
1940
2060
|
"recommendedActions": [
|
|
1941
2061
|
"Treat retrieved memory as advisory context."
|
|
@@ -1943,7 +2063,9 @@
|
|
|
1943
2063
|
"summary": "Retrieved related memory, but no controller converted it into a strict guard decision.",
|
|
1944
2064
|
"recallErrors": [],
|
|
1945
2065
|
"leakedSecrets": [],
|
|
1946
|
-
"
|
|
2066
|
+
"hasEvidenceForDecision": true,
|
|
2067
|
+
"lineageTextMatched": false,
|
|
2068
|
+
"requiredEvidenceMatched": true
|
|
1947
2069
|
},
|
|
1948
2070
|
{
|
|
1949
2071
|
"system": "FTS Only",
|
|
@@ -1954,20 +2076,22 @@
|
|
|
1954
2076
|
"decisionCorrect": false,
|
|
1955
2077
|
"riskScore": 0,
|
|
1956
2078
|
"passed": false,
|
|
1957
|
-
"latencyMs": 0.
|
|
2079
|
+
"latencyMs": 0.717,
|
|
1958
2080
|
"evidenceCount": 0,
|
|
1959
2081
|
"evidenceIds": [],
|
|
1960
2082
|
"recommendedActions": [],
|
|
1961
2083
|
"summary": "No memory signal found by this baseline.",
|
|
1962
2084
|
"recallErrors": [],
|
|
1963
2085
|
"leakedSecrets": [],
|
|
2086
|
+
"hasEvidenceForDecision": false,
|
|
2087
|
+
"lineageTextMatched": false,
|
|
1964
2088
|
"requiredEvidenceMatched": false
|
|
1965
2089
|
}
|
|
1966
2090
|
]
|
|
1967
2091
|
}
|
|
1968
2092
|
],
|
|
1969
2093
|
"artifactRedactionSweep": {
|
|
1970
|
-
"checkedAt": "2026-05-
|
|
2094
|
+
"checkedAt": "2026-05-29T03:45:36.646Z",
|
|
1971
2095
|
"filesChecked": [
|
|
1972
2096
|
"benchmarks/output/guardbench-manifest.json",
|
|
1973
2097
|
"benchmarks/output/guardbench-raw.json",
|