audrey 0.21.0 → 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +238 -0
- package/LICENSE +21 -21
- package/README.md +281 -33
- package/SECURITY.md +30 -0
- package/benchmarks/adapter-kit.mjs +20 -0
- package/benchmarks/adapter-self-test.mjs +166 -0
- package/benchmarks/adapters/example-allow.mjs +28 -0
- package/benchmarks/adapters/mem0-platform.mjs +267 -0
- package/benchmarks/adapters/registry.json +51 -0
- package/benchmarks/adapters/zep-cloud.mjs +280 -0
- package/benchmarks/baselines.js +169 -0
- package/benchmarks/build-leaderboard.mjs +170 -0
- package/benchmarks/cases.js +537 -0
- package/benchmarks/create-conformance-card.mjs +139 -0
- package/benchmarks/create-submission-bundle.mjs +176 -0
- package/benchmarks/dry-run-external-adapters.mjs +165 -0
- package/benchmarks/guardbench.js +1035 -0
- package/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/guardbench-manifest.json +414 -0
- package/benchmarks/output/guardbench-raw.json +1171 -0
- package/benchmarks/output/guardbench-summary.json +1981 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/benchmarks/output/submission-bundle/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/submission-bundle/guardbench-manifest.json +414 -0
- package/benchmarks/output/submission-bundle/guardbench-raw.json +1171 -0
- package/benchmarks/output/submission-bundle/guardbench-summary.json +1981 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/benchmarks/output/summary.json +2354 -0
- package/benchmarks/perf-snapshot.js +304 -0
- package/benchmarks/perf.bench.js +161 -0
- package/benchmarks/public-paths.mjs +78 -0
- package/benchmarks/reference-results.js +70 -0
- package/benchmarks/report.js +259 -0
- package/benchmarks/run-external-guardbench.mjs +281 -0
- package/benchmarks/run.js +682 -0
- package/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/snapshots/perf-0.22.2.json +123 -0
- package/benchmarks/snapshots/perf-0.23.0.json +123 -0
- package/benchmarks/validate-adapter-module.mjs +104 -0
- package/benchmarks/validate-adapter-registry.mjs +134 -0
- package/benchmarks/validate-adapter-self-test.mjs +96 -0
- package/benchmarks/validate-guardbench-artifacts.mjs +343 -0
- package/benchmarks/verify-external-evidence.mjs +296 -0
- package/benchmarks/verify-publication-artifacts.mjs +286 -0
- package/benchmarks/verify-submission-bundle.mjs +167 -0
- package/dist/mcp-server/config.d.ts +5 -4
- package/dist/mcp-server/config.d.ts.map +1 -1
- package/dist/mcp-server/config.js +6 -8
- package/dist/mcp-server/config.js.map +1 -1
- package/dist/mcp-server/index.d.ts +281 -23
- package/dist/mcp-server/index.d.ts.map +1 -1
- package/dist/mcp-server/index.js +1186 -82
- package/dist/mcp-server/index.js.map +1 -1
- package/dist/src/action-key.d.ts +9 -0
- package/dist/src/action-key.d.ts.map +1 -0
- package/dist/src/action-key.js +49 -0
- package/dist/src/action-key.js.map +1 -0
- package/dist/src/adaptive.d.ts.map +1 -1
- package/dist/src/adaptive.js +8 -6
- package/dist/src/adaptive.js.map +1 -1
- package/dist/src/affect.d.ts +4 -1
- package/dist/src/affect.d.ts.map +1 -1
- package/dist/src/affect.js +14 -12
- package/dist/src/affect.js.map +1 -1
- package/dist/src/audrey.d.ts +57 -4
- package/dist/src/audrey.d.ts.map +1 -1
- package/dist/src/audrey.js +512 -65
- package/dist/src/audrey.js.map +1 -1
- package/dist/src/capsule.d.ts +2 -1
- package/dist/src/capsule.d.ts.map +1 -1
- package/dist/src/capsule.js +18 -8
- package/dist/src/capsule.js.map +1 -1
- package/dist/src/causal.d.ts.map +1 -1
- package/dist/src/causal.js +23 -5
- package/dist/src/causal.js.map +1 -1
- package/dist/src/confidence.d.ts.map +1 -1
- package/dist/src/confidence.js +3 -0
- package/dist/src/confidence.js.map +1 -1
- package/dist/src/consolidate.d.ts +1 -0
- package/dist/src/consolidate.d.ts.map +1 -1
- package/dist/src/consolidate.js +70 -54
- package/dist/src/consolidate.js.map +1 -1
- package/dist/src/controller.d.ts +94 -0
- package/dist/src/controller.d.ts.map +1 -0
- package/dist/src/controller.js +350 -0
- package/dist/src/controller.js.map +1 -0
- package/dist/src/db.d.ts.map +1 -1
- package/dist/src/db.js +181 -169
- package/dist/src/db.js.map +1 -1
- package/dist/src/decay.d.ts.map +1 -1
- package/dist/src/decay.js +62 -55
- package/dist/src/decay.js.map +1 -1
- package/dist/src/embedding.d.ts +2 -1
- package/dist/src/embedding.d.ts.map +1 -1
- package/dist/src/embedding.js +60 -22
- package/dist/src/embedding.js.map +1 -1
- package/dist/src/encode.d.ts +9 -2
- package/dist/src/encode.d.ts.map +1 -1
- package/dist/src/encode.js +25 -12
- package/dist/src/encode.js.map +1 -1
- package/dist/src/export.d.ts.map +1 -1
- package/dist/src/export.js +5 -3
- package/dist/src/export.js.map +1 -1
- package/dist/src/feedback.d.ts +35 -0
- package/dist/src/feedback.d.ts.map +1 -0
- package/dist/src/feedback.js +129 -0
- package/dist/src/feedback.js.map +1 -0
- package/dist/src/forget.d.ts.map +1 -1
- package/dist/src/forget.js +68 -60
- package/dist/src/forget.js.map +1 -1
- package/dist/src/fts.js +1 -1
- package/dist/src/fts.js.map +1 -1
- package/dist/src/hybrid-recall.d.ts +2 -1
- package/dist/src/hybrid-recall.d.ts.map +1 -1
- package/dist/src/hybrid-recall.js +41 -32
- package/dist/src/hybrid-recall.js.map +1 -1
- package/dist/src/impact.d.ts +47 -0
- package/dist/src/impact.d.ts.map +1 -0
- package/dist/src/impact.js +146 -0
- package/dist/src/impact.js.map +1 -0
- package/dist/src/import.d.ts +177 -1
- package/dist/src/import.d.ts.map +1 -1
- package/dist/src/import.js +235 -46
- package/dist/src/import.js.map +1 -1
- package/dist/src/index.d.ts +5 -1
- package/dist/src/index.d.ts.map +1 -1
- package/dist/src/index.js +3 -1
- package/dist/src/index.js.map +1 -1
- package/dist/src/interference.d.ts +5 -2
- package/dist/src/interference.d.ts.map +1 -1
- package/dist/src/interference.js +39 -32
- package/dist/src/interference.js.map +1 -1
- package/dist/src/introspect.js +18 -18
- package/dist/src/llm.d.ts.map +1 -1
- package/dist/src/llm.js +1 -0
- package/dist/src/llm.js.map +1 -1
- package/dist/src/migrate.d.ts.map +1 -1
- package/dist/src/migrate.js +21 -9
- package/dist/src/migrate.js.map +1 -1
- package/dist/src/preflight.d.ts +2 -1
- package/dist/src/preflight.d.ts.map +1 -1
- package/dist/src/preflight.js +66 -5
- package/dist/src/preflight.js.map +1 -1
- package/dist/src/profile.d.ts +23 -0
- package/dist/src/profile.d.ts.map +1 -0
- package/dist/src/profile.js +51 -0
- package/dist/src/profile.js.map +1 -0
- package/dist/src/promote.d.ts.map +1 -1
- package/dist/src/promote.js +8 -9
- package/dist/src/promote.js.map +1 -1
- package/dist/src/prompts.d.ts.map +1 -1
- package/dist/src/prompts.js +165 -136
- package/dist/src/prompts.js.map +1 -1
- package/dist/src/recall.d.ts +9 -6
- package/dist/src/recall.d.ts.map +1 -1
- package/dist/src/recall.js +204 -62
- package/dist/src/recall.js.map +1 -1
- package/dist/src/redact.d.ts +7 -1
- package/dist/src/redact.d.ts.map +1 -1
- package/dist/src/redact.js +94 -11
- package/dist/src/redact.js.map +1 -1
- package/dist/src/reflexes.d.ts +1 -0
- package/dist/src/reflexes.d.ts.map +1 -1
- package/dist/src/reflexes.js +3 -0
- package/dist/src/reflexes.js.map +1 -1
- package/dist/src/rollback.d.ts.map +1 -1
- package/dist/src/rollback.js +13 -8
- package/dist/src/rollback.js.map +1 -1
- package/dist/src/routes.d.ts +1 -0
- package/dist/src/routes.d.ts.map +1 -1
- package/dist/src/routes.js +251 -6
- package/dist/src/routes.js.map +1 -1
- package/dist/src/rules-compiler.d.ts.map +1 -1
- package/dist/src/rules-compiler.js +36 -6
- package/dist/src/rules-compiler.js.map +1 -1
- package/dist/src/server.d.ts +2 -1
- package/dist/src/server.d.ts.map +1 -1
- package/dist/src/server.js +42 -4
- package/dist/src/server.js.map +1 -1
- package/dist/src/tool-trace.d.ts.map +1 -1
- package/dist/src/tool-trace.js +42 -29
- package/dist/src/tool-trace.js.map +1 -1
- package/dist/src/types.d.ts +28 -1
- package/dist/src/types.d.ts.map +1 -1
- package/dist/src/ulid.d.ts.map +1 -1
- package/dist/src/ulid.js +52 -2
- package/dist/src/ulid.js.map +1 -1
- package/dist/src/utils.d.ts.map +1 -1
- package/dist/src/utils.js +8 -1
- package/dist/src/utils.js.map +1 -1
- package/dist/src/validate.d.ts +2 -0
- package/dist/src/validate.d.ts.map +1 -1
- package/dist/src/validate.js +77 -46
- package/dist/src/validate.js.map +1 -1
- package/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/MEMORY_BENCHMARKING.md +59 -0
- package/docs/PRODUCTION_BACKLOG.md +304 -0
- package/docs/paper/00-master.md +48 -0
- package/docs/paper/01-introduction.md +27 -0
- package/docs/paper/02-related-work.md +47 -0
- package/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/04-design.md +164 -0
- package/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/06-implementation.md +113 -0
- package/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/claim-register.json +138 -0
- package/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/LICENSE +21 -0
- package/docs/paper/output/submission-bundle/README.md +533 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-manifest.json +414 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-raw.json +1171 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-summary.json +1981 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/summary.json +2354 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/docs/paper/output/submission-bundle/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/paper/output/submission-bundle/docs/paper/00-master.md +48 -0
- package/docs/paper/output/submission-bundle/docs/paper/01-introduction.md +27 -0
- package/docs/paper/output/submission-bundle/docs/paper/02-related-work.md +47 -0
- package/docs/paper/output/submission-bundle/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/output/submission-bundle/docs/paper/04-design.md +164 -0
- package/docs/paper/output/submission-bundle/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/output/submission-bundle/docs/paper/06-implementation.md +113 -0
- package/docs/paper/output/submission-bundle/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/output/submission-bundle/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/output/submission-bundle/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/output/submission-bundle/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.json +138 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/output/submission-bundle/docs/paper/references.bib +222 -0
- package/docs/paper/output/submission-bundle/package.json +212 -0
- package/docs/paper/output/submission-bundle/paper-submission-manifest.json +379 -0
- package/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/publication-pack.json +81 -0
- package/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/references.bib +222 -0
- package/package.json +103 -26
- package/scripts/audit-release-completion.mjs +362 -0
- package/scripts/create-arxiv-source.mjs +362 -0
- package/scripts/create-paper-submission-bundle.mjs +210 -0
- package/scripts/finalize-release.mjs +526 -0
- package/scripts/prepare-release-cut.mjs +269 -0
- package/scripts/publish-release-bundle.mjs +209 -0
- package/scripts/publish-release-github-api.mjs +429 -0
- package/scripts/run-vitest.mjs +34 -0
- package/scripts/smoke-cli.js +72 -0
- package/scripts/sync-paper-artifacts.mjs +109 -0
- package/scripts/verify-arxiv-compile.mjs +440 -0
- package/scripts/verify-arxiv-source.mjs +194 -0
- package/scripts/verify-browser-launch-plan.mjs +237 -0
- package/scripts/verify-browser-launch-results.mjs +285 -0
- package/scripts/verify-paper-artifacts.mjs +338 -0
- package/scripts/verify-paper-claims.mjs +226 -0
- package/scripts/verify-paper-submission-bundle.mjs +207 -0
- package/scripts/verify-publication-pack.mjs +196 -0
- package/scripts/verify-python-package.py +201 -0
- package/scripts/verify-release-readiness.mjs +741 -0
- package/docs/assets/benchmarks/local-benchmark.svg +0 -45
- package/docs/assets/benchmarks/operations-benchmark.svg +0 -45
- package/docs/assets/benchmarks/published-memory-standards.svg +0 -50
- package/docs/audrey-for-dummies.md +0 -670
- package/docs/benchmarking.md +0 -151
- package/docs/future-of-llm-memory.md +0 -452
- package/docs/mcp-hosts.md +0 -206
- package/docs/ollama-local-agents.md +0 -128
- package/docs/production-readiness.md +0 -128
|
@@ -0,0 +1,379 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "Audrey paper submission bundle",
|
|
4
|
+
"generatedAt": "2026-05-13T23:33:57.713Z",
|
|
5
|
+
"sourceRoot": ".",
|
|
6
|
+
"outDir": "docs/paper/output/submission-bundle",
|
|
7
|
+
"claimVerification": {
|
|
8
|
+
"ok": true,
|
|
9
|
+
"count": 4
|
|
10
|
+
},
|
|
11
|
+
"publicationPackVerification": {
|
|
12
|
+
"ok": true,
|
|
13
|
+
"count": 9
|
|
14
|
+
},
|
|
15
|
+
"guardBenchSnapshot": {
|
|
16
|
+
"passed": 10,
|
|
17
|
+
"scenarios": 10,
|
|
18
|
+
"redactionLeaks": 0,
|
|
19
|
+
"artifactLeaks": 0,
|
|
20
|
+
"latencyP50Ms": 3.097,
|
|
21
|
+
"latencyP95Ms": 29.711
|
|
22
|
+
},
|
|
23
|
+
"files": [
|
|
24
|
+
{
|
|
25
|
+
"path": "benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json",
|
|
26
|
+
"source": "benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json",
|
|
27
|
+
"bytes": 1261,
|
|
28
|
+
"sha256": "b9fa6d2343c56a8231c1f2d12330676ac760c7d7157d2479e5fbd345c09baacd"
|
|
29
|
+
},
|
|
30
|
+
{
|
|
31
|
+
"path": "benchmarks/output/external/guardbench-external-dry-run.json",
|
|
32
|
+
"source": "benchmarks/output/external/guardbench-external-dry-run.json",
|
|
33
|
+
"bytes": 1831,
|
|
34
|
+
"sha256": "988dc23a7d4724bd76f7e1a01c89bf1c7708e38d24dcae0baafed5ea37e6aa20"
|
|
35
|
+
},
|
|
36
|
+
{
|
|
37
|
+
"path": "benchmarks/output/external/guardbench-external-evidence.json",
|
|
38
|
+
"source": "benchmarks/output/external/guardbench-external-evidence.json",
|
|
39
|
+
"bytes": 1638,
|
|
40
|
+
"sha256": "685572d86fb30ac6a6249f0cd1b6a6058b10d6784d88a4a25e0fc17136637379"
|
|
41
|
+
},
|
|
42
|
+
{
|
|
43
|
+
"path": "benchmarks/output/guardbench-conformance-card.json",
|
|
44
|
+
"source": "benchmarks/output/guardbench-conformance-card.json",
|
|
45
|
+
"bytes": 1735,
|
|
46
|
+
"sha256": "0709bb4d93a797764e4ed5655c575390a57554a42625398d378c8ec0f23bd2b4"
|
|
47
|
+
},
|
|
48
|
+
{
|
|
49
|
+
"path": "benchmarks/output/guardbench-manifest.json",
|
|
50
|
+
"source": "benchmarks/output/guardbench-manifest.json",
|
|
51
|
+
"bytes": 12056,
|
|
52
|
+
"sha256": "57636ce19fdaa6e50fc3fc961d9e499a9f43632f588c713a9fefe8e8a6fa724c"
|
|
53
|
+
},
|
|
54
|
+
{
|
|
55
|
+
"path": "benchmarks/output/guardbench-raw.json",
|
|
56
|
+
"source": "benchmarks/output/guardbench-raw.json",
|
|
57
|
+
"bytes": 39429,
|
|
58
|
+
"sha256": "c5b9c68cf946478fbfba617f17717e05ea3e01301089de19153d59e77e674bc6"
|
|
59
|
+
},
|
|
60
|
+
{
|
|
61
|
+
"path": "benchmarks/output/guardbench-summary.json",
|
|
62
|
+
"source": "benchmarks/output/guardbench-summary.json",
|
|
63
|
+
"bytes": 64381,
|
|
64
|
+
"sha256": "2a6d5ee83cce2502135fb0442ef8cd3f2679fdc38c84207612c22a800a7a113a"
|
|
65
|
+
},
|
|
66
|
+
{
|
|
67
|
+
"path": "benchmarks/output/leaderboard/guardbench-leaderboard.json",
|
|
68
|
+
"source": "benchmarks/output/leaderboard/guardbench-leaderboard.json",
|
|
69
|
+
"bytes": 2798,
|
|
70
|
+
"sha256": "55c6fabf3e4ccf399650aadf7d34e83d4bcdd5cfe26439e3d50a7cf9dac0ec66"
|
|
71
|
+
},
|
|
72
|
+
{
|
|
73
|
+
"path": "benchmarks/output/leaderboard/guardbench-leaderboard.md",
|
|
74
|
+
"source": "benchmarks/output/leaderboard/guardbench-leaderboard.md",
|
|
75
|
+
"bytes": 364,
|
|
76
|
+
"sha256": "d04ac3106b4b4d5563b9cdddb1f5816ff62ad0636836d29f8b91af1d80755458"
|
|
77
|
+
},
|
|
78
|
+
{
|
|
79
|
+
"path": "benchmarks/output/submission-bundle/submission-manifest.json",
|
|
80
|
+
"source": "benchmarks/output/submission-bundle/submission-manifest.json",
|
|
81
|
+
"bytes": 3986,
|
|
82
|
+
"sha256": "2c37a32eab5dba72b197971ed7a63173d7a395d0e65707a5490a7a868b332c6f"
|
|
83
|
+
},
|
|
84
|
+
{
|
|
85
|
+
"path": "benchmarks/output/submission-bundle/validation-report.json",
|
|
86
|
+
"source": "benchmarks/output/submission-bundle/validation-report.json",
|
|
87
|
+
"bytes": 739,
|
|
88
|
+
"sha256": "9734a26b31a7511fbba361f22245dd6325b65fe47d1072fa59df7eeb15d724a1"
|
|
89
|
+
},
|
|
90
|
+
{
|
|
91
|
+
"path": "benchmarks/output/summary.json",
|
|
92
|
+
"source": "benchmarks/output/summary.json",
|
|
93
|
+
"bytes": 100749,
|
|
94
|
+
"sha256": "75d778ce194cf9122b3e58bd361b2e15ecc5c1597aa62c060f567011af73963e"
|
|
95
|
+
},
|
|
96
|
+
{
|
|
97
|
+
"path": "benchmarks/schemas/guardbench-adapter-registry.schema.json",
|
|
98
|
+
"source": "benchmarks/schemas/guardbench-adapter-registry.schema.json",
|
|
99
|
+
"bytes": 2016,
|
|
100
|
+
"sha256": "0fb401e0b00270f16287a47cdb868ec6ac23e85f134958141f37519bf0c67164"
|
|
101
|
+
},
|
|
102
|
+
{
|
|
103
|
+
"path": "benchmarks/schemas/guardbench-adapter-self-test.schema.json",
|
|
104
|
+
"source": "benchmarks/schemas/guardbench-adapter-self-test.schema.json",
|
|
105
|
+
"bytes": 4572,
|
|
106
|
+
"sha256": "369402022870257c0bca52c05f21e53b40e310547bf49871ce08b2976c755127"
|
|
107
|
+
},
|
|
108
|
+
{
|
|
109
|
+
"path": "benchmarks/schemas/guardbench-conformance-card.schema.json",
|
|
110
|
+
"source": "benchmarks/schemas/guardbench-conformance-card.schema.json",
|
|
111
|
+
"bytes": 5251,
|
|
112
|
+
"sha256": "337e197617e889388ff9f71f361b6c75450b43c1c131af622d4a59bc4faca89e"
|
|
113
|
+
},
|
|
114
|
+
{
|
|
115
|
+
"path": "benchmarks/schemas/guardbench-external-dry-run.schema.json",
|
|
116
|
+
"source": "benchmarks/schemas/guardbench-external-dry-run.schema.json",
|
|
117
|
+
"bytes": 2177,
|
|
118
|
+
"sha256": "df327a2b2c1cd7bf4453457c83ebc10708e6f56aa1d3526c7ac492a1b254880c"
|
|
119
|
+
},
|
|
120
|
+
{
|
|
121
|
+
"path": "benchmarks/schemas/guardbench-external-evidence.schema.json",
|
|
122
|
+
"source": "benchmarks/schemas/guardbench-external-evidence.schema.json",
|
|
123
|
+
"bytes": 3075,
|
|
124
|
+
"sha256": "c6f7af89c53d039ff7e3b3b9f5829a7524e4a24c254dd17754dd51469c0295d1"
|
|
125
|
+
},
|
|
126
|
+
{
|
|
127
|
+
"path": "benchmarks/schemas/guardbench-external-run.schema.json",
|
|
128
|
+
"source": "benchmarks/schemas/guardbench-external-run.schema.json",
|
|
129
|
+
"bytes": 4443,
|
|
130
|
+
"sha256": "36f79172e6b9264fa7f16a90684f2c75fb3f8432c5226be4181d93622b17b40b"
|
|
131
|
+
},
|
|
132
|
+
{
|
|
133
|
+
"path": "benchmarks/schemas/guardbench-leaderboard.schema.json",
|
|
134
|
+
"source": "benchmarks/schemas/guardbench-leaderboard.schema.json",
|
|
135
|
+
"bytes": 5457,
|
|
136
|
+
"sha256": "ac3414af9f97d3c3b241ffea3fe9995295cb107dbc4fddef2f32f0d3de2d1abf"
|
|
137
|
+
},
|
|
138
|
+
{
|
|
139
|
+
"path": "benchmarks/schemas/guardbench-manifest.schema.json",
|
|
140
|
+
"source": "benchmarks/schemas/guardbench-manifest.schema.json",
|
|
141
|
+
"bytes": 6345,
|
|
142
|
+
"sha256": "a2995e946908f094dfd5db264db87615167586d57f1a335aa9bf2262b709ef4d"
|
|
143
|
+
},
|
|
144
|
+
{
|
|
145
|
+
"path": "benchmarks/schemas/guardbench-publication-verification.schema.json",
|
|
146
|
+
"source": "benchmarks/schemas/guardbench-publication-verification.schema.json",
|
|
147
|
+
"bytes": 1713,
|
|
148
|
+
"sha256": "a83442c23dee3805b6c1bd3b8524b16948b5dc78d3d65074142c2a99c733f1b9"
|
|
149
|
+
},
|
|
150
|
+
{
|
|
151
|
+
"path": "benchmarks/schemas/guardbench-raw.schema.json",
|
|
152
|
+
"source": "benchmarks/schemas/guardbench-raw.schema.json",
|
|
153
|
+
"bytes": 5057,
|
|
154
|
+
"sha256": "f419685932a5549d5efef611b1dbbe585300365de3c977fcfedf174672f6bc3a"
|
|
155
|
+
},
|
|
156
|
+
{
|
|
157
|
+
"path": "benchmarks/schemas/guardbench-submission-manifest.schema.json",
|
|
158
|
+
"source": "benchmarks/schemas/guardbench-submission-manifest.schema.json",
|
|
159
|
+
"bytes": 4469,
|
|
160
|
+
"sha256": "4d624bec3cbb7f3043064a874bd869ac8556f42231f0871a179f58cd8fbcfb23"
|
|
161
|
+
},
|
|
162
|
+
{
|
|
163
|
+
"path": "benchmarks/schemas/guardbench-summary.schema.json",
|
|
164
|
+
"source": "benchmarks/schemas/guardbench-summary.schema.json",
|
|
165
|
+
"bytes": 7331,
|
|
166
|
+
"sha256": "ac70b448c730fb8b01899615477a167a64734d16304c39d661b2b3130e8aa1da"
|
|
167
|
+
},
|
|
168
|
+
{
|
|
169
|
+
"path": "docs/AUDREY_PAPER_OUTLINE.md",
|
|
170
|
+
"source": "docs/AUDREY_PAPER_OUTLINE.md",
|
|
171
|
+
"bytes": 9329,
|
|
172
|
+
"sha256": "a728e690ccfcba6c7854bb4589123fb8714f17c9b2a7ae1109aa5ad6f7e75b81"
|
|
173
|
+
},
|
|
174
|
+
{
|
|
175
|
+
"path": "docs/paper/00-master.md",
|
|
176
|
+
"source": "docs/paper/00-master.md",
|
|
177
|
+
"bytes": 3590,
|
|
178
|
+
"sha256": "375cff75dff1621c327ff2e670c14effdbddfff9f58e90340e60588916c43f51"
|
|
179
|
+
},
|
|
180
|
+
{
|
|
181
|
+
"path": "docs/paper/01-introduction.md",
|
|
182
|
+
"source": "docs/paper/01-introduction.md",
|
|
183
|
+
"bytes": 5211,
|
|
184
|
+
"sha256": "d7af48b19e87713d951a8a62ad072846aab1d860bc314f7b76fd088fcb20b1d4"
|
|
185
|
+
},
|
|
186
|
+
{
|
|
187
|
+
"path": "docs/paper/02-related-work.md",
|
|
188
|
+
"source": "docs/paper/02-related-work.md",
|
|
189
|
+
"bytes": 9127,
|
|
190
|
+
"sha256": "994db1f186f040056e91755551a52ca7a370f11261766c721c3920e9098afaf2"
|
|
191
|
+
},
|
|
192
|
+
{
|
|
193
|
+
"path": "docs/paper/03-problem-definition.md",
|
|
194
|
+
"source": "docs/paper/03-problem-definition.md",
|
|
195
|
+
"bytes": 10643,
|
|
196
|
+
"sha256": "1d5d44c83a9527dffb27b7eb228a83b28a0113ec27d25975c4b36b855c296589"
|
|
197
|
+
},
|
|
198
|
+
{
|
|
199
|
+
"path": "docs/paper/04-design.md",
|
|
200
|
+
"source": "docs/paper/04-design.md",
|
|
201
|
+
"bytes": 15961,
|
|
202
|
+
"sha256": "ebcdd61e66f26e67dca21783d3bde885c64f54826715efdbc3e27640ea4ca2c0"
|
|
203
|
+
},
|
|
204
|
+
{
|
|
205
|
+
"path": "docs/paper/05-guardbench-spec.md",
|
|
206
|
+
"source": "docs/paper/05-guardbench-spec.md",
|
|
207
|
+
"bytes": 39027,
|
|
208
|
+
"sha256": "a9a7abd93c6bc50a4146819f4b81a418f489caff1a56a71a35bdeccd9e8a1514"
|
|
209
|
+
},
|
|
210
|
+
{
|
|
211
|
+
"path": "docs/paper/06-implementation.md",
|
|
212
|
+
"source": "docs/paper/06-implementation.md",
|
|
213
|
+
"bytes": 14471,
|
|
214
|
+
"sha256": "497fa20661f152da603ec0801f56e06ec81817487e4c2079775669368dd80ba3"
|
|
215
|
+
},
|
|
216
|
+
{
|
|
217
|
+
"path": "docs/paper/07-evaluation.md",
|
|
218
|
+
"source": "docs/paper/07-evaluation.md",
|
|
219
|
+
"bytes": 11240,
|
|
220
|
+
"sha256": "8062c2f8b2a50af7d921a0358db85f9e65bee742f4c8e2244cadb8756c4fe703"
|
|
221
|
+
},
|
|
222
|
+
{
|
|
223
|
+
"path": "docs/paper/08-discussion-limitations.md",
|
|
224
|
+
"source": "docs/paper/08-discussion-limitations.md",
|
|
225
|
+
"bytes": 9010,
|
|
226
|
+
"sha256": "71645e65e2621029b2added1302f34e89332e223a6b162ead86c278230c1f8d1"
|
|
227
|
+
},
|
|
228
|
+
{
|
|
229
|
+
"path": "docs/paper/09-conclusion.md",
|
|
230
|
+
"source": "docs/paper/09-conclusion.md",
|
|
231
|
+
"bytes": 1561,
|
|
232
|
+
"sha256": "7beb8157eef4caa5ed36852ada382e0ce8254473bb070bcac5c309671742d509"
|
|
233
|
+
},
|
|
234
|
+
{
|
|
235
|
+
"path": "docs/paper/appendix-a-demo-transcript.md",
|
|
236
|
+
"source": "docs/paper/appendix-a-demo-transcript.md",
|
|
237
|
+
"bytes": 5258,
|
|
238
|
+
"sha256": "a6d43e28aea72c85ec0f1cc33f1d70a4df38aed3dba58ec9ca96c325c0759074"
|
|
239
|
+
},
|
|
240
|
+
{
|
|
241
|
+
"path": "docs/paper/arxiv-compile-report.schema.json",
|
|
242
|
+
"source": "docs/paper/arxiv-compile-report.schema.json",
|
|
243
|
+
"bytes": 3129,
|
|
244
|
+
"sha256": "2cefebdca45b8304cd5846bf2ae15cb3cb43cc1ce3ebfbcfdd790c24a55a05e3"
|
|
245
|
+
},
|
|
246
|
+
{
|
|
247
|
+
"path": "docs/paper/arxiv-source.schema.json",
|
|
248
|
+
"source": "docs/paper/arxiv-source.schema.json",
|
|
249
|
+
"bytes": 2262,
|
|
250
|
+
"sha256": "5be714fb038985e16a83bba2c596c15b541f01f6ac6c1448fcb295bb638f4e27"
|
|
251
|
+
},
|
|
252
|
+
{
|
|
253
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
254
|
+
"source": "docs/paper/audrey-paper-v1.md",
|
|
255
|
+
"bytes": 116195,
|
|
256
|
+
"sha256": "3f9c807f0e0e82b0f19018b83900b62efecc17ff9bcee5b493a5d4fe0528ad7a"
|
|
257
|
+
},
|
|
258
|
+
{
|
|
259
|
+
"path": "docs/paper/browser-launch-plan.json",
|
|
260
|
+
"source": "docs/paper/browser-launch-plan.json",
|
|
261
|
+
"bytes": 8613,
|
|
262
|
+
"sha256": "32869c1b77c53d2b7a1da8b13efa4eabb959443efad55a4d4d873d6ca39fced3"
|
|
263
|
+
},
|
|
264
|
+
{
|
|
265
|
+
"path": "docs/paper/browser-launch-plan.schema.json",
|
|
266
|
+
"source": "docs/paper/browser-launch-plan.schema.json",
|
|
267
|
+
"bytes": 3266,
|
|
268
|
+
"sha256": "de9252f560ae4178b8c50da1e05ae344d8e42eb294af38e8782e6a461cd4b51c"
|
|
269
|
+
},
|
|
270
|
+
{
|
|
271
|
+
"path": "docs/paper/browser-launch-results.json",
|
|
272
|
+
"source": "docs/paper/browser-launch-results.json",
|
|
273
|
+
"bytes": 9232,
|
|
274
|
+
"sha256": "4a111b6b16981d2adffc4930088f0efe1c331ad9adff6fe966f59683d7097a0a"
|
|
275
|
+
},
|
|
276
|
+
{
|
|
277
|
+
"path": "docs/paper/browser-launch-results.schema.json",
|
|
278
|
+
"source": "docs/paper/browser-launch-results.schema.json",
|
|
279
|
+
"bytes": 2135,
|
|
280
|
+
"sha256": "5832bd8e716fb167584232a8bb639f8b201a28adedea2dd3d72be3facfb33931"
|
|
281
|
+
},
|
|
282
|
+
{
|
|
283
|
+
"path": "docs/paper/claim-register.json",
|
|
284
|
+
"source": "docs/paper/claim-register.json",
|
|
285
|
+
"bytes": 4513,
|
|
286
|
+
"sha256": "c1aa78a87cd5b944e8117acc8785f84a9af179aa9cd5dc616deb9e637d7ee682"
|
|
287
|
+
},
|
|
288
|
+
{
|
|
289
|
+
"path": "docs/paper/claim-register.schema.json",
|
|
290
|
+
"source": "docs/paper/claim-register.schema.json",
|
|
291
|
+
"bytes": 2181,
|
|
292
|
+
"sha256": "4a142f7c4bf25ccfeeb4ecd7fbda2323ffd40192827e21a6c8bd5b8ff726d715"
|
|
293
|
+
},
|
|
294
|
+
{
|
|
295
|
+
"path": "docs/paper/evidence-ledger.md",
|
|
296
|
+
"source": "docs/paper/evidence-ledger.md",
|
|
297
|
+
"bytes": 61844,
|
|
298
|
+
"sha256": "2a376be83b65df3a7038ddbd684e809d538ef35cbe34d91eb309773502bb5920"
|
|
299
|
+
},
|
|
300
|
+
{
|
|
301
|
+
"path": "docs/paper/output/arxiv-compile-report.json",
|
|
302
|
+
"source": "docs/paper/output/arxiv-compile-report.json",
|
|
303
|
+
"bytes": 924,
|
|
304
|
+
"sha256": "11018bea60272ce8467675cf6491e9a7dbfeb3a774ee502dd1adc8ba5d3b1112"
|
|
305
|
+
},
|
|
306
|
+
{
|
|
307
|
+
"path": "docs/paper/output/arxiv/arxiv-manifest.json",
|
|
308
|
+
"source": "docs/paper/output/arxiv/arxiv-manifest.json",
|
|
309
|
+
"bytes": 1316,
|
|
310
|
+
"sha256": "386121a5f6234f56a370c5c54bde4ff12fc462921e7e5770d6968a4710271df8"
|
|
311
|
+
},
|
|
312
|
+
{
|
|
313
|
+
"path": "docs/paper/output/arxiv/main.tex",
|
|
314
|
+
"source": "docs/paper/output/arxiv/main.tex",
|
|
315
|
+
"bytes": 122247,
|
|
316
|
+
"sha256": "b0122e625380ad9a6aff78e2acbd5984b558c054962f8774f77fee70e6588d06"
|
|
317
|
+
},
|
|
318
|
+
{
|
|
319
|
+
"path": "docs/paper/output/arxiv/README-arxiv.txt",
|
|
320
|
+
"source": "docs/paper/output/arxiv/README-arxiv.txt",
|
|
321
|
+
"bytes": 327,
|
|
322
|
+
"sha256": "10770b31a7aff7ec87f1cd7d1b5595778dabc5ff64180c7b65332bbc1897b13d"
|
|
323
|
+
},
|
|
324
|
+
{
|
|
325
|
+
"path": "docs/paper/output/arxiv/references.bib",
|
|
326
|
+
"source": "docs/paper/output/arxiv/references.bib",
|
|
327
|
+
"bytes": 8285,
|
|
328
|
+
"sha256": "c0bfcaf7bfe37d6933c812e46352be8a95397eaa430a0f5bc94037600a53f654"
|
|
329
|
+
},
|
|
330
|
+
{
|
|
331
|
+
"path": "docs/paper/paper-submission-bundle.schema.json",
|
|
332
|
+
"source": "docs/paper/paper-submission-bundle.schema.json",
|
|
333
|
+
"bytes": 2260,
|
|
334
|
+
"sha256": "9714642edb7fd34073fc417af9ce889faa6da16e4a48a07a14a804957edaa3df"
|
|
335
|
+
},
|
|
336
|
+
{
|
|
337
|
+
"path": "docs/paper/publication-pack.json",
|
|
338
|
+
"source": "docs/paper/publication-pack.json",
|
|
339
|
+
"bytes": 6565,
|
|
340
|
+
"sha256": "a1a523d5938faea72be568b843ac3890e61cea6070b0cfa46acf22ad3d2fb974"
|
|
341
|
+
},
|
|
342
|
+
{
|
|
343
|
+
"path": "docs/paper/publication-pack.schema.json",
|
|
344
|
+
"source": "docs/paper/publication-pack.schema.json",
|
|
345
|
+
"bytes": 1606,
|
|
346
|
+
"sha256": "94577686ffe14636cedc54a9d735b2ad1dc265c532efc03b19f68b5782f550ba"
|
|
347
|
+
},
|
|
348
|
+
{
|
|
349
|
+
"path": "docs/paper/references.bib",
|
|
350
|
+
"source": "docs/paper/references.bib",
|
|
351
|
+
"bytes": 8285,
|
|
352
|
+
"sha256": "c0bfcaf7bfe37d6933c812e46352be8a95397eaa430a0f5bc94037600a53f654"
|
|
353
|
+
},
|
|
354
|
+
{
|
|
355
|
+
"path": "docs/paper/SUBMISSION_README.md",
|
|
356
|
+
"source": "docs/paper/SUBMISSION_README.md",
|
|
357
|
+
"bytes": 18992,
|
|
358
|
+
"sha256": "3c756a518a44da0fc2b80b8d28a7b3abbe5b5a758ce03c16b30aad51385ea554"
|
|
359
|
+
},
|
|
360
|
+
{
|
|
361
|
+
"path": "LICENSE",
|
|
362
|
+
"source": "LICENSE",
|
|
363
|
+
"bytes": 1066,
|
|
364
|
+
"sha256": "77e02bd8d273d655d537296bc2d9f0bb00a521911b25bf276f749497d983de9e"
|
|
365
|
+
},
|
|
366
|
+
{
|
|
367
|
+
"path": "package.json",
|
|
368
|
+
"source": "package.json",
|
|
369
|
+
"bytes": 11668,
|
|
370
|
+
"sha256": "0892c9cdc5bab8f5036a12ef3cad5eb0b509eea86813f5d49cda29f6d38653c2"
|
|
371
|
+
},
|
|
372
|
+
{
|
|
373
|
+
"path": "README.md",
|
|
374
|
+
"source": "README.md",
|
|
375
|
+
"bytes": 24693,
|
|
376
|
+
"sha256": "f7c5ac813046ad9f3def5fea67bbae8f1f817b38201d57f9a3565b04470681c6"
|
|
377
|
+
}
|
|
378
|
+
]
|
|
379
|
+
}
|
|
@@ -0,0 +1,70 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://audrey-memory.org/schemas/audrey-paper-submission-bundle.schema.json",
|
|
4
|
+
"title": "Audrey Paper Submission Bundle",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"additionalProperties": false,
|
|
7
|
+
"required": [
|
|
8
|
+
"schemaVersion",
|
|
9
|
+
"suite",
|
|
10
|
+
"generatedAt",
|
|
11
|
+
"sourceRoot",
|
|
12
|
+
"outDir",
|
|
13
|
+
"claimVerification",
|
|
14
|
+
"publicationPackVerification",
|
|
15
|
+
"guardBenchSnapshot",
|
|
16
|
+
"files"
|
|
17
|
+
],
|
|
18
|
+
"properties": {
|
|
19
|
+
"schemaVersion": { "const": "1.0.0" },
|
|
20
|
+
"suite": { "const": "Audrey paper submission bundle" },
|
|
21
|
+
"generatedAt": { "type": "string", "minLength": 1 },
|
|
22
|
+
"sourceRoot": { "type": "string", "minLength": 1 },
|
|
23
|
+
"outDir": { "type": "string", "minLength": 1 },
|
|
24
|
+
"claimVerification": { "$ref": "#/$defs/check" },
|
|
25
|
+
"publicationPackVerification": { "$ref": "#/$defs/check" },
|
|
26
|
+
"guardBenchSnapshot": {
|
|
27
|
+
"type": "object",
|
|
28
|
+
"additionalProperties": false,
|
|
29
|
+
"required": ["passed", "scenarios", "redactionLeaks", "artifactLeaks", "latencyP50Ms", "latencyP95Ms"],
|
|
30
|
+
"properties": {
|
|
31
|
+
"passed": { "type": "integer", "minimum": 0 },
|
|
32
|
+
"scenarios": { "type": "integer", "minimum": 0 },
|
|
33
|
+
"redactionLeaks": { "type": "integer", "minimum": 0 },
|
|
34
|
+
"artifactLeaks": { "type": "integer", "minimum": 0 },
|
|
35
|
+
"latencyP50Ms": { "type": "number", "minimum": 0 },
|
|
36
|
+
"latencyP95Ms": { "type": "number", "minimum": 0 }
|
|
37
|
+
}
|
|
38
|
+
},
|
|
39
|
+
"files": {
|
|
40
|
+
"type": "array",
|
|
41
|
+
"minItems": 1,
|
|
42
|
+
"items": { "$ref": "#/$defs/fileRecord" }
|
|
43
|
+
}
|
|
44
|
+
},
|
|
45
|
+
"$defs": {
|
|
46
|
+
"check": {
|
|
47
|
+
"type": "object",
|
|
48
|
+
"additionalProperties": false,
|
|
49
|
+
"required": ["ok", "count"],
|
|
50
|
+
"properties": {
|
|
51
|
+
"ok": { "type": "boolean" },
|
|
52
|
+
"count": { "type": "integer", "minimum": 0 }
|
|
53
|
+
}
|
|
54
|
+
},
|
|
55
|
+
"fileRecord": {
|
|
56
|
+
"type": "object",
|
|
57
|
+
"additionalProperties": false,
|
|
58
|
+
"required": ["path", "source", "bytes", "sha256"],
|
|
59
|
+
"properties": {
|
|
60
|
+
"path": { "type": "string", "minLength": 1 },
|
|
61
|
+
"source": { "type": "string", "minLength": 1 },
|
|
62
|
+
"bytes": { "type": "integer", "minimum": 0 },
|
|
63
|
+
"sha256": {
|
|
64
|
+
"type": "string",
|
|
65
|
+
"pattern": "^[a-f0-9]{64}$"
|
|
66
|
+
}
|
|
67
|
+
}
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
}
|
|
@@ -0,0 +1,81 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "Audrey publication pack",
|
|
4
|
+
"claimRegister": "docs/paper/claim-register.json",
|
|
5
|
+
"entries": [
|
|
6
|
+
{
|
|
7
|
+
"id": "arxiv-title",
|
|
8
|
+
"platform": "arxiv",
|
|
9
|
+
"kind": "title",
|
|
10
|
+
"claimIds": ["C01", "C03"],
|
|
11
|
+
"maxChars": 180,
|
|
12
|
+
"text": "Audrey: Local-First Pre-Action Memory Control for AI Agents"
|
|
13
|
+
},
|
|
14
|
+
{
|
|
15
|
+
"id": "arxiv-abstract",
|
|
16
|
+
"platform": "arxiv",
|
|
17
|
+
"kind": "abstract",
|
|
18
|
+
"claimIds": ["C01", "C02", "C03", "C04"],
|
|
19
|
+
"maxChars": 1920,
|
|
20
|
+
"text": "AI agents increasingly rely on long-running tool use, but most memory systems are evaluated as retrieval layers rather than as pre-action control systems. Audrey is a local-first memory runtime that records episodes, procedures, contradictions, tool traces, validation outcomes, and salience, then checks relevant memory before an agent touches tools. The paper introduces GuardBench, a Stage-A benchmark specification for memory-before-action behavior, and reports a local comparative run across Audrey Guard, no-memory, recent-window, vector-only, and FTS-only adapters. In the current repository artifacts, Audrey Guard passes 10/10 local GuardBench scenarios with zero seeded raw-secret leaks in published artifacts. The paper does not report external-system GuardBench scores; Mem0 and Zep adapters exist, but live credentialed outputs remain pending strict evidence verification. The release includes schema-bound manifests, raw outputs, conformance cards, submission bundles, leaderboard artifacts, an external evidence verifier, and a claim register that blocks unsupported public claims."
|
|
21
|
+
},
|
|
22
|
+
{
|
|
23
|
+
"id": "hacker-news-title",
|
|
24
|
+
"platform": "hacker-news",
|
|
25
|
+
"kind": "title",
|
|
26
|
+
"claimIds": ["C01", "C03"],
|
|
27
|
+
"maxChars": 80,
|
|
28
|
+
"text": "Show HN: Audrey, a local-first memory firewall for AI agents"
|
|
29
|
+
},
|
|
30
|
+
{
|
|
31
|
+
"id": "hacker-news-comment",
|
|
32
|
+
"platform": "hacker-news",
|
|
33
|
+
"kind": "body",
|
|
34
|
+
"claimIds": ["C01", "C02", "C03", "C04"],
|
|
35
|
+
"maxChars": 1800,
|
|
36
|
+
"text": "Audrey is my local-first memory runtime for agents. The core idea is memory-before-action: before an agent runs a command, edits files, or touches tools, Audrey recalls relevant failures, rules, procedures, contradictions, and validation history, then returns allow/warn/block with evidence. The research paper introduces GuardBench, a Stage-A benchmark spec for this pre-action control problem. Current local artifacts show Audrey Guard passing 10/10 local scenarios with zero seeded raw-secret leaks in published artifacts. I am deliberately not claiming external-system scores yet: Mem0 and Zep adapters are implemented, but live credentialed runs are still pending strict evidence verification. The repo includes schemas, raw outputs, conformance cards, a submission bundle, a leaderboard builder, an external evidence verifier, and a claim register that blocks public overclaims."
|
|
37
|
+
},
|
|
38
|
+
{
|
|
39
|
+
"id": "reddit-title",
|
|
40
|
+
"platform": "reddit",
|
|
41
|
+
"kind": "title",
|
|
42
|
+
"claimIds": ["C01", "C03"],
|
|
43
|
+
"maxChars": 300,
|
|
44
|
+
"text": "Audrey: a local-first memory firewall for agents, with a GuardBench paper and auditable benchmark artifacts"
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
"id": "reddit-body",
|
|
48
|
+
"platform": "reddit",
|
|
49
|
+
"kind": "body",
|
|
50
|
+
"claimIds": ["C01", "C02", "C03", "C04"],
|
|
51
|
+
"maxChars": 4000,
|
|
52
|
+
"text": "I have been building Audrey as a local-first memory layer for agents, but the framing has shifted from simple recall to pre-action control. Instead of only asking whether memory can retrieve facts, Audrey asks whether memory changes the next tool action before it happens. It records tool failures, rules, procedures, contradictions, validations, and salience, then returns allow/warn/block decisions with evidence. The paper introduces GuardBench as a reproducibility contract for this memory-before-action behavior. The current Stage-A result is intentionally narrow: local Audrey Guard passes 10/10 local GuardBench scenarios with zero seeded raw-secret leaks in published artifacts. External Mem0/Zep scores are not claimed yet; those adapters exist, but live credentialed outputs are pending strict evidence verification. The repo now includes the benchmark manifest, raw outputs, schemas, conformance card, submission bundle, leaderboard builder, external evidence verifier, and claim register so the public claims can be audited."
|
|
53
|
+
},
|
|
54
|
+
{
|
|
55
|
+
"id": "x-post-1",
|
|
56
|
+
"platform": "x",
|
|
57
|
+
"kind": "post",
|
|
58
|
+
"claimIds": ["C01", "C02"],
|
|
59
|
+
"maxChars": 280,
|
|
60
|
+
"requiresArtifactUrl": true,
|
|
61
|
+
"reservedUrlChars": 24,
|
|
62
|
+
"text": "Audrey is a local-first memory firewall for AI agents: recall failures, rules, contradictions, and validations before tools run. Stage-A GuardBench: local Audrey Guard passes 10/10. External Mem0/Zep scores remain pending."
|
|
63
|
+
},
|
|
64
|
+
{
|
|
65
|
+
"id": "x-post-2",
|
|
66
|
+
"platform": "x",
|
|
67
|
+
"kind": "post",
|
|
68
|
+
"claimIds": ["C03", "C04"],
|
|
69
|
+
"maxChars": 280,
|
|
70
|
+
"text": "The Audrey paper ships with auditable benchmark artifacts: schemas, raw outputs, conformance cards, submission bundle, leaderboard, external evidence verifier, and a claim register that blocks unsupported public claims."
|
|
71
|
+
},
|
|
72
|
+
{
|
|
73
|
+
"id": "linkedin-post",
|
|
74
|
+
"platform": "linkedin",
|
|
75
|
+
"kind": "post",
|
|
76
|
+
"claimIds": ["C01", "C02", "C03", "C04"],
|
|
77
|
+
"maxChars": 3000,
|
|
78
|
+
"text": "I am preparing Audrey as a local-first memory runtime for AI agents, centered on pre-action memory control. Most agent memory work is evaluated as retrieval: can the system find the right fact? Audrey focuses on a different operational question: can memory change the next tool action before the tool runs? Audrey records episodes, procedures, contradictions, tool traces, validation outcomes, and salience, then returns allow/warn/block decisions with evidence. The accompanying paper introduces GuardBench, a Stage-A benchmark specification for memory-before-action behavior. Current local artifacts show Audrey Guard passing 10/10 local GuardBench scenarios with zero seeded raw-secret leaks in published artifacts. I am intentionally not reporting external-system scores yet: Mem0 and Zep adapters are implemented, but live credentialed runs remain pending strict evidence verification. The release includes machine-readable schemas, raw outputs, conformance cards, submission bundles, leaderboard artifacts, an external evidence verifier, and a public claim register so the claims can be audited before publication."
|
|
79
|
+
}
|
|
80
|
+
]
|
|
81
|
+
}
|
|
@@ -0,0 +1,60 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://audrey-memory.org/schemas/audrey-publication-pack.schema.json",
|
|
4
|
+
"title": "Audrey Publication Pack",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"additionalProperties": false,
|
|
7
|
+
"required": ["schemaVersion", "suite", "claimRegister", "entries"],
|
|
8
|
+
"properties": {
|
|
9
|
+
"schemaVersion": { "const": "1.0.0" },
|
|
10
|
+
"suite": { "const": "Audrey publication pack" },
|
|
11
|
+
"claimRegister": { "type": "string", "minLength": 1 },
|
|
12
|
+
"entries": {
|
|
13
|
+
"type": "array",
|
|
14
|
+
"minItems": 1,
|
|
15
|
+
"items": { "$ref": "#/$defs/entry" }
|
|
16
|
+
}
|
|
17
|
+
},
|
|
18
|
+
"$defs": {
|
|
19
|
+
"entry": {
|
|
20
|
+
"type": "object",
|
|
21
|
+
"additionalProperties": false,
|
|
22
|
+
"required": ["id", "platform", "kind", "claimIds", "maxChars", "text"],
|
|
23
|
+
"properties": {
|
|
24
|
+
"id": {
|
|
25
|
+
"type": "string",
|
|
26
|
+
"pattern": "^[a-z0-9][a-z0-9-]*$"
|
|
27
|
+
},
|
|
28
|
+
"platform": {
|
|
29
|
+
"enum": ["arxiv", "hacker-news", "linkedin", "reddit", "x"]
|
|
30
|
+
},
|
|
31
|
+
"kind": {
|
|
32
|
+
"enum": ["abstract", "body", "post", "title"]
|
|
33
|
+
},
|
|
34
|
+
"claimIds": {
|
|
35
|
+
"type": "array",
|
|
36
|
+
"minItems": 1,
|
|
37
|
+
"items": {
|
|
38
|
+
"type": "string",
|
|
39
|
+
"pattern": "^C[0-9]{2}$"
|
|
40
|
+
}
|
|
41
|
+
},
|
|
42
|
+
"maxChars": {
|
|
43
|
+
"type": "integer",
|
|
44
|
+
"minimum": 1
|
|
45
|
+
},
|
|
46
|
+
"requiresArtifactUrl": {
|
|
47
|
+
"type": "boolean"
|
|
48
|
+
},
|
|
49
|
+
"reservedUrlChars": {
|
|
50
|
+
"type": "integer",
|
|
51
|
+
"minimum": 0
|
|
52
|
+
},
|
|
53
|
+
"text": {
|
|
54
|
+
"type": "string",
|
|
55
|
+
"minLength": 1
|
|
56
|
+
}
|
|
57
|
+
}
|
|
58
|
+
}
|
|
59
|
+
}
|
|
60
|
+
}
|