audrey 0.23.1 → 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +81 -19
- package/LICENSE +21 -21
- package/README.md +209 -5
- package/SECURITY.md +2 -1
- package/benchmarks/adapter-kit.mjs +20 -0
- package/benchmarks/adapter-self-test.mjs +166 -0
- package/benchmarks/adapters/example-allow.mjs +28 -0
- package/benchmarks/adapters/mem0-platform.mjs +267 -0
- package/benchmarks/adapters/registry.json +51 -0
- package/benchmarks/adapters/zep-cloud.mjs +280 -0
- package/benchmarks/baselines.js +169 -0
- package/benchmarks/build-leaderboard.mjs +170 -0
- package/benchmarks/cases.js +537 -0
- package/benchmarks/create-conformance-card.mjs +139 -0
- package/benchmarks/create-submission-bundle.mjs +176 -0
- package/benchmarks/dry-run-external-adapters.mjs +165 -0
- package/benchmarks/guardbench.js +1035 -0
- package/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/guardbench-manifest.json +414 -0
- package/benchmarks/output/guardbench-raw.json +1171 -0
- package/benchmarks/output/guardbench-summary.json +1981 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/benchmarks/output/submission-bundle/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/submission-bundle/guardbench-manifest.json +414 -0
- package/benchmarks/output/submission-bundle/guardbench-raw.json +1171 -0
- package/benchmarks/output/submission-bundle/guardbench-summary.json +1981 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/benchmarks/output/summary.json +2354 -0
- package/benchmarks/perf-snapshot.js +304 -0
- package/benchmarks/perf.bench.js +161 -0
- package/benchmarks/public-paths.mjs +78 -0
- package/benchmarks/reference-results.js +70 -0
- package/benchmarks/report.js +259 -0
- package/benchmarks/run-external-guardbench.mjs +281 -0
- package/benchmarks/run.js +682 -0
- package/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/snapshots/perf-0.22.2.json +123 -0
- package/benchmarks/snapshots/perf-0.23.0.json +123 -0
- package/benchmarks/validate-adapter-module.mjs +104 -0
- package/benchmarks/validate-adapter-registry.mjs +134 -0
- package/benchmarks/validate-adapter-self-test.mjs +96 -0
- package/benchmarks/validate-guardbench-artifacts.mjs +343 -0
- package/benchmarks/verify-external-evidence.mjs +296 -0
- package/benchmarks/verify-publication-artifacts.mjs +286 -0
- package/benchmarks/verify-submission-bundle.mjs +167 -0
- package/dist/mcp-server/config.d.ts +1 -1
- package/dist/mcp-server/config.d.ts.map +1 -1
- package/dist/mcp-server/config.js +1 -1
- package/dist/mcp-server/config.js.map +1 -1
- package/dist/mcp-server/index.d.ts +65 -3
- package/dist/mcp-server/index.d.ts.map +1 -1
- package/dist/mcp-server/index.js +675 -157
- package/dist/mcp-server/index.js.map +1 -1
- package/dist/src/action-key.d.ts +9 -0
- package/dist/src/action-key.d.ts.map +1 -0
- package/dist/src/action-key.js +49 -0
- package/dist/src/action-key.js.map +1 -0
- package/dist/src/adaptive.js +5 -5
- package/dist/src/affect.js +8 -8
- package/dist/src/audrey.d.ts +3 -0
- package/dist/src/audrey.d.ts.map +1 -1
- package/dist/src/audrey.js +55 -3
- package/dist/src/audrey.js.map +1 -1
- package/dist/src/capsule.js +4 -4
- package/dist/src/causal.js +3 -3
- package/dist/src/consolidate.js +48 -48
- package/dist/src/controller.d.ts +61 -5
- package/dist/src/controller.d.ts.map +1 -1
- package/dist/src/controller.js +230 -49
- package/dist/src/controller.js.map +1 -1
- package/dist/src/db.js +172 -172
- package/dist/src/decay.js +8 -8
- package/dist/src/embedding.d.ts +2 -1
- package/dist/src/embedding.d.ts.map +1 -1
- package/dist/src/embedding.js +39 -29
- package/dist/src/embedding.js.map +1 -1
- package/dist/src/encode.js +6 -6
- package/dist/src/feedback.d.ts +6 -0
- package/dist/src/feedback.d.ts.map +1 -1
- package/dist/src/feedback.js +6 -0
- package/dist/src/feedback.js.map +1 -1
- package/dist/src/forget.js +12 -12
- package/dist/src/hybrid-recall.js +9 -9
- package/dist/src/impact.js +6 -6
- package/dist/src/import.d.ts +3 -3
- package/dist/src/import.js +41 -41
- package/dist/src/index.d.ts +3 -3
- package/dist/src/index.d.ts.map +1 -1
- package/dist/src/index.js +2 -2
- package/dist/src/index.js.map +1 -1
- package/dist/src/interference.js +14 -14
- package/dist/src/introspect.js +18 -18
- package/dist/src/preflight.d.ts.map +1 -1
- package/dist/src/preflight.js +41 -0
- package/dist/src/preflight.js.map +1 -1
- package/dist/src/promote.js +7 -7
- package/dist/src/prompts.js +118 -118
- package/dist/src/recall.js +30 -30
- package/dist/src/reflexes.d.ts +1 -0
- package/dist/src/reflexes.d.ts.map +1 -1
- package/dist/src/reflexes.js +3 -0
- package/dist/src/reflexes.js.map +1 -1
- package/dist/src/rollback.js +4 -4
- package/dist/src/routes.d.ts.map +1 -1
- package/dist/src/routes.js +67 -1
- package/dist/src/routes.js.map +1 -1
- package/dist/src/validate.js +25 -25
- package/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/MEMORY_BENCHMARKING.md +59 -0
- package/docs/PRODUCTION_BACKLOG.md +304 -0
- package/docs/paper/00-master.md +48 -0
- package/docs/paper/01-introduction.md +27 -0
- package/docs/paper/02-related-work.md +47 -0
- package/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/04-design.md +164 -0
- package/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/06-implementation.md +113 -0
- package/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/claim-register.json +138 -0
- package/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/LICENSE +21 -0
- package/docs/paper/output/submission-bundle/README.md +533 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-manifest.json +414 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-raw.json +1171 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-summary.json +1981 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/summary.json +2354 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/docs/paper/output/submission-bundle/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/paper/output/submission-bundle/docs/paper/00-master.md +48 -0
- package/docs/paper/output/submission-bundle/docs/paper/01-introduction.md +27 -0
- package/docs/paper/output/submission-bundle/docs/paper/02-related-work.md +47 -0
- package/docs/paper/output/submission-bundle/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/output/submission-bundle/docs/paper/04-design.md +164 -0
- package/docs/paper/output/submission-bundle/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/output/submission-bundle/docs/paper/06-implementation.md +113 -0
- package/docs/paper/output/submission-bundle/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/output/submission-bundle/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/output/submission-bundle/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/output/submission-bundle/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.json +138 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/output/submission-bundle/docs/paper/references.bib +222 -0
- package/docs/paper/output/submission-bundle/package.json +212 -0
- package/docs/paper/output/submission-bundle/paper-submission-manifest.json +379 -0
- package/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/publication-pack.json +81 -0
- package/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/references.bib +222 -0
- package/package.json +87 -4
- package/scripts/audit-release-completion.mjs +362 -0
- package/scripts/create-arxiv-source.mjs +362 -0
- package/scripts/create-paper-submission-bundle.mjs +210 -0
- package/scripts/finalize-release.mjs +526 -0
- package/scripts/prepare-release-cut.mjs +269 -0
- package/scripts/publish-release-bundle.mjs +209 -0
- package/scripts/publish-release-github-api.mjs +429 -0
- package/scripts/run-vitest.mjs +34 -0
- package/scripts/smoke-cli.js +72 -0
- package/scripts/sync-paper-artifacts.mjs +109 -0
- package/scripts/verify-arxiv-compile.mjs +440 -0
- package/scripts/verify-arxiv-source.mjs +194 -0
- package/scripts/verify-browser-launch-plan.mjs +237 -0
- package/scripts/verify-browser-launch-results.mjs +285 -0
- package/scripts/verify-paper-artifacts.mjs +338 -0
- package/scripts/verify-paper-claims.mjs +226 -0
- package/scripts/verify-paper-submission-bundle.mjs +207 -0
- package/scripts/verify-publication-pack.mjs +196 -0
- package/scripts/verify-python-package.py +201 -0
- package/scripts/verify-release-readiness.mjs +741 -0
|
@@ -0,0 +1,93 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "GuardBench leaderboard",
|
|
4
|
+
"generatedAt": "2026-05-13T23:33:51.927Z",
|
|
5
|
+
"ranking": [
|
|
6
|
+
"verified bundle",
|
|
7
|
+
"adapter conformance",
|
|
8
|
+
"fullContractPassRate",
|
|
9
|
+
"decisionAccuracy",
|
|
10
|
+
"evidenceRecall",
|
|
11
|
+
"redactionLeaks ascending",
|
|
12
|
+
"latency.p95Ms ascending",
|
|
13
|
+
"subject.name"
|
|
14
|
+
],
|
|
15
|
+
"rows": [
|
|
16
|
+
{
|
|
17
|
+
"rank": 1,
|
|
18
|
+
"subject": {
|
|
19
|
+
"name": "Audrey Guard",
|
|
20
|
+
"requestedAdapter": null,
|
|
21
|
+
"external": false
|
|
22
|
+
},
|
|
23
|
+
"score": {
|
|
24
|
+
"scenarios": 10,
|
|
25
|
+
"fullContractPassed": 10,
|
|
26
|
+
"fullContractPassRate": 1,
|
|
27
|
+
"decisionAccuracy": 1,
|
|
28
|
+
"evidenceRecall": 1,
|
|
29
|
+
"redactionLeaks": 0,
|
|
30
|
+
"latency": {
|
|
31
|
+
"p50Ms": 3.097,
|
|
32
|
+
"p95Ms": 29.711,
|
|
33
|
+
"maxMs": 29.711
|
|
34
|
+
}
|
|
35
|
+
},
|
|
36
|
+
"conformance": {
|
|
37
|
+
"ok": true,
|
|
38
|
+
"failures": [],
|
|
39
|
+
"artifactValidationOk": true,
|
|
40
|
+
"artifactValidationFailures": []
|
|
41
|
+
},
|
|
42
|
+
"source": {
|
|
43
|
+
"dir": "benchmarks/output/submission-bundle",
|
|
44
|
+
"manifestGeneratedAt": "2026-05-13T23:33:51.597Z",
|
|
45
|
+
"fileCount": 17
|
|
46
|
+
},
|
|
47
|
+
"verification": {
|
|
48
|
+
"ok": true,
|
|
49
|
+
"dir": "benchmarks/output/submission-bundle",
|
|
50
|
+
"subject": {
|
|
51
|
+
"name": "Audrey Guard",
|
|
52
|
+
"requestedAdapter": null,
|
|
53
|
+
"external": false
|
|
54
|
+
},
|
|
55
|
+
"files": [
|
|
56
|
+
"guardbench-conformance-card.json",
|
|
57
|
+
"guardbench-manifest.json",
|
|
58
|
+
"guardbench-raw.json",
|
|
59
|
+
"guardbench-summary.json",
|
|
60
|
+
"schemas/guardbench-adapter-registry.schema.json",
|
|
61
|
+
"schemas/guardbench-adapter-self-test.schema.json",
|
|
62
|
+
"schemas/guardbench-conformance-card.schema.json",
|
|
63
|
+
"schemas/guardbench-external-dry-run.schema.json",
|
|
64
|
+
"schemas/guardbench-external-evidence.schema.json",
|
|
65
|
+
"schemas/guardbench-external-run.schema.json",
|
|
66
|
+
"schemas/guardbench-leaderboard.schema.json",
|
|
67
|
+
"schemas/guardbench-manifest.schema.json",
|
|
68
|
+
"schemas/guardbench-publication-verification.schema.json",
|
|
69
|
+
"schemas/guardbench-raw.schema.json",
|
|
70
|
+
"schemas/guardbench-submission-manifest.schema.json",
|
|
71
|
+
"schemas/guardbench-summary.schema.json",
|
|
72
|
+
"validation-report.json"
|
|
73
|
+
],
|
|
74
|
+
"artifactValidation": {
|
|
75
|
+
"ok": true,
|
|
76
|
+
"dir": "benchmarks/output/submission-bundle",
|
|
77
|
+
"schemasDir": "benchmarks/output/submission-bundle/schemas",
|
|
78
|
+
"files": [
|
|
79
|
+
"guardbench-manifest.json",
|
|
80
|
+
"guardbench-summary.json",
|
|
81
|
+
"guardbench-raw.json"
|
|
82
|
+
],
|
|
83
|
+
"optionalFiles": [
|
|
84
|
+
"guardbench-conformance-card.json"
|
|
85
|
+
],
|
|
86
|
+
"failures": []
|
|
87
|
+
},
|
|
88
|
+
"failures": []
|
|
89
|
+
}
|
|
90
|
+
}
|
|
91
|
+
],
|
|
92
|
+
"failures": []
|
|
93
|
+
}
|
package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.md
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
# GuardBench Leaderboard
|
|
2
|
+
|
|
3
|
+
Generated: 2026-05-13T23:33:51.927Z
|
|
4
|
+
|
|
5
|
+
| Rank | Subject | Verified | Conformant | Full Contract | Decision Accuracy | Evidence Recall | Redaction Leaks | p95 Latency | Bundle |
|
|
6
|
+
|---:|---|---:|---:|---:|---:|---:|---:|---:|---|
|
|
7
|
+
| 1 | Audrey Guard | yes | yes | 100.0% | 100.0% | 100.0% | 0 | 29.711ms | benchmarks/output/submission-bundle |
|
|
@@ -0,0 +1,131 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "GuardBench submission bundle",
|
|
4
|
+
"generatedAt": "2026-05-13T23:33:51.597Z",
|
|
5
|
+
"sourceDir": "benchmarks/output",
|
|
6
|
+
"subject": {
|
|
7
|
+
"name": "Audrey Guard",
|
|
8
|
+
"requestedAdapter": null,
|
|
9
|
+
"external": false
|
|
10
|
+
},
|
|
11
|
+
"score": {
|
|
12
|
+
"scenarios": 10,
|
|
13
|
+
"fullContractPassed": 10,
|
|
14
|
+
"fullContractPassRate": 1,
|
|
15
|
+
"decisionAccuracy": 1,
|
|
16
|
+
"evidenceRecall": 1,
|
|
17
|
+
"redactionLeaks": 0,
|
|
18
|
+
"latency": {
|
|
19
|
+
"p50Ms": 3.097,
|
|
20
|
+
"p95Ms": 29.711,
|
|
21
|
+
"maxMs": 29.711
|
|
22
|
+
}
|
|
23
|
+
},
|
|
24
|
+
"conformance": {
|
|
25
|
+
"ok": true,
|
|
26
|
+
"failures": [],
|
|
27
|
+
"artifactValidationOk": true,
|
|
28
|
+
"artifactValidationFailures": []
|
|
29
|
+
},
|
|
30
|
+
"validation": {
|
|
31
|
+
"ok": true,
|
|
32
|
+
"dir": "benchmarks/output/submission-bundle",
|
|
33
|
+
"schemasDir": "benchmarks/output/submission-bundle/schemas",
|
|
34
|
+
"files": [
|
|
35
|
+
"guardbench-manifest.json",
|
|
36
|
+
"guardbench-summary.json",
|
|
37
|
+
"guardbench-raw.json"
|
|
38
|
+
],
|
|
39
|
+
"optionalFiles": [
|
|
40
|
+
"guardbench-conformance-card.json"
|
|
41
|
+
],
|
|
42
|
+
"failures": []
|
|
43
|
+
},
|
|
44
|
+
"files": [
|
|
45
|
+
{
|
|
46
|
+
"path": "guardbench-conformance-card.json",
|
|
47
|
+
"bytes": 1735,
|
|
48
|
+
"sha256": "0709bb4d93a797764e4ed5655c575390a57554a42625398d378c8ec0f23bd2b4"
|
|
49
|
+
},
|
|
50
|
+
{
|
|
51
|
+
"path": "guardbench-manifest.json",
|
|
52
|
+
"bytes": 12056,
|
|
53
|
+
"sha256": "57636ce19fdaa6e50fc3fc961d9e499a9f43632f588c713a9fefe8e8a6fa724c"
|
|
54
|
+
},
|
|
55
|
+
{
|
|
56
|
+
"path": "guardbench-raw.json",
|
|
57
|
+
"bytes": 39429,
|
|
58
|
+
"sha256": "c5b9c68cf946478fbfba617f17717e05ea3e01301089de19153d59e77e674bc6"
|
|
59
|
+
},
|
|
60
|
+
{
|
|
61
|
+
"path": "guardbench-summary.json",
|
|
62
|
+
"bytes": 64381,
|
|
63
|
+
"sha256": "2a6d5ee83cce2502135fb0442ef8cd3f2679fdc38c84207612c22a800a7a113a"
|
|
64
|
+
},
|
|
65
|
+
{
|
|
66
|
+
"path": "schemas/guardbench-adapter-registry.schema.json",
|
|
67
|
+
"bytes": 2016,
|
|
68
|
+
"sha256": "0fb401e0b00270f16287a47cdb868ec6ac23e85f134958141f37519bf0c67164"
|
|
69
|
+
},
|
|
70
|
+
{
|
|
71
|
+
"path": "schemas/guardbench-adapter-self-test.schema.json",
|
|
72
|
+
"bytes": 4572,
|
|
73
|
+
"sha256": "369402022870257c0bca52c05f21e53b40e310547bf49871ce08b2976c755127"
|
|
74
|
+
},
|
|
75
|
+
{
|
|
76
|
+
"path": "schemas/guardbench-conformance-card.schema.json",
|
|
77
|
+
"bytes": 5251,
|
|
78
|
+
"sha256": "337e197617e889388ff9f71f361b6c75450b43c1c131af622d4a59bc4faca89e"
|
|
79
|
+
},
|
|
80
|
+
{
|
|
81
|
+
"path": "schemas/guardbench-external-dry-run.schema.json",
|
|
82
|
+
"bytes": 2177,
|
|
83
|
+
"sha256": "df327a2b2c1cd7bf4453457c83ebc10708e6f56aa1d3526c7ac492a1b254880c"
|
|
84
|
+
},
|
|
85
|
+
{
|
|
86
|
+
"path": "schemas/guardbench-external-evidence.schema.json",
|
|
87
|
+
"bytes": 3075,
|
|
88
|
+
"sha256": "c6f7af89c53d039ff7e3b3b9f5829a7524e4a24c254dd17754dd51469c0295d1"
|
|
89
|
+
},
|
|
90
|
+
{
|
|
91
|
+
"path": "schemas/guardbench-external-run.schema.json",
|
|
92
|
+
"bytes": 4443,
|
|
93
|
+
"sha256": "36f79172e6b9264fa7f16a90684f2c75fb3f8432c5226be4181d93622b17b40b"
|
|
94
|
+
},
|
|
95
|
+
{
|
|
96
|
+
"path": "schemas/guardbench-leaderboard.schema.json",
|
|
97
|
+
"bytes": 5457,
|
|
98
|
+
"sha256": "ac3414af9f97d3c3b241ffea3fe9995295cb107dbc4fddef2f32f0d3de2d1abf"
|
|
99
|
+
},
|
|
100
|
+
{
|
|
101
|
+
"path": "schemas/guardbench-manifest.schema.json",
|
|
102
|
+
"bytes": 6345,
|
|
103
|
+
"sha256": "a2995e946908f094dfd5db264db87615167586d57f1a335aa9bf2262b709ef4d"
|
|
104
|
+
},
|
|
105
|
+
{
|
|
106
|
+
"path": "schemas/guardbench-publication-verification.schema.json",
|
|
107
|
+
"bytes": 1713,
|
|
108
|
+
"sha256": "a83442c23dee3805b6c1bd3b8524b16948b5dc78d3d65074142c2a99c733f1b9"
|
|
109
|
+
},
|
|
110
|
+
{
|
|
111
|
+
"path": "schemas/guardbench-raw.schema.json",
|
|
112
|
+
"bytes": 5057,
|
|
113
|
+
"sha256": "f419685932a5549d5efef611b1dbbe585300365de3c977fcfedf174672f6bc3a"
|
|
114
|
+
},
|
|
115
|
+
{
|
|
116
|
+
"path": "schemas/guardbench-submission-manifest.schema.json",
|
|
117
|
+
"bytes": 4469,
|
|
118
|
+
"sha256": "4d624bec3cbb7f3043064a874bd869ac8556f42231f0871a179f58cd8fbcfb23"
|
|
119
|
+
},
|
|
120
|
+
{
|
|
121
|
+
"path": "schemas/guardbench-summary.schema.json",
|
|
122
|
+
"bytes": 7331,
|
|
123
|
+
"sha256": "ac70b448c730fb8b01899615477a167a64734d16304c39d661b2b3130e8aa1da"
|
|
124
|
+
},
|
|
125
|
+
{
|
|
126
|
+
"path": "validation-report.json",
|
|
127
|
+
"bytes": 739,
|
|
128
|
+
"sha256": "9734a26b31a7511fbba361f22245dd6325b65fe47d1072fa59df7eeb15d724a1"
|
|
129
|
+
}
|
|
130
|
+
]
|
|
131
|
+
}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"generatedAt": "2026-05-13T23:33:51.596Z",
|
|
3
|
+
"sourceValidation": {
|
|
4
|
+
"ok": true,
|
|
5
|
+
"dir": "benchmarks/output",
|
|
6
|
+
"schemasDir": "benchmarks/schemas",
|
|
7
|
+
"files": [
|
|
8
|
+
"guardbench-manifest.json",
|
|
9
|
+
"guardbench-summary.json",
|
|
10
|
+
"guardbench-raw.json"
|
|
11
|
+
],
|
|
12
|
+
"optionalFiles": [
|
|
13
|
+
"guardbench-conformance-card.json"
|
|
14
|
+
],
|
|
15
|
+
"failures": []
|
|
16
|
+
},
|
|
17
|
+
"bundleValidation": {
|
|
18
|
+
"ok": true,
|
|
19
|
+
"dir": "benchmarks/output/submission-bundle",
|
|
20
|
+
"schemasDir": "benchmarks/output/submission-bundle/schemas",
|
|
21
|
+
"files": [
|
|
22
|
+
"guardbench-manifest.json",
|
|
23
|
+
"guardbench-summary.json",
|
|
24
|
+
"guardbench-raw.json"
|
|
25
|
+
],
|
|
26
|
+
"optionalFiles": [
|
|
27
|
+
"guardbench-conformance-card.json"
|
|
28
|
+
],
|
|
29
|
+
"failures": []
|
|
30
|
+
}
|
|
31
|
+
}
|