audrey 0.23.1 → 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +81 -19
- package/LICENSE +21 -21
- package/README.md +209 -5
- package/SECURITY.md +2 -1
- package/benchmarks/adapter-kit.mjs +20 -0
- package/benchmarks/adapter-self-test.mjs +166 -0
- package/benchmarks/adapters/example-allow.mjs +28 -0
- package/benchmarks/adapters/mem0-platform.mjs +267 -0
- package/benchmarks/adapters/registry.json +51 -0
- package/benchmarks/adapters/zep-cloud.mjs +280 -0
- package/benchmarks/baselines.js +169 -0
- package/benchmarks/build-leaderboard.mjs +170 -0
- package/benchmarks/cases.js +537 -0
- package/benchmarks/create-conformance-card.mjs +139 -0
- package/benchmarks/create-submission-bundle.mjs +176 -0
- package/benchmarks/dry-run-external-adapters.mjs +165 -0
- package/benchmarks/guardbench.js +1035 -0
- package/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/guardbench-manifest.json +414 -0
- package/benchmarks/output/guardbench-raw.json +1171 -0
- package/benchmarks/output/guardbench-summary.json +1981 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/benchmarks/output/submission-bundle/guardbench-conformance-card.json +63 -0
- package/benchmarks/output/submission-bundle/guardbench-manifest.json +414 -0
- package/benchmarks/output/submission-bundle/guardbench-raw.json +1171 -0
- package/benchmarks/output/submission-bundle/guardbench-summary.json +1981 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/output/submission-bundle/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/benchmarks/output/summary.json +2354 -0
- package/benchmarks/perf-snapshot.js +304 -0
- package/benchmarks/perf.bench.js +161 -0
- package/benchmarks/public-paths.mjs +78 -0
- package/benchmarks/reference-results.js +70 -0
- package/benchmarks/report.js +259 -0
- package/benchmarks/run-external-guardbench.mjs +281 -0
- package/benchmarks/run.js +682 -0
- package/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/benchmarks/snapshots/perf-0.22.2.json +123 -0
- package/benchmarks/snapshots/perf-0.23.0.json +123 -0
- package/benchmarks/validate-adapter-module.mjs +104 -0
- package/benchmarks/validate-adapter-registry.mjs +134 -0
- package/benchmarks/validate-adapter-self-test.mjs +96 -0
- package/benchmarks/validate-guardbench-artifacts.mjs +343 -0
- package/benchmarks/verify-external-evidence.mjs +296 -0
- package/benchmarks/verify-publication-artifacts.mjs +286 -0
- package/benchmarks/verify-submission-bundle.mjs +167 -0
- package/dist/mcp-server/config.d.ts +1 -1
- package/dist/mcp-server/config.d.ts.map +1 -1
- package/dist/mcp-server/config.js +1 -1
- package/dist/mcp-server/config.js.map +1 -1
- package/dist/mcp-server/index.d.ts +65 -3
- package/dist/mcp-server/index.d.ts.map +1 -1
- package/dist/mcp-server/index.js +675 -157
- package/dist/mcp-server/index.js.map +1 -1
- package/dist/src/action-key.d.ts +9 -0
- package/dist/src/action-key.d.ts.map +1 -0
- package/dist/src/action-key.js +49 -0
- package/dist/src/action-key.js.map +1 -0
- package/dist/src/adaptive.js +5 -5
- package/dist/src/affect.js +8 -8
- package/dist/src/audrey.d.ts +3 -0
- package/dist/src/audrey.d.ts.map +1 -1
- package/dist/src/audrey.js +55 -3
- package/dist/src/audrey.js.map +1 -1
- package/dist/src/capsule.js +4 -4
- package/dist/src/causal.js +3 -3
- package/dist/src/consolidate.js +48 -48
- package/dist/src/controller.d.ts +61 -5
- package/dist/src/controller.d.ts.map +1 -1
- package/dist/src/controller.js +230 -49
- package/dist/src/controller.js.map +1 -1
- package/dist/src/db.js +172 -172
- package/dist/src/decay.js +8 -8
- package/dist/src/embedding.d.ts +2 -1
- package/dist/src/embedding.d.ts.map +1 -1
- package/dist/src/embedding.js +39 -29
- package/dist/src/embedding.js.map +1 -1
- package/dist/src/encode.js +6 -6
- package/dist/src/feedback.d.ts +6 -0
- package/dist/src/feedback.d.ts.map +1 -1
- package/dist/src/feedback.js +6 -0
- package/dist/src/feedback.js.map +1 -1
- package/dist/src/forget.js +12 -12
- package/dist/src/hybrid-recall.js +9 -9
- package/dist/src/impact.js +6 -6
- package/dist/src/import.d.ts +3 -3
- package/dist/src/import.js +41 -41
- package/dist/src/index.d.ts +3 -3
- package/dist/src/index.d.ts.map +1 -1
- package/dist/src/index.js +2 -2
- package/dist/src/index.js.map +1 -1
- package/dist/src/interference.js +14 -14
- package/dist/src/introspect.js +18 -18
- package/dist/src/preflight.d.ts.map +1 -1
- package/dist/src/preflight.js +41 -0
- package/dist/src/preflight.js.map +1 -1
- package/dist/src/promote.js +7 -7
- package/dist/src/prompts.js +118 -118
- package/dist/src/recall.js +30 -30
- package/dist/src/reflexes.d.ts +1 -0
- package/dist/src/reflexes.d.ts.map +1 -1
- package/dist/src/reflexes.js +3 -0
- package/dist/src/reflexes.js.map +1 -1
- package/dist/src/rollback.js +4 -4
- package/dist/src/routes.d.ts.map +1 -1
- package/dist/src/routes.js +67 -1
- package/dist/src/routes.js.map +1 -1
- package/dist/src/validate.js +25 -25
- package/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/MEMORY_BENCHMARKING.md +59 -0
- package/docs/PRODUCTION_BACKLOG.md +304 -0
- package/docs/paper/00-master.md +48 -0
- package/docs/paper/01-introduction.md +27 -0
- package/docs/paper/02-related-work.md +47 -0
- package/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/04-design.md +164 -0
- package/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/06-implementation.md +113 -0
- package/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/claim-register.json +138 -0
- package/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/LICENSE +21 -0
- package/docs/paper/output/submission-bundle/README.md +533 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/adapter-self-test/guardbench-adapter-self-test.json +50 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-dry-run.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/external/guardbench-external-evidence.json +56 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-conformance-card.json +63 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-manifest.json +414 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-raw.json +1171 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/guardbench-summary.json +1981 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.json +93 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/leaderboard/guardbench-leaderboard.md +7 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/submission-manifest.json +131 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/submission-bundle/validation-report.json +31 -0
- package/docs/paper/output/submission-bundle/benchmarks/output/summary.json +2354 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-registry.schema.json +69 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-adapter-self-test.schema.json +156 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-conformance-card.schema.json +184 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-dry-run.schema.json +74 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-evidence.schema.json +108 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-external-run.schema.json +160 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-leaderboard.schema.json +179 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-manifest.schema.json +213 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-publication-verification.schema.json +47 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-raw.schema.json +164 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-submission-manifest.schema.json +151 -0
- package/docs/paper/output/submission-bundle/benchmarks/schemas/guardbench-summary.schema.json +228 -0
- package/docs/paper/output/submission-bundle/docs/AUDREY_PAPER_OUTLINE.md +175 -0
- package/docs/paper/output/submission-bundle/docs/paper/00-master.md +48 -0
- package/docs/paper/output/submission-bundle/docs/paper/01-introduction.md +27 -0
- package/docs/paper/output/submission-bundle/docs/paper/02-related-work.md +47 -0
- package/docs/paper/output/submission-bundle/docs/paper/03-problem-definition.md +108 -0
- package/docs/paper/output/submission-bundle/docs/paper/04-design.md +164 -0
- package/docs/paper/output/submission-bundle/docs/paper/05-guardbench-spec.md +412 -0
- package/docs/paper/output/submission-bundle/docs/paper/06-implementation.md +113 -0
- package/docs/paper/output/submission-bundle/docs/paper/07-evaluation.md +168 -0
- package/docs/paper/output/submission-bundle/docs/paper/08-discussion-limitations.md +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/09-conclusion.md +11 -0
- package/docs/paper/output/submission-bundle/docs/paper/SUBMISSION_README.md +162 -0
- package/docs/paper/output/submission-bundle/docs/paper/appendix-a-demo-transcript.md +114 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-compile-report.schema.json +116 -0
- package/docs/paper/output/submission-bundle/docs/paper/arxiv-source.schema.json +61 -0
- package/docs/paper/output/submission-bundle/docs/paper/audrey-paper-v1.md +1106 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.json +209 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-plan.schema.json +100 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.json +86 -0
- package/docs/paper/output/submission-bundle/docs/paper/browser-launch-results.schema.json +66 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.json +138 -0
- package/docs/paper/output/submission-bundle/docs/paper/claim-register.schema.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/evidence-ledger.md +103 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/README-arxiv.txt +8 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/arxiv-manifest.json +41 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/main.tex +949 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv/references.bib +222 -0
- package/docs/paper/output/submission-bundle/docs/paper/output/arxiv-compile-report.json +24 -0
- package/docs/paper/output/submission-bundle/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.json +81 -0
- package/docs/paper/output/submission-bundle/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/output/submission-bundle/docs/paper/references.bib +222 -0
- package/docs/paper/output/submission-bundle/package.json +212 -0
- package/docs/paper/output/submission-bundle/paper-submission-manifest.json +379 -0
- package/docs/paper/paper-submission-bundle.schema.json +70 -0
- package/docs/paper/publication-pack.json +81 -0
- package/docs/paper/publication-pack.schema.json +60 -0
- package/docs/paper/references.bib +222 -0
- package/package.json +87 -4
- package/scripts/audit-release-completion.mjs +362 -0
- package/scripts/create-arxiv-source.mjs +362 -0
- package/scripts/create-paper-submission-bundle.mjs +210 -0
- package/scripts/finalize-release.mjs +526 -0
- package/scripts/prepare-release-cut.mjs +269 -0
- package/scripts/publish-release-bundle.mjs +209 -0
- package/scripts/publish-release-github-api.mjs +429 -0
- package/scripts/run-vitest.mjs +34 -0
- package/scripts/smoke-cli.js +72 -0
- package/scripts/sync-paper-artifacts.mjs +109 -0
- package/scripts/verify-arxiv-compile.mjs +440 -0
- package/scripts/verify-arxiv-source.mjs +194 -0
- package/scripts/verify-browser-launch-plan.mjs +237 -0
- package/scripts/verify-browser-launch-results.mjs +285 -0
- package/scripts/verify-paper-artifacts.mjs +338 -0
- package/scripts/verify-paper-claims.mjs +226 -0
- package/scripts/verify-paper-submission-bundle.mjs +207 -0
- package/scripts/verify-publication-pack.mjs +196 -0
- package/scripts/verify-python-package.py +201 -0
- package/scripts/verify-release-readiness.mjs +741 -0
|
@@ -0,0 +1,209 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "Audrey browser launch plan",
|
|
4
|
+
"checkedAt": "2026-05-13",
|
|
5
|
+
"publicationPack": "docs/paper/publication-pack.json",
|
|
6
|
+
"sources": [
|
|
7
|
+
{
|
|
8
|
+
"id": "arxiv-submission-guidelines",
|
|
9
|
+
"url": "https://info.arxiv.org/help/submit/index.html",
|
|
10
|
+
"checkedAt": "2026-05-13",
|
|
11
|
+
"notes": "Use the registered-author user page to start a new submission; verify uploaded files and metadata before final submit."
|
|
12
|
+
},
|
|
13
|
+
{
|
|
14
|
+
"id": "arxiv-category-taxonomy",
|
|
15
|
+
"url": "https://arxiv.org/category_taxonomy",
|
|
16
|
+
"checkedAt": "2026-05-13",
|
|
17
|
+
"notes": "cs.AI covers artificial intelligence; cs.CR covers cryptography and security. Use cs.AI primary and cs.CR secondary only if the final paper framing still matches both."
|
|
18
|
+
},
|
|
19
|
+
{
|
|
20
|
+
"id": "hacker-news-guidelines",
|
|
21
|
+
"url": "https://news.ycombinator.com/newsguidelines.html",
|
|
22
|
+
"checkedAt": "2026-05-13",
|
|
23
|
+
"notes": "Use a neutral title, submit the original source, avoid promotion-first behavior, do not solicit votes or comments, and keep comments human-written."
|
|
24
|
+
},
|
|
25
|
+
{
|
|
26
|
+
"id": "hacker-news-submit",
|
|
27
|
+
"url": "https://news.ycombinator.com/submit",
|
|
28
|
+
"checkedAt": "2026-05-13",
|
|
29
|
+
"notes": "Submission form for title, URL, and optional text/comment after login."
|
|
30
|
+
},
|
|
31
|
+
{
|
|
32
|
+
"id": "reddit-submit-api",
|
|
33
|
+
"url": "https://www.reddit.com/dev/api/",
|
|
34
|
+
"checkedAt": "2026-05-13",
|
|
35
|
+
"notes": "Reddit submit supports link or self posts, titles up to 300 characters, subreddit selection, and captcha fields."
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"id": "reddit-spam-policy",
|
|
39
|
+
"url": "https://support.reddithelp.com/hc/en-us/articles/360043504051-What-constitutes-spam",
|
|
40
|
+
"checkedAt": "2026-05-13",
|
|
41
|
+
"notes": "Avoid repeated, unsolicited, mass, or automation-assisted posting. Check subreddit rules before any self-promotional post."
|
|
42
|
+
},
|
|
43
|
+
{
|
|
44
|
+
"id": "x-web-intent",
|
|
45
|
+
"url": "https://developer.x.com/en/docs/twitter-for-websites/tweet-button/guides/web-intent",
|
|
46
|
+
"checkedAt": "2026-05-13",
|
|
47
|
+
"notes": "Tweet intent supports prefilled text and enforces the 280-character limit across text, URL, hashtags, and via fields."
|
|
48
|
+
},
|
|
49
|
+
{
|
|
50
|
+
"id": "x-counting-characters",
|
|
51
|
+
"url": "https://docs.x.com/fundamentals/counting-characters",
|
|
52
|
+
"checkedAt": "2026-05-13",
|
|
53
|
+
"notes": "X wraps valid URLs with t.co and counts each detected URL as 23 characters, so the publication pack uses reservedUrlChars: 24 including a separator."
|
|
54
|
+
},
|
|
55
|
+
{
|
|
56
|
+
"id": "linkedin-share-help",
|
|
57
|
+
"url": "https://www.linkedin.com/help/linkedin/answer/a525301/sharing-articles-or-links",
|
|
58
|
+
"checkedAt": "2026-05-13",
|
|
59
|
+
"notes": "Use the LinkedIn home feed share box; posts can include text up to 3000 characters plus a URL preview."
|
|
60
|
+
}
|
|
61
|
+
],
|
|
62
|
+
"preflightCommands": [
|
|
63
|
+
"npm run release:gate:paper",
|
|
64
|
+
"npm run paper:publication-pack",
|
|
65
|
+
"npm run paper:bundle:verify",
|
|
66
|
+
"npm run paper:launch-plan"
|
|
67
|
+
],
|
|
68
|
+
"targets": [
|
|
69
|
+
{
|
|
70
|
+
"id": "arxiv-preprint",
|
|
71
|
+
"platform": "arxiv",
|
|
72
|
+
"label": "arXiv preprint submission",
|
|
73
|
+
"order": 1,
|
|
74
|
+
"url": "https://arxiv.org/user/",
|
|
75
|
+
"status": "blocked-until-login",
|
|
76
|
+
"authRequired": true,
|
|
77
|
+
"humanRequired": true,
|
|
78
|
+
"captchaPossible": false,
|
|
79
|
+
"manualRuleCheckRequired": true,
|
|
80
|
+
"contentEntryIds": ["arxiv-title", "arxiv-abstract"],
|
|
81
|
+
"artifactRefs": [
|
|
82
|
+
"docs/paper/output/arxiv/",
|
|
83
|
+
"docs/paper/audrey-paper-v1.md",
|
|
84
|
+
"docs/paper/references.bib",
|
|
85
|
+
"docs/paper/output/submission-bundle/"
|
|
86
|
+
],
|
|
87
|
+
"sourceRefs": ["arxiv-submission-guidelines", "arxiv-category-taxonomy"],
|
|
88
|
+
"operatorChecks": [
|
|
89
|
+
"Confirm the logged-in account is a registered arXiv author and has endorsement if arXiv requests it.",
|
|
90
|
+
"Convert the Markdown paper to the chosen arXiv upload format before final submit.",
|
|
91
|
+
"Use cs.AI as the primary category and cs.CR as secondary only after reviewing the final arXiv category screen.",
|
|
92
|
+
"Preview the compiled PDF and metadata before pressing the final submit button."
|
|
93
|
+
],
|
|
94
|
+
"postSubmitChecks": [
|
|
95
|
+
"Record the arXiv identifier or pending submission ID.",
|
|
96
|
+
"Update launch links in the publication copy before posting to social channels."
|
|
97
|
+
]
|
|
98
|
+
},
|
|
99
|
+
{
|
|
100
|
+
"id": "hacker-news-show",
|
|
101
|
+
"platform": "hacker-news",
|
|
102
|
+
"label": "Hacker News Show HN submission",
|
|
103
|
+
"order": 2,
|
|
104
|
+
"url": "https://news.ycombinator.com/submit",
|
|
105
|
+
"status": "blocked-until-artifact-url",
|
|
106
|
+
"authRequired": true,
|
|
107
|
+
"humanRequired": true,
|
|
108
|
+
"captchaPossible": false,
|
|
109
|
+
"manualRuleCheckRequired": true,
|
|
110
|
+
"contentEntryIds": ["hacker-news-title", "hacker-news-comment"],
|
|
111
|
+
"artifactRefs": [
|
|
112
|
+
"docs/paper/publication-pack.json",
|
|
113
|
+
"README.md",
|
|
114
|
+
"docs/paper/output/submission-bundle/"
|
|
115
|
+
],
|
|
116
|
+
"sourceRefs": ["hacker-news-guidelines", "hacker-news-submit"],
|
|
117
|
+
"operatorChecks": [
|
|
118
|
+
"Use the original public URL after the paper or repo release is live.",
|
|
119
|
+
"Keep the title neutral and at or below the Hacker News 80-character title target.",
|
|
120
|
+
"Do not solicit votes, comments, or submissions from anyone.",
|
|
121
|
+
"Write any follow-up comments manually; do not paste generated replies."
|
|
122
|
+
],
|
|
123
|
+
"postSubmitChecks": [
|
|
124
|
+
"Record the HN item URL.",
|
|
125
|
+
"Stay available to answer questions in the thread without marketing language."
|
|
126
|
+
]
|
|
127
|
+
},
|
|
128
|
+
{
|
|
129
|
+
"id": "reddit-discussion",
|
|
130
|
+
"platform": "reddit",
|
|
131
|
+
"label": "Reddit discussion post",
|
|
132
|
+
"order": 3,
|
|
133
|
+
"url": "https://www.reddit.com/submit",
|
|
134
|
+
"status": "blocked-until-login",
|
|
135
|
+
"authRequired": true,
|
|
136
|
+
"humanRequired": true,
|
|
137
|
+
"captchaPossible": true,
|
|
138
|
+
"manualRuleCheckRequired": true,
|
|
139
|
+
"contentEntryIds": ["reddit-title", "reddit-body"],
|
|
140
|
+
"artifactRefs": [
|
|
141
|
+
"docs/paper/publication-pack.json",
|
|
142
|
+
"docs/paper/output/submission-bundle/"
|
|
143
|
+
],
|
|
144
|
+
"sourceRefs": ["reddit-submit-api", "reddit-spam-policy"],
|
|
145
|
+
"operatorChecks": [
|
|
146
|
+
"Choose exactly one subreddit after reading that community's current rules and self-promotion policy in the browser.",
|
|
147
|
+
"Do not cross-post the same launch copy to multiple subreddits.",
|
|
148
|
+
"Disclose author affiliation plainly if the chosen subreddit allows the post.",
|
|
149
|
+
"Handle any captcha or subreddit flair requirement manually."
|
|
150
|
+
],
|
|
151
|
+
"postSubmitChecks": [
|
|
152
|
+
"Record the Reddit post URL and selected subreddit.",
|
|
153
|
+
"If removed, do not repost without moderator guidance or materially different context."
|
|
154
|
+
]
|
|
155
|
+
},
|
|
156
|
+
{
|
|
157
|
+
"id": "x-launch-thread",
|
|
158
|
+
"platform": "x",
|
|
159
|
+
"label": "X launch thread",
|
|
160
|
+
"order": 4,
|
|
161
|
+
"url": "https://twitter.com/intent/tweet",
|
|
162
|
+
"status": "blocked-until-artifact-url",
|
|
163
|
+
"authRequired": true,
|
|
164
|
+
"humanRequired": true,
|
|
165
|
+
"captchaPossible": true,
|
|
166
|
+
"manualRuleCheckRequired": false,
|
|
167
|
+
"contentEntryIds": ["x-post-1", "x-post-2"],
|
|
168
|
+
"artifactRefs": [
|
|
169
|
+
"docs/paper/publication-pack.json"
|
|
170
|
+
],
|
|
171
|
+
"sourceRefs": ["x-web-intent", "x-counting-characters"],
|
|
172
|
+
"operatorChecks": [
|
|
173
|
+
"Use the publication-pack URL reserve before appending the public paper or repo URL.",
|
|
174
|
+
"Post the second entry as a human-authored reply, not as an automated batch.",
|
|
175
|
+
"Do not claim external Mem0/Zep scores unless strict evidence has passed."
|
|
176
|
+
],
|
|
177
|
+
"postSubmitChecks": [
|
|
178
|
+
"Record the first post URL.",
|
|
179
|
+
"Check that the thread links to the final public artifact, not a local path."
|
|
180
|
+
]
|
|
181
|
+
},
|
|
182
|
+
{
|
|
183
|
+
"id": "linkedin-launch-post",
|
|
184
|
+
"platform": "linkedin",
|
|
185
|
+
"label": "LinkedIn launch post",
|
|
186
|
+
"order": 5,
|
|
187
|
+
"url": "https://www.linkedin.com/feed/",
|
|
188
|
+
"status": "blocked-until-artifact-url",
|
|
189
|
+
"authRequired": true,
|
|
190
|
+
"humanRequired": true,
|
|
191
|
+
"captchaPossible": true,
|
|
192
|
+
"manualRuleCheckRequired": false,
|
|
193
|
+
"contentEntryIds": ["linkedin-post"],
|
|
194
|
+
"artifactRefs": [
|
|
195
|
+
"docs/paper/publication-pack.json"
|
|
196
|
+
],
|
|
197
|
+
"sourceRefs": ["linkedin-share-help"],
|
|
198
|
+
"operatorChecks": [
|
|
199
|
+
"Paste the final public URL into the share box and wait for the link preview.",
|
|
200
|
+
"Keep the post within LinkedIn's 3000-character text limit.",
|
|
201
|
+
"Do not claim external Mem0/Zep scores unless strict evidence has passed."
|
|
202
|
+
],
|
|
203
|
+
"postSubmitChecks": [
|
|
204
|
+
"Record the LinkedIn post URL.",
|
|
205
|
+
"Verify the preview points at the public paper or repo URL."
|
|
206
|
+
]
|
|
207
|
+
}
|
|
208
|
+
]
|
|
209
|
+
}
|
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://audrey-memory.org/schemas/audrey-browser-launch-plan.schema.json",
|
|
4
|
+
"title": "Audrey Browser Launch Plan",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"additionalProperties": false,
|
|
7
|
+
"required": ["schemaVersion", "suite", "checkedAt", "publicationPack", "sources", "preflightCommands", "targets"],
|
|
8
|
+
"properties": {
|
|
9
|
+
"schemaVersion": { "const": "1.0.0" },
|
|
10
|
+
"suite": { "const": "Audrey browser launch plan" },
|
|
11
|
+
"checkedAt": { "type": "string", "minLength": 1 },
|
|
12
|
+
"publicationPack": { "type": "string", "minLength": 1 },
|
|
13
|
+
"sources": {
|
|
14
|
+
"type": "array",
|
|
15
|
+
"minItems": 1,
|
|
16
|
+
"items": { "$ref": "#/$defs/source" }
|
|
17
|
+
},
|
|
18
|
+
"preflightCommands": {
|
|
19
|
+
"type": "array",
|
|
20
|
+
"minItems": 1,
|
|
21
|
+
"items": { "type": "string", "minLength": 1 }
|
|
22
|
+
},
|
|
23
|
+
"targets": {
|
|
24
|
+
"type": "array",
|
|
25
|
+
"minItems": 1,
|
|
26
|
+
"items": { "$ref": "#/$defs/target" }
|
|
27
|
+
}
|
|
28
|
+
},
|
|
29
|
+
"$defs": {
|
|
30
|
+
"source": {
|
|
31
|
+
"type": "object",
|
|
32
|
+
"additionalProperties": false,
|
|
33
|
+
"required": ["id", "url", "checkedAt", "notes"],
|
|
34
|
+
"properties": {
|
|
35
|
+
"id": { "type": "string", "pattern": "^[a-z0-9][a-z0-9-]*$" },
|
|
36
|
+
"url": { "type": "string", "pattern": "^https://.+" },
|
|
37
|
+
"checkedAt": { "type": "string", "minLength": 1 },
|
|
38
|
+
"notes": { "type": "string", "minLength": 1 }
|
|
39
|
+
}
|
|
40
|
+
},
|
|
41
|
+
"target": {
|
|
42
|
+
"type": "object",
|
|
43
|
+
"additionalProperties": false,
|
|
44
|
+
"required": [
|
|
45
|
+
"id",
|
|
46
|
+
"platform",
|
|
47
|
+
"label",
|
|
48
|
+
"order",
|
|
49
|
+
"url",
|
|
50
|
+
"status",
|
|
51
|
+
"authRequired",
|
|
52
|
+
"humanRequired",
|
|
53
|
+
"captchaPossible",
|
|
54
|
+
"manualRuleCheckRequired",
|
|
55
|
+
"contentEntryIds",
|
|
56
|
+
"artifactRefs",
|
|
57
|
+
"sourceRefs",
|
|
58
|
+
"operatorChecks",
|
|
59
|
+
"postSubmitChecks"
|
|
60
|
+
],
|
|
61
|
+
"properties": {
|
|
62
|
+
"id": { "type": "string", "pattern": "^[a-z0-9][a-z0-9-]*$" },
|
|
63
|
+
"platform": { "enum": ["arxiv", "hacker-news", "linkedin", "reddit", "x"] },
|
|
64
|
+
"label": { "type": "string", "minLength": 1 },
|
|
65
|
+
"order": { "type": "integer", "minimum": 1 },
|
|
66
|
+
"url": { "type": "string", "pattern": "^https://.+" },
|
|
67
|
+
"status": { "enum": ["ready-manual", "blocked-until-artifact-url", "blocked-until-login"] },
|
|
68
|
+
"authRequired": { "type": "boolean" },
|
|
69
|
+
"humanRequired": { "type": "boolean" },
|
|
70
|
+
"captchaPossible": { "type": "boolean" },
|
|
71
|
+
"manualRuleCheckRequired": { "type": "boolean" },
|
|
72
|
+
"contentEntryIds": {
|
|
73
|
+
"type": "array",
|
|
74
|
+
"minItems": 1,
|
|
75
|
+
"items": { "type": "string", "pattern": "^[a-z0-9][a-z0-9-]*$" }
|
|
76
|
+
},
|
|
77
|
+
"artifactRefs": {
|
|
78
|
+
"type": "array",
|
|
79
|
+
"minItems": 1,
|
|
80
|
+
"items": { "type": "string", "minLength": 1 }
|
|
81
|
+
},
|
|
82
|
+
"sourceRefs": {
|
|
83
|
+
"type": "array",
|
|
84
|
+
"minItems": 1,
|
|
85
|
+
"items": { "type": "string", "pattern": "^[a-z0-9][a-z0-9-]*$" }
|
|
86
|
+
},
|
|
87
|
+
"operatorChecks": {
|
|
88
|
+
"type": "array",
|
|
89
|
+
"minItems": 1,
|
|
90
|
+
"items": { "type": "string", "minLength": 1 }
|
|
91
|
+
},
|
|
92
|
+
"postSubmitChecks": {
|
|
93
|
+
"type": "array",
|
|
94
|
+
"minItems": 1,
|
|
95
|
+
"items": { "type": "string", "minLength": 1 }
|
|
96
|
+
}
|
|
97
|
+
}
|
|
98
|
+
}
|
|
99
|
+
}
|
|
100
|
+
}
|
|
@@ -0,0 +1,86 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "Audrey browser launch results",
|
|
4
|
+
"capturedAt": "2026-05-13",
|
|
5
|
+
"plan": "docs/paper/browser-launch-plan.json",
|
|
6
|
+
"targets": [
|
|
7
|
+
{
|
|
8
|
+
"id": "arxiv-preprint",
|
|
9
|
+
"platform": "arxiv",
|
|
10
|
+
"status": "pending",
|
|
11
|
+
"publicUrl": null,
|
|
12
|
+
"artifactUrl": "https://paper-site-r3jdakujn-evilanders-projects.vercel.app",
|
|
13
|
+
"submittedAt": null,
|
|
14
|
+
"operatorVerified": false,
|
|
15
|
+
"manualRuleCheckCompleted": true,
|
|
16
|
+
"postSubmitChecksCompleted": [],
|
|
17
|
+
"blocker": "arXiv accepted the paper as submit/7591154, but the account page currently shows status on hold, so no public arXiv identifier or public abstract URL has been assigned yet.",
|
|
18
|
+
"notes": "arXiv support confirmed the active username is Evilands and suspended the duplicate account. The active account was recovered, START NEW SUBMISSION appeared, the verified source package was uploaded, arXiv TeX Live 2025 compiled main.tex to a 34-page PDF successfully, the PDF and HTML previews were opened, metadata was saved with primary category cs.AI and cross-list cs.CR, and the article was submitted on 2026-05-13. A later account refresh still showed submit/7591154 under the active Evilands account with status on hold, so a support follow-up was sent on 2026-05-13 asking whether any author-side action remains or whether it is waiting on arXiv review/moderation. Record the final public arXiv URL after moderation and announcement."
|
|
19
|
+
},
|
|
20
|
+
{
|
|
21
|
+
"id": "hacker-news-show",
|
|
22
|
+
"platform": "hacker-news",
|
|
23
|
+
"status": "submitted",
|
|
24
|
+
"publicUrl": "https://news.ycombinator.com/item?id=48123428",
|
|
25
|
+
"artifactUrl": "https://paper-site-r3jdakujn-evilanders-projects.vercel.app",
|
|
26
|
+
"submittedAt": "2026-05-13T10:44:16-05:00",
|
|
27
|
+
"operatorVerified": true,
|
|
28
|
+
"manualRuleCheckCompleted": true,
|
|
29
|
+
"postSubmitChecksCompleted": [
|
|
30
|
+
"Record the HN item URL.",
|
|
31
|
+
"Stay available to answer questions in the thread without marketing language.",
|
|
32
|
+
"Record the follow-up HN source/repo item URL."
|
|
33
|
+
],
|
|
34
|
+
"blocker": null,
|
|
35
|
+
"notes": "The logged-in Show HN route returned https://news.ycombinator.com/showlim and stated that Show HN submissions are temporarily restricted for this account. A neutral normal HN link submission was made instead through https://news.ycombinator.com/submit with title Audrey: Local-first pre-action memory control for AI agents and URL https://paper-site-r3jdakujn-evilanders-projects.vercel.app/. HN newest showed item 48123428 as 1 point by evilanders with edit/delete controls, confirming account ownership of the submission. The original item exposed no comment box and the HN edit screen only allowed title editing, so a follow-up source submission was posted with title Audrey: local-first memory guard for AI agents (source) and URL https://github.com/Evilander/Audrey at https://news.ycombinator.com/item?id=48123903."
|
|
36
|
+
},
|
|
37
|
+
{
|
|
38
|
+
"id": "reddit-discussion",
|
|
39
|
+
"platform": "reddit",
|
|
40
|
+
"status": "submitted",
|
|
41
|
+
"publicUrl": "https://www.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/",
|
|
42
|
+
"artifactUrl": "https://paper-site-r3jdakujn-evilanders-projects.vercel.app",
|
|
43
|
+
"submittedAt": "2026-05-13T10:40:46-05:00",
|
|
44
|
+
"operatorVerified": true,
|
|
45
|
+
"manualRuleCheckCompleted": true,
|
|
46
|
+
"postSubmitChecksCompleted": [
|
|
47
|
+
"Record the Reddit post URL and selected subreddit.",
|
|
48
|
+
"If removed, do not repost without moderator guidance or materially different context.",
|
|
49
|
+
"Verify the original Reddit post body includes the GitHub repo URL.",
|
|
50
|
+
"Verify every Audrey-specific Reddit marketing post, comment, and reply contains the GitHub repo URL."
|
|
51
|
+
],
|
|
52
|
+
"blocker": null,
|
|
53
|
+
"notes": "Submitted to r/ClaudeCode with Showcase flair after reading its current rules. The post discloses builder affiliation and cost, links the public paper/artifact preview plus the GitHub repo URL https://github.com/Evilander/Audrey, and avoids unsupported external Mem0/Zep score claims. A question about Audrey versus PreToolUse plus permissions.deny was answered with the explicit split between static deny rules and learned/contextual memory guards; that parent reply was edited to include the GitHub repo URL (https://old.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/olla7zf/). A follow-up question about hook-rule conversion, semantic false positives, and blocked-action UX was answered with local GuardBench scope boundaries and the GitHub repo URL (https://old.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/olln5u3/). Moriarty/Dangerous-Jelly2309's GuardBench expansion comment was answered with the repo URL and a priority order for retry-amplification, wrong-environment mutation, author-contradiction, undo-prior-fix, and schema-evolution-blindness (https://old.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/olloc0z/). A later Moriarty follow-up about MILP timing, asymmetric false-block/false-allow costs, and structural recurrence under disguise was answered with the GitHub repo URL and GuardBench v2 framing (https://old.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/olmj11t/). Earlier r/LocalLLaMA submission was removed by AutoModerator for insufficient subreddit karma (https://www.reddit.com/r/LocalLLaMA/comments/1tc0i6a/audrey_a_localfirst_memory_firewall_for_agents/), so no duplicate LocalLLaMA repost was attempted. Follow-up participation was posted without Audrey links or promo in r/LocalLLaMA (https://old.reddit.com/r/LocalLLaMA/comments/1tc1d3c/is_it_worth_getting_a_5090_for_my_needs/olkulwp/), r/ClaudeAI (https://old.reddit.com/r/ClaudeAI/comments/1tc1o81/i_built_skills_curator_a_contextaware_claude/olkuwsi/), r/ChatGPT (https://old.reddit.com/r/ChatGPT/comments/1tbfzs6/ive_been_customizing_codex_to_do_automated/olkv6fd/), r/codex (https://old.reddit.com/r/codex/comments/1tbyd5c/most_vibecoders_have_poor_project_management/olkvjy3/), r/VibeCodingSaaS (https://old.reddit.com/r/VibeCodingSaaS/comments/1tbf0x7/every_session_ends_with_a_10layer_audit_heres/olkvu31/), r/ClaudeCode memory/guard threads (https://old.reddit.com/r/ClaudeCode/comments/1tc1h7w/are_you_guys_actually_using_memory/olkz22s/ and https://old.reddit.com/r/ClaudeCode/comments/1tc2k1z/one_thumbsdown_stopped_my_claude_code_agent_from/oll34lg/), and an r/artificial agent-security thread (https://old.reddit.com/r/artificial/comments/1tc1570/built_a_tool_that_stops_ai_agents_from_being/oll6eke/). A later r/VibeCodingSaaS memory-freshness discussion explicitly mentioning Audrey was answered with the GitHub repo URL and the same pre-action/staleness framing (https://old.reddit.com/r/VibeCodingSaaS/comments/1tbf0x7/every_session_ends_with_a_10layer_audit_heres/olmj3zt/). An additional VibeCodingSaaS Chrono/time-confidence reply was answered with the GitHub repo URL (https://old.reddit.com/r/VibeCodingSaaS/comments/1tbf0x7/every_session_ends_with_a_10layer_audit_heres/olnft5b/). A later ClaudeCode Moriarty follow-up was answered with the GitHub repo URL (https://old.reddit.com/r/ClaudeCode/comments/1tc3dhb/audrey_localfirst_memory_guard_for_claude_code/olnfzzl/)."
|
|
54
|
+
},
|
|
55
|
+
{
|
|
56
|
+
"id": "x-launch-thread",
|
|
57
|
+
"platform": "x",
|
|
58
|
+
"status": "pending",
|
|
59
|
+
"publicUrl": null,
|
|
60
|
+
"artifactUrl": "https://paper-site-r3jdakujn-evilanders-projects.vercel.app",
|
|
61
|
+
"submittedAt": null,
|
|
62
|
+
"operatorVerified": false,
|
|
63
|
+
"manualRuleCheckCompleted": false,
|
|
64
|
+
"postSubmitChecksCompleted": [],
|
|
65
|
+
"blocker": "Awaiting logged-in X posting; this browser session was confirmed for arXiv, HN, Reddit, and LinkedIn, but an attempt to open X compose redirected to the X login flow instead of a logged-in composer.",
|
|
66
|
+
"notes": "Public artifact URL is available; shorten the first post before posting because the current publication-pack X first post is 282/280 characters after URL reserve. Browser verification on 2026-05-13 reached https://x.com/i/flow/login?redirect_after_login=%2Fcompose%2Fpost, so no X launch thread was submitted."
|
|
67
|
+
},
|
|
68
|
+
{
|
|
69
|
+
"id": "linkedin-launch-post",
|
|
70
|
+
"platform": "linkedin",
|
|
71
|
+
"status": "submitted",
|
|
72
|
+
"publicUrl": "https://www.linkedin.com/feed/update/urn:li:share:7460326224108638208/",
|
|
73
|
+
"artifactUrl": "https://paper-site-r3jdakujn-evilanders-projects.vercel.app",
|
|
74
|
+
"submittedAt": "2026-05-13T08:53:01-05:00",
|
|
75
|
+
"operatorVerified": true,
|
|
76
|
+
"manualRuleCheckCompleted": false,
|
|
77
|
+
"postSubmitChecksCompleted": [
|
|
78
|
+
"Record the LinkedIn post URL.",
|
|
79
|
+
"Verify the preview points at the public paper or repo URL.",
|
|
80
|
+
"Verify the LinkedIn thread includes the GitHub repo URL."
|
|
81
|
+
],
|
|
82
|
+
"blocker": null,
|
|
83
|
+
"notes": "LinkedIn reported Post successful and exposes the post at the recorded update URL; the published post contains the Audrey launch text and LinkedIn's shortened outbound link for the public paper URL. A follow-up comment was posted on the same LinkedIn update with the GitHub repo URL https://github.com/Evilander/Audrey."
|
|
84
|
+
}
|
|
85
|
+
]
|
|
86
|
+
}
|
|
@@ -0,0 +1,66 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://audrey-memory.org/schemas/audrey-browser-launch-results.schema.json",
|
|
4
|
+
"title": "Audrey Browser Launch Results",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"additionalProperties": false,
|
|
7
|
+
"required": ["schemaVersion", "suite", "capturedAt", "plan", "targets"],
|
|
8
|
+
"properties": {
|
|
9
|
+
"schemaVersion": { "const": "1.0.0" },
|
|
10
|
+
"suite": { "const": "Audrey browser launch results" },
|
|
11
|
+
"capturedAt": { "type": "string", "minLength": 1 },
|
|
12
|
+
"plan": { "type": "string", "minLength": 1 },
|
|
13
|
+
"targets": {
|
|
14
|
+
"type": "array",
|
|
15
|
+
"minItems": 1,
|
|
16
|
+
"items": { "$ref": "#/$defs/targetResult" }
|
|
17
|
+
}
|
|
18
|
+
},
|
|
19
|
+
"$defs": {
|
|
20
|
+
"nullableHttpsUrl": {
|
|
21
|
+
"anyOf": [
|
|
22
|
+
{ "type": "null" },
|
|
23
|
+
{ "type": "string", "pattern": "^https://.+" }
|
|
24
|
+
]
|
|
25
|
+
},
|
|
26
|
+
"nullableString": {
|
|
27
|
+
"anyOf": [
|
|
28
|
+
{ "type": "null" },
|
|
29
|
+
{ "type": "string", "minLength": 1 }
|
|
30
|
+
]
|
|
31
|
+
},
|
|
32
|
+
"targetResult": {
|
|
33
|
+
"type": "object",
|
|
34
|
+
"additionalProperties": false,
|
|
35
|
+
"required": [
|
|
36
|
+
"id",
|
|
37
|
+
"platform",
|
|
38
|
+
"status",
|
|
39
|
+
"publicUrl",
|
|
40
|
+
"artifactUrl",
|
|
41
|
+
"submittedAt",
|
|
42
|
+
"operatorVerified",
|
|
43
|
+
"manualRuleCheckCompleted",
|
|
44
|
+
"postSubmitChecksCompleted",
|
|
45
|
+
"blocker",
|
|
46
|
+
"notes"
|
|
47
|
+
],
|
|
48
|
+
"properties": {
|
|
49
|
+
"id": { "type": "string", "pattern": "^[a-z0-9][a-z0-9-]*$" },
|
|
50
|
+
"platform": { "enum": ["arxiv", "hacker-news", "linkedin", "reddit", "x"] },
|
|
51
|
+
"status": { "enum": ["pending", "submitted", "skipped", "failed"] },
|
|
52
|
+
"publicUrl": { "$ref": "#/$defs/nullableHttpsUrl" },
|
|
53
|
+
"artifactUrl": { "$ref": "#/$defs/nullableHttpsUrl" },
|
|
54
|
+
"submittedAt": { "$ref": "#/$defs/nullableString" },
|
|
55
|
+
"operatorVerified": { "type": "boolean" },
|
|
56
|
+
"manualRuleCheckCompleted": { "type": "boolean" },
|
|
57
|
+
"postSubmitChecksCompleted": {
|
|
58
|
+
"type": "array",
|
|
59
|
+
"items": { "type": "string", "minLength": 1 }
|
|
60
|
+
},
|
|
61
|
+
"blocker": { "$ref": "#/$defs/nullableString" },
|
|
62
|
+
"notes": { "type": "string", "minLength": 1 }
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
}
|
|
66
|
+
}
|
|
@@ -0,0 +1,138 @@
|
|
|
1
|
+
{
|
|
2
|
+
"schemaVersion": "1.0.0",
|
|
3
|
+
"suite": "Audrey paper claim register",
|
|
4
|
+
"claims": [
|
|
5
|
+
{
|
|
6
|
+
"id": "C01",
|
|
7
|
+
"status": "supported",
|
|
8
|
+
"claim": "Audrey Guard passes the local Stage-A GuardBench comparative suite without leaking seeded secrets in published artifacts.",
|
|
9
|
+
"evidence": [
|
|
10
|
+
"benchmarks/output/guardbench-summary.json",
|
|
11
|
+
"benchmarks/output/guardbench-raw.json",
|
|
12
|
+
"docs/paper/evidence-ledger.md#E46",
|
|
13
|
+
"docs/paper/evidence-ledger.md#E65"
|
|
14
|
+
],
|
|
15
|
+
"artifactChecks": [
|
|
16
|
+
"guardbench-local-passed",
|
|
17
|
+
"no-published-secret-leaks"
|
|
18
|
+
],
|
|
19
|
+
"requiredText": [
|
|
20
|
+
{
|
|
21
|
+
"path": "README.md",
|
|
22
|
+
"text": "Latest local result in this checkout: 10/10 scenarios passed"
|
|
23
|
+
},
|
|
24
|
+
{
|
|
25
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
26
|
+
"text": "Local comparative GuardBench reports decision accuracy and full-contract pass rate across all ten scenarios"
|
|
27
|
+
}
|
|
28
|
+
],
|
|
29
|
+
"forbiddenText": []
|
|
30
|
+
},
|
|
31
|
+
{
|
|
32
|
+
"id": "C02",
|
|
33
|
+
"status": "pending",
|
|
34
|
+
"claim": "External Mem0 and Zep GuardBench scores are not reported until credentialed live bundles pass strict evidence verification.",
|
|
35
|
+
"evidence": [
|
|
36
|
+
"benchmarks/output/external/guardbench-external-evidence.json",
|
|
37
|
+
"benchmarks/adapters/registry.json",
|
|
38
|
+
"docs/paper/evidence-ledger.md#E77",
|
|
39
|
+
"docs/paper/evidence-ledger.md#E81"
|
|
40
|
+
],
|
|
41
|
+
"artifactChecks": [
|
|
42
|
+
"adapter-registry-has-mem0-zep",
|
|
43
|
+
"external-evidence-pending",
|
|
44
|
+
"paper-stage-boundary-excludes-external-scores"
|
|
45
|
+
],
|
|
46
|
+
"requiredText": [
|
|
47
|
+
{
|
|
48
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
49
|
+
"text": "this paper does not report external-system GuardBench scores"
|
|
50
|
+
},
|
|
51
|
+
{
|
|
52
|
+
"path": "docs/paper/SUBMISSION_README.md",
|
|
53
|
+
"text": "live Mem0 run is still pending"
|
|
54
|
+
},
|
|
55
|
+
{
|
|
56
|
+
"path": "docs/paper/SUBMISSION_README.md",
|
|
57
|
+
"text": "live Zep run is still pending"
|
|
58
|
+
}
|
|
59
|
+
],
|
|
60
|
+
"forbiddenText": [
|
|
61
|
+
{
|
|
62
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
63
|
+
"text": "Mem0 Platform passes 10/10"
|
|
64
|
+
},
|
|
65
|
+
{
|
|
66
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
67
|
+
"text": "Zep Cloud passes 10/10"
|
|
68
|
+
},
|
|
69
|
+
{
|
|
70
|
+
"path": "README.md",
|
|
71
|
+
"text": "external-system scores are reported"
|
|
72
|
+
}
|
|
73
|
+
]
|
|
74
|
+
},
|
|
75
|
+
{
|
|
76
|
+
"id": "C03",
|
|
77
|
+
"status": "supported",
|
|
78
|
+
"claim": "The public GuardBench artifact set has a one-command verifier that covers registry, modules, self-test, artifacts, bundle, external readiness, external evidence, and leaderboard.",
|
|
79
|
+
"evidence": [
|
|
80
|
+
"benchmarks/verify-publication-artifacts.mjs",
|
|
81
|
+
"benchmarks/schemas/guardbench-publication-verification.schema.json",
|
|
82
|
+
"docs/paper/evidence-ledger.md#E75",
|
|
83
|
+
"docs/paper/evidence-ledger.md#E80",
|
|
84
|
+
"docs/paper/evidence-ledger.md#E81"
|
|
85
|
+
],
|
|
86
|
+
"artifactChecks": [
|
|
87
|
+
"publication-verifier-ok"
|
|
88
|
+
],
|
|
89
|
+
"requiredText": [
|
|
90
|
+
{
|
|
91
|
+
"path": "README.md",
|
|
92
|
+
"text": "bench:guard:publication:verify"
|
|
93
|
+
},
|
|
94
|
+
{
|
|
95
|
+
"path": "docs/paper/audrey-paper-v1.md",
|
|
96
|
+
"text": "external evidence verification report"
|
|
97
|
+
}
|
|
98
|
+
],
|
|
99
|
+
"forbiddenText": []
|
|
100
|
+
},
|
|
101
|
+
{
|
|
102
|
+
"id": "C04",
|
|
103
|
+
"status": "supported",
|
|
104
|
+
"claim": "Published benchmark artifacts and external evidence reports do not contain seeded raw secrets or runtime credential values.",
|
|
105
|
+
"evidence": [
|
|
106
|
+
"benchmarks/output/guardbench-summary.json",
|
|
107
|
+
"benchmarks/output/guardbench-raw.json",
|
|
108
|
+
"benchmarks/output/external/guardbench-external-evidence.json",
|
|
109
|
+
"docs/paper/evidence-ledger.md#E65",
|
|
110
|
+
"docs/paper/evidence-ledger.md#E81"
|
|
111
|
+
],
|
|
112
|
+
"artifactChecks": [
|
|
113
|
+
"no-published-secret-leaks",
|
|
114
|
+
"external-evidence-no-secrets"
|
|
115
|
+
],
|
|
116
|
+
"requiredText": [
|
|
117
|
+
{
|
|
118
|
+
"path": "README.md",
|
|
119
|
+
"text": "0 published artifact leaks"
|
|
120
|
+
},
|
|
121
|
+
{
|
|
122
|
+
"path": "docs/paper/SUBMISSION_README.md",
|
|
123
|
+
"text": "runtime credential leaks"
|
|
124
|
+
}
|
|
125
|
+
],
|
|
126
|
+
"forbiddenText": [
|
|
127
|
+
{
|
|
128
|
+
"path": "benchmarks/output/guardbench-summary.json",
|
|
129
|
+
"text": "sk-guardbench-secret-0000000000000000000000000000"
|
|
130
|
+
},
|
|
131
|
+
{
|
|
132
|
+
"path": "benchmarks/output/external/guardbench-external-evidence.json",
|
|
133
|
+
"text": "runtime-key"
|
|
134
|
+
}
|
|
135
|
+
]
|
|
136
|
+
}
|
|
137
|
+
]
|
|
138
|
+
}
|