@beyondwork/docx-react-component 1.0.0 → 1.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (560) hide show
  1. package/README.md +44 -104
  2. package/package.json +66 -15
  3. package/src/api/public-types.ts +1 -1
  4. package/src/compare/diff-engine.ts +530 -0
  5. package/src/compare/export-redlines.ts +162 -0
  6. package/src/compare/snapshot.ts +37 -0
  7. package/src/core/commands/index.ts +1 -1
  8. package/src/core/state/editor-state.ts +2 -2
  9. package/src/index.ts +45 -0
  10. package/src/legal/bookmarks.ts +196 -0
  11. package/src/legal/cross-references.ts +356 -0
  12. package/src/legal/defined-terms.ts +203 -0
  13. package/src/runtime/document-runtime.ts +3 -5
  14. package/src/runtime/table-commands.ts +4 -1
  15. package/src/runtime/table-schema.ts +17 -2
  16. package/src/runtime/virtualized-rendering.ts +258 -0
  17. package/src/ui/WordReviewEditor.tsx +256 -35
  18. package/src/ui-tailwind/editor-surface/tw-editor-surface.tsx +2 -2
  19. package/src/ui-tailwind/editor-surface/tw-table-node-view.tsx +16 -2
  20. package/.codex/config.toml +0 -5
  21. package/.corepack/v1/pnpm/10.30.3/.corepack +0 -1
  22. package/.corepack/v1/pnpm/10.30.3/LICENSE +0 -22
  23. package/.corepack/v1/pnpm/10.30.3/README.md +0 -240
  24. package/.corepack/v1/pnpm/10.30.3/dist/node-gyp-bin/node-gyp +0 -6
  25. package/.corepack/v1/pnpm/10.30.3/dist/node-gyp-bin/node-gyp.cmd +0 -5
  26. package/.corepack/v1/pnpm/10.30.3/dist/pnpm.cjs +0 -195400
  27. package/.corepack/v1/pnpm/10.30.3/dist/pnpmrc +0 -2
  28. package/.corepack/v1/pnpm/10.30.3/dist/reflink.darwin-arm64-2HJ4WGO6.node +0 -0
  29. package/.corepack/v1/pnpm/10.30.3/dist/reflink.darwin-x64-3G3H6IW4.node +0 -0
  30. package/.corepack/v1/pnpm/10.30.3/dist/reflink.win32-arm64-msvc-Q6BARPPB.node +0 -0
  31. package/.corepack/v1/pnpm/10.30.3/dist/reflink.win32-x64-msvc-J2TZHRQI.node +0 -0
  32. package/.corepack/v1/pnpm/10.30.3/dist/templates/completion.bash +0 -31
  33. package/.corepack/v1/pnpm/10.30.3/dist/templates/completion.fish +0 -22
  34. package/.corepack/v1/pnpm/10.30.3/dist/templates/completion.ps1 +0 -193
  35. package/.corepack/v1/pnpm/10.30.3/dist/templates/completion.zsh +0 -27
  36. package/.corepack/v1/pnpm/10.30.3/dist/vendor/fastlist-0.3.0-x64.exe +0 -0
  37. package/.corepack/v1/pnpm/10.30.3/dist/vendor/fastlist-0.3.0-x86.exe +0 -0
  38. package/.corepack/v1/pnpm/10.30.3/dist/worker.js +0 -10119
  39. package/.corepack/v1/pnpm/10.30.3/package.json +0 -192
  40. package/.cursor/mcp.json +0 -7
  41. package/.github/workflows/ci.yml +0 -35
  42. package/.mcp.json +0 -7
  43. package/.openclaw/workspace-state.json +0 -4
  44. package/.pnpmrc.json +0 -1
  45. package/.wave-launch.sh +0 -7
  46. package/.workspace-marker +0 -1
  47. package/AGENTS.md +0 -78
  48. package/CHANGELOG.md +0 -177
  49. package/DESIGN.md +0 -929
  50. package/HEARTBEAT.md +0 -7
  51. package/IDENTITY.md +0 -23
  52. package/SOUL.md +0 -36
  53. package/TOOLS.md +0 -40
  54. package/USER.md +0 -17
  55. package/docs/README.md +0 -107
  56. package/docs/agents/wave-cont-eval-role.md +0 -36
  57. package/docs/agents/wave-cont-qa-role.md +0 -52
  58. package/docs/agents/wave-deploy-verifier-role.md +0 -34
  59. package/docs/agents/wave-design-role.md +0 -47
  60. package/docs/agents/wave-documentation-role.md +0 -34
  61. package/docs/agents/wave-infra-role.md +0 -34
  62. package/docs/agents/wave-integration-role.md +0 -37
  63. package/docs/agents/wave-launcher-role.md +0 -41
  64. package/docs/agents/wave-orchestrator-role.md +0 -52
  65. package/docs/agents/wave-planner-role.md +0 -39
  66. package/docs/agents/wave-security-role.md +0 -40
  67. package/docs/architecture/docx/README.md +0 -10
  68. package/docs/architecture/future/README.md +0 -8
  69. package/docs/architecture/ooxml-upgrade-analysis.md +0 -134
  70. package/docs/architecture/platform/shared-openxml-editor-platform.md +0 -153
  71. package/docs/architecture/xlsx/canonical-workbook-model-and-commands.md +0 -187
  72. package/docs/architecture/xlsx/spreadsheet-editor-frontend-architecture.md +0 -150
  73. package/docs/comment-redline-overview.md +0 -350
  74. package/docs/concepts/context7-vs-skills.md +0 -118
  75. package/docs/concepts/operating-modes.md +0 -91
  76. package/docs/concepts/runtime-agnostic-orchestration.md +0 -111
  77. package/docs/concepts/what-is-a-wave.md +0 -217
  78. package/docs/context7/bundles.json +0 -222
  79. package/docs/context7/planner-agent/README.md +0 -28
  80. package/docs/context7/planner-agent/manifest.json +0 -83
  81. package/docs/context7/planner-agent/papers/cooperbench-why-coding-agents-cannot-be-your-teammates-yet.md +0 -3283
  82. package/docs/context7/planner-agent/papers/dova-deliberation-first-multi-agent-orchestration-for-autonomous-research-automation.md +0 -1699
  83. package/docs/context7/planner-agent/papers/dpbench-large-language-models-struggle-with-simultaneous-coordination.md +0 -2251
  84. package/docs/context7/planner-agent/papers/incremental-planning-to-control-a-blackboard-based-problem-solver.md +0 -1729
  85. package/docs/context7/planner-agent/papers/silo-bench-a-scalable-environment-for-evaluating-distributed-coordination-in-multi-agent-llm-systems.md +0 -3747
  86. package/docs/context7/planner-agent/papers/todoevolve-learning-to-architect-agent-planning-systems.md +0 -1675
  87. package/docs/context7/planner-agent/papers/verified-multi-agent-orchestration-a-plan-execute-verify-replan-framework-for-complex-query-resolution.md +0 -1173
  88. package/docs/context7/planner-agent/papers/why-do-multi-agent-llm-systems-fail.md +0 -5211
  89. package/docs/context7/planner-agent/topics/planning-and-orchestration.md +0 -24
  90. package/docs/evals/arm-templates/README.md +0 -13
  91. package/docs/evals/arm-templates/full-wave.json +0 -15
  92. package/docs/evals/arm-templates/single-agent.json +0 -15
  93. package/docs/evals/benchmark-catalog.json +0 -670
  94. package/docs/evals/cases/README.md +0 -47
  95. package/docs/evals/cases/wave-blackboard-inbox-targeting.json +0 -73
  96. package/docs/evals/cases/wave-contradiction-conflict.json +0 -104
  97. package/docs/evals/cases/wave-expert-routing-preservation.json +0 -69
  98. package/docs/evals/cases/wave-hidden-profile-private-evidence.json +0 -81
  99. package/docs/evals/cases/wave-premature-closure-guard.json +0 -71
  100. package/docs/evals/cases/wave-silo-cross-agent-state.json +0 -77
  101. package/docs/evals/cases/wave-simultaneous-lockstep.json +0 -92
  102. package/docs/evals/external-benchmarks.json +0 -85
  103. package/docs/evals/external-command-config.sample.json +0 -9
  104. package/docs/evals/external-command-config.swe-bench-pro.json +0 -8
  105. package/docs/evals/pilots/README.md +0 -47
  106. package/docs/evals/pilots/swe-bench-pro-public-full-wave-review-10.json +0 -64
  107. package/docs/evals/pilots/swe-bench-pro-public-pilot.json +0 -111
  108. package/docs/evals/wave-benchmark-program.md +0 -302
  109. package/docs/guides/planner.md +0 -220
  110. package/docs/guides/recommendations-0.8.9.md +0 -133
  111. package/docs/guides/signal-wrappers.md +0 -165
  112. package/docs/guides/terminal-surfaces.md +0 -96
  113. package/docs/image copy.png +0 -0
  114. package/docs/image.png +0 -0
  115. package/docs/images/image.png +0 -0
  116. package/docs/legal-feedback-architecture.md +0 -498
  117. package/docs/plans/component-cutover-matrix.json +0 -1072
  118. package/docs/plans/component-cutover-matrix.md +0 -307
  119. package/docs/plans/context7-wave-orchestrator.md +0 -155
  120. package/docs/plans/current-state.md +0 -198
  121. package/docs/plans/docx/README.md +0 -9
  122. package/docs/plans/examples/wave-benchmark-improvement.md +0 -108
  123. package/docs/plans/examples/wave-example-live-proof.md +0 -435
  124. package/docs/plans/master-plan.md +0 -224
  125. package/docs/plans/migration.md +0 -538
  126. package/docs/plans/operations/README.md +0 -7
  127. package/docs/plans/operations/wave-10-word-certification.md +0 -87
  128. package/docs/plans/operations/wave-8-railway-staging.md +0 -153
  129. package/docs/plans/operations/wave-9-manual-certification.md +0 -73
  130. package/docs/plans/platform/README.md +0 -9
  131. package/docs/plans/reference/legal-checklist-coverage.md +0 -258
  132. package/docs/plans/wave-orchestrator.md +0 -423
  133. package/docs/plans/waves/README.md +0 -75
  134. package/docs/plans/waves/completed/wave-0.md +0 -195
  135. package/docs/plans/waves/completed/wave-1.md +0 -379
  136. package/docs/plans/waves/completed/wave-10.md +0 -670
  137. package/docs/plans/waves/completed/wave-11.md +0 -335
  138. package/docs/plans/waves/completed/wave-12.md +0 -417
  139. package/docs/plans/waves/completed/wave-13.md +0 -316
  140. package/docs/plans/waves/completed/wave-14.md +0 -319
  141. package/docs/plans/waves/completed/wave-15.md +0 -321
  142. package/docs/plans/waves/completed/wave-16.md +0 -316
  143. package/docs/plans/waves/completed/wave-17.md +0 -331
  144. package/docs/plans/waves/completed/wave-18.md +0 -328
  145. package/docs/plans/waves/completed/wave-2.md +0 -438
  146. package/docs/plans/waves/completed/wave-3.md +0 -435
  147. package/docs/plans/waves/completed/wave-4.md +0 -430
  148. package/docs/plans/waves/completed/wave-5.md +0 -430
  149. package/docs/plans/waves/completed/wave-6.md +0 -430
  150. package/docs/plans/waves/completed/wave-7.md +0 -526
  151. package/docs/plans/waves/completed/wave-8.md +0 -596
  152. package/docs/plans/waves/completed/wave-9.md +0 -552
  153. package/docs/plans/waves/deferred/README.md +0 -14
  154. package/docs/plans/waves/deferred/encrypted-intake-contracts.md +0 -282
  155. package/docs/plans/waves/deferred/legal-feedback-wave-expansion.md +0 -308
  156. package/docs/plans/waves/deferred/wave-encrypted-intake.md +0 -451
  157. package/docs/plans/waves/design/README.md +0 -5
  158. package/docs/plans/waves/design/wave-1-a1.md +0 -309
  159. package/docs/plans/waves/reviews/README.md +0 -5
  160. package/docs/plans/waves/reviews/wave-0-cont-qa.md +0 -151
  161. package/docs/plans/waves/reviews/wave-1-cont-qa.md +0 -46
  162. package/docs/plans/waves/reviews/wave-10-accessibility-and-design.md +0 -51
  163. package/docs/plans/waves/reviews/wave-10-cont-qa.md +0 -24
  164. package/docs/plans/waves/reviews/wave-10-dashboard-proof.md +0 -46
  165. package/docs/plans/waves/reviews/wave-10-performance-signoff.md +0 -55
  166. package/docs/plans/waves/reviews/wave-10-regression-proof.md +0 -23
  167. package/docs/plans/waves/reviews/wave-10-release-audit.md +0 -31
  168. package/docs/plans/waves/reviews/wave-10-service-proof.md +0 -83
  169. package/docs/plans/waves/reviews/wave-10-word-certification.md +0 -31
  170. package/docs/plans/waves/reviews/wave-18-ai-contract-closure.md +0 -277
  171. package/docs/plans/waves/reviews/wave-18-cont-qa.md +0 -255
  172. package/docs/plans/waves/reviews/wave-18-parity-proof.md +0 -271
  173. package/docs/plans/waves/reviews/wave-19-cont-qa.md +0 -59
  174. package/docs/plans/waves/reviews/wave-2-cont-qa.md +0 -72
  175. package/docs/plans/waves/reviews/wave-20-cont-qa.md +0 -60
  176. package/docs/plans/waves/reviews/wave-25-cont-qa.md +0 -48
  177. package/docs/plans/waves/reviews/wave-28-cont-qa.md +0 -46
  178. package/docs/plans/waves/reviews/wave-29-cont-qa.md +0 -53
  179. package/docs/plans/waves/reviews/wave-3-cont-qa.md +0 -53
  180. package/docs/plans/waves/reviews/wave-3-core-proof.md +0 -77
  181. package/docs/plans/waves/reviews/wave-3-validator-proof.md +0 -73
  182. package/docs/plans/waves/reviews/wave-32-cont-qa.md +0 -43
  183. package/docs/plans/waves/reviews/wave-33-cont-qa.md +0 -526
  184. package/docs/plans/waves/reviews/wave-34-cont-qa.md +0 -100
  185. package/docs/plans/waves/reviews/wave-35-cont-qa.md +0 -145
  186. package/docs/plans/waves/reviews/wave-4-cont-qa.md +0 -47
  187. package/docs/plans/waves/reviews/wave-4-structure-proof.md +0 -69
  188. package/docs/plans/waves/reviews/wave-5-comment-proof.md +0 -158
  189. package/docs/plans/waves/reviews/wave-5-cont-qa.md +0 -68
  190. package/docs/plans/waves/reviews/wave-6-cont-qa.md +0 -416
  191. package/docs/plans/waves/reviews/wave-6-redline-proof.md +0 -130
  192. package/docs/plans/waves/reviews/wave-7-cont-qa.md +0 -82
  193. package/docs/plans/waves/reviews/wave-7-ooxml-compliance.md +0 -85
  194. package/docs/plans/waves/reviews/wave-7-preservation-proof.md +0 -119
  195. package/docs/plans/waves/reviews/wave-7-trust-ux.md +0 -87
  196. package/docs/plans/waves/reviews/wave-8-accessibility-and-design.md +0 -128
  197. package/docs/plans/waves/reviews/wave-8-cont-qa.md +0 -92
  198. package/docs/plans/waves/reviews/wave-8-live-proof.md +0 -140
  199. package/docs/plans/waves/reviews/wave-8-security.md +0 -47
  200. package/docs/plans/waves/reviews/wave-9-editor-embedding.md +0 -39
  201. package/docs/plans/waves/reviews/wave-9-fixture-runner.md +0 -56
  202. package/docs/plans/waves/reviews/wave-9-live-proof.md +0 -105
  203. package/docs/plans/waves/reviews/wave-9-usability-and-performance.md +0 -152
  204. package/docs/plans/waves/specs/README.md +0 -5
  205. package/docs/plans/waves/specs/wave-1-component-boundaries.md +0 -322
  206. package/docs/plans/waves/specs/wave-1-ooxml-contracts.md +0 -323
  207. package/docs/plans/waves/specs/wave-1-review-and-ui-contracts.md +0 -339
  208. package/docs/plans/waves/specs/wave-1-runtime-contracts.md +0 -509
  209. package/docs/plans/waves/wave-19.md +0 -341
  210. package/docs/plans/waves/wave-20.md +0 -308
  211. package/docs/plans/waves/wave-21.md +0 -289
  212. package/docs/plans/waves/wave-22.md +0 -221
  213. package/docs/plans/waves/wave-23.md +0 -295
  214. package/docs/plans/waves/wave-24.md +0 -286
  215. package/docs/plans/waves/wave-25.md +0 -313
  216. package/docs/plans/waves/wave-26.md +0 -300
  217. package/docs/plans/waves/wave-27.md +0 -299
  218. package/docs/plans/waves/wave-28.md +0 -368
  219. package/docs/plans/waves/wave-29.md +0 -303
  220. package/docs/plans/waves/wave-30.md +0 -307
  221. package/docs/plans/waves/wave-31.md +0 -231
  222. package/docs/plans/waves/wave-32.md +0 -152
  223. package/docs/plans/waves/wave-33.md +0 -147
  224. package/docs/plans/waves/wave-34.md +0 -148
  225. package/docs/plans/waves/wave-35.md +0 -141
  226. package/docs/plans/waves/wave-36.md +0 -146
  227. package/docs/plans/xlsx/README.md +0 -14
  228. package/docs/plans/xlsx/xlsx-fixture-corpus-and-certification-plan.md +0 -126
  229. package/docs/reference/cli-reference.md +0 -600
  230. package/docs/reference/coordination-and-closure.md +0 -487
  231. package/docs/reference/deep-research-report (15).md +0 -25
  232. package/docs/reference/docx/README.md +0 -10
  233. package/docs/reference/legal-checklist.md +0 -445
  234. package/docs/reference/live-proof-waves.md +0 -199
  235. package/docs/reference/ooxml-compliance.md +0 -129
  236. package/docs/reference/ooxml-feature-parity-matrix.md +0 -172
  237. package/docs/reference/platform/shared-ooxml-platform-guidance.md +0 -77
  238. package/docs/reference/prototype-agent-prompt-legal-fidelity.md +0 -155
  239. package/docs/reference/public-api.md +0 -456
  240. package/docs/reference/repository-guidance.md +0 -58
  241. package/docs/reference/runtime-config/README.md +0 -182
  242. package/docs/reference/runtime-config/claude.md +0 -110
  243. package/docs/reference/runtime-config/codex.md +0 -82
  244. package/docs/reference/runtime-config/opencode.md +0 -93
  245. package/docs/reference/sample-waves.md +0 -105
  246. package/docs/reference/skills.md +0 -237
  247. package/docs/reference/templates/AGENTS.md +0 -78
  248. package/docs/reference/templates/HEARTBEAT.md +0 -7
  249. package/docs/reference/templates/IDENTITY.md +0 -23
  250. package/docs/reference/templates/SOUL.md +0 -36
  251. package/docs/reference/templates/TOOLS.md +0 -40
  252. package/docs/reference/templates/USER.md +0 -17
  253. package/docs/reference/wave-control.md +0 -184
  254. package/docs/reference/wave-planning-lessons.md +0 -167
  255. package/docs/reference/word-review-editor-frontend-architecture.md +0 -479
  256. package/docs/reference/word-review-editor-ux-guide.md +0 -253
  257. package/docs/reference/xlsx/xlsx-ooxml-compliance.md +0 -137
  258. package/docs/research/agent-context-sources.md +0 -178
  259. package/docs/research/coordination-failure-review.md +0 -290
  260. package/docs/research/docx-react-component/Canonical Document Schema Specification for a React-based Word-compatible Editor.md +0 -2317
  261. package/docs/research/docx-react-component/Feature Compatibility Matrix for a React Word Compatible Legal Editor v1.md +0 -219
  262. package/docs/research/docx-react-component/React Component Architecture and Front-End Structure Specification for a Word-Compatible Legal Review Editor.md +0 -1112
  263. package/docs/research/docx-react-component/document_compatibility_and_testing_spec.md +0 -751
  264. package/docs/research/xlsx/raw/README.md +0 -13
  265. package/docs/roadmap.md +0 -174
  266. package/docs/superpowers/plans/2026-03-28-harness-control-bar.md +0 -677
  267. package/docs/superpowers/specs/2026-03-28-harness-control-bar-design.md +0 -274
  268. package/docs/xlsx-react/README.md +0 -38
  269. package/docs/xlsx-react/agent-llm-interaction-layer-docx-xlsx.md +0 -621
  270. package/docs/xlsx-react/canonical-workbook-model-and-commands.md +0 -948
  271. package/docs/xlsx-react/shared-openxml-editor-platform-docx-xlsx.md +0 -228
  272. package/docs/xlsx-react/spreadsheet-editor-component-architecture.md +0 -809
  273. package/docs/xlsx-react/spreadsheet-editor-frontend-architecture.md +0 -537
  274. package/docs/xlsx-react/spreadsheet-editor-ux-guide.md +0 -520
  275. package/docs/xlsx-react/xlsx-editor-research-pack.md +0 -871
  276. package/docs/xlsx-react/xlsx-fixture-corpus-and-certification-plan.md +0 -436
  277. package/docs/xlsx-react/xlsx-ooxml-compliance.md +0 -320
  278. package/examples/README.md +0 -16
  279. package/memory/MEMORY.md +0 -24
  280. package/pnpm-workspace.yaml +0 -4
  281. package/scripts/check-no-authored-js.sh +0 -13
  282. package/scripts/context7-api-check.sh +0 -65
  283. package/scripts/context7-export-env.sh +0 -42
  284. package/scripts/run-context7-mcp.sh +0 -8
  285. package/scripts/run-workspace-tests.sh +0 -15
  286. package/scripts/start-wave-10-local.sh +0 -189
  287. package/scripts/wave-agent-attach.sh +0 -47
  288. package/scripts/wave-auto-answer.sh +0 -118
  289. package/scripts/wave-dashboard-attach.sh +0 -13
  290. package/scripts/wave-launch.sh +0 -273
  291. package/scripts/wave-overnight-supervisor.sh +0 -145
  292. package/scripts/wave-status.sh +0 -379
  293. package/scripts/wave-watch.sh +0 -231
  294. package/services/README.md +0 -17
  295. package/services/openxml-validator/Dockerfile +0 -29
  296. package/services/openxml-validator/OpenXmlValidator.Api.csproj +0 -12
  297. package/services/openxml-validator/Program.cs +0 -436
  298. package/services/openxml-validator/README.md +0 -152
  299. package/services/openxml-validator/railway.json +0 -16
  300. package/services/react-word-editor/.tmp-a4/src/api/public-types.ts +0 -318
  301. package/services/react-word-editor/.tmp-a4/src/ui/WordReviewEditor.tsx +0 -1302
  302. package/services/react-word-editor/.tmp-a4/src/ui/editor-surface/editor-surface.tsx +0 -546
  303. package/services/react-word-editor/.tmp-a4/test/ui/word-review-editor.test.tsx +0 -146
  304. package/services/react-word-editor/.tmp-a4-build/src/api/public-types.js +0 -2
  305. package/services/react-word-editor/.tmp-a4-build/src/ui/WordReviewEditor.js +0 -818
  306. package/services/react-word-editor/.tmp-a4-build/src/ui/editor-surface/editor-surface.js +0 -229
  307. package/services/react-word-editor/.tmp-a4-build/test/ui/word-review-editor.test.js +0 -121
  308. package/services/react-word-editor/.tmp-wave-4-a3-tsconfig.json +0 -21
  309. package/services/react-word-editor/.tmp-wave-4-a3-tsconfig.tsbuildinfo +0 -1
  310. package/services/react-word-editor/Dockerfile +0 -26
  311. package/services/react-word-editor/README.md +0 -254
  312. package/services/react-word-editor/app/api/certification/route.ts +0 -79
  313. package/services/react-word-editor/app/api/demo-sessions/route.ts +0 -109
  314. package/services/react-word-editor/app/api/deploy-health/route.ts +0 -23
  315. package/services/react-word-editor/app/api/exports/[exportId]/route.ts +0 -34
  316. package/services/react-word-editor/app/api/exports/route.ts +0 -81
  317. package/services/react-word-editor/app/api/fixtures/[fixtureId]/run/route.ts +0 -100
  318. package/services/react-word-editor/app/api/health/route.ts +0 -70
  319. package/services/react-word-editor/app/api/runs/[runId]/route.ts +0 -36
  320. package/services/react-word-editor/app/api/scenarios/[scenarioId]/run/route.ts +0 -85
  321. package/services/react-word-editor/app/api/sessions/[sessionId]/route.ts +0 -199
  322. package/services/react-word-editor/app/api/sessions/[sessionId]/source/route.ts +0 -45
  323. package/services/react-word-editor/app/api/uploads/route.ts +0 -70
  324. package/services/react-word-editor/app/api/validate/route.ts +0 -310
  325. package/services/react-word-editor/app/certification/[runId]/page.tsx +0 -14
  326. package/services/react-word-editor/app/certification/page.tsx +0 -32
  327. package/services/react-word-editor/app/dashboard/page.tsx +0 -7
  328. package/services/react-word-editor/app/demo/page.tsx +0 -30
  329. package/services/react-word-editor/app/demo/prototype-client.tsx +0 -1080
  330. package/services/react-word-editor/app/editor/[sessionId]/page.tsx +0 -33
  331. package/services/react-word-editor/app/fixtures/page.tsx +0 -7
  332. package/services/react-word-editor/app/globals.css +0 -121
  333. package/services/react-word-editor/app/layout.tsx +0 -32
  334. package/services/react-word-editor/app/page.tsx +0 -30
  335. package/services/react-word-editor/app/runs/[runId]/page.tsx +0 -34
  336. package/services/react-word-editor/app/wave-10-word-review/page.tsx +0 -7
  337. package/services/react-word-editor/components/harness-control-bar.tsx +0 -289
  338. package/services/react-word-editor/components/harness-editor-session-client.tsx +0 -1214
  339. package/services/react-word-editor/components/harness-workspace-page.tsx +0 -715
  340. package/services/react-word-editor/components/reduced-motion-toggle.tsx +0 -79
  341. package/services/react-word-editor/components/workspace-certification-panel.tsx +0 -307
  342. package/services/react-word-editor/lib/certification-bundle.ts +0 -796
  343. package/services/react-word-editor/lib/certification-store.ts +0 -661
  344. package/services/react-word-editor/lib/demo-fixtures.test.mjs +0 -195
  345. package/services/react-word-editor/lib/demo-fixtures.ts +0 -1519
  346. package/services/react-word-editor/lib/editor-session-summary.test.mjs +0 -68
  347. package/services/react-word-editor/lib/editor-session-summary.ts +0 -14
  348. package/services/react-word-editor/lib/editor-session.ts +0 -228
  349. package/services/react-word-editor/lib/exports-route.test.mjs +0 -32
  350. package/services/react-word-editor/lib/harness-client.ts +0 -347
  351. package/services/react-word-editor/lib/harness-config.json +0 -30
  352. package/services/react-word-editor/lib/harness-config.test.mjs +0 -31
  353. package/services/react-word-editor/lib/harness-config.ts +0 -21
  354. package/services/react-word-editor/lib/harness-editor-datastore.test.mjs +0 -220
  355. package/services/react-word-editor/lib/harness-editor-datastore.ts +0 -161
  356. package/services/react-word-editor/lib/private-mode.test.mjs +0 -42
  357. package/services/react-word-editor/lib/private-mode.ts +0 -61
  358. package/services/react-word-editor/lib/regression-report.test.mjs +0 -352
  359. package/services/react-word-editor/lib/regression-report.ts +0 -896
  360. package/services/react-word-editor/lib/run-artifacts.ts +0 -934
  361. package/services/react-word-editor/lib/run-history.ts +0 -755
  362. package/services/react-word-editor/lib/scenario-artifacts.test.mjs +0 -41
  363. package/services/react-word-editor/lib/scenario-artifacts.ts +0 -44
  364. package/services/react-word-editor/lib/storage.ts +0 -953
  365. package/services/react-word-editor/lib/validator-client.test.mjs +0 -54
  366. package/services/react-word-editor/lib/validator-client.ts +0 -95
  367. package/services/react-word-editor/lib/workspace-navigation.ts +0 -79
  368. package/services/react-word-editor/middleware.ts +0 -35
  369. package/services/react-word-editor/next-env.d.ts +0 -6
  370. package/services/react-word-editor/next.config.mjs +0 -15
  371. package/services/react-word-editor/package.json +0 -38
  372. package/services/react-word-editor/postcss.config.mjs +0 -8
  373. package/services/react-word-editor/railway.json +0 -21
  374. package/services/react-word-editor/scripts/wave-10-certification.mjs +0 -101
  375. package/services/react-word-editor/scripts/wave-9-live-usability-pilot.mjs +0 -911
  376. package/services/react-word-editor/tsconfig.json +0 -39
  377. package/services/react-word-editor/tsconfig.tsbuildinfo +0 -1
  378. package/skills/README.md +0 -48
  379. package/skills/domain-docx-compatibility/SKILL.md +0 -44
  380. package/skills/domain-docx-compatibility/skill.json +0 -19
  381. package/skills/domain-editor-architecture/SKILL.md +0 -49
  382. package/skills/domain-editor-architecture/skill.json +0 -19
  383. package/skills/domain-legal-review/SKILL.md +0 -39
  384. package/skills/domain-legal-review/skill.json +0 -19
  385. package/skills/provider-aws/SKILL.md +0 -117
  386. package/skills/provider-aws/adapters/claude.md +0 -1
  387. package/skills/provider-aws/adapters/codex.md +0 -1
  388. package/skills/provider-aws/references/service-verification.md +0 -39
  389. package/skills/provider-aws/skill.json +0 -54
  390. package/skills/provider-custom-deploy/SKILL.md +0 -64
  391. package/skills/provider-custom-deploy/skill.json +0 -50
  392. package/skills/provider-docker-compose/SKILL.md +0 -96
  393. package/skills/provider-docker-compose/adapters/local.md +0 -1
  394. package/skills/provider-docker-compose/skill.json +0 -53
  395. package/skills/provider-github-release/SKILL.md +0 -121
  396. package/skills/provider-github-release/adapters/claude.md +0 -1
  397. package/skills/provider-github-release/adapters/codex.md +0 -1
  398. package/skills/provider-github-release/skill.json +0 -55
  399. package/skills/provider-kubernetes/SKILL.md +0 -143
  400. package/skills/provider-kubernetes/adapters/claude.md +0 -1
  401. package/skills/provider-kubernetes/adapters/codex.md +0 -1
  402. package/skills/provider-kubernetes/references/kubectl-patterns.md +0 -58
  403. package/skills/provider-kubernetes/skill.json +0 -52
  404. package/skills/provider-railway/SKILL.md +0 -123
  405. package/skills/provider-railway/adapters/claude.md +0 -1
  406. package/skills/provider-railway/adapters/codex.md +0 -1
  407. package/skills/provider-railway/adapters/local.md +0 -1
  408. package/skills/provider-railway/adapters/opencode.md +0 -1
  409. package/skills/provider-railway/references/verification-commands.md +0 -39
  410. package/skills/provider-railway/skill.json +0 -71
  411. package/skills/provider-ssh-manual/SKILL.md +0 -97
  412. package/skills/provider-ssh-manual/skill.json +0 -54
  413. package/skills/repo-coding-rules/SKILL.md +0 -55
  414. package/skills/repo-coding-rules/skill.json +0 -34
  415. package/skills/role-cont-eval/SKILL.md +0 -91
  416. package/skills/role-cont-eval/adapters/codex.md +0 -1
  417. package/skills/role-cont-eval/skill.json +0 -36
  418. package/skills/role-cont-qa/SKILL.md +0 -100
  419. package/skills/role-cont-qa/adapters/claude.md +0 -1
  420. package/skills/role-cont-qa/skill.json +0 -36
  421. package/skills/role-deploy/SKILL.md +0 -97
  422. package/skills/role-deploy/skill.json +0 -36
  423. package/skills/role-design/SKILL.md +0 -50
  424. package/skills/role-design/skill.json +0 -36
  425. package/skills/role-documentation/SKILL.md +0 -76
  426. package/skills/role-documentation/skill.json +0 -36
  427. package/skills/role-implementation/SKILL.md +0 -45
  428. package/skills/role-implementation/skill.json +0 -36
  429. package/skills/role-infra/SKILL.md +0 -81
  430. package/skills/role-infra/skill.json +0 -36
  431. package/skills/role-integration/SKILL.md +0 -91
  432. package/skills/role-integration/skill.json +0 -36
  433. package/skills/role-planner/SKILL.md +0 -39
  434. package/skills/role-planner/skill.json +0 -21
  435. package/skills/role-research/SKILL.md +0 -65
  436. package/skills/role-research/skill.json +0 -36
  437. package/skills/role-security/SKILL.md +0 -60
  438. package/skills/role-security/skill.json +0 -36
  439. package/skills/runtime-claude/SKILL.md +0 -66
  440. package/skills/runtime-claude/skill.json +0 -36
  441. package/skills/runtime-codex/SKILL.md +0 -58
  442. package/skills/runtime-codex/skill.json +0 -36
  443. package/skills/runtime-local/SKILL.md +0 -46
  444. package/skills/runtime-local/skill.json +0 -36
  445. package/skills/runtime-opencode/SKILL.md +0 -58
  446. package/skills/runtime-opencode/skill.json +0 -36
  447. package/skills/signal-hygiene/SKILL.md +0 -51
  448. package/skills/signal-hygiene/skill.json +0 -20
  449. package/skills/tui-design/SKILL.md +0 -77
  450. package/skills/tui-design/references/tui-design.md +0 -259
  451. package/skills/tui-design/skill.json +0 -36
  452. package/skills/wave-core/SKILL.md +0 -141
  453. package/skills/wave-core/references/marker-syntax.md +0 -70
  454. package/skills/wave-core/skill.json +0 -35
  455. package/test/README.md +0 -16
  456. package/test/core/formatting-commands.test.ts +0 -285
  457. package/test/core/image-commands.test.ts +0 -298
  458. package/test/core/mapping.test.ts +0 -186
  459. package/test/core/text-commands.test.ts +0 -176
  460. package/test/fixtures/docx/F01-basic-contract.docx +0 -0
  461. package/test/fixtures/docx/F01-basic-contract.md +0 -33
  462. package/test/fixtures/docx/F02-headings-styles.docx +0 -0
  463. package/test/fixtures/docx/F02-headings-styles.md +0 -33
  464. package/test/fixtures/docx/F03-legal-outline-numbering.docx +0 -0
  465. package/test/fixtures/docx/F03-legal-outline-numbering.md +0 -34
  466. package/test/fixtures/docx/F04-restart-numbering-schedules.docx +0 -0
  467. package/test/fixtures/docx/F04-restart-numbering-schedules.md +0 -33
  468. package/test/fixtures/docx/F05-table-heavy-agreement.docx +0 -0
  469. package/test/fixtures/docx/F05-table-heavy-agreement.md +0 -34
  470. package/test/fixtures/docx/F06-merged-cells-signature-table.docx +0 -0
  471. package/test/fixtures/docx/F06-merged-cells-signature-table.md +0 -34
  472. package/test/fixtures/docx/F07-inline-images-exhibit.docx +0 -0
  473. package/test/fixtures/docx/F07-inline-images-exhibit.md +0 -34
  474. package/test/fixtures/docx/F08-hyperlinks.docx +0 -0
  475. package/test/fixtures/docx/F08-hyperlinks.md +0 -33
  476. package/test/fixtures/docx/F09-comments-single-paragraph.docx +0 -0
  477. package/test/fixtures/docx/F09-comments-single-paragraph.md +0 -33
  478. package/test/fixtures/docx/F10-threaded-comments-resolve.docx +0 -0
  479. package/test/fixtures/docx/F10-threaded-comments-resolve.md +0 -33
  480. package/test/fixtures/docx/F11-redlines-basic.docx +0 -0
  481. package/test/fixtures/docx/F11-redlines-basic.md +0 -33
  482. package/test/fixtures/docx/F12-redlines-paragraph-joins-splits.docx +0 -0
  483. package/test/fixtures/docx/F12-redlines-paragraph-joins-splits.md +0 -33
  484. package/test/fixtures/docx/F13-comments-on-deleted-text.docx +0 -0
  485. package/test/fixtures/docx/F13-comments-on-deleted-text.md +0 -33
  486. package/test/fixtures/docx/F14-revisions-in-tables-and-lists.docx +0 -0
  487. package/test/fixtures/docx/F14-revisions-in-tables-and-lists.md +0 -33
  488. package/test/fixtures/docx/F15-sections-headers-footers.docx +0 -0
  489. package/test/fixtures/docx/F15-sections-headers-footers.md +0 -33
  490. package/test/fixtures/docx/F16-footnotes-endnotes.docx +0 -0
  491. package/test/fixtures/docx/F16-footnotes-endnotes.md +0 -33
  492. package/test/fixtures/docx/F17-fields-and-toc.docx +0 -0
  493. package/test/fixtures/docx/F17-fields-and-toc.md +0 -33
  494. package/test/fixtures/docx/F18-content-controls-template.docx +0 -0
  495. package/test/fixtures/docx/F18-content-controls-template.md +0 -33
  496. package/test/fixtures/docx/F19-custom-xml-doc-assembly.docx +0 -0
  497. package/test/fixtures/docx/F19-custom-xml-doc-assembly.md +0 -35
  498. package/test/fixtures/docx/F20-unknown-ooxml-and-alternatecontent.docx +0 -0
  499. package/test/fixtures/docx/F20-unknown-ooxml-and-alternatecontent.md +0 -33
  500. package/test/fixtures/docx/F21-malformed-broken-docx.docx +0 -0
  501. package/test/fixtures/docx/F21-malformed-broken-docx.md +0 -33
  502. package/test/fixtures/docx/README.md +0 -74
  503. package/test/fixtures/docx/certification-manifest.json +0 -104
  504. package/test/fixtures/docx/fixtures.manifest.json +0 -196
  505. package/test/fixtures/encrypted-docx/README.md +0 -27
  506. package/test/fixtures/encrypted-docx/certification-manifest.json +0 -9
  507. package/test/fixtures/encrypted-docx/fixtures.manifest.json +0 -47
  508. package/test/fixtures/scenarios/docx/README.md +0 -25
  509. package/test/fixtures/scenarios/docx/S01-sow-template.docx +0 -0
  510. package/test/fixtures/scenarios/docx/S01-sow-template.md +0 -30
  511. package/test/fixtures/scenarios/docx/S02-bw-partner-user-licence-agreement-redlines.docx +0 -0
  512. package/test/fixtures/scenarios/docx/S02-bw-partner-user-licence-agreement-redlines.md +0 -32
  513. package/test/fixtures/scenarios/docx/scenario-manifest.json +0 -53
  514. package/test/formats/xlsx/io/xlsx-import.test.ts +0 -766
  515. package/test/formats/xlsx/model/workbook.test.ts +0 -669
  516. package/test/helpers/dom-setup.ts +0 -124
  517. package/test/io/comment-roundtrip.test.ts +0 -272
  518. package/test/io/complex-content-roundtrip.test.ts +0 -632
  519. package/test/io/docx-compatibility-regression.test.ts +0 -199
  520. package/test/io/docx-session.test.ts +0 -1495
  521. package/test/io/footnotes-roundtrip.test.ts +0 -318
  522. package/test/io/headers-footers-roundtrip.test.ts +0 -547
  523. package/test/io/numbering-roundtrip.test.ts +0 -234
  524. package/test/io/package-reader.test.ts +0 -199
  525. package/test/io/paragraph-properties-roundtrip.test.ts +0 -129
  526. package/test/io/preserved-package-roundtrip.test.ts +0 -365
  527. package/test/io/property-completeness.test.ts +0 -292
  528. package/test/io/revision-roundtrip.test.ts +0 -347
  529. package/test/io/structural-blocks.test.ts +0 -202
  530. package/test/io/table-media-roundtrip.test.ts +0 -448
  531. package/test/io/table-properties-roundtrip.test.ts +0 -569
  532. package/test/io/table-roundtrip.test.ts +0 -302
  533. package/test/io/text-roundtrip.test.ts +0 -344
  534. package/test/model/canonical-document.test.ts +0 -285
  535. package/test/preservation/opaque-fragment-store.test.ts +0 -121
  536. package/test/preservation/package-preservation.test.ts +0 -395
  537. package/test/preservation/store.test.ts +0 -84
  538. package/test/review/comment-remapping.test.ts +0 -220
  539. package/test/review/comment-store.test.ts +0 -180
  540. package/test/review/move-revisions.test.ts +0 -143
  541. package/test/review/property-change-revisions.test.ts +0 -225
  542. package/test/review/revision-actions.test.ts +0 -330
  543. package/test/review/revision-store.test.ts +0 -193
  544. package/test/runtime/session-capabilities.test.ts +0 -260
  545. package/test/runtime/table-commands.test.ts +0 -356
  546. package/test/runtime/table-schema.test.ts +0 -221
  547. package/test/runtime/tracked-changes-toggle.test.ts +0 -107
  548. package/test/ui/comment-review-surface.test.tsx +0 -114
  549. package/test/ui/reduced-motion-toggle.test.tsx +0 -137
  550. package/test/ui/word-review-editor.imported-scenarios.test.tsx +0 -169
  551. package/test/ui/word-review-editor.interaction.test.tsx +0 -1198
  552. package/test/ui/word-review-editor.test.js +0 -188
  553. package/test/ui/word-review-editor.test.tsx +0 -280
  554. package/test/ui-tailwind/search-plugin.test.ts +0 -286
  555. package/test/validation/compatibility-engine.test.ts +0 -336
  556. package/test/validation/compatibility-report.test.ts +0 -189
  557. package/test/validation/low-priority-word-surfaces.test.ts +0 -282
  558. package/test/validation/malformed-doc.test.ts +0 -113
  559. package/test-results/.last-run.json +0 -4
  560. package/wave.config.json +0 -406
@@ -1,670 +0,0 @@
1
- {
2
- "version": 2,
3
- "families": {
4
- "service-output": {
5
- "title": "Service Output Quality",
6
- "summary": "Benchmarks for reviewing runtime output quality, behavior, and correctness.",
7
- "benchmarks": {
8
- "golden-response-smoke": {
9
- "title": "Golden Response Smoke",
10
- "summary": "Compare representative outputs to known-good expectations."
11
- },
12
- "manual-session-review": {
13
- "title": "Manual Session Review",
14
- "summary": "Run the service manually and document output gaps from representative user flows."
15
- }
16
- }
17
- },
18
- "latency": {
19
- "title": "Latency",
20
- "summary": "Benchmarks for startup and request latency.",
21
- "benchmarks": {
22
- "http-latency-smoke": {
23
- "title": "HTTP Latency Smoke",
24
- "summary": "Quick latency pass over the service's core request path."
25
- },
26
- "cold-start-smoke": {
27
- "title": "Cold Start Smoke",
28
- "summary": "Track cold start behavior for the primary runtime surface."
29
- }
30
- }
31
- },
32
- "quality-regression": {
33
- "title": "Quality Regression",
34
- "summary": "Benchmarks for guarding against regressions during output tuning.",
35
- "benchmarks": {
36
- "baseline-diff-review": {
37
- "title": "Baseline Diff Review",
38
- "summary": "Compare current outputs to a previous accepted baseline."
39
- },
40
- "operator-checklist-review": {
41
- "title": "Operator Checklist Review",
42
- "summary": "Run a documented checklist over the tuned output surface."
43
- }
44
- }
45
- },
46
- "hidden-profile-pooling": {
47
- "title": "Hidden Profile Pooling",
48
- "summary": "Benchmarks for whether distributed private evidence is surfaced, pooled, and integrated before the team converges.",
49
- "category": "coordination",
50
- "coordinationModel": "blackboard-distributed-information",
51
- "primaryMetric": {
52
- "id": "distributed-info-accuracy",
53
- "title": "Distributed Information Accuracy",
54
- "unit": "percent",
55
- "direction": "higher-is-better",
56
- "summary": "Accuracy when key evidence begins distributed across agents."
57
- },
58
- "secondaryMetrics": [
59
- {
60
- "id": "latent-asymmetry-surfacing-rate",
61
- "title": "Latent Asymmetry Surfacing Rate",
62
- "unit": "percent",
63
- "direction": "higher-is-better"
64
- },
65
- {
66
- "id": "premature-convergence-rate",
67
- "title": "Premature Convergence Rate",
68
- "unit": "percent",
69
- "direction": "lower-is-better"
70
- }
71
- ],
72
- "paperReferences": [
73
- {
74
- "id": "hiddenbench-2025",
75
- "title": "Systematic Failures in Collective Reasoning under Distributed Information in Multi-Agent LLMs",
76
- "year": 2025,
77
- "url": "https://arxiv.org/abs/2505.11556",
78
- "summary": "HiddenBench benchmark for collective reasoning under distributed information."
79
- }
80
- ],
81
- "sotaBaseline": {
82
- "source": "paper-static",
83
- "paper": "HiddenBench",
84
- "year": 2025,
85
- "metric": "distributed-info-accuracy",
86
- "value": 30.1,
87
- "notes": "Reported multi-agent accuracy under distributed information in the paper abstract.",
88
- "url": "https://arxiv.org/abs/2505.11556"
89
- },
90
- "benchmarks": {
91
- "latent-asymmetry-surfacing": {
92
- "title": "Latent Asymmetry Surfacing",
93
- "summary": "Checks whether agents explicitly seek or expose facts they suspect other agents may hold.",
94
- "goal": "Measure whether the framework notices unshared evidence before converging.",
95
- "failureModes": [
96
- "latent-information-asymmetry",
97
- "premature-consensus",
98
- "shared-evidence-overweighting"
99
- ],
100
- "signals": [
101
- "requests-for-missing-evidence",
102
- "inbox-to-summary-fact-escalation",
103
- "late-discovered-decision-changing-fact"
104
- ],
105
- "scoring": {
106
- "primaryMetric": "latent-asymmetry-surfacing-rate",
107
- "successCriterion": "Critical unshared evidence is surfaced before final recommendation.",
108
- "rubric": "Score higher when agents explicitly search for missing facts instead of relying on already-shared evidence."
109
- },
110
- "paperReferences": [
111
- {
112
- "id": "hiddenbench-2025",
113
- "title": "Systematic Failures in Collective Reasoning under Distributed Information in Multi-Agent LLMs",
114
- "year": 2025,
115
- "url": "https://arxiv.org/abs/2505.11556"
116
- }
117
- ],
118
- "tuningNotes": "Use when adjusting inbox compilation, clarification prompting, or board-to-summary compression."
119
- },
120
- "private-evidence-integration": {
121
- "title": "Private Evidence Integration",
122
- "summary": "Checks whether separately observed facts are integrated into the final answer rather than merely repeated in conversation.",
123
- "localCases": ["wave-hidden-profile-private-evidence"],
124
- "goal": "Measure end-to-end integration of distributed evidence into a coherent outcome.",
125
- "failureModes": [
126
- "communication-without-integration",
127
- "evidence-drop",
128
- "incorrect-global-reconstruction"
129
- ],
130
- "signals": [
131
- "final-answer-uses-private-facts",
132
- "integration-summary-cites-distributed-evidence",
133
- "correct-global-state-reconstruction"
134
- ],
135
- "scoring": {
136
- "primaryMetric": "distributed-info-accuracy",
137
- "successCriterion": "The final answer requires and reflects the distributed facts.",
138
- "rubric": "Score higher only when the final recommendation depends on the pooled evidence."
139
- },
140
- "sotaBaseline": {
141
- "source": "paper-static",
142
- "paper": "HiddenBench",
143
- "year": 2025,
144
- "metric": "distributed-info-accuracy",
145
- "value": 30.1,
146
- "notes": "Paper baseline for multi-agent distributed-information accuracy.",
147
- "url": "https://arxiv.org/abs/2505.11556"
148
- }
149
- },
150
- "premature-consensus-guard": {
151
- "title": "Premature Consensus Guard",
152
- "summary": "Checks whether the system delays closure when important evidence is still siloed.",
153
- "localCases": ["wave-premature-closure-guard"],
154
- "goal": "Measure resistance to converging early on shared but incomplete evidence.",
155
- "failureModes": [
156
- "premature-consensus",
157
- "closure-before-evidence-pooling"
158
- ],
159
- "signals": [
160
- "clarification-raised-before-close",
161
- "integration-barrier-trips",
162
- "documentation-or-cont-qa-blocks"
163
- ],
164
- "scoring": {
165
- "primaryMetric": "premature-convergence-rate",
166
- "successCriterion": "Final closure is blocked when a decision-relevant fact remains siloed."
167
- }
168
- }
169
- }
170
- },
171
- "silo-escape": {
172
- "title": "Silo Escape",
173
- "summary": "Benchmarks for whether agents can move from locally sufficient views to globally correct coordinated state.",
174
- "category": "coordination",
175
- "coordinationModel": "shared-workspace-integration",
176
- "primaryMetric": {
177
- "id": "global-state-reconstruction-rate",
178
- "title": "Global State Reconstruction Rate",
179
- "unit": "percent",
180
- "direction": "higher-is-better",
181
- "summary": "Rate at which the team reconstructs the correct distributed state."
182
- },
183
- "secondaryMetrics": [
184
- {
185
- "id": "communication-reasoning-gap",
186
- "title": "Communication-Reasoning Gap",
187
- "unit": "rubric",
188
- "direction": "lower-is-better"
189
- },
190
- {
191
- "id": "summary-fact-retention-rate",
192
- "title": "Summary Fact Retention Rate",
193
- "unit": "percent",
194
- "direction": "higher-is-better"
195
- }
196
- ],
197
- "paperReferences": [
198
- {
199
- "id": "silo-bench-2026",
200
- "title": "Silo-Bench: A Scalable Environment for Evaluating Distributed Coordination in Multi-Agent LLM Systems",
201
- "year": 2026,
202
- "url": "https://arxiv.org/abs/2603.01045",
203
- "summary": "Shows agents often exchange information but fail to integrate it."
204
- }
205
- ],
206
- "benchmarks": {
207
- "cross-agent-state-reconstruction": {
208
- "title": "Cross-Agent State Reconstruction",
209
- "summary": "Checks whether the final shared state reflects facts that no single agent started with alone.",
210
- "localCases": ["wave-silo-cross-agent-state"],
211
- "goal": "Measure whether the blackboard can reconstruct a correct global state from distributed local views.",
212
- "failureModes": [
213
- "information-silo",
214
- "global-state-loss",
215
- "integration-failure"
216
- ],
217
- "signals": [
218
- "integration-summary-mentions-cross-agent-facts",
219
- "ledger-reflects-distributed-blockers",
220
- "final-answer-requires-pooled-state"
221
- ],
222
- "scoring": {
223
- "primaryMetric": "global-state-reconstruction-rate",
224
- "successCriterion": "The correct global state is reconstructed and used in the decision."
225
- },
226
- "tuningNotes": "Use when adjusting shared summary size, inbox targeting, or integration evidence aggregation."
227
- },
228
- "shared-summary-fact-retention": {
229
- "title": "Shared Summary Fact Retention",
230
- "summary": "Checks whether compiled summaries preserve critical facts from the raw coordination log.",
231
- "goal": "Measure information loss introduced by summary compression.",
232
- "failureModes": [
233
- "summary-compression-loss",
234
- "critical-fact-drop"
235
- ],
236
- "signals": [
237
- "raw-log-fact-present-in-summary",
238
- "summary-fact-present-in-inbox",
239
- "decision-uses-retained-facts"
240
- ],
241
- "scoring": {
242
- "primaryMetric": "summary-fact-retention-rate",
243
- "successCriterion": "Decision-changing facts survive from raw log into the shared summary and targeted inboxes."
244
- }
245
- },
246
- "communication-reasoning-gap-review": {
247
- "title": "Communication-Reasoning Gap Review",
248
- "summary": "Checks whether active communication actually improves the final integrated answer.",
249
- "goal": "Measure the gap between information exchange and correct synthesis.",
250
- "failureModes": [
251
- "communication-without-synthesis",
252
- "false-confidence-after-sharing"
253
- ],
254
- "signals": [
255
- "messages-exchanged",
256
- "facts-shared",
257
- "incorrect-integrated-answer"
258
- ],
259
- "scoring": {
260
- "primaryMetric": "communication-reasoning-gap",
261
- "successCriterion": "Additional communication materially improves the final integrated answer."
262
- },
263
- "sotaBaseline": {
264
- "source": "paper-static",
265
- "paper": "Silo-Bench",
266
- "year": 2026,
267
- "metric": "communication-reasoning-gap",
268
- "value": "present",
269
- "notes": "Silo-Bench reports a persistent communication-reasoning gap rather than a single abstracted scalar baseline.",
270
- "url": "https://arxiv.org/abs/2603.01045"
271
- }
272
- }
273
- }
274
- },
275
- "simultaneous-coordination": {
276
- "title": "Simultaneous Coordination",
277
- "summary": "Benchmarks for contention, deadlock, and convergent-reasoning failures when decisions must be made concurrently.",
278
- "category": "coordination",
279
- "coordinationModel": "simultaneous-resource-contention",
280
- "primaryMetric": {
281
- "id": "deadlock-rate",
282
- "title": "Deadlock Rate",
283
- "unit": "percent",
284
- "direction": "lower-is-better",
285
- "summary": "Frequency of deadlock or coordination collapse under simultaneous decisions."
286
- },
287
- "secondaryMetrics": [
288
- {
289
- "id": "contention-resolution-rate",
290
- "title": "Contention Resolution Rate",
291
- "unit": "percent",
292
- "direction": "higher-is-better"
293
- },
294
- {
295
- "id": "symmetry-breaking-rate",
296
- "title": "Symmetry Breaking Rate",
297
- "unit": "percent",
298
- "direction": "higher-is-better"
299
- }
300
- ],
301
- "paperReferences": [
302
- {
303
- "id": "dpbench-2026",
304
- "title": "DPBench: Large Language Models Struggle with Simultaneous Coordination",
305
- "year": 2026,
306
- "url": "https://arxiv.org/abs/2602.13255",
307
- "summary": "Shows severe failures under simultaneous coordination and convergent reasoning."
308
- }
309
- ],
310
- "sotaBaseline": {
311
- "source": "paper-static",
312
- "paper": "DPBench",
313
- "year": 2026,
314
- "metric": "deadlock-rate",
315
- "value": 95,
316
- "notes": "Paper abstract reports deadlock rates exceeding 95 percent under some simultaneous settings.",
317
- "url": "https://arxiv.org/abs/2602.13255"
318
- },
319
- "benchmarks": {
320
- "contention-deadlock-avoidance": {
321
- "title": "Contention Deadlock Avoidance",
322
- "summary": "Checks whether the framework avoids deadlock under simultaneous resource contention.",
323
- "goal": "Measure whether external coordination surfaces reduce deadlock-like failure.",
324
- "failureModes": [
325
- "deadlock",
326
- "convergent-reasoning",
327
- "resource-contention-collapse"
328
- ],
329
- "signals": [
330
- "deadlock-observed",
331
- "dependency-barrier-resolution",
332
- "assignment-reroute-success"
333
- ],
334
- "scoring": {
335
- "primaryMetric": "deadlock-rate",
336
- "successCriterion": "The team avoids deadlock and reaches a valid allocation or resolution."
337
- },
338
- "sotaBaseline": {
339
- "source": "paper-static",
340
- "paper": "DPBench",
341
- "year": 2026,
342
- "metric": "deadlock-rate",
343
- "value": 95,
344
- "notes": "Reference point from the abstract's reported worst-case deadlock rate.",
345
- "url": "https://arxiv.org/abs/2602.13255"
346
- }
347
- },
348
- "symmetric-action-divergence": {
349
- "title": "Symmetric Action Divergence",
350
- "summary": "Checks whether agents can avoid choosing the same locally sensible but globally conflicting action.",
351
- "goal": "Measure symmetry breaking under pressure.",
352
- "failureModes": [
353
- "same-plan-collapse",
354
- "convergent-reasoning"
355
- ],
356
- "signals": [
357
- "distinct-action-selection",
358
- "lock-or-ticket-usage",
359
- "retry-breaks-symmetry"
360
- ],
361
- "scoring": {
362
- "primaryMetric": "symmetry-breaking-rate",
363
- "successCriterion": "At least one agent changes strategy in time to avoid global conflict."
364
- }
365
- },
366
- "lockstep-resolution": {
367
- "title": "Lockstep Resolution",
368
- "summary": "Checks whether the framework resolves many-way concurrent dependencies without circular waiting.",
369
- "localCases": ["wave-simultaneous-lockstep"],
370
- "goal": "Measure coordination quality when several blocking tickets must resolve together.",
371
- "failureModes": [
372
- "circular-wait",
373
- "helper-assignment-stall",
374
- "dependency-stall"
375
- ],
376
- "signals": [
377
- "required-dependencies-close",
378
- "clarification-chain-completes",
379
- "no-indefinite-retry-loop"
380
- ],
381
- "scoring": {
382
- "primaryMetric": "contention-resolution-rate",
383
- "successCriterion": "Concurrent blockers close without repeated deadlock-like relaunch cycles."
384
- }
385
- }
386
- }
387
- },
388
- "expertise-leverage": {
389
- "title": "Expertise Leverage",
390
- "summary": "Benchmarks for whether the framework routes work toward experts and preserves expert signals instead of averaging them away.",
391
- "category": "coordination",
392
- "coordinationModel": "role-and-capability-routing",
393
- "primaryMetric": {
394
- "id": "expert-preservation-rate",
395
- "title": "Expert Preservation Rate",
396
- "unit": "percent",
397
- "direction": "higher-is-better",
398
- "summary": "Rate at which expert-advantaged decisions survive to the final recommendation."
399
- },
400
- "secondaryMetrics": [
401
- {
402
- "id": "expert-performance-gap",
403
- "title": "Expert Performance Gap",
404
- "unit": "percent",
405
- "direction": "lower-is-better"
406
- },
407
- {
408
- "id": "capability-routing-precision",
409
- "title": "Capability Routing Precision",
410
- "unit": "percent",
411
- "direction": "higher-is-better"
412
- }
413
- ],
414
- "paperReferences": [
415
- {
416
- "id": "experts-back-2026",
417
- "title": "Multi-Agent Teams Hold Experts Back",
418
- "year": 2026,
419
- "url": "https://arxiv.org/abs/2602.01011",
420
- "summary": "Shows unconstrained teams often underuse their best expert."
421
- }
422
- ],
423
- "sotaBaseline": {
424
- "source": "paper-static",
425
- "paper": "Multi-Agent Teams Hold Experts Back",
426
- "year": 2026,
427
- "metric": "expert-performance-gap",
428
- "value": 37.6,
429
- "notes": "Paper abstract reports performance losses of up to 37.6 percent relative to the best expert agent.",
430
- "url": "https://arxiv.org/abs/2602.01011"
431
- },
432
- "benchmarks": {
433
- "expert-routing-preservation": {
434
- "title": "Expert Routing Preservation",
435
- "summary": "Checks whether capability-targeted work is routed to the best available owner and stays there through closure.",
436
- "localCases": ["wave-expert-routing-preservation"],
437
- "goal": "Measure whether the harness protects expert ownership instead of diluting it.",
438
- "failureModes": [
439
- "expert-underuse",
440
- "misrouting",
441
- "owner-dilution"
442
- ],
443
- "signals": [
444
- "preferred-agent-selected",
445
- "assigned-owner-resolves-task",
446
- "few-non-expert-overrides"
447
- ],
448
- "scoring": {
449
- "primaryMetric": "capability-routing-precision",
450
- "successCriterion": "Capability-targeted requests land on the intended owner or a justified fallback."
451
- }
452
- },
453
- "expert-signal-weighting": {
454
- "title": "Expert Signal Weighting",
455
- "summary": "Checks whether the final recommendation preserves a stronger expert signal when expert and non-expert views conflict.",
456
- "goal": "Measure resistance to integrative compromise.",
457
- "failureModes": [
458
- "integrative-compromise",
459
- "expert-signal-dilution"
460
- ],
461
- "signals": [
462
- "expert-evidence-cited-integration",
463
- "cont-qa-honors-expert-proof",
464
- "non-expert-opinion-does-not-override-proof"
465
- ],
466
- "scoring": {
467
- "primaryMetric": "expert-preservation-rate",
468
- "successCriterion": "The final result tracks the best-supported expert view rather than the average view."
469
- }
470
- },
471
- "anti-compromise-decision-review": {
472
- "title": "Anti-Compromise Decision Review",
473
- "summary": "Checks whether the framework avoids averaging incompatible recommendations into a low-quality compromise.",
474
- "goal": "Measure whether closure authority and proof gates prevent compromise collapse.",
475
- "failureModes": [
476
- "consensus-over-correctness",
477
- "expert-performance-gap"
478
- ],
479
- "signals": [
480
- "integration-flags-conflict",
481
- "clarification-raised",
482
- "final-recommendation-follows-evidence"
483
- ],
484
- "scoring": {
485
- "primaryMetric": "expert-performance-gap",
486
- "successCriterion": "The team does not regress materially below its strongest expert signal."
487
- },
488
- "sotaBaseline": {
489
- "source": "paper-static",
490
- "paper": "Multi-Agent Teams Hold Experts Back",
491
- "year": 2026,
492
- "metric": "expert-performance-gap",
493
- "value": 37.6,
494
- "notes": "Reference point from the abstract's reported expert-underuse loss.",
495
- "url": "https://arxiv.org/abs/2602.01011"
496
- }
497
- }
498
- }
499
- },
500
- "blackboard-fidelity": {
501
- "title": "Blackboard Fidelity",
502
- "summary": "Benchmarks for whether raw coordination, summaries, inboxes, ledgers, and integration state stay semantically aligned.",
503
- "category": "coordination",
504
- "coordinationModel": "blackboard-projection-integrity",
505
- "primaryMetric": {
506
- "id": "projection-consistency-rate",
507
- "title": "Projection Consistency Rate",
508
- "unit": "percent",
509
- "direction": "higher-is-better",
510
- "summary": "Rate at which derived blackboard artifacts preserve the underlying coordination facts."
511
- },
512
- "secondaryMetrics": [
513
- {
514
- "id": "targeted-inbox-recall",
515
- "title": "Targeted Inbox Recall",
516
- "unit": "percent",
517
- "direction": "higher-is-better"
518
- },
519
- {
520
- "id": "integration-coherence-rate",
521
- "title": "Integration Coherence Rate",
522
- "unit": "percent",
523
- "direction": "higher-is-better"
524
- }
525
- ],
526
- "benchmarks": {
527
- "log-to-summary-consistency": {
528
- "title": "Log To Summary Consistency",
529
- "summary": "Checks whether the shared summary preserves critical blockers, clarifications, dependencies, and conflicts from the raw log.",
530
- "goal": "Measure whether summary generation remains trustworthy as the wave grows.",
531
- "failureModes": [
532
- "summary-drift",
533
- "projection-loss"
534
- ],
535
- "signals": [
536
- "blocker-preserved",
537
- "clarification-preserved",
538
- "dependency-preserved",
539
- "conflict-preserved"
540
- ],
541
- "scoring": {
542
- "primaryMetric": "projection-consistency-rate",
543
- "successCriterion": "Critical coordination facts remain visible after projection."
544
- }
545
- },
546
- "inbox-targeting-fidelity": {
547
- "title": "Inbox Targeting Fidelity",
548
- "summary": "Checks whether relevant facts reach the agents that own the impacted paths, components, or requests.",
549
- "localCases": ["wave-blackboard-inbox-targeting"],
550
- "goal": "Measure whether inbox targeting reduces silos instead of creating them.",
551
- "failureModes": [
552
- "mis-targeted-context",
553
- "owner-context-loss"
554
- ],
555
- "signals": [
556
- "artifact-relevant-fact-routed",
557
- "owned-component-fact-routed",
558
- "targeted-request-routed"
559
- ],
560
- "scoring": {
561
- "primaryMetric": "targeted-inbox-recall",
562
- "successCriterion": "Agents receive the facts relevant to their owned paths, components, or follow-up work."
563
- }
564
- },
565
- "integration-summary-coherence": {
566
- "title": "Integration Summary Coherence",
567
- "summary": "Checks whether integration output is faithful to blockers, claims, proof gaps, docs gaps, and deploy risks seen elsewhere.",
568
- "goal": "Measure whether the integration steward output is a reliable synthesis layer.",
569
- "failureModes": [
570
- "integration-hallucination",
571
- "integration-omission"
572
- ],
573
- "signals": [
574
- "conflicts-match-log",
575
- "proof-gaps-match-agent-state",
576
- "doc-gaps-match-doc-queue"
577
- ],
578
- "scoring": {
579
- "primaryMetric": "integration-coherence-rate",
580
- "successCriterion": "Integration summaries match the evidence visible in coordination, validation, and runtime signals."
581
- }
582
- }
583
- }
584
- },
585
- "contradiction-recovery": {
586
- "title": "Contradiction Recovery",
587
- "summary": "Benchmarks for whether the framework notices conflicting claims and converts them into explicit repair work instead of silent inconsistency.",
588
- "category": "coordination",
589
- "coordinationModel": "conflict-detection-and-repair",
590
- "primaryMetric": {
591
- "id": "contradiction-detection-rate",
592
- "title": "Contradiction Detection Rate",
593
- "unit": "percent",
594
- "direction": "higher-is-better",
595
- "summary": "Rate at which material conflicting claims are surfaced before closeout."
596
- },
597
- "secondaryMetrics": [
598
- {
599
- "id": "repair-closure-rate",
600
- "title": "Repair Closure Rate",
601
- "unit": "percent",
602
- "direction": "higher-is-better"
603
- },
604
- {
605
- "id": "false-consensus-rate",
606
- "title": "False Consensus Rate",
607
- "unit": "percent",
608
- "direction": "lower-is-better"
609
- }
610
- ],
611
- "benchmarks": {
612
- "claim-conflict-detection": {
613
- "title": "Claim Conflict Detection",
614
- "summary": "Checks whether incompatible claims are surfaced in coordination or integration instead of passing through silently.",
615
- "localCases": ["wave-contradiction-conflict"],
616
- "goal": "Measure whether the framework sees contradictory evidence before final closure.",
617
- "failureModes": [
618
- "false-consensus",
619
- "silent-contradiction"
620
- ],
621
- "signals": [
622
- "integration-conflict-raised",
623
- "cont-qa-blocks",
624
- "follow-up-request-created"
625
- ],
626
- "scoring": {
627
- "primaryMetric": "contradiction-detection-rate",
628
- "successCriterion": "Conflicting claims are surfaced as explicit blockers or conflicts before closeout."
629
- }
630
- },
631
- "evidence-based-repair": {
632
- "title": "Evidence Based Repair",
633
- "summary": "Checks whether contradictions produce concrete owner-bound follow-up work and eventually close.",
634
- "goal": "Measure whether conflict handling ends in repair rather than logging alone.",
635
- "failureModes": [
636
- "conflict-without-repair",
637
- "dangling-follow-up"
638
- ],
639
- "signals": [
640
- "helper-assignment-created",
641
- "clarification-linked-request-closes",
642
- "integration-recommendation-improves"
643
- ],
644
- "scoring": {
645
- "primaryMetric": "repair-closure-rate",
646
- "successCriterion": "Contradictions produce follow-up work that resolves before final pass."
647
- }
648
- },
649
- "clarification-chain-closure": {
650
- "title": "Clarification Chain Closure",
651
- "summary": "Checks whether clarification requests remain linked and blocking until their follow-up chain really closes.",
652
- "goal": "Measure resistance to fake resolution through status drift.",
653
- "failureModes": [
654
- "premature-clarification-close",
655
- "broken-linkage"
656
- ],
657
- "signals": [
658
- "closure-condition-present",
659
- "linked-request-open-while-parent-open",
660
- "human-escalation-when-needed"
661
- ],
662
- "scoring": {
663
- "primaryMetric": "false-consensus-rate",
664
- "successCriterion": "Clarifications do not silently disappear without an actual linked resolution."
665
- }
666
- }
667
- }
668
- }
669
- }
670
- }