switchroom 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (718) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +447 -0
  3. package/bin/autoaccept.exp +81 -0
  4. package/bin/boot-self-test.sh +149 -0
  5. package/bin/bridge-watchdog.sh +967 -0
  6. package/bin/handoff-briefing.sh +206 -0
  7. package/bin/run-hook.sh +228 -0
  8. package/bin/switchroom.ts +4 -0
  9. package/bin/timezone-hook.sh +67 -0
  10. package/bin/user-profile-refresh-hook.sh +38 -0
  11. package/bin/workspace-dynamic-hook.sh +142 -0
  12. package/bin/workspace-stable-hook.sh +57 -0
  13. package/dist/cli/autoaccept-poll.js +118 -0
  14. package/dist/cli/switchroom.js +48557 -0
  15. package/package.json +95 -0
  16. package/profiles/_base/settings.json.hbs +15 -0
  17. package/profiles/_base/start.sh.hbs +383 -0
  18. package/profiles/_shared/telegram-style.md.hbs +140 -0
  19. package/profiles/coding/CLAUDE.md.hbs +57 -0
  20. package/profiles/coding/skills/architecture/SKILL.md +70 -0
  21. package/profiles/coding/skills/code-review/SKILL.md +58 -0
  22. package/profiles/coding/workspace/SOUL.md.hbs +25 -0
  23. package/profiles/default/CLAUDE.md +238 -0
  24. package/profiles/default/CLAUDE.md.hbs +113 -0
  25. package/profiles/default/workspace/CLAUDE.md.hbs +126 -0
  26. package/profiles/default/workspace/HEARTBEAT.md.hbs +40 -0
  27. package/profiles/default/workspace/IDENTITY.md.hbs +32 -0
  28. package/profiles/default/workspace/MEMORY.md.hbs +29 -0
  29. package/profiles/default/workspace/SOUL.md.hbs +61 -0
  30. package/profiles/default/workspace/TOOLS.md.hbs +29 -0
  31. package/profiles/default/workspace/USER.md.hbs +52 -0
  32. package/profiles/default/workspace/memory/.gitkeep +0 -0
  33. package/profiles/executive-assistant/CLAUDE.md.hbs +51 -0
  34. package/profiles/executive-assistant/skills/daily-briefing/SKILL.md +55 -0
  35. package/profiles/executive-assistant/skills/meeting-prep/SKILL.md +58 -0
  36. package/profiles/executive-assistant/workspace/SOUL.md.hbs +25 -0
  37. package/profiles/health-coach/CLAUDE.md.hbs +45 -0
  38. package/profiles/health-coach/skills/check-in/SKILL.md +41 -0
  39. package/profiles/health-coach/skills/weekly-review/SKILL.md +53 -0
  40. package/profiles/health-coach/workspace/SOUL.md.hbs +25 -0
  41. package/skills/buildkite-agent-infrastructure/SKILL.md +302 -0
  42. package/skills/buildkite-agent-infrastructure/agents/openai.yaml +6 -0
  43. package/skills/buildkite-agent-infrastructure/assets/buildkite-icon-large.png +0 -0
  44. package/skills/buildkite-agent-infrastructure/assets/buildkite-icon-small.png +0 -0
  45. package/skills/buildkite-agent-infrastructure/references/audit-logging.md +87 -0
  46. package/skills/buildkite-agent-infrastructure/references/graphql-mutations.md +690 -0
  47. package/skills/buildkite-agent-infrastructure/references/instance-shapes.md +38 -0
  48. package/skills/buildkite-agent-infrastructure/references/pipeline-templates.md +73 -0
  49. package/skills/buildkite-agent-infrastructure/references/self-hosted-agents.md +137 -0
  50. package/skills/buildkite-agent-infrastructure/references/sso-saml.md +92 -0
  51. package/skills/buildkite-agent-runtime/SKILL.md +476 -0
  52. package/skills/buildkite-agent-runtime/agents/openai.yaml +6 -0
  53. package/skills/buildkite-agent-runtime/assets/buildkite-icon-large.png +0 -0
  54. package/skills/buildkite-agent-runtime/assets/buildkite-icon-small.png +0 -0
  55. package/skills/buildkite-agent-runtime/references/flag-reference.md +417 -0
  56. package/skills/buildkite-agent-runtime/references/patterns-and-recipes.md +555 -0
  57. package/skills/buildkite-api/SKILL.md +285 -0
  58. package/skills/buildkite-api/agents/openai.yaml +6 -0
  59. package/skills/buildkite-api/assets/buildkite-icon-large.png +0 -0
  60. package/skills/buildkite-api/assets/buildkite-icon-small.png +0 -0
  61. package/skills/buildkite-api/references/graphql-reference.md +195 -0
  62. package/skills/buildkite-api/references/patterns.md +44 -0
  63. package/skills/buildkite-api/references/webhooks.md +161 -0
  64. package/skills/buildkite-cli/SKILL.md +379 -0
  65. package/skills/buildkite-cli/agents/openai.yaml +6 -0
  66. package/skills/buildkite-cli/assets/buildkite-icon-large.png +0 -0
  67. package/skills/buildkite-cli/assets/buildkite-icon-small.png +0 -0
  68. package/skills/buildkite-cli/references/command-reference.md +181 -0
  69. package/skills/buildkite-migration/SKILL.md +182 -0
  70. package/skills/buildkite-pipelines/SKILL.md +464 -0
  71. package/skills/buildkite-pipelines/agents/openai.yaml +6 -0
  72. package/skills/buildkite-pipelines/assets/buildkite-icon-large.png +0 -0
  73. package/skills/buildkite-pipelines/assets/buildkite-icon-small.png +0 -0
  74. package/skills/buildkite-pipelines/examples/basic-pipeline.yml +24 -0
  75. package/skills/buildkite-pipelines/examples/optimized-pipeline.yml +100 -0
  76. package/skills/buildkite-pipelines/references/advanced-patterns.md +286 -0
  77. package/skills/buildkite-pipelines/references/retry-and-error-codes.md +131 -0
  78. package/skills/buildkite-pipelines/references/step-types-reference.md +225 -0
  79. package/skills/buildkite-secure-delivery/SKILL.md +168 -0
  80. package/skills/buildkite-secure-delivery/agents/openai.yaml +6 -0
  81. package/skills/buildkite-secure-delivery/assets/buildkite-icon-large.png +0 -0
  82. package/skills/buildkite-secure-delivery/assets/buildkite-icon-small.png +0 -0
  83. package/skills/buildkite-secure-delivery/references/oidc-cloud-providers.md +83 -0
  84. package/skills/buildkite-secure-delivery/references/package-publishing.md +100 -0
  85. package/skills/buildkite-test-engine/SKILL.md +239 -0
  86. package/skills/buildkite-test-engine/agents/openai.yaml +6 -0
  87. package/skills/buildkite-test-engine/assets/buildkite-icon-large.png +0 -0
  88. package/skills/buildkite-test-engine/assets/buildkite-icon-small.png +0 -0
  89. package/skills/buildkite-test-engine/examples/bktec-splitting.yml +16 -0
  90. package/skills/buildkite-test-engine/examples/collector-pipeline.yml +11 -0
  91. package/skills/buildkite-test-engine/references/collectors.md +198 -0
  92. package/skills/buildkite-test-engine/references/splitting-examples.md +93 -0
  93. package/skills/docx/LICENSE.txt +30 -0
  94. package/skills/docx/SKILL.md +590 -0
  95. package/skills/docx/VENDORED.md +32 -0
  96. package/skills/docx/scripts/__init__.py +1 -0
  97. package/skills/docx/scripts/accept_changes.py +135 -0
  98. package/skills/docx/scripts/comment.py +318 -0
  99. package/skills/docx/scripts/office/helpers/__init__.py +0 -0
  100. package/skills/docx/scripts/office/helpers/merge_runs.py +199 -0
  101. package/skills/docx/scripts/office/helpers/simplify_redlines.py +197 -0
  102. package/skills/docx/scripts/office/pack.py +159 -0
  103. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
  104. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
  105. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
  106. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
  107. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
  108. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
  109. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
  110. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
  111. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
  112. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
  113. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
  114. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
  115. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
  116. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
  117. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
  118. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
  119. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
  120. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
  121. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
  122. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
  123. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
  124. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
  125. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
  126. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
  127. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
  128. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
  129. package/skills/docx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
  130. package/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
  131. package/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
  132. package/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
  133. package/skills/docx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
  134. package/skills/docx/scripts/office/schemas/mce/mc.xsd +75 -0
  135. package/skills/docx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
  136. package/skills/docx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
  137. package/skills/docx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
  138. package/skills/docx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
  139. package/skills/docx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
  140. package/skills/docx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
  141. package/skills/docx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
  142. package/skills/docx/scripts/office/soffice.py +183 -0
  143. package/skills/docx/scripts/office/unpack.py +132 -0
  144. package/skills/docx/scripts/office/validate.py +111 -0
  145. package/skills/docx/scripts/office/validators/__init__.py +15 -0
  146. package/skills/docx/scripts/office/validators/__pycache__/__init__.cpython-313.pyc +0 -0
  147. package/skills/docx/scripts/office/validators/__pycache__/base.cpython-313.pyc +0 -0
  148. package/skills/docx/scripts/office/validators/base.py +847 -0
  149. package/skills/docx/scripts/office/validators/docx.py +446 -0
  150. package/skills/docx/scripts/office/validators/pptx.py +275 -0
  151. package/skills/docx/scripts/office/validators/redlining.py +247 -0
  152. package/skills/docx/scripts/templates/comments.xml +3 -0
  153. package/skills/docx/scripts/templates/commentsExtended.xml +3 -0
  154. package/skills/docx/scripts/templates/commentsExtensible.xml +3 -0
  155. package/skills/docx/scripts/templates/commentsIds.xml +3 -0
  156. package/skills/docx/scripts/templates/people.xml +3 -0
  157. package/skills/file-bug/SKILL.md +129 -0
  158. package/skills/humanizer/LICENSE +21 -0
  159. package/skills/humanizer/SKILL.md +559 -0
  160. package/skills/humanizer/VENDORED.md +38 -0
  161. package/skills/humanizer-calibrate/SKILL.md +144 -0
  162. package/skills/mcp-builder/LICENSE.txt +202 -0
  163. package/skills/mcp-builder/SKILL.md +236 -0
  164. package/skills/mcp-builder/VENDORED.md +32 -0
  165. package/skills/mcp-builder/reference/evaluation.md +602 -0
  166. package/skills/mcp-builder/reference/mcp_best_practices.md +249 -0
  167. package/skills/mcp-builder/reference/node_mcp_server.md +970 -0
  168. package/skills/mcp-builder/reference/python_mcp_server.md +719 -0
  169. package/skills/mcp-builder/scripts/connections.py +151 -0
  170. package/skills/mcp-builder/scripts/evaluation.py +373 -0
  171. package/skills/mcp-builder/scripts/example_evaluation.xml +22 -0
  172. package/skills/mcp-builder/scripts/requirements.txt +2 -0
  173. package/skills/pdf/LICENSE.txt +30 -0
  174. package/skills/pdf/SKILL.md +314 -0
  175. package/skills/pdf/VENDORED.md +32 -0
  176. package/skills/pdf/forms.md +294 -0
  177. package/skills/pdf/reference.md +612 -0
  178. package/skills/pdf/scripts/check_bounding_boxes.py +65 -0
  179. package/skills/pdf/scripts/check_fillable_fields.py +11 -0
  180. package/skills/pdf/scripts/convert_pdf_to_images.py +33 -0
  181. package/skills/pdf/scripts/create_validation_image.py +37 -0
  182. package/skills/pdf/scripts/extract_form_field_info.py +122 -0
  183. package/skills/pdf/scripts/extract_form_structure.py +115 -0
  184. package/skills/pdf/scripts/fill_fillable_fields.py +98 -0
  185. package/skills/pdf/scripts/fill_pdf_form_with_annotations.py +107 -0
  186. package/skills/pptx/LICENSE.txt +30 -0
  187. package/skills/pptx/SKILL.md +232 -0
  188. package/skills/pptx/VENDORED.md +32 -0
  189. package/skills/pptx/editing.md +205 -0
  190. package/skills/pptx/pptxgenjs.md +420 -0
  191. package/skills/pptx/scripts/__init__.py +0 -0
  192. package/skills/pptx/scripts/add_slide.py +195 -0
  193. package/skills/pptx/scripts/clean.py +286 -0
  194. package/skills/pptx/scripts/office/helpers/__init__.py +0 -0
  195. package/skills/pptx/scripts/office/helpers/merge_runs.py +199 -0
  196. package/skills/pptx/scripts/office/helpers/simplify_redlines.py +197 -0
  197. package/skills/pptx/scripts/office/pack.py +159 -0
  198. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
  199. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
  200. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
  201. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
  202. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
  203. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
  204. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
  205. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
  206. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
  207. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
  208. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
  209. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
  210. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
  211. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
  212. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
  213. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
  214. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
  215. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
  216. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
  217. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
  218. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
  219. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
  220. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
  221. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
  222. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
  223. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
  224. package/skills/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
  225. package/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
  226. package/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
  227. package/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
  228. package/skills/pptx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
  229. package/skills/pptx/scripts/office/schemas/mce/mc.xsd +75 -0
  230. package/skills/pptx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
  231. package/skills/pptx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
  232. package/skills/pptx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
  233. package/skills/pptx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
  234. package/skills/pptx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
  235. package/skills/pptx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
  236. package/skills/pptx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
  237. package/skills/pptx/scripts/office/soffice.py +183 -0
  238. package/skills/pptx/scripts/office/unpack.py +132 -0
  239. package/skills/pptx/scripts/office/validate.py +111 -0
  240. package/skills/pptx/scripts/office/validators/__init__.py +15 -0
  241. package/skills/pptx/scripts/office/validators/base.py +847 -0
  242. package/skills/pptx/scripts/office/validators/docx.py +446 -0
  243. package/skills/pptx/scripts/office/validators/pptx.py +275 -0
  244. package/skills/pptx/scripts/office/validators/redlining.py +247 -0
  245. package/skills/pptx/scripts/thumbnail.py +289 -0
  246. package/skills/skill-creator/LICENSE.txt +202 -0
  247. package/skills/skill-creator/SKILL.md +485 -0
  248. package/skills/skill-creator/VENDORED.md +32 -0
  249. package/skills/skill-creator/agents/analyzer.md +274 -0
  250. package/skills/skill-creator/agents/comparator.md +202 -0
  251. package/skills/skill-creator/agents/grader.md +223 -0
  252. package/skills/skill-creator/assets/eval_review.html +146 -0
  253. package/skills/skill-creator/eval-viewer/generate_review.py +471 -0
  254. package/skills/skill-creator/eval-viewer/viewer.html +1325 -0
  255. package/skills/skill-creator/references/schemas.md +430 -0
  256. package/skills/skill-creator/scripts/__init__.py +0 -0
  257. package/skills/skill-creator/scripts/aggregate_benchmark.py +401 -0
  258. package/skills/skill-creator/scripts/generate_report.py +326 -0
  259. package/skills/skill-creator/scripts/improve_description.py +247 -0
  260. package/skills/skill-creator/scripts/package_skill.py +136 -0
  261. package/skills/skill-creator/scripts/quick_validate.py +103 -0
  262. package/skills/skill-creator/scripts/run_eval.py +310 -0
  263. package/skills/skill-creator/scripts/run_loop.py +328 -0
  264. package/skills/skill-creator/scripts/utils.py +47 -0
  265. package/skills/switchroom-architecture/SKILL.md +60 -0
  266. package/skills/switchroom-architecture/cascade.md +112 -0
  267. package/skills/switchroom-architecture/sub-agents.md +87 -0
  268. package/skills/switchroom-architecture/telegram.md +94 -0
  269. package/skills/switchroom-cli/SKILL.md +274 -0
  270. package/skills/switchroom-health/SKILL.md +101 -0
  271. package/skills/switchroom-install/SKILL.md +116 -0
  272. package/skills/switchroom-manage/SKILL.md +90 -0
  273. package/skills/switchroom-status/SKILL.md +69 -0
  274. package/skills/switchroom-status/scripts/status.sh +69 -0
  275. package/skills/telegram-test-harness/SKILL.md +191 -0
  276. package/skills/token-helpers/SKILL.md +73 -0
  277. package/skills/token-helpers/scripts/google-cal-token.sh +62 -0
  278. package/skills/token-helpers/scripts/ms-graph-token.sh +70 -0
  279. package/skills/webapp-testing/LICENSE.txt +202 -0
  280. package/skills/webapp-testing/SKILL.md +96 -0
  281. package/skills/webapp-testing/VENDORED.md +32 -0
  282. package/skills/webapp-testing/examples/console_logging.py +35 -0
  283. package/skills/webapp-testing/examples/element_discovery.py +40 -0
  284. package/skills/webapp-testing/examples/static_html_automation.py +33 -0
  285. package/skills/webapp-testing/scripts/with_server.py +106 -0
  286. package/skills/xlsx/LICENSE.txt +30 -0
  287. package/skills/xlsx/SKILL.md +292 -0
  288. package/skills/xlsx/VENDORED.md +32 -0
  289. package/skills/xlsx/scripts/office/helpers/__init__.py +0 -0
  290. package/skills/xlsx/scripts/office/helpers/merge_runs.py +199 -0
  291. package/skills/xlsx/scripts/office/helpers/simplify_redlines.py +197 -0
  292. package/skills/xlsx/scripts/office/pack.py +159 -0
  293. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
  294. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
  295. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
  296. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
  297. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
  298. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
  299. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
  300. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
  301. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
  302. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
  303. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
  304. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
  305. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
  306. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
  307. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
  308. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
  309. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
  310. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
  311. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
  312. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
  313. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
  314. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
  315. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
  316. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
  317. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
  318. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
  319. package/skills/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
  320. package/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
  321. package/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
  322. package/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
  323. package/skills/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
  324. package/skills/xlsx/scripts/office/schemas/mce/mc.xsd +75 -0
  325. package/skills/xlsx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
  326. package/skills/xlsx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
  327. package/skills/xlsx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
  328. package/skills/xlsx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
  329. package/skills/xlsx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
  330. package/skills/xlsx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
  331. package/skills/xlsx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
  332. package/skills/xlsx/scripts/office/soffice.py +183 -0
  333. package/skills/xlsx/scripts/office/unpack.py +132 -0
  334. package/skills/xlsx/scripts/office/validate.py +111 -0
  335. package/skills/xlsx/scripts/office/validators/__init__.py +15 -0
  336. package/skills/xlsx/scripts/office/validators/base.py +847 -0
  337. package/skills/xlsx/scripts/office/validators/docx.py +446 -0
  338. package/skills/xlsx/scripts/office/validators/pptx.py +275 -0
  339. package/skills/xlsx/scripts/office/validators/redlining.py +247 -0
  340. package/skills/xlsx/scripts/recalc.py +184 -0
  341. package/telegram-plugin/.claude-plugin/plugin.json +20 -0
  342. package/telegram-plugin/.mcp.json +14 -0
  343. package/telegram-plugin/LICENSE +21 -0
  344. package/telegram-plugin/README.md +352 -0
  345. package/telegram-plugin/active-pins-sweep.ts +204 -0
  346. package/telegram-plugin/active-pins.ts +146 -0
  347. package/telegram-plugin/active-reactions-sweep.ts +79 -0
  348. package/telegram-plugin/active-reactions.ts +134 -0
  349. package/telegram-plugin/admin-commands/dispatch.test.ts +149 -0
  350. package/telegram-plugin/admin-commands/index.ts +106 -0
  351. package/telegram-plugin/answer-stream.ts +565 -0
  352. package/telegram-plugin/ask-user.ts +179 -0
  353. package/telegram-plugin/attachment-path.ts +80 -0
  354. package/telegram-plugin/auth-code-redact.ts +83 -0
  355. package/telegram-plugin/auth-dashboard.ts +1104 -0
  356. package/telegram-plugin/auth-slot-parser.ts +497 -0
  357. package/telegram-plugin/auto-fallback-dispatcher.ts +68 -0
  358. package/telegram-plugin/auto-fallback.ts +348 -0
  359. package/telegram-plugin/bridge/bridge.ts +687 -0
  360. package/telegram-plugin/bridge/ipc-client.ts +326 -0
  361. package/telegram-plugin/bun.lock +218 -0
  362. package/telegram-plugin/card-format.ts +62 -0
  363. package/telegram-plugin/channel-envelope-safety.test.ts +56 -0
  364. package/telegram-plugin/channel-envelope-safety.ts +56 -0
  365. package/telegram-plugin/chat-lock.ts +65 -0
  366. package/telegram-plugin/context-exhaustion.ts +38 -0
  367. package/telegram-plugin/credits-watch.ts +220 -0
  368. package/telegram-plugin/dist/bridge/bridge.js +24758 -0
  369. package/telegram-plugin/dist/foreman/foreman.js +30723 -0
  370. package/telegram-plugin/dist/gateway/gateway.js +46497 -0
  371. package/telegram-plugin/dist/server.js +24551 -0
  372. package/telegram-plugin/dm-command-gate.ts +56 -0
  373. package/telegram-plugin/docs/gateway-server-split.md +133 -0
  374. package/telegram-plugin/docs/multi-agent-card-design.md +847 -0
  375. package/telegram-plugin/docs/pinned-progress-card-reliability.md +144 -0
  376. package/telegram-plugin/docs/stream-json-daemon-mode.md +477 -0
  377. package/telegram-plugin/docs/waiting-ux-spec.md +233 -0
  378. package/telegram-plugin/draft-stream.ts +442 -0
  379. package/telegram-plugin/draft-transport.ts +72 -0
  380. package/telegram-plugin/first-paint.ts +246 -0
  381. package/telegram-plugin/fleet-state.ts +246 -0
  382. package/telegram-plugin/foreman/foreman-create-flow.ts +202 -0
  383. package/telegram-plugin/foreman/foreman-handlers.ts +493 -0
  384. package/telegram-plugin/foreman/foreman.ts +1130 -0
  385. package/telegram-plugin/foreman/setup-flow.ts +345 -0
  386. package/telegram-plugin/foreman/setup-state.ts +239 -0
  387. package/telegram-plugin/foreman/state.ts +203 -0
  388. package/telegram-plugin/format.ts +685 -0
  389. package/telegram-plugin/gateway/access-validator.test.ts +95 -0
  390. package/telegram-plugin/gateway/access-validator.ts +37 -0
  391. package/telegram-plugin/gateway/boot-card.ts +582 -0
  392. package/telegram-plugin/gateway/boot-probes.ts +863 -0
  393. package/telegram-plugin/gateway/boot-reason.ts +51 -0
  394. package/telegram-plugin/gateway/boot-sweep-filter.test.ts +54 -0
  395. package/telegram-plugin/gateway/boot-sweep-filter.ts +32 -0
  396. package/telegram-plugin/gateway/clean-shutdown-marker.ts +183 -0
  397. package/telegram-plugin/gateway/disconnect-flush.ts +109 -0
  398. package/telegram-plugin/gateway/gateway.ts +10202 -0
  399. package/telegram-plugin/gateway/inbound-coalesce.ts +147 -0
  400. package/telegram-plugin/gateway/inject-handler.test.ts +221 -0
  401. package/telegram-plugin/gateway/inject-handler.ts +190 -0
  402. package/telegram-plugin/gateway/ipc-protocol.ts +151 -0
  403. package/telegram-plugin/gateway/ipc-server.ts +494 -0
  404. package/telegram-plugin/gateway/pid-file.ts +103 -0
  405. package/telegram-plugin/gateway/poll-health.ts +156 -0
  406. package/telegram-plugin/gateway/preamble-suppressor.ts +154 -0
  407. package/telegram-plugin/gateway/quota-cache.ts +125 -0
  408. package/telegram-plugin/gateway/resolve-calling-subagent.ts +78 -0
  409. package/telegram-plugin/gateway/restart-watchdog.ts +200 -0
  410. package/telegram-plugin/gateway/session-marker.ts +83 -0
  411. package/telegram-plugin/gateway/shutdown-drain.ts +162 -0
  412. package/telegram-plugin/gateway/startup-mutex.ts +285 -0
  413. package/telegram-plugin/gateway/startup-network-retry.ts +142 -0
  414. package/telegram-plugin/gateway/turn-active-marker.ts +176 -0
  415. package/telegram-plugin/gateway/unhandled-rejection-policy.ts +78 -0
  416. package/telegram-plugin/handoff-continuity.ts +200 -0
  417. package/telegram-plugin/history.ts +468 -0
  418. package/telegram-plugin/hooks/hooks.json +58 -0
  419. package/telegram-plugin/hooks/secret-guard-pretool.mjs +208 -0
  420. package/telegram-plugin/hooks/secret-scrub-stop.mjs +98 -0
  421. package/telegram-plugin/hooks/silent-end-interrupt-stop.mjs +111 -0
  422. package/telegram-plugin/hooks/subagent-tracker-posttool.mjs +296 -0
  423. package/telegram-plugin/hooks/subagent-tracker-pretool.mjs +261 -0
  424. package/telegram-plugin/html-sanitize.ts +244 -0
  425. package/telegram-plugin/idle-footer.ts +65 -0
  426. package/telegram-plugin/inline-keyboard-callbacks.ts +166 -0
  427. package/telegram-plugin/interrupt-marker.ts +66 -0
  428. package/telegram-plugin/issues-card.ts +371 -0
  429. package/telegram-plugin/issues-watcher.ts +125 -0
  430. package/telegram-plugin/model-unavailable.ts +325 -0
  431. package/telegram-plugin/node_modules/.vite/vitest/da39a3ee5e6b4b0d3255bfef95601890afd80709/results.json +1 -0
  432. package/telegram-plugin/operator-events-history.ts +94 -0
  433. package/telegram-plugin/operator-events.fixtures.json +161 -0
  434. package/telegram-plugin/operator-events.ts +421 -0
  435. package/telegram-plugin/package.json +55 -0
  436. package/telegram-plugin/permission-rule.ts +133 -0
  437. package/telegram-plugin/permission-title.ts +117 -0
  438. package/telegram-plugin/pin-event-log.ts +76 -0
  439. package/telegram-plugin/plugin-logger.ts +136 -0
  440. package/telegram-plugin/progress-card-driver.ts +2697 -0
  441. package/telegram-plugin/progress-card-pin-manager.ts +589 -0
  442. package/telegram-plugin/progress-card-pin-watchdog.ts +98 -0
  443. package/telegram-plugin/progress-card.ts +1409 -0
  444. package/telegram-plugin/pty-partial-handler.ts +247 -0
  445. package/telegram-plugin/pty-tail.ts +730 -0
  446. package/telegram-plugin/quota-check.ts +474 -0
  447. package/telegram-plugin/recent-outbound-dedup.ts +169 -0
  448. package/telegram-plugin/registry/api-registry.test.ts +201 -0
  449. package/telegram-plugin/registry/subagents-bugs.test.ts +454 -0
  450. package/telegram-plugin/registry/subagents-schema.ts +509 -0
  451. package/telegram-plugin/registry/subagents.test.ts +476 -0
  452. package/telegram-plugin/registry/turns-schema.test.ts +101 -0
  453. package/telegram-plugin/registry/turns-schema.ts +417 -0
  454. package/telegram-plugin/retry-api-call.ts +172 -0
  455. package/telegram-plugin/scripts/build.mjs +78 -0
  456. package/telegram-plugin/secret-detect/audit.ts +66 -0
  457. package/telegram-plugin/secret-detect/chunker.ts +37 -0
  458. package/telegram-plugin/secret-detect/entropy.ts +20 -0
  459. package/telegram-plugin/secret-detect/gitleaks-loader.ts +74 -0
  460. package/telegram-plugin/secret-detect/gitleaks.toml +27 -0
  461. package/telegram-plugin/secret-detect/index.ts +218 -0
  462. package/telegram-plugin/secret-detect/kv-scanner.ts +60 -0
  463. package/telegram-plugin/secret-detect/mask.ts +13 -0
  464. package/telegram-plugin/secret-detect/patterns.ts +115 -0
  465. package/telegram-plugin/secret-detect/pipeline.ts +144 -0
  466. package/telegram-plugin/secret-detect/rewrite.ts +26 -0
  467. package/telegram-plugin/secret-detect/secretlint-source.ts +95 -0
  468. package/telegram-plugin/secret-detect/slug.ts +44 -0
  469. package/telegram-plugin/secret-detect/staging.ts +85 -0
  470. package/telegram-plugin/secret-detect/suppressor.ts +34 -0
  471. package/telegram-plugin/secret-detect/url-redact.ts +60 -0
  472. package/telegram-plugin/secret-detect/vault-write.ts +56 -0
  473. package/telegram-plugin/server.js +41795 -0
  474. package/telegram-plugin/server.ts +171 -0
  475. package/telegram-plugin/session-tail.ts +884 -0
  476. package/telegram-plugin/shared/bot-runtime.ts +324 -0
  477. package/telegram-plugin/silent-reply.ts +58 -0
  478. package/telegram-plugin/slot-banner-driver.ts +147 -0
  479. package/telegram-plugin/slot-banner.ts +86 -0
  480. package/telegram-plugin/start.js +26 -0
  481. package/telegram-plugin/startup-reset.ts +45 -0
  482. package/telegram-plugin/status-reactions.ts +332 -0
  483. package/telegram-plugin/steering.ts +155 -0
  484. package/telegram-plugin/sticker-aliases.ts +249 -0
  485. package/telegram-plugin/stream-controller.ts +311 -0
  486. package/telegram-plugin/stream-reply-handler.ts +664 -0
  487. package/telegram-plugin/streaming-metrics.ts +134 -0
  488. package/telegram-plugin/streaming-report.ts +204 -0
  489. package/telegram-plugin/subagent-watcher.ts +880 -0
  490. package/telegram-plugin/telegram-button-constraints.ts +191 -0
  491. package/telegram-plugin/telegraph.ts +381 -0
  492. package/telegram-plugin/tests/HARNESS.md +340 -0
  493. package/telegram-plugin/tests/_progress-card-harness.ts +105 -0
  494. package/telegram-plugin/tests/active-pins-boot-reaper.test.ts +211 -0
  495. package/telegram-plugin/tests/active-pins-sweep.test.ts +309 -0
  496. package/telegram-plugin/tests/active-pins.test.ts +187 -0
  497. package/telegram-plugin/tests/active-reactions-sweep.test.ts +116 -0
  498. package/telegram-plugin/tests/active-reactions.test.ts +198 -0
  499. package/telegram-plugin/tests/answer-stream-dedup.test.ts +352 -0
  500. package/telegram-plugin/tests/answer-stream-silent-markers.test.ts +236 -0
  501. package/telegram-plugin/tests/answer-stream.test.ts +878 -0
  502. package/telegram-plugin/tests/ask-user.test.ts +203 -0
  503. package/telegram-plugin/tests/attachment-path.test.ts +199 -0
  504. package/telegram-plugin/tests/auth-account-identity-surface.test.ts +118 -0
  505. package/telegram-plugin/tests/auth-code-auto-capture.test.ts +144 -0
  506. package/telegram-plugin/tests/auth-code-redact.test.ts +248 -0
  507. package/telegram-plugin/tests/auth-dashboard-edge-cases.test.ts +260 -0
  508. package/telegram-plugin/tests/auth-dashboard-restart-flow.test.ts +140 -0
  509. package/telegram-plugin/tests/auth-dashboard-v3b.test.ts +559 -0
  510. package/telegram-plugin/tests/auth-dashboard.test.ts +1045 -0
  511. package/telegram-plugin/tests/auth-login-url-button.test.ts +122 -0
  512. package/telegram-plugin/tests/auth-slot-commands.test.ts +640 -0
  513. package/telegram-plugin/tests/auto-fallback-dispatcher.e2e.test.ts +183 -0
  514. package/telegram-plugin/tests/auto-fallback.test.ts +381 -0
  515. package/telegram-plugin/tests/boot-card-account-quota.test.ts +137 -0
  516. package/telegram-plugin/tests/boot-card-dedupe.test.ts +154 -0
  517. package/telegram-plugin/tests/boot-card-probe-target.test.ts +194 -0
  518. package/telegram-plugin/tests/boot-card-reason.test.ts +103 -0
  519. package/telegram-plugin/tests/boot-card-render.test.ts +219 -0
  520. package/telegram-plugin/tests/boot-probes.test.ts +451 -0
  521. package/telegram-plugin/tests/bot-api.harness.ts +116 -0
  522. package/telegram-plugin/tests/bot-runtime.test.ts +190 -0
  523. package/telegram-plugin/tests/bridge-anonymous-refuse.test.ts +60 -0
  524. package/telegram-plugin/tests/context-exhaustion.test.ts +114 -0
  525. package/telegram-plugin/tests/credits-watch.test.ts +221 -0
  526. package/telegram-plugin/tests/dm-command-gate.test.ts +176 -0
  527. package/telegram-plugin/tests/draft-stream.test.ts +752 -0
  528. package/telegram-plugin/tests/draft-transport.test.ts +141 -0
  529. package/telegram-plugin/tests/e2e.test.ts +436 -0
  530. package/telegram-plugin/tests/fake-bot-api.test.ts +213 -0
  531. package/telegram-plugin/tests/fake-bot-api.ts +617 -0
  532. package/telegram-plugin/tests/false-restart-banner.test.ts +253 -0
  533. package/telegram-plugin/tests/first-paint.test.ts +257 -0
  534. package/telegram-plugin/tests/fixtures/pty-tail-tmux-fragment.bin +6 -0
  535. package/telegram-plugin/tests/fixtures/service-log-current-claude-code.bin +3624 -0
  536. package/telegram-plugin/tests/fleet-state-watcher.test.ts +101 -0
  537. package/telegram-plugin/tests/fleet-state.test.ts +185 -0
  538. package/telegram-plugin/tests/foreman-create-flow.test.ts +359 -0
  539. package/telegram-plugin/tests/foreman-handlers.test.ts +347 -0
  540. package/telegram-plugin/tests/foreman-state.test.ts +164 -0
  541. package/telegram-plugin/tests/foreman-write-ops.test.ts +214 -0
  542. package/telegram-plugin/tests/gateway-409-retry-banner.test.ts +173 -0
  543. package/telegram-plugin/tests/gateway-boot-marker-clear.test.ts +72 -0
  544. package/telegram-plugin/tests/gateway-bridge.test.ts +811 -0
  545. package/telegram-plugin/tests/gateway-clean-shutdown-marker.test.ts +414 -0
  546. package/telegram-plugin/tests/gateway-disconnect-flush.test.ts +144 -0
  547. package/telegram-plugin/tests/gateway-message-validator.test.ts +133 -0
  548. package/telegram-plugin/tests/gateway-no-reply-single-emit.test.ts +103 -0
  549. package/telegram-plugin/tests/gateway-secret-detect.test.ts +127 -0
  550. package/telegram-plugin/tests/gateway-startup-mutex.test.ts +284 -0
  551. package/telegram-plugin/tests/gateway-startup-network-retry.test.ts +185 -0
  552. package/telegram-plugin/tests/gateway-startup-reset.test.ts +72 -0
  553. package/telegram-plugin/tests/gateway-update-placeholder-dispatch.test.ts +125 -0
  554. package/telegram-plugin/tests/handoff-continuity.test.ts +249 -0
  555. package/telegram-plugin/tests/harness-ordering-invariants.test.ts +243 -0
  556. package/telegram-plugin/tests/harness-parse-mode-validation.test.ts +114 -0
  557. package/telegram-plugin/tests/history.test.ts +364 -0
  558. package/telegram-plugin/tests/html-balanced.ts +63 -0
  559. package/telegram-plugin/tests/html-sanitize.test.ts +146 -0
  560. package/telegram-plugin/tests/idle-footer-wiring.test.ts +88 -0
  561. package/telegram-plugin/tests/idle-footer.test.ts +66 -0
  562. package/telegram-plugin/tests/inbound-coalesce.test.ts +127 -0
  563. package/telegram-plugin/tests/inline-keyboard-callbacks.test.ts +150 -0
  564. package/telegram-plugin/tests/interrupt-marker.test.ts +126 -0
  565. package/telegram-plugin/tests/ipc-protocol.test.ts +218 -0
  566. package/telegram-plugin/tests/ipc-server-anonymous-refuse.test.ts +82 -0
  567. package/telegram-plugin/tests/ipc-server-client.test.ts +323 -0
  568. package/telegram-plugin/tests/ipc-server-race.test.ts +183 -0
  569. package/telegram-plugin/tests/ipc-server-validate-operator.test.ts +91 -0
  570. package/telegram-plugin/tests/ipc-server-validate-pty-partial.test.ts +64 -0
  571. package/telegram-plugin/tests/ipc-server-validate-update-placeholder.test.ts +77 -0
  572. package/telegram-plugin/tests/ipc-validator.test.ts +274 -0
  573. package/telegram-plugin/tests/issues-card.test.ts +495 -0
  574. package/telegram-plugin/tests/issues-watcher.test.ts +165 -0
  575. package/telegram-plugin/tests/model-unavailable.test.ts +303 -0
  576. package/telegram-plugin/tests/multi-turn-continuity.test.ts +159 -0
  577. package/telegram-plugin/tests/operator-events-history.test.ts +125 -0
  578. package/telegram-plugin/tests/operator-events-session-tail.test.ts +192 -0
  579. package/telegram-plugin/tests/operator-events.test.ts +331 -0
  580. package/telegram-plugin/tests/outbound-ordering.test.ts +293 -0
  581. package/telegram-plugin/tests/parse-mode-rotation.test.ts +164 -0
  582. package/telegram-plugin/tests/permission-rule.test.ts +121 -0
  583. package/telegram-plugin/tests/permission-title.test.ts +106 -0
  584. package/telegram-plugin/tests/pin-event-log.test.ts +124 -0
  585. package/telegram-plugin/tests/plugin-logger.test.ts +97 -0
  586. package/telegram-plugin/tests/poll-health.test.ts +86 -0
  587. package/telegram-plugin/tests/preamble-suppressor.test.ts +285 -0
  588. package/telegram-plugin/tests/progress-card-api-failure-during-deferred.test.ts +73 -0
  589. package/telegram-plugin/tests/progress-card-close-paths-converge.test.ts +272 -0
  590. package/telegram-plugin/tests/progress-card-cross-turn.test.ts +258 -0
  591. package/telegram-plugin/tests/progress-card-dispose-preservepending.test.ts +81 -0
  592. package/telegram-plugin/tests/progress-card-draft-flag.test.ts +80 -0
  593. package/telegram-plugin/tests/progress-card-driver-eviction.test.ts +215 -0
  594. package/telegram-plugin/tests/progress-card-driver-fleet-shadow.test.ts +123 -0
  595. package/telegram-plugin/tests/progress-card-driver-force-complete-parent-done.test.ts +76 -0
  596. package/telegram-plugin/tests/progress-card-edit-timestamps-budget.test.ts +62 -0
  597. package/telegram-plugin/tests/progress-card-memory-bounds.test.ts +84 -0
  598. package/telegram-plugin/tests/progress-card-pin-failure-paths.test.ts +139 -0
  599. package/telegram-plugin/tests/progress-card-pin-manager.test.ts +773 -0
  600. package/telegram-plugin/tests/progress-card-pin-race-fast-turn.test.ts +66 -0
  601. package/telegram-plugin/tests/progress-card-pin-sidecar-partial-write.test.ts +64 -0
  602. package/telegram-plugin/tests/progress-card-pin-watchdog.test.ts +190 -0
  603. package/telegram-plugin/tests/progress-card-sigterm-pin-flush.test.ts +146 -0
  604. package/telegram-plugin/tests/progress-update.test.ts +236 -0
  605. package/telegram-plugin/tests/protocol-fixtures.test.ts +59 -0
  606. package/telegram-plugin/tests/protocol-fixtures.ts +198 -0
  607. package/telegram-plugin/tests/pty-partial-handler.test.ts +326 -0
  608. package/telegram-plugin/tests/pty-tail-real-fixture.test.ts +114 -0
  609. package/telegram-plugin/tests/pty-tail-tmux-fragment.test.ts +71 -0
  610. package/telegram-plugin/tests/pty-tail.test.ts +525 -0
  611. package/telegram-plugin/tests/quota-cache.test.ts +187 -0
  612. package/telegram-plugin/tests/quota-check.test.ts +622 -0
  613. package/telegram-plugin/tests/races.test.ts +842 -0
  614. package/telegram-plugin/tests/real-gateway-f1-ladder-integrity.test.ts +123 -0
  615. package/telegram-plugin/tests/real-gateway-f2-instant-draft.test.ts +82 -0
  616. package/telegram-plugin/tests/real-gateway-f3-late-card.test.ts +114 -0
  617. package/telegram-plugin/tests/real-gateway-harness.ts +699 -0
  618. package/telegram-plugin/tests/real-gateway-i6-turn-flush-replay-dedup.test.ts +313 -0
  619. package/telegram-plugin/tests/real-gateway-ipc-lifecycle.test.ts +299 -0
  620. package/telegram-plugin/tests/real-gateway-spec.test.ts +487 -0
  621. package/telegram-plugin/tests/real-gateway.smoke.test.ts +101 -0
  622. package/telegram-plugin/tests/recent-outbound-dedup.test.ts +192 -0
  623. package/telegram-plugin/tests/registry-turns.test.ts +432 -0
  624. package/telegram-plugin/tests/reply-terminal-reaction.test.ts +149 -0
  625. package/telegram-plugin/tests/resolve-calling-subagent.test.ts +269 -0
  626. package/telegram-plugin/tests/restart-watchdog.test.ts +224 -0
  627. package/telegram-plugin/tests/retry-api-call.test.ts +287 -0
  628. package/telegram-plugin/tests/secret-detect-audit.test.ts +58 -0
  629. package/telegram-plugin/tests/secret-detect-fail-closed.test.ts +83 -0
  630. package/telegram-plugin/tests/secret-detect-gitleaks.test.ts +32 -0
  631. package/telegram-plugin/tests/secret-detect-oauth-code.test.ts +308 -0
  632. package/telegram-plugin/tests/secret-detect-pipeline.test.ts +123 -0
  633. package/telegram-plugin/tests/secret-detect-secretlint.test.ts +101 -0
  634. package/telegram-plugin/tests/secret-detect-staging.test.ts +45 -0
  635. package/telegram-plugin/tests/secret-detect-suppressor-no-silent-allow.test.ts +67 -0
  636. package/telegram-plugin/tests/secret-detect.test.ts +223 -0
  637. package/telegram-plugin/tests/secret-guard-pretool.test.ts +194 -0
  638. package/telegram-plugin/tests/send-typing-action-validation.test.ts +61 -0
  639. package/telegram-plugin/tests/session-tail-capped.test.ts +285 -0
  640. package/telegram-plugin/tests/session-tail.test.ts +524 -0
  641. package/telegram-plugin/tests/setup-flow.test.ts +510 -0
  642. package/telegram-plugin/tests/setup-state.test.ts +146 -0
  643. package/telegram-plugin/tests/silent-reply-guard.test.ts +122 -0
  644. package/telegram-plugin/tests/slot-banner-driver.e2e.test.ts +350 -0
  645. package/telegram-plugin/tests/slot-banner.test.ts +74 -0
  646. package/telegram-plugin/tests/snapshot-serializer.ts +79 -0
  647. package/telegram-plugin/tests/spawn-detached-cgroup-escape.test.ts +51 -0
  648. package/telegram-plugin/tests/status-accent.test.ts +186 -0
  649. package/telegram-plugin/tests/status-reactions-allowed-filter.test.ts +132 -0
  650. package/telegram-plugin/tests/status-reactions.test.ts +314 -0
  651. package/telegram-plugin/tests/steering.test.ts +282 -0
  652. package/telegram-plugin/tests/sticker-aliases.test.ts +232 -0
  653. package/telegram-plugin/tests/stream-controller-html-fallback.test.ts +127 -0
  654. package/telegram-plugin/tests/stream-controller.test.ts +262 -0
  655. package/telegram-plugin/tests/stream-reply-error-paths.test.ts +208 -0
  656. package/telegram-plugin/tests/stream-reply-handler.test.ts +1292 -0
  657. package/telegram-plugin/tests/streaming-e2e.test.ts +389 -0
  658. package/telegram-plugin/tests/streaming-metrics.test.ts +201 -0
  659. package/telegram-plugin/tests/streaming-orchestration.test.ts +756 -0
  660. package/telegram-plugin/tests/subagent-registry-bugs.test.ts +725 -0
  661. package/telegram-plugin/tests/subagent-tracker-hooks.test.ts +213 -0
  662. package/telegram-plugin/tests/subagent-watcher-parent-marker.test.ts +274 -0
  663. package/telegram-plugin/tests/subagent-watcher-stall-notification.test.ts +243 -0
  664. package/telegram-plugin/tests/subagent-watcher.test.ts +877 -0
  665. package/telegram-plugin/tests/subagents-schema-init-order.test.ts +109 -0
  666. package/telegram-plugin/tests/sync-chat-running-subagents.test.ts +116 -0
  667. package/telegram-plugin/tests/telegram-button-constraints.test.ts +194 -0
  668. package/telegram-plugin/tests/telegram-format.test.ts +1093 -0
  669. package/telegram-plugin/tests/telegraph.test.ts +246 -0
  670. package/telegram-plugin/tests/tool-labels.test.ts +383 -0
  671. package/telegram-plugin/tests/turn-active-marker.test.ts +195 -0
  672. package/telegram-plugin/tests/turn-end-regressions.test.ts +489 -0
  673. package/telegram-plugin/tests/turn-flush-card-takeover.test.ts +218 -0
  674. package/telegram-plugin/tests/turn-flush-dedup-controller.test.ts +144 -0
  675. package/telegram-plugin/tests/turn-flush-prose-recovery.test.ts +78 -0
  676. package/telegram-plugin/tests/turn-flush-safety.test.ts +189 -0
  677. package/telegram-plugin/tests/turn-signal-tracker.test.ts +107 -0
  678. package/telegram-plugin/tests/turns-writer.test.ts +323 -0
  679. package/telegram-plugin/tests/two-zone-bg-carry-full-lifecycle.test.ts +131 -0
  680. package/telegram-plugin/tests/two-zone-bg-detection.test.ts +120 -0
  681. package/telegram-plugin/tests/two-zone-bg-done-when-all-terminal.test.ts +114 -0
  682. package/telegram-plugin/tests/two-zone-bg-early-turn-end.test.ts +87 -0
  683. package/telegram-plugin/tests/two-zone-bg-survives-next-turn.test.ts +211 -0
  684. package/telegram-plugin/tests/two-zone-card-cap.test.ts +62 -0
  685. package/telegram-plugin/tests/two-zone-card-fleet-row.test.ts +101 -0
  686. package/telegram-plugin/tests/two-zone-card-header-phases.test.ts +68 -0
  687. package/telegram-plugin/tests/two-zone-card-html-balance.test.ts +110 -0
  688. package/telegram-plugin/tests/two-zone-card-lifecycle.test.ts +128 -0
  689. package/telegram-plugin/tests/two-zone-card-sanitise.test.ts +58 -0
  690. package/telegram-plugin/tests/two-zone-card-snapshot.test.ts +133 -0
  691. package/telegram-plugin/tests/two-zone-concurrent-turns-isolation.test.ts +155 -0
  692. package/telegram-plugin/tests/two-zone-phasefor-precedence.test.ts +117 -0
  693. package/telegram-plugin/tests/two-zone-snapshot-extras.test.ts +143 -0
  694. package/telegram-plugin/tests/two-zone-stuck-edit-throttle.test.ts +149 -0
  695. package/telegram-plugin/tests/two-zone-stuck-header-escalation.test.ts +101 -0
  696. package/telegram-plugin/tests/two-zone-stuck-per-member.test.ts +114 -0
  697. package/telegram-plugin/tests/two-zone-stuck-recovery.test.ts +105 -0
  698. package/telegram-plugin/tests/typing-wrap.test.ts +141 -0
  699. package/telegram-plugin/tests/unhandled-rejection-policy.test.ts +147 -0
  700. package/telegram-plugin/tests/update-factory-edited-and-reactions.test.ts +108 -0
  701. package/telegram-plugin/tests/update-factory.ts +305 -0
  702. package/telegram-plugin/tests/vault-grant-wizard.test.ts +84 -0
  703. package/telegram-plugin/tests/vault-grants-revoke.test.ts +265 -0
  704. package/telegram-plugin/tests/vault-subcommands.test.ts +234 -0
  705. package/telegram-plugin/tests/voice-transcribe.test.ts +196 -0
  706. package/telegram-plugin/tests/waiting-ux-harness.ts +381 -0
  707. package/telegram-plugin/tests/waiting-ux.e2e.test.ts +233 -0
  708. package/telegram-plugin/tests/welcome-text.test.ts +407 -0
  709. package/telegram-plugin/tool-error-filter.ts +89 -0
  710. package/telegram-plugin/tool-labels.ts +330 -0
  711. package/telegram-plugin/tool-names.ts +53 -0
  712. package/telegram-plugin/turn-flush-prose-recovery.ts +40 -0
  713. package/telegram-plugin/turn-flush-safety.ts +109 -0
  714. package/telegram-plugin/turn-signal-tracker.ts +79 -0
  715. package/telegram-plugin/two-zone-card.ts +249 -0
  716. package/telegram-plugin/typing-wrap.ts +92 -0
  717. package/telegram-plugin/voice-transcribe.ts +166 -0
  718. package/telegram-plugin/welcome-text.ts +359 -0
@@ -0,0 +1,1325 @@
1
+ <!DOCTYPE html>
2
+ <html lang="en">
3
+ <head>
4
+ <meta charset="UTF-8">
5
+ <meta name="viewport" content="width=device-width, initial-scale=1.0">
6
+ <title>Eval Review</title>
7
+ <link rel="preconnect" href="https://fonts.googleapis.com">
8
+ <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
9
+ <link href="https://fonts.googleapis.com/css2?family=Poppins:wght@500;600&family=Lora:wght@400;500&display=swap" rel="stylesheet">
10
+ <script src="https://cdn.sheetjs.com/xlsx-0.20.3/package/dist/xlsx.full.min.js" integrity="sha384-EnyY0/GSHQGSxSgMwaIPzSESbqoOLSexfnSMN2AP+39Ckmn92stwABZynq1JyzdT" crossorigin="anonymous"></script>
11
+ <style>
12
+ :root {
13
+ --bg: #faf9f5;
14
+ --surface: #ffffff;
15
+ --border: #e8e6dc;
16
+ --text: #141413;
17
+ --text-muted: #b0aea5;
18
+ --accent: #d97757;
19
+ --accent-hover: #c4613f;
20
+ --green: #788c5d;
21
+ --green-bg: #eef2e8;
22
+ --red: #c44;
23
+ --red-bg: #fceaea;
24
+ --header-bg: #141413;
25
+ --header-text: #faf9f5;
26
+ --radius: 6px;
27
+ }
28
+
29
+ * { box-sizing: border-box; margin: 0; padding: 0; }
30
+
31
+ body {
32
+ font-family: 'Lora', Georgia, serif;
33
+ background: var(--bg);
34
+ color: var(--text);
35
+ height: 100vh;
36
+ display: flex;
37
+ flex-direction: column;
38
+ }
39
+
40
+ /* ---- Header ---- */
41
+ .header {
42
+ background: var(--header-bg);
43
+ color: var(--header-text);
44
+ padding: 1rem 2rem;
45
+ display: flex;
46
+ justify-content: space-between;
47
+ align-items: center;
48
+ flex-shrink: 0;
49
+ }
50
+ .header h1 {
51
+ font-family: 'Poppins', sans-serif;
52
+ font-size: 1.25rem;
53
+ font-weight: 600;
54
+ }
55
+ .header .instructions {
56
+ font-size: 0.8rem;
57
+ opacity: 0.7;
58
+ margin-top: 0.25rem;
59
+ }
60
+ .header .progress {
61
+ font-size: 0.875rem;
62
+ opacity: 0.8;
63
+ text-align: right;
64
+ }
65
+
66
+ /* ---- Main content ---- */
67
+ .main {
68
+ flex: 1;
69
+ overflow-y: auto;
70
+ padding: 1.5rem 2rem;
71
+ display: flex;
72
+ flex-direction: column;
73
+ gap: 1.25rem;
74
+ }
75
+
76
+ /* ---- Sections ---- */
77
+ .section {
78
+ background: var(--surface);
79
+ border: 1px solid var(--border);
80
+ border-radius: var(--radius);
81
+ flex-shrink: 0;
82
+ }
83
+ .section-header {
84
+ font-family: 'Poppins', sans-serif;
85
+ padding: 0.75rem 1rem;
86
+ font-size: 0.75rem;
87
+ font-weight: 500;
88
+ text-transform: uppercase;
89
+ letter-spacing: 0.05em;
90
+ color: var(--text-muted);
91
+ border-bottom: 1px solid var(--border);
92
+ background: var(--bg);
93
+ }
94
+ .section-body {
95
+ padding: 1rem;
96
+ }
97
+
98
+ /* ---- Config badge ---- */
99
+ .config-badge {
100
+ display: inline-block;
101
+ padding: 0.2rem 0.625rem;
102
+ border-radius: 9999px;
103
+ font-family: 'Poppins', sans-serif;
104
+ font-size: 0.6875rem;
105
+ font-weight: 600;
106
+ text-transform: uppercase;
107
+ letter-spacing: 0.03em;
108
+ margin-left: 0.75rem;
109
+ vertical-align: middle;
110
+ }
111
+ .config-badge.config-primary {
112
+ background: rgba(33, 150, 243, 0.12);
113
+ color: #1976d2;
114
+ }
115
+ .config-badge.config-baseline {
116
+ background: rgba(255, 193, 7, 0.15);
117
+ color: #f57f17;
118
+ }
119
+
120
+ /* ---- Prompt ---- */
121
+ .prompt-text {
122
+ white-space: pre-wrap;
123
+ font-size: 0.9375rem;
124
+ line-height: 1.6;
125
+ }
126
+
127
+ /* ---- Outputs ---- */
128
+ .output-file {
129
+ border: 1px solid var(--border);
130
+ border-radius: var(--radius);
131
+ overflow: hidden;
132
+ }
133
+ .output-file + .output-file {
134
+ margin-top: 1rem;
135
+ }
136
+ .output-file-header {
137
+ padding: 0.5rem 0.75rem;
138
+ font-size: 0.8rem;
139
+ font-weight: 600;
140
+ color: var(--text-muted);
141
+ background: var(--bg);
142
+ border-bottom: 1px solid var(--border);
143
+ font-family: 'SF Mono', SFMono-Regular, Consolas, 'Liberation Mono', Menlo, monospace;
144
+ display: flex;
145
+ justify-content: space-between;
146
+ align-items: center;
147
+ }
148
+ .output-file-header .dl-btn {
149
+ font-size: 0.7rem;
150
+ color: var(--accent);
151
+ text-decoration: none;
152
+ cursor: pointer;
153
+ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif;
154
+ font-weight: 500;
155
+ opacity: 0.8;
156
+ }
157
+ .output-file-header .dl-btn:hover {
158
+ opacity: 1;
159
+ text-decoration: underline;
160
+ }
161
+ .output-file-content {
162
+ padding: 0.75rem;
163
+ overflow-x: auto;
164
+ }
165
+ .output-file-content pre {
166
+ font-size: 0.8125rem;
167
+ line-height: 1.5;
168
+ white-space: pre-wrap;
169
+ word-break: break-word;
170
+ font-family: 'SF Mono', SFMono-Regular, Consolas, 'Liberation Mono', Menlo, monospace;
171
+ }
172
+ .output-file-content img {
173
+ max-width: 100%;
174
+ height: auto;
175
+ border-radius: 4px;
176
+ }
177
+ .output-file-content iframe {
178
+ width: 100%;
179
+ height: 600px;
180
+ border: none;
181
+ }
182
+ .output-file-content table {
183
+ border-collapse: collapse;
184
+ font-size: 0.8125rem;
185
+ width: 100%;
186
+ }
187
+ .output-file-content table td,
188
+ .output-file-content table th {
189
+ border: 1px solid var(--border);
190
+ padding: 0.375rem 0.5rem;
191
+ text-align: left;
192
+ }
193
+ .output-file-content table th {
194
+ background: var(--bg);
195
+ font-weight: 600;
196
+ }
197
+ .output-file-content .download-link {
198
+ display: inline-flex;
199
+ align-items: center;
200
+ gap: 0.5rem;
201
+ padding: 0.5rem 1rem;
202
+ background: var(--bg);
203
+ border: 1px solid var(--border);
204
+ border-radius: 4px;
205
+ color: var(--accent);
206
+ text-decoration: none;
207
+ font-size: 0.875rem;
208
+ cursor: pointer;
209
+ }
210
+ .output-file-content .download-link:hover {
211
+ background: var(--border);
212
+ }
213
+ .empty-state {
214
+ color: var(--text-muted);
215
+ font-style: italic;
216
+ padding: 2rem;
217
+ text-align: center;
218
+ }
219
+
220
+ /* ---- Feedback ---- */
221
+ .prev-feedback {
222
+ background: var(--bg);
223
+ border: 1px solid var(--border);
224
+ border-radius: 4px;
225
+ padding: 0.625rem 0.75rem;
226
+ margin-top: 0.75rem;
227
+ font-size: 0.8125rem;
228
+ color: var(--text-muted);
229
+ line-height: 1.5;
230
+ }
231
+ .prev-feedback-label {
232
+ font-size: 0.7rem;
233
+ font-weight: 600;
234
+ text-transform: uppercase;
235
+ letter-spacing: 0.04em;
236
+ margin-bottom: 0.25rem;
237
+ color: var(--text-muted);
238
+ }
239
+ .feedback-textarea {
240
+ width: 100%;
241
+ min-height: 100px;
242
+ padding: 0.75rem;
243
+ border: 1px solid var(--border);
244
+ border-radius: 4px;
245
+ font-family: inherit;
246
+ font-size: 0.9375rem;
247
+ line-height: 1.5;
248
+ resize: vertical;
249
+ color: var(--text);
250
+ }
251
+ .feedback-textarea:focus {
252
+ outline: none;
253
+ border-color: var(--accent);
254
+ box-shadow: 0 0 0 3px rgba(37, 99, 235, 0.1);
255
+ }
256
+ .feedback-status {
257
+ font-size: 0.75rem;
258
+ color: var(--text-muted);
259
+ margin-top: 0.5rem;
260
+ min-height: 1.1em;
261
+ }
262
+
263
+ /* ---- Grades (collapsible) ---- */
264
+ .grades-toggle {
265
+ display: flex;
266
+ align-items: center;
267
+ cursor: pointer;
268
+ user-select: none;
269
+ }
270
+ .grades-toggle:hover {
271
+ color: var(--accent);
272
+ }
273
+ .grades-toggle .arrow {
274
+ margin-right: 0.5rem;
275
+ transition: transform 0.15s;
276
+ font-size: 0.75rem;
277
+ }
278
+ .grades-toggle .arrow.open {
279
+ transform: rotate(90deg);
280
+ }
281
+ .grades-content {
282
+ display: none;
283
+ margin-top: 0.75rem;
284
+ }
285
+ .grades-content.open {
286
+ display: block;
287
+ }
288
+ .grades-summary {
289
+ font-size: 0.875rem;
290
+ margin-bottom: 0.75rem;
291
+ display: flex;
292
+ align-items: center;
293
+ gap: 0.5rem;
294
+ }
295
+ .grade-badge {
296
+ display: inline-block;
297
+ padding: 0.125rem 0.5rem;
298
+ border-radius: 9999px;
299
+ font-size: 0.75rem;
300
+ font-weight: 600;
301
+ }
302
+ .grade-pass { background: var(--green-bg); color: var(--green); }
303
+ .grade-fail { background: var(--red-bg); color: var(--red); }
304
+ .assertion-list {
305
+ list-style: none;
306
+ }
307
+ .assertion-item {
308
+ padding: 0.625rem 0;
309
+ border-bottom: 1px solid var(--border);
310
+ font-size: 0.8125rem;
311
+ }
312
+ .assertion-item:last-child { border-bottom: none; }
313
+ .assertion-status {
314
+ font-weight: 600;
315
+ margin-right: 0.5rem;
316
+ }
317
+ .assertion-status.pass { color: var(--green); }
318
+ .assertion-status.fail { color: var(--red); }
319
+ .assertion-evidence {
320
+ color: var(--text-muted);
321
+ font-size: 0.75rem;
322
+ margin-top: 0.25rem;
323
+ padding-left: 1.5rem;
324
+ }
325
+
326
+ /* ---- View tabs ---- */
327
+ .view-tabs {
328
+ display: flex;
329
+ gap: 0;
330
+ padding: 0 2rem;
331
+ background: var(--bg);
332
+ border-bottom: 1px solid var(--border);
333
+ flex-shrink: 0;
334
+ }
335
+ .view-tab {
336
+ font-family: 'Poppins', sans-serif;
337
+ padding: 0.625rem 1.25rem;
338
+ font-size: 0.8125rem;
339
+ font-weight: 500;
340
+ cursor: pointer;
341
+ border: none;
342
+ background: none;
343
+ color: var(--text-muted);
344
+ border-bottom: 2px solid transparent;
345
+ transition: all 0.15s;
346
+ }
347
+ .view-tab:hover { color: var(--text); }
348
+ .view-tab.active {
349
+ color: var(--accent);
350
+ border-bottom-color: var(--accent);
351
+ }
352
+ .view-panel { display: none; }
353
+ .view-panel.active { display: flex; flex-direction: column; flex: 1; overflow: hidden; }
354
+
355
+ /* ---- Benchmark view ---- */
356
+ .benchmark-view {
357
+ padding: 1.5rem 2rem;
358
+ overflow-y: auto;
359
+ flex: 1;
360
+ }
361
+ .benchmark-table {
362
+ border-collapse: collapse;
363
+ background: var(--surface);
364
+ border: 1px solid var(--border);
365
+ border-radius: var(--radius);
366
+ font-size: 0.8125rem;
367
+ width: 100%;
368
+ margin-bottom: 1.5rem;
369
+ }
370
+ .benchmark-table th, .benchmark-table td {
371
+ padding: 0.625rem 0.75rem;
372
+ text-align: left;
373
+ border: 1px solid var(--border);
374
+ }
375
+ .benchmark-table th {
376
+ font-family: 'Poppins', sans-serif;
377
+ background: var(--header-bg);
378
+ color: var(--header-text);
379
+ font-weight: 500;
380
+ font-size: 0.75rem;
381
+ text-transform: uppercase;
382
+ letter-spacing: 0.04em;
383
+ }
384
+ .benchmark-table tr:hover { background: var(--bg); }
385
+ .benchmark-table tr.benchmark-row-with { background: rgba(33, 150, 243, 0.06); }
386
+ .benchmark-table tr.benchmark-row-without { background: rgba(255, 193, 7, 0.06); }
387
+ .benchmark-table tr.benchmark-row-with:hover { background: rgba(33, 150, 243, 0.12); }
388
+ .benchmark-table tr.benchmark-row-without:hover { background: rgba(255, 193, 7, 0.12); }
389
+ .benchmark-table tr.benchmark-row-avg { font-weight: 600; border-top: 2px solid var(--border); }
390
+ .benchmark-table tr.benchmark-row-avg.benchmark-row-with { background: rgba(33, 150, 243, 0.12); }
391
+ .benchmark-table tr.benchmark-row-avg.benchmark-row-without { background: rgba(255, 193, 7, 0.12); }
392
+ .benchmark-delta-positive { color: var(--green); font-weight: 600; }
393
+ .benchmark-delta-negative { color: var(--red); font-weight: 600; }
394
+ .benchmark-notes {
395
+ background: var(--surface);
396
+ border: 1px solid var(--border);
397
+ border-radius: var(--radius);
398
+ padding: 1rem;
399
+ }
400
+ .benchmark-notes h3 {
401
+ font-family: 'Poppins', sans-serif;
402
+ font-size: 0.875rem;
403
+ margin-bottom: 0.75rem;
404
+ }
405
+ .benchmark-notes ul {
406
+ list-style: disc;
407
+ padding-left: 1.25rem;
408
+ }
409
+ .benchmark-notes li {
410
+ font-size: 0.8125rem;
411
+ line-height: 1.6;
412
+ margin-bottom: 0.375rem;
413
+ }
414
+ .benchmark-empty {
415
+ color: var(--text-muted);
416
+ font-style: italic;
417
+ text-align: center;
418
+ padding: 3rem;
419
+ }
420
+
421
+ /* ---- Navigation ---- */
422
+ .nav {
423
+ display: flex;
424
+ justify-content: space-between;
425
+ align-items: center;
426
+ padding: 1rem 2rem;
427
+ border-top: 1px solid var(--border);
428
+ background: var(--surface);
429
+ flex-shrink: 0;
430
+ }
431
+ .nav-btn {
432
+ font-family: 'Poppins', sans-serif;
433
+ padding: 0.5rem 1.25rem;
434
+ border: 1px solid var(--border);
435
+ border-radius: var(--radius);
436
+ background: var(--surface);
437
+ cursor: pointer;
438
+ font-size: 0.875rem;
439
+ font-weight: 500;
440
+ color: var(--text);
441
+ transition: all 0.15s;
442
+ }
443
+ .nav-btn:hover:not(:disabled) {
444
+ background: var(--bg);
445
+ border-color: var(--text-muted);
446
+ }
447
+ .nav-btn:disabled {
448
+ opacity: 0.4;
449
+ cursor: not-allowed;
450
+ }
451
+ .done-btn {
452
+ font-family: 'Poppins', sans-serif;
453
+ padding: 0.5rem 1.5rem;
454
+ border: 1px solid var(--border);
455
+ border-radius: var(--radius);
456
+ background: var(--surface);
457
+ color: var(--text);
458
+ cursor: pointer;
459
+ font-size: 0.875rem;
460
+ font-weight: 500;
461
+ transition: all 0.15s;
462
+ }
463
+ .done-btn:hover {
464
+ background: var(--bg);
465
+ border-color: var(--text-muted);
466
+ }
467
+ .done-btn.ready {
468
+ border: none;
469
+ background: var(--accent);
470
+ color: white;
471
+ font-weight: 600;
472
+ }
473
+ .done-btn.ready:hover {
474
+ background: var(--accent-hover);
475
+ }
476
+ /* ---- Done overlay ---- */
477
+ .done-overlay {
478
+ display: none;
479
+ position: fixed;
480
+ inset: 0;
481
+ background: rgba(0, 0, 0, 0.5);
482
+ z-index: 100;
483
+ justify-content: center;
484
+ align-items: center;
485
+ }
486
+ .done-overlay.visible {
487
+ display: flex;
488
+ }
489
+ .done-card {
490
+ background: var(--surface);
491
+ border-radius: 12px;
492
+ padding: 2rem 3rem;
493
+ text-align: center;
494
+ box-shadow: 0 20px 60px rgba(0, 0, 0, 0.3);
495
+ max-width: 500px;
496
+ }
497
+ .done-card h2 {
498
+ font-size: 1.5rem;
499
+ margin-bottom: 0.5rem;
500
+ }
501
+ .done-card p {
502
+ color: var(--text-muted);
503
+ margin-bottom: 1.5rem;
504
+ line-height: 1.5;
505
+ }
506
+ .done-card .btn-row {
507
+ display: flex;
508
+ gap: 0.5rem;
509
+ justify-content: center;
510
+ }
511
+ .done-card button {
512
+ padding: 0.5rem 1.25rem;
513
+ border: 1px solid var(--border);
514
+ border-radius: var(--radius);
515
+ background: var(--surface);
516
+ cursor: pointer;
517
+ font-size: 0.875rem;
518
+ }
519
+ .done-card button:hover {
520
+ background: var(--bg);
521
+ }
522
+ /* ---- Toast ---- */
523
+ .toast {
524
+ position: fixed;
525
+ bottom: 5rem;
526
+ left: 50%;
527
+ transform: translateX(-50%);
528
+ background: var(--header-bg);
529
+ color: var(--header-text);
530
+ padding: 0.625rem 1.25rem;
531
+ border-radius: var(--radius);
532
+ font-size: 0.875rem;
533
+ opacity: 0;
534
+ transition: opacity 0.3s;
535
+ pointer-events: none;
536
+ z-index: 200;
537
+ }
538
+ .toast.visible {
539
+ opacity: 1;
540
+ }
541
+ </style>
542
+ </head>
543
+ <body>
544
+ <div id="app" style="height:100vh; display:flex; flex-direction:column;">
545
+ <div class="header">
546
+ <div>
547
+ <h1>Eval Review: <span id="skill-name"></span></h1>
548
+ <div class="instructions">Review each output and leave feedback below. Navigate with arrow keys or buttons. When done, copy feedback and paste into Claude Code.</div>
549
+ </div>
550
+ <div class="progress" id="progress"></div>
551
+ </div>
552
+
553
+ <!-- View tabs (only shown when benchmark data exists) -->
554
+ <div class="view-tabs" id="view-tabs" style="display:none;">
555
+ <button class="view-tab active" onclick="switchView('outputs')">Outputs</button>
556
+ <button class="view-tab" onclick="switchView('benchmark')">Benchmark</button>
557
+ </div>
558
+
559
+ <!-- Outputs panel (qualitative review) -->
560
+ <div class="view-panel active" id="panel-outputs">
561
+ <div class="main">
562
+ <!-- Prompt -->
563
+ <div class="section">
564
+ <div class="section-header">Prompt <span class="config-badge" id="config-badge" style="display:none;"></span></div>
565
+ <div class="section-body">
566
+ <div class="prompt-text" id="prompt-text"></div>
567
+ </div>
568
+ </div>
569
+
570
+ <!-- Outputs -->
571
+ <div class="section">
572
+ <div class="section-header">Output</div>
573
+ <div class="section-body" id="outputs-body">
574
+ <div class="empty-state">No output files found</div>
575
+ </div>
576
+ </div>
577
+
578
+ <!-- Previous Output (collapsible) -->
579
+ <div class="section" id="prev-outputs-section" style="display:none;">
580
+ <div class="section-header">
581
+ <div class="grades-toggle" onclick="togglePrevOutputs()">
582
+ <span class="arrow" id="prev-outputs-arrow">&#9654;</span>
583
+ Previous Output
584
+ </div>
585
+ </div>
586
+ <div class="grades-content" id="prev-outputs-content"></div>
587
+ </div>
588
+
589
+ <!-- Grades (collapsible) -->
590
+ <div class="section" id="grades-section" style="display:none;">
591
+ <div class="section-header">
592
+ <div class="grades-toggle" onclick="toggleGrades()">
593
+ <span class="arrow" id="grades-arrow">&#9654;</span>
594
+ Formal Grades
595
+ </div>
596
+ </div>
597
+ <div class="grades-content" id="grades-content"></div>
598
+ </div>
599
+
600
+ <!-- Feedback -->
601
+ <div class="section">
602
+ <div class="section-header">Your Feedback</div>
603
+ <div class="section-body">
604
+ <textarea
605
+ class="feedback-textarea"
606
+ id="feedback"
607
+ placeholder="What do you think of this output? Any issues, suggestions, or things that look great?"
608
+ ></textarea>
609
+ <div class="feedback-status" id="feedback-status"></div>
610
+ <div class="prev-feedback" id="prev-feedback" style="display:none;">
611
+ <div class="prev-feedback-label">Previous feedback</div>
612
+ <div id="prev-feedback-text"></div>
613
+ </div>
614
+ </div>
615
+ </div>
616
+ </div>
617
+
618
+ <div class="nav" id="outputs-nav">
619
+ <button class="nav-btn" id="prev-btn" onclick="navigate(-1)">&#8592; Previous</button>
620
+ <button class="done-btn" id="done-btn" onclick="showDoneDialog()">Submit All Reviews</button>
621
+ <button class="nav-btn" id="next-btn" onclick="navigate(1)">Next &#8594;</button>
622
+ </div>
623
+ </div><!-- end panel-outputs -->
624
+
625
+ <!-- Benchmark panel (quantitative stats) -->
626
+ <div class="view-panel" id="panel-benchmark">
627
+ <div class="benchmark-view" id="benchmark-content">
628
+ <div class="benchmark-empty">No benchmark data available. Run a benchmark to see quantitative results here.</div>
629
+ </div>
630
+ </div>
631
+ </div>
632
+
633
+ <!-- Done overlay -->
634
+ <div class="done-overlay" id="done-overlay">
635
+ <div class="done-card">
636
+ <h2>Review Complete</h2>
637
+ <p>Your feedback has been saved. Go back to your Claude Code session and tell Claude you're done reviewing.</p>
638
+ <div class="btn-row">
639
+ <button onclick="closeDoneDialog()">OK</button>
640
+ </div>
641
+ </div>
642
+ </div>
643
+
644
+ <!-- Toast -->
645
+ <div class="toast" id="toast"></div>
646
+
647
+ <script>
648
+ // ---- Embedded data (injected by generate_review.py) ----
649
+ /*__EMBEDDED_DATA__*/
650
+
651
+ // ---- State ----
652
+ let feedbackMap = {}; // run_id -> feedback text
653
+ let currentIndex = 0;
654
+ let visitedRuns = new Set();
655
+
656
+ // ---- Init ----
657
+ async function init() {
658
+ // Load saved feedback from server — but only if this isn't a fresh
659
+ // iteration (indicated by previous_feedback being present). When
660
+ // previous feedback exists, the feedback.json on disk is stale from
661
+ // the prior iteration and should not pre-fill the textareas.
662
+ const hasPrevious = Object.keys(EMBEDDED_DATA.previous_feedback || {}).length > 0
663
+ || Object.keys(EMBEDDED_DATA.previous_outputs || {}).length > 0;
664
+ if (!hasPrevious) {
665
+ try {
666
+ const resp = await fetch("/api/feedback");
667
+ const data = await resp.json();
668
+ if (data.reviews) {
669
+ for (const r of data.reviews) feedbackMap[r.run_id] = r.feedback;
670
+ }
671
+ } catch { /* first run, no feedback yet */ }
672
+ }
673
+
674
+ document.getElementById("skill-name").textContent = EMBEDDED_DATA.skill_name;
675
+ showRun(0);
676
+
677
+ // Wire up feedback auto-save
678
+ const textarea = document.getElementById("feedback");
679
+ let saveTimeout = null;
680
+ textarea.addEventListener("input", () => {
681
+ clearTimeout(saveTimeout);
682
+ document.getElementById("feedback-status").textContent = "";
683
+ saveTimeout = setTimeout(() => saveCurrentFeedback(), 800);
684
+ });
685
+ }
686
+
687
+ // ---- Navigation ----
688
+ function navigate(delta) {
689
+ const newIndex = currentIndex + delta;
690
+ if (newIndex >= 0 && newIndex < EMBEDDED_DATA.runs.length) {
691
+ saveCurrentFeedback();
692
+ showRun(newIndex);
693
+ }
694
+ }
695
+
696
+ function updateNavButtons() {
697
+ document.getElementById("prev-btn").disabled = currentIndex === 0;
698
+ document.getElementById("next-btn").disabled =
699
+ currentIndex === EMBEDDED_DATA.runs.length - 1;
700
+ }
701
+
702
+ // ---- Show a run ----
703
+ function showRun(index) {
704
+ currentIndex = index;
705
+ const run = EMBEDDED_DATA.runs[index];
706
+
707
+ // Progress
708
+ document.getElementById("progress").textContent =
709
+ `${index + 1} of ${EMBEDDED_DATA.runs.length}`;
710
+
711
+ // Prompt
712
+ document.getElementById("prompt-text").textContent = run.prompt;
713
+
714
+ // Config badge
715
+ const badge = document.getElementById("config-badge");
716
+ const configMatch = run.id.match(/(with_skill|without_skill|new_skill|old_skill)/);
717
+ if (configMatch) {
718
+ const config = configMatch[1];
719
+ const isBaseline = config === "without_skill" || config === "old_skill";
720
+ badge.textContent = config.replace(/_/g, " ");
721
+ badge.className = "config-badge " + (isBaseline ? "config-baseline" : "config-primary");
722
+ badge.style.display = "inline-block";
723
+ } else {
724
+ badge.style.display = "none";
725
+ }
726
+
727
+ // Outputs
728
+ renderOutputs(run);
729
+
730
+ // Previous outputs
731
+ renderPrevOutputs(run);
732
+
733
+ // Grades
734
+ renderGrades(run);
735
+
736
+ // Previous feedback
737
+ const prevFb = (EMBEDDED_DATA.previous_feedback || {})[run.id];
738
+ const prevEl = document.getElementById("prev-feedback");
739
+ if (prevFb) {
740
+ document.getElementById("prev-feedback-text").textContent = prevFb;
741
+ prevEl.style.display = "block";
742
+ } else {
743
+ prevEl.style.display = "none";
744
+ }
745
+
746
+ // Feedback
747
+ document.getElementById("feedback").value = feedbackMap[run.id] || "";
748
+ document.getElementById("feedback-status").textContent = "";
749
+
750
+ updateNavButtons();
751
+
752
+ // Track visited runs and promote done button when all visited
753
+ visitedRuns.add(index);
754
+ const doneBtn = document.getElementById("done-btn");
755
+ if (visitedRuns.size >= EMBEDDED_DATA.runs.length) {
756
+ doneBtn.classList.add("ready");
757
+ }
758
+
759
+ // Scroll main content to top
760
+ document.querySelector(".main").scrollTop = 0;
761
+ }
762
+
763
+ // ---- Render outputs ----
764
+ function renderOutputs(run) {
765
+ const container = document.getElementById("outputs-body");
766
+ container.innerHTML = "";
767
+
768
+ const outputs = run.outputs || [];
769
+ if (outputs.length === 0) {
770
+ container.innerHTML = '<div class="empty-state">No output files</div>';
771
+ return;
772
+ }
773
+
774
+ for (const file of outputs) {
775
+ const fileDiv = document.createElement("div");
776
+ fileDiv.className = "output-file";
777
+
778
+ // Always show file header with download link
779
+ const header = document.createElement("div");
780
+ header.className = "output-file-header";
781
+ const nameSpan = document.createElement("span");
782
+ nameSpan.textContent = file.name;
783
+ header.appendChild(nameSpan);
784
+ const dlBtn = document.createElement("a");
785
+ dlBtn.className = "dl-btn";
786
+ dlBtn.textContent = "Download";
787
+ dlBtn.download = file.name;
788
+ dlBtn.href = getDownloadUri(file);
789
+ header.appendChild(dlBtn);
790
+ fileDiv.appendChild(header);
791
+
792
+ const content = document.createElement("div");
793
+ content.className = "output-file-content";
794
+
795
+ if (file.type === "text") {
796
+ const pre = document.createElement("pre");
797
+ pre.textContent = file.content;
798
+ content.appendChild(pre);
799
+ } else if (file.type === "image") {
800
+ const img = document.createElement("img");
801
+ img.src = file.data_uri;
802
+ img.alt = file.name;
803
+ content.appendChild(img);
804
+ } else if (file.type === "pdf") {
805
+ const iframe = document.createElement("iframe");
806
+ iframe.src = file.data_uri;
807
+ content.appendChild(iframe);
808
+ } else if (file.type === "xlsx") {
809
+ renderXlsx(content, file.data_b64);
810
+ } else if (file.type === "binary") {
811
+ const a = document.createElement("a");
812
+ a.className = "download-link";
813
+ a.href = file.data_uri;
814
+ a.download = file.name;
815
+ a.textContent = "Download " + file.name;
816
+ content.appendChild(a);
817
+ } else if (file.type === "error") {
818
+ const pre = document.createElement("pre");
819
+ pre.textContent = file.content;
820
+ pre.style.color = "var(--red)";
821
+ content.appendChild(pre);
822
+ }
823
+
824
+ fileDiv.appendChild(content);
825
+ container.appendChild(fileDiv);
826
+ }
827
+ }
828
+
829
+ // ---- XLSX rendering via SheetJS ----
830
+ function renderXlsx(container, b64Data) {
831
+ try {
832
+ const raw = Uint8Array.from(atob(b64Data), c => c.charCodeAt(0));
833
+ const wb = XLSX.read(raw, { type: "array" });
834
+
835
+ for (let i = 0; i < wb.SheetNames.length; i++) {
836
+ const sheetName = wb.SheetNames[i];
837
+ const ws = wb.Sheets[sheetName];
838
+
839
+ if (wb.SheetNames.length > 1) {
840
+ const sheetLabel = document.createElement("div");
841
+ sheetLabel.style.cssText =
842
+ "font-weight:600; font-size:0.8rem; color:#b0aea5; margin-top:0.5rem; margin-bottom:0.25rem;";
843
+ sheetLabel.textContent = "Sheet: " + sheetName;
844
+ container.appendChild(sheetLabel);
845
+ }
846
+
847
+ const htmlStr = XLSX.utils.sheet_to_html(ws, { editable: false });
848
+ const wrapper = document.createElement("div");
849
+ wrapper.innerHTML = htmlStr;
850
+ container.appendChild(wrapper);
851
+ }
852
+ } catch (err) {
853
+ container.textContent = "Error rendering spreadsheet: " + err.message;
854
+ }
855
+ }
856
+
857
+ // ---- Grades ----
858
+ function renderGrades(run) {
859
+ const section = document.getElementById("grades-section");
860
+ const content = document.getElementById("grades-content");
861
+
862
+ if (!run.grading) {
863
+ section.style.display = "none";
864
+ return;
865
+ }
866
+
867
+ const grading = run.grading;
868
+ section.style.display = "block";
869
+ // Reset to collapsed
870
+ content.classList.remove("open");
871
+ document.getElementById("grades-arrow").classList.remove("open");
872
+
873
+ const summary = grading.summary || {};
874
+ const expectations = grading.expectations || [];
875
+
876
+ let html = '<div style="padding: 1rem;">';
877
+
878
+ // Summary line
879
+ const passRate = summary.pass_rate != null
880
+ ? Math.round(summary.pass_rate * 100) + "%"
881
+ : "?";
882
+ const badgeClass = summary.pass_rate >= 0.8 ? "grade-pass" : summary.pass_rate >= 0.5 ? "" : "grade-fail";
883
+ html += '<div class="grades-summary">';
884
+ html += '<span class="grade-badge ' + badgeClass + '">' + passRate + '</span>';
885
+ html += '<span>' + (summary.passed || 0) + ' passed, ' + (summary.failed || 0) + ' failed of ' + (summary.total || 0) + '</span>';
886
+ html += '</div>';
887
+
888
+ // Assertions list
889
+ html += '<ul class="assertion-list">';
890
+ for (const exp of expectations) {
891
+ const statusClass = exp.passed ? "pass" : "fail";
892
+ const statusIcon = exp.passed ? "\u2713" : "\u2717";
893
+ html += '<li class="assertion-item">';
894
+ html += '<span class="assertion-status ' + statusClass + '">' + statusIcon + '</span>';
895
+ html += '<span>' + escapeHtml(exp.text) + '</span>';
896
+ if (exp.evidence) {
897
+ html += '<div class="assertion-evidence">' + escapeHtml(exp.evidence) + '</div>';
898
+ }
899
+ html += '</li>';
900
+ }
901
+ html += '</ul>';
902
+
903
+ html += '</div>';
904
+ content.innerHTML = html;
905
+ }
906
+
907
+ function toggleGrades() {
908
+ const content = document.getElementById("grades-content");
909
+ const arrow = document.getElementById("grades-arrow");
910
+ content.classList.toggle("open");
911
+ arrow.classList.toggle("open");
912
+ }
913
+
914
+ // ---- Previous outputs (collapsible) ----
915
+ function renderPrevOutputs(run) {
916
+ const section = document.getElementById("prev-outputs-section");
917
+ const content = document.getElementById("prev-outputs-content");
918
+ const prevOutputs = (EMBEDDED_DATA.previous_outputs || {})[run.id];
919
+
920
+ if (!prevOutputs || prevOutputs.length === 0) {
921
+ section.style.display = "none";
922
+ return;
923
+ }
924
+
925
+ section.style.display = "block";
926
+ // Reset to collapsed
927
+ content.classList.remove("open");
928
+ document.getElementById("prev-outputs-arrow").classList.remove("open");
929
+
930
+ // Render the files into the content area
931
+ content.innerHTML = "";
932
+ const wrapper = document.createElement("div");
933
+ wrapper.style.padding = "1rem";
934
+
935
+ for (const file of prevOutputs) {
936
+ const fileDiv = document.createElement("div");
937
+ fileDiv.className = "output-file";
938
+
939
+ const header = document.createElement("div");
940
+ header.className = "output-file-header";
941
+ const nameSpan = document.createElement("span");
942
+ nameSpan.textContent = file.name;
943
+ header.appendChild(nameSpan);
944
+ const dlBtn = document.createElement("a");
945
+ dlBtn.className = "dl-btn";
946
+ dlBtn.textContent = "Download";
947
+ dlBtn.download = file.name;
948
+ dlBtn.href = getDownloadUri(file);
949
+ header.appendChild(dlBtn);
950
+ fileDiv.appendChild(header);
951
+
952
+ const fc = document.createElement("div");
953
+ fc.className = "output-file-content";
954
+
955
+ if (file.type === "text") {
956
+ const pre = document.createElement("pre");
957
+ pre.textContent = file.content;
958
+ fc.appendChild(pre);
959
+ } else if (file.type === "image") {
960
+ const img = document.createElement("img");
961
+ img.src = file.data_uri;
962
+ img.alt = file.name;
963
+ fc.appendChild(img);
964
+ } else if (file.type === "pdf") {
965
+ const iframe = document.createElement("iframe");
966
+ iframe.src = file.data_uri;
967
+ fc.appendChild(iframe);
968
+ } else if (file.type === "xlsx") {
969
+ renderXlsx(fc, file.data_b64);
970
+ } else if (file.type === "binary") {
971
+ const a = document.createElement("a");
972
+ a.className = "download-link";
973
+ a.href = file.data_uri;
974
+ a.download = file.name;
975
+ a.textContent = "Download " + file.name;
976
+ fc.appendChild(a);
977
+ }
978
+
979
+ fileDiv.appendChild(fc);
980
+ wrapper.appendChild(fileDiv);
981
+ }
982
+
983
+ content.appendChild(wrapper);
984
+ }
985
+
986
+ function togglePrevOutputs() {
987
+ const content = document.getElementById("prev-outputs-content");
988
+ const arrow = document.getElementById("prev-outputs-arrow");
989
+ content.classList.toggle("open");
990
+ arrow.classList.toggle("open");
991
+ }
992
+
993
+ // ---- Feedback (saved to server -> feedback.json) ----
994
+ function saveCurrentFeedback() {
995
+ const run = EMBEDDED_DATA.runs[currentIndex];
996
+ const text = document.getElementById("feedback").value;
997
+
998
+ if (text.trim() === "") {
999
+ delete feedbackMap[run.id];
1000
+ } else {
1001
+ feedbackMap[run.id] = text;
1002
+ }
1003
+
1004
+ // Build reviews array from map
1005
+ const reviews = [];
1006
+ for (const [run_id, feedback] of Object.entries(feedbackMap)) {
1007
+ if (feedback.trim()) {
1008
+ reviews.push({ run_id, feedback, timestamp: new Date().toISOString() });
1009
+ }
1010
+ }
1011
+
1012
+ fetch("/api/feedback", {
1013
+ method: "POST",
1014
+ headers: { "Content-Type": "application/json" },
1015
+ body: JSON.stringify({ reviews, status: "in_progress" }),
1016
+ }).then(() => {
1017
+ document.getElementById("feedback-status").textContent = "Saved";
1018
+ }).catch(() => {
1019
+ // Static mode or server unavailable — no-op on auto-save,
1020
+ // feedback will be downloaded on final submit
1021
+ document.getElementById("feedback-status").textContent = "Will download on submit";
1022
+ });
1023
+ }
1024
+
1025
+ // ---- Done ----
1026
+ function showDoneDialog() {
1027
+ // Save current textarea to feedbackMap (but don't POST yet)
1028
+ const run = EMBEDDED_DATA.runs[currentIndex];
1029
+ const text = document.getElementById("feedback").value;
1030
+ if (text.trim() === "") {
1031
+ delete feedbackMap[run.id];
1032
+ } else {
1033
+ feedbackMap[run.id] = text;
1034
+ }
1035
+
1036
+ // POST once with status: complete — include ALL runs so the model
1037
+ // can distinguish "no feedback" (looks good) from "not reviewed"
1038
+ const reviews = [];
1039
+ const ts = new Date().toISOString();
1040
+ for (const r of EMBEDDED_DATA.runs) {
1041
+ reviews.push({ run_id: r.id, feedback: feedbackMap[r.id] || "", timestamp: ts });
1042
+ }
1043
+ const payload = JSON.stringify({ reviews, status: "complete" }, null, 2);
1044
+ fetch("/api/feedback", {
1045
+ method: "POST",
1046
+ headers: { "Content-Type": "application/json" },
1047
+ body: payload,
1048
+ }).then(() => {
1049
+ document.getElementById("done-overlay").classList.add("visible");
1050
+ }).catch(() => {
1051
+ // Server not available (static mode) — download as file
1052
+ const blob = new Blob([payload], { type: "application/json" });
1053
+ const url = URL.createObjectURL(blob);
1054
+ const a = document.createElement("a");
1055
+ a.href = url;
1056
+ a.download = "feedback.json";
1057
+ a.click();
1058
+ URL.revokeObjectURL(url);
1059
+ document.getElementById("done-overlay").classList.add("visible");
1060
+ });
1061
+ }
1062
+
1063
+ function closeDoneDialog() {
1064
+ // Reset status back to in_progress
1065
+ saveCurrentFeedback();
1066
+ document.getElementById("done-overlay").classList.remove("visible");
1067
+ }
1068
+
1069
+ // ---- Toast ----
1070
+ function showToast(message) {
1071
+ const toast = document.getElementById("toast");
1072
+ toast.textContent = message;
1073
+ toast.classList.add("visible");
1074
+ setTimeout(() => toast.classList.remove("visible"), 2000);
1075
+ }
1076
+
1077
+ // ---- Keyboard nav ----
1078
+ document.addEventListener("keydown", (e) => {
1079
+ // Don't capture when typing in textarea
1080
+ if (e.target.tagName === "TEXTAREA") return;
1081
+
1082
+ if (e.key === "ArrowLeft" || e.key === "ArrowUp") {
1083
+ e.preventDefault();
1084
+ navigate(-1);
1085
+ } else if (e.key === "ArrowRight" || e.key === "ArrowDown") {
1086
+ e.preventDefault();
1087
+ navigate(1);
1088
+ }
1089
+ });
1090
+
1091
+ // ---- Util ----
1092
+ function getDownloadUri(file) {
1093
+ if (file.data_uri) return file.data_uri;
1094
+ if (file.data_b64) return "data:application/octet-stream;base64," + file.data_b64;
1095
+ if (file.type === "text") return "data:text/plain;charset=utf-8," + encodeURIComponent(file.content);
1096
+ return "#";
1097
+ }
1098
+
1099
+ function escapeHtml(text) {
1100
+ const div = document.createElement("div");
1101
+ div.textContent = text;
1102
+ return div.innerHTML;
1103
+ }
1104
+
1105
+ // ---- View switching ----
1106
+ function switchView(view) {
1107
+ document.querySelectorAll(".view-tab").forEach(t => t.classList.remove("active"));
1108
+ document.querySelectorAll(".view-panel").forEach(p => p.classList.remove("active"));
1109
+ document.querySelector(`[onclick="switchView('${view}')"]`).classList.add("active");
1110
+ document.getElementById("panel-" + view).classList.add("active");
1111
+ }
1112
+
1113
+ // ---- Benchmark rendering ----
1114
+ function renderBenchmark() {
1115
+ const data = EMBEDDED_DATA.benchmark;
1116
+ if (!data) return;
1117
+
1118
+ // Show the tabs
1119
+ document.getElementById("view-tabs").style.display = "flex";
1120
+
1121
+ const container = document.getElementById("benchmark-content");
1122
+ const summary = data.run_summary || {};
1123
+ const metadata = data.metadata || {};
1124
+ const notes = data.notes || [];
1125
+
1126
+ let html = "";
1127
+
1128
+ // Header
1129
+ html += "<h2 style='font-family: Poppins, sans-serif; margin-bottom: 0.5rem;'>Benchmark Results</h2>";
1130
+ html += "<p style='color: var(--text-muted); font-size: 0.875rem; margin-bottom: 1.25rem;'>";
1131
+ if (metadata.skill_name) html += "<strong>" + escapeHtml(metadata.skill_name) + "</strong> &mdash; ";
1132
+ if (metadata.timestamp) html += metadata.timestamp + " &mdash; ";
1133
+ if (metadata.evals_run) html += "Evals: " + metadata.evals_run.join(", ") + " &mdash; ";
1134
+ html += (metadata.runs_per_configuration || "?") + " runs per configuration";
1135
+ html += "</p>";
1136
+
1137
+ // Summary table
1138
+ html += '<table class="benchmark-table">';
1139
+
1140
+ function fmtStat(stat, pct) {
1141
+ if (!stat) return "—";
1142
+ const suffix = pct ? "%" : "";
1143
+ const m = pct ? (stat.mean * 100).toFixed(0) : stat.mean.toFixed(1);
1144
+ const s = pct ? (stat.stddev * 100).toFixed(0) : stat.stddev.toFixed(1);
1145
+ return m + suffix + " ± " + s + suffix;
1146
+ }
1147
+
1148
+ function deltaClass(val) {
1149
+ if (!val) return "";
1150
+ const n = parseFloat(val);
1151
+ if (n > 0) return "benchmark-delta-positive";
1152
+ if (n < 0) return "benchmark-delta-negative";
1153
+ return "";
1154
+ }
1155
+
1156
+ // Discover config names dynamically (everything except "delta")
1157
+ const configs = Object.keys(summary).filter(k => k !== "delta");
1158
+ const configA = configs[0] || "config_a";
1159
+ const configB = configs[1] || "config_b";
1160
+ const labelA = configA.replace(/_/g, " ").replace(/\b\w/g, c => c.toUpperCase());
1161
+ const labelB = configB.replace(/_/g, " ").replace(/\b\w/g, c => c.toUpperCase());
1162
+ const a = summary[configA] || {};
1163
+ const b = summary[configB] || {};
1164
+ const delta = summary.delta || {};
1165
+
1166
+ html += "<thead><tr><th>Metric</th><th>" + escapeHtml(labelA) + "</th><th>" + escapeHtml(labelB) + "</th><th>Delta</th></tr></thead>";
1167
+ html += "<tbody>";
1168
+
1169
+ html += "<tr><td><strong>Pass Rate</strong></td>";
1170
+ html += "<td>" + fmtStat(a.pass_rate, true) + "</td>";
1171
+ html += "<td>" + fmtStat(b.pass_rate, true) + "</td>";
1172
+ html += '<td class="' + deltaClass(delta.pass_rate) + '">' + (delta.pass_rate || "—") + "</td></tr>";
1173
+
1174
+ // Time (only show row if data exists)
1175
+ if (a.time_seconds || b.time_seconds) {
1176
+ html += "<tr><td><strong>Time (s)</strong></td>";
1177
+ html += "<td>" + fmtStat(a.time_seconds, false) + "</td>";
1178
+ html += "<td>" + fmtStat(b.time_seconds, false) + "</td>";
1179
+ html += '<td class="' + deltaClass(delta.time_seconds) + '">' + (delta.time_seconds ? delta.time_seconds + "s" : "—") + "</td></tr>";
1180
+ }
1181
+
1182
+ // Tokens (only show row if data exists)
1183
+ if (a.tokens || b.tokens) {
1184
+ html += "<tr><td><strong>Tokens</strong></td>";
1185
+ html += "<td>" + fmtStat(a.tokens, false) + "</td>";
1186
+ html += "<td>" + fmtStat(b.tokens, false) + "</td>";
1187
+ html += '<td class="' + deltaClass(delta.tokens) + '">' + (delta.tokens || "—") + "</td></tr>";
1188
+ }
1189
+
1190
+ html += "</tbody></table>";
1191
+
1192
+ // Per-eval breakdown (if runs data available)
1193
+ const runs = data.runs || [];
1194
+ if (runs.length > 0) {
1195
+ const evalIds = [...new Set(runs.map(r => r.eval_id))].sort((a, b) => a - b);
1196
+
1197
+ html += "<h3 style='font-family: Poppins, sans-serif; margin-bottom: 0.75rem;'>Per-Eval Breakdown</h3>";
1198
+
1199
+ const hasTime = runs.some(r => r.result && r.result.time_seconds != null);
1200
+ const hasErrors = runs.some(r => r.result && r.result.errors > 0);
1201
+
1202
+ for (const evalId of evalIds) {
1203
+ const evalRuns = runs.filter(r => r.eval_id === evalId);
1204
+ const evalName = evalRuns[0] && evalRuns[0].eval_name ? evalRuns[0].eval_name : "Eval " + evalId;
1205
+
1206
+ html += "<h4 style='font-family: Poppins, sans-serif; margin: 1rem 0 0.5rem; color: var(--text);'>" + escapeHtml(evalName) + "</h4>";
1207
+ html += '<table class="benchmark-table">';
1208
+ html += "<thead><tr><th>Config</th><th>Run</th><th>Pass Rate</th>";
1209
+ if (hasTime) html += "<th>Time (s)</th>";
1210
+ if (hasErrors) html += "<th>Crashes During Execution</th>";
1211
+ html += "</tr></thead>";
1212
+ html += "<tbody>";
1213
+
1214
+ // Group by config and render with average rows
1215
+ const configGroups = [...new Set(evalRuns.map(r => r.configuration))];
1216
+ for (let ci = 0; ci < configGroups.length; ci++) {
1217
+ const config = configGroups[ci];
1218
+ const configRuns = evalRuns.filter(r => r.configuration === config);
1219
+ if (configRuns.length === 0) continue;
1220
+
1221
+ const rowClass = ci === 0 ? "benchmark-row-with" : "benchmark-row-without";
1222
+ const configLabel = config.replace(/_/g, " ").replace(/\b\w/g, c => c.toUpperCase());
1223
+
1224
+ for (const run of configRuns) {
1225
+ const r = run.result || {};
1226
+ const prClass = r.pass_rate >= 0.8 ? "benchmark-delta-positive" : r.pass_rate < 0.5 ? "benchmark-delta-negative" : "";
1227
+ html += '<tr class="' + rowClass + '">';
1228
+ html += "<td>" + configLabel + "</td>";
1229
+ html += "<td>" + run.run_number + "</td>";
1230
+ html += '<td class="' + prClass + '">' + ((r.pass_rate || 0) * 100).toFixed(0) + "% (" + (r.passed || 0) + "/" + (r.total || 0) + ")</td>";
1231
+ if (hasTime) html += "<td>" + (r.time_seconds != null ? r.time_seconds.toFixed(1) : "—") + "</td>";
1232
+ if (hasErrors) html += "<td>" + (r.errors || 0) + "</td>";
1233
+ html += "</tr>";
1234
+ }
1235
+
1236
+ // Average row
1237
+ const rates = configRuns.map(r => (r.result || {}).pass_rate || 0);
1238
+ const avgRate = rates.reduce((a, b) => a + b, 0) / rates.length;
1239
+ const avgPrClass = avgRate >= 0.8 ? "benchmark-delta-positive" : avgRate < 0.5 ? "benchmark-delta-negative" : "";
1240
+ html += '<tr class="benchmark-row-avg ' + rowClass + '">';
1241
+ html += "<td>" + configLabel + "</td>";
1242
+ html += "<td>Avg</td>";
1243
+ html += '<td class="' + avgPrClass + '">' + (avgRate * 100).toFixed(0) + "%</td>";
1244
+ if (hasTime) {
1245
+ const times = configRuns.map(r => (r.result || {}).time_seconds).filter(t => t != null);
1246
+ html += "<td>" + (times.length ? (times.reduce((a, b) => a + b, 0) / times.length).toFixed(1) : "—") + "</td>";
1247
+ }
1248
+ if (hasErrors) html += "<td></td>";
1249
+ html += "</tr>";
1250
+ }
1251
+ html += "</tbody></table>";
1252
+
1253
+ // Per-assertion detail for this eval
1254
+ const runsWithExpectations = {};
1255
+ for (const config of configGroups) {
1256
+ runsWithExpectations[config] = evalRuns.filter(r => r.configuration === config && r.expectations && r.expectations.length > 0);
1257
+ }
1258
+ const hasAnyExpectations = Object.values(runsWithExpectations).some(runs => runs.length > 0);
1259
+ if (hasAnyExpectations) {
1260
+ // Collect all unique assertion texts across all configs
1261
+ const allAssertions = [];
1262
+ const seen = new Set();
1263
+ for (const config of configGroups) {
1264
+ for (const run of runsWithExpectations[config]) {
1265
+ for (const exp of (run.expectations || [])) {
1266
+ if (!seen.has(exp.text)) {
1267
+ seen.add(exp.text);
1268
+ allAssertions.push(exp.text);
1269
+ }
1270
+ }
1271
+ }
1272
+ }
1273
+
1274
+ html += '<table class="benchmark-table" style="margin-top: 0.5rem;">';
1275
+ html += "<thead><tr><th>Assertion</th>";
1276
+ for (const config of configGroups) {
1277
+ const label = config.replace(/_/g, " ").replace(/\b\w/g, c => c.toUpperCase());
1278
+ html += "<th>" + escapeHtml(label) + "</th>";
1279
+ }
1280
+ html += "</tr></thead><tbody>";
1281
+
1282
+ for (const assertionText of allAssertions) {
1283
+ html += "<tr><td>" + escapeHtml(assertionText) + "</td>";
1284
+
1285
+ for (const config of configGroups) {
1286
+ html += "<td>";
1287
+ for (const run of runsWithExpectations[config]) {
1288
+ const exp = (run.expectations || []).find(e => e.text === assertionText);
1289
+ if (exp) {
1290
+ const cls = exp.passed ? "benchmark-delta-positive" : "benchmark-delta-negative";
1291
+ const icon = exp.passed ? "\u2713" : "\u2717";
1292
+ html += '<span class="' + cls + '" title="Run ' + run.run_number + ': ' + escapeHtml(exp.evidence || "") + '">' + icon + "</span> ";
1293
+ } else {
1294
+ html += "— ";
1295
+ }
1296
+ }
1297
+ html += "</td>";
1298
+ }
1299
+ html += "</tr>";
1300
+ }
1301
+ html += "</tbody></table>";
1302
+ }
1303
+ }
1304
+ }
1305
+
1306
+ // Notes
1307
+ if (notes.length > 0) {
1308
+ html += '<div class="benchmark-notes">';
1309
+ html += "<h3>Analysis Notes</h3>";
1310
+ html += "<ul>";
1311
+ for (const note of notes) {
1312
+ html += "<li>" + escapeHtml(note) + "</li>";
1313
+ }
1314
+ html += "</ul></div>";
1315
+ }
1316
+
1317
+ container.innerHTML = html;
1318
+ }
1319
+
1320
+ // ---- Start ----
1321
+ init();
1322
+ renderBenchmark();
1323
+ </script>
1324
+ </body>
1325
+ </html>