inspect-ai 0.3.62__py3-none-any.whl → 0.3.63__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (415) hide show
  1. inspect_ai/_cli/main.py +1 -1
  2. inspect_ai/_cli/trace.py +8 -0
  3. inspect_ai/_display/core/active.py +2 -3
  4. inspect_ai/_eval/eval.py +4 -4
  5. inspect_ai/_eval/evalset.py +6 -6
  6. inspect_ai/_eval/task/run.py +3 -0
  7. inspect_ai/_util/hash.py +1 -1
  8. inspect_ai/_view/www/.vscode/extensions.json +3 -0
  9. inspect_ai/_view/www/.vscode/settings.json +8 -0
  10. inspect_ai/_view/www/App.css +92 -29
  11. inspect_ai/_view/www/dist/assets/index.css +16637 -14676
  12. inspect_ai/_view/www/dist/assets/index.js +58897 -51440
  13. inspect_ai/_view/www/dist/index.html +1 -1
  14. inspect_ai/_view/www/index.html +2 -2
  15. inspect_ai/_view/www/log-schema.json +1 -0
  16. inspect_ai/_view/www/package.json +22 -4
  17. inspect_ai/_view/www/postcss.config.cjs +8 -9
  18. inspect_ai/_view/www/src/{App.mjs → App.tsx} +355 -365
  19. inspect_ai/_view/www/src/AppErrorBoundary.tsx +47 -0
  20. inspect_ai/_view/www/src/api/api-browser.ts +2 -2
  21. inspect_ai/_view/www/src/api/api-http.ts +3 -5
  22. inspect_ai/_view/www/src/api/api-vscode.ts +6 -6
  23. inspect_ai/_view/www/src/api/client-api.ts +4 -4
  24. inspect_ai/_view/www/src/api/index.ts +4 -4
  25. inspect_ai/_view/www/src/api/{Types.ts → types.ts} +25 -9
  26. inspect_ai/_view/www/src/appearance/colors.ts +9 -0
  27. inspect_ai/_view/www/src/appearance/fonts.ts +39 -0
  28. inspect_ai/_view/www/src/appearance/icons.ts +100 -0
  29. inspect_ai/_view/www/src/appearance/{Styles.mjs → styles.ts} +2 -32
  30. inspect_ai/_view/www/src/components/AnsiDisplay.tsx +198 -0
  31. inspect_ai/_view/www/src/components/AsciinemaPlayer.tsx +86 -0
  32. inspect_ai/_view/www/src/components/Card.css +60 -0
  33. inspect_ai/_view/www/src/components/Card.tsx +109 -0
  34. inspect_ai/_view/www/src/components/CopyButton.module.css +11 -0
  35. inspect_ai/_view/www/src/components/CopyButton.tsx +58 -0
  36. inspect_ai/_view/www/src/components/DownloadButton.css +4 -0
  37. inspect_ai/_view/www/src/components/DownloadButton.tsx +25 -0
  38. inspect_ai/_view/www/src/components/DownloadPanel.css +10 -0
  39. inspect_ai/_view/www/src/components/DownloadPanel.tsx +30 -0
  40. inspect_ai/_view/www/src/components/EmptyPanel.css +12 -0
  41. inspect_ai/_view/www/src/components/EmptyPanel.tsx +15 -0
  42. inspect_ai/_view/www/src/components/ErrorPanel.css +37 -0
  43. inspect_ai/_view/www/src/components/ErrorPanel.tsx +39 -0
  44. inspect_ai/_view/www/src/components/ExpandablePanel.css +40 -0
  45. inspect_ai/_view/www/src/components/ExpandablePanel.tsx +115 -0
  46. inspect_ai/_view/www/src/components/FindBand.css +49 -0
  47. inspect_ai/_view/www/src/components/FindBand.tsx +130 -0
  48. inspect_ai/_view/www/src/components/HumanBaselineView.css +41 -0
  49. inspect_ai/_view/www/src/components/HumanBaselineView.tsx +162 -0
  50. inspect_ai/_view/www/src/components/JsonPanel.css +20 -0
  51. inspect_ai/_view/www/src/components/JsonPanel.tsx +82 -0
  52. inspect_ai/_view/www/src/components/LabeledValue.css +20 -0
  53. inspect_ai/_view/www/src/components/LabeledValue.tsx +41 -0
  54. inspect_ai/_view/www/src/components/LargeModal.module.css +54 -0
  55. inspect_ai/_view/www/src/components/LargeModal.tsx +199 -0
  56. inspect_ai/_view/www/src/components/LightboxCarousel.css +95 -0
  57. inspect_ai/_view/www/src/components/LightboxCarousel.tsx +132 -0
  58. inspect_ai/_view/www/src/components/MarkdownDiv.css +3 -0
  59. inspect_ai/_view/www/src/components/MarkdownDiv.tsx +133 -0
  60. inspect_ai/_view/www/src/components/MessageBand.css +43 -0
  61. inspect_ai/_view/www/src/components/MessageBand.tsx +39 -0
  62. inspect_ai/_view/www/src/components/MorePopOver.tsx +67 -0
  63. inspect_ai/_view/www/src/components/NavPills.module.css +18 -0
  64. inspect_ai/_view/www/src/components/NavPills.tsx +99 -0
  65. inspect_ai/_view/www/src/components/ProgressBar.module.css +37 -0
  66. inspect_ai/_view/www/src/components/ProgressBar.tsx +22 -0
  67. inspect_ai/_view/www/src/components/TabSet.module.css +40 -0
  68. inspect_ai/_view/www/src/components/TabSet.tsx +200 -0
  69. inspect_ai/_view/www/src/components/ToolButton.css +3 -0
  70. inspect_ai/_view/www/src/components/ToolButton.tsx +27 -0
  71. inspect_ai/_view/www/src/components/VirtualList.module.css +19 -0
  72. inspect_ai/_view/www/src/components/VirtualList.tsx +292 -0
  73. inspect_ai/_view/www/src/{index.js → index.tsx} +45 -19
  74. inspect_ai/_view/www/src/{log → logfile}/remoteLogFile.ts +3 -7
  75. inspect_ai/_view/www/src/{utils/remoteZipFile.mjs → logfile/remoteZipFile.ts} +86 -80
  76. inspect_ai/_view/www/src/metadata/MetaDataGrid.tsx +83 -0
  77. inspect_ai/_view/www/src/metadata/MetaDataView.module.css +35 -0
  78. inspect_ai/_view/www/src/metadata/MetaDataView.tsx +95 -0
  79. inspect_ai/_view/www/src/metadata/MetadataGrid.module.css +15 -0
  80. inspect_ai/_view/www/src/metadata/RenderedContent.module.css +12 -0
  81. inspect_ai/_view/www/src/{components/RenderedContent/RenderedContent.mjs → metadata/RenderedContent.tsx} +92 -73
  82. inspect_ai/_view/www/src/metadata/types.ts +18 -0
  83. inspect_ai/_view/www/src/plan/DatasetDetailView.module.css +3 -0
  84. inspect_ai/_view/www/src/plan/DatasetDetailView.tsx +37 -0
  85. inspect_ai/_view/www/src/plan/DetailStep.module.css +9 -0
  86. inspect_ai/_view/www/src/plan/DetailStep.tsx +31 -0
  87. inspect_ai/_view/www/src/plan/PlanCard.tsx +28 -0
  88. inspect_ai/_view/www/src/plan/PlanDetailView.module.css +48 -0
  89. inspect_ai/_view/www/src/plan/PlanDetailView.tsx +309 -0
  90. inspect_ai/_view/www/src/plan/ScorerDetailView.module.css +3 -0
  91. inspect_ai/_view/www/src/plan/ScorerDetailView.tsx +30 -0
  92. inspect_ai/_view/www/src/plan/SolverDetailView.module.css +15 -0
  93. inspect_ai/_view/www/src/plan/SolverDetailView.tsx +32 -0
  94. inspect_ai/_view/www/src/samples/InlineSampleDisplay.module.css +8 -0
  95. inspect_ai/_view/www/src/samples/InlineSampleDisplay.tsx +53 -0
  96. inspect_ai/_view/www/src/samples/SampleDialog.tsx +122 -0
  97. inspect_ai/_view/www/src/samples/SampleDisplay.module.css +29 -0
  98. inspect_ai/_view/www/src/samples/SampleDisplay.tsx +326 -0
  99. inspect_ai/_view/www/src/samples/SampleSummaryView.module.css +24 -0
  100. inspect_ai/_view/www/src/samples/SampleSummaryView.tsx +175 -0
  101. inspect_ai/_view/www/src/samples/SamplesTools.tsx +60 -0
  102. inspect_ai/_view/www/src/samples/chat/ChatMessage.module.css +29 -0
  103. inspect_ai/_view/www/src/samples/chat/ChatMessage.tsx +76 -0
  104. inspect_ai/_view/www/src/samples/chat/ChatMessageRenderer.tsx +60 -0
  105. inspect_ai/_view/www/src/samples/chat/ChatMessageRow.module.css +9 -0
  106. inspect_ai/_view/www/src/samples/chat/ChatMessageRow.tsx +57 -0
  107. inspect_ai/_view/www/src/samples/chat/ChatView.tsx +46 -0
  108. inspect_ai/_view/www/src/samples/chat/ChatViewVirtualList.module.css +4 -0
  109. inspect_ai/_view/www/src/samples/chat/ChatViewVirtualList.tsx +58 -0
  110. inspect_ai/_view/www/src/samples/chat/MessageContent.module.css +4 -0
  111. inspect_ai/_view/www/src/samples/chat/MessageContent.tsx +143 -0
  112. inspect_ai/_view/www/src/samples/chat/MessageContents.module.css +3 -0
  113. inspect_ai/_view/www/src/samples/chat/MessageContents.tsx +131 -0
  114. inspect_ai/_view/www/src/samples/chat/messages.ts +112 -0
  115. inspect_ai/_view/www/src/samples/chat/tools/ToolCallView.tsx +145 -0
  116. inspect_ai/_view/www/src/samples/chat/tools/ToolInput.module.css +14 -0
  117. inspect_ai/_view/www/src/samples/chat/tools/ToolInput.tsx +86 -0
  118. inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.module.css +19 -0
  119. inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.tsx +53 -0
  120. inspect_ai/_view/www/src/samples/chat/tools/ToolTitle.module.css +4 -0
  121. inspect_ai/_view/www/src/samples/chat/tools/ToolTitle.tsx +18 -0
  122. inspect_ai/_view/www/src/samples/chat/tools/tool.ts +107 -0
  123. inspect_ai/_view/www/src/samples/descriptor/samplesDescriptor.tsx +363 -0
  124. inspect_ai/_view/www/src/samples/descriptor/score/BooleanScoreDescriptor.module.css +22 -0
  125. inspect_ai/_view/www/src/samples/descriptor/score/BooleanScoreDescriptor.tsx +26 -0
  126. inspect_ai/_view/www/src/samples/descriptor/score/CategoricalScoreDescriptor.tsx +18 -0
  127. inspect_ai/_view/www/src/samples/descriptor/score/NumericScoreDescriptor.tsx +27 -0
  128. inspect_ai/_view/www/src/samples/descriptor/score/ObjectScoreDescriptor.module.css +18 -0
  129. inspect_ai/_view/www/src/samples/descriptor/score/ObjectScoreDescriptor.tsx +71 -0
  130. inspect_ai/_view/www/src/samples/descriptor/score/OtherScoreDescriptor.tsx +20 -0
  131. inspect_ai/_view/www/src/samples/descriptor/score/PassFailScoreDescriptor.module.css +28 -0
  132. inspect_ai/_view/www/src/samples/descriptor/score/PassFailScoreDescriptor.tsx +81 -0
  133. inspect_ai/_view/www/src/samples/descriptor/score/ScoreDescriptor.tsx +99 -0
  134. inspect_ai/_view/www/src/samples/descriptor/types.ts +55 -0
  135. inspect_ai/_view/www/src/samples/error/FlatSampleErrorView.module.css +19 -0
  136. inspect_ai/_view/www/src/samples/error/FlatSampleErrorView.tsx +22 -0
  137. inspect_ai/_view/www/src/samples/error/SampleErrorView.module.css +17 -0
  138. inspect_ai/_view/www/src/samples/error/SampleErrorView.tsx +31 -0
  139. inspect_ai/_view/www/src/samples/error/error.ts +15 -0
  140. inspect_ai/_view/www/src/samples/list/SampleFooter.module.css +9 -0
  141. inspect_ai/_view/www/src/samples/list/SampleFooter.tsx +14 -0
  142. inspect_ai/_view/www/src/samples/list/SampleHeader.module.css +13 -0
  143. inspect_ai/_view/www/src/samples/list/SampleHeader.tsx +36 -0
  144. inspect_ai/_view/www/src/samples/list/SampleList.module.css +11 -0
  145. inspect_ai/_view/www/src/samples/list/SampleList.tsx +247 -0
  146. inspect_ai/_view/www/src/samples/list/SampleRow.module.css +33 -0
  147. inspect_ai/_view/www/src/samples/list/SampleRow.tsx +98 -0
  148. inspect_ai/_view/www/src/samples/list/SampleSeparator.module.css +6 -0
  149. inspect_ai/_view/www/src/samples/list/SampleSeparator.tsx +24 -0
  150. inspect_ai/_view/www/src/samples/sample-tools/EpochFilter.module.css +9 -0
  151. inspect_ai/_view/www/src/samples/sample-tools/EpochFilter.tsx +51 -0
  152. inspect_ai/_view/www/src/samples/sample-tools/SelectScorer.module.css +16 -0
  153. inspect_ai/_view/www/src/samples/sample-tools/SelectScorer.tsx +173 -0
  154. inspect_ai/_view/www/src/samples/sample-tools/SortFilter.module.css +9 -0
  155. inspect_ai/_view/www/src/samples/sample-tools/SortFilter.tsx +182 -0
  156. inspect_ai/_view/www/src/samples/{tools/filters.mjs → sample-tools/filters.ts} +86 -81
  157. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/SampleFilter.module.css +16 -0
  158. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/SampleFilter.tsx +288 -0
  159. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/completions.ts +346 -0
  160. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/language.ts +19 -0
  161. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/tokenize.ts +97 -0
  162. inspect_ai/_view/www/src/samples/{SampleLimit.mjs → sampleLimit.ts} +3 -6
  163. inspect_ai/_view/www/src/samples/scores/SampleScoreView.module.css +53 -0
  164. inspect_ai/_view/www/src/samples/scores/SampleScoreView.tsx +168 -0
  165. inspect_ai/_view/www/src/samples/scores/SampleScores.module.css +5 -0
  166. inspect_ai/_view/www/src/samples/scores/SampleScores.tsx +37 -0
  167. inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.tsx +66 -0
  168. inspect_ai/_view/www/src/samples/transcript/ErrorEventView.tsx +51 -0
  169. inspect_ai/_view/www/src/samples/transcript/InfoEventView.module.css +3 -0
  170. inspect_ai/_view/www/src/samples/transcript/InfoEventView.tsx +54 -0
  171. inspect_ai/_view/www/src/samples/transcript/InputEventView.tsx +48 -0
  172. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.module.css +6 -0
  173. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.tsx +36 -0
  174. inspect_ai/_view/www/src/samples/transcript/ModelEventView.module.css +43 -0
  175. inspect_ai/_view/www/src/samples/transcript/ModelEventView.tsx +223 -0
  176. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.module.css +23 -0
  177. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.tsx +108 -0
  178. inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.tsx +75 -0
  179. inspect_ai/_view/www/src/samples/transcript/SampleTranscript.tsx +22 -0
  180. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.module.css +15 -0
  181. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.tsx +100 -0
  182. inspect_ai/_view/www/src/samples/transcript/StepEventView.tsx +171 -0
  183. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.module.css +19 -0
  184. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.tsx +133 -0
  185. inspect_ai/_view/www/src/samples/transcript/ToolEventView.module.css +10 -0
  186. inspect_ai/_view/www/src/samples/transcript/ToolEventView.tsx +91 -0
  187. inspect_ai/_view/www/src/samples/transcript/TranscriptView.module.css +49 -0
  188. inspect_ai/_view/www/src/samples/transcript/TranscriptView.tsx +449 -0
  189. inspect_ai/_view/www/src/samples/transcript/event/EventNav.module.css +5 -0
  190. inspect_ai/_view/www/src/samples/transcript/event/EventNav.tsx +43 -0
  191. inspect_ai/_view/www/src/samples/transcript/event/EventNavs.module.css +3 -0
  192. inspect_ai/_view/www/src/samples/transcript/event/EventNavs.tsx +38 -0
  193. inspect_ai/_view/www/src/samples/transcript/event/EventPanel.module.css +25 -0
  194. inspect_ai/_view/www/src/samples/transcript/event/EventPanel.tsx +190 -0
  195. inspect_ai/_view/www/src/samples/transcript/event/EventRow.module.css +13 -0
  196. inspect_ai/_view/www/src/samples/transcript/event/EventRow.tsx +32 -0
  197. inspect_ai/_view/www/src/samples/transcript/event/EventSection.module.css +8 -0
  198. inspect_ai/_view/www/src/samples/transcript/event/EventSection.tsx +29 -0
  199. inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.tsx +67 -0
  200. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.tsx +274 -0
  201. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenders.module.css +10 -0
  202. inspect_ai/_view/www/src/samples/transcript/state/StateEventView.module.css +9 -0
  203. inspect_ai/_view/www/src/samples/transcript/state/{StateEventView.mjs → StateEventView.tsx} +148 -110
  204. inspect_ai/_view/www/src/samples/transcript/types.ts +58 -0
  205. inspect_ai/_view/www/src/types/log.d.ts +1 -0
  206. inspect_ai/_view/www/src/types/prism.d.ts +11 -0
  207. inspect_ai/_view/www/src/types.ts +71 -0
  208. inspect_ai/_view/www/src/usage/ModelTokenTable.tsx +22 -0
  209. inspect_ai/_view/www/src/usage/ModelUsagePanel.module.css +24 -0
  210. inspect_ai/_view/www/src/usage/ModelUsagePanel.tsx +95 -0
  211. inspect_ai/_view/www/src/usage/TokenTable.module.css +17 -0
  212. inspect_ai/_view/www/src/usage/TokenTable.tsx +91 -0
  213. inspect_ai/_view/www/src/usage/UsageCard.module.css +15 -0
  214. inspect_ai/_view/www/src/usage/UsageCard.tsx +67 -0
  215. inspect_ai/_view/www/src/utils/attachments.ts +42 -0
  216. inspect_ai/_view/www/src/utils/{Base64.mjs → base64.ts} +1 -6
  217. inspect_ai/_view/www/src/{components/Browser.mjs → utils/browser.ts} +0 -1
  218. inspect_ai/_view/www/src/utils/debugging.ts +28 -0
  219. inspect_ai/_view/www/src/utils/dom.ts +30 -0
  220. inspect_ai/_view/www/src/utils/format.ts +194 -0
  221. inspect_ai/_view/www/src/utils/git.ts +7 -0
  222. inspect_ai/_view/www/src/utils/html.ts +6 -0
  223. inspect_ai/_view/www/src/utils/http.ts +14 -0
  224. inspect_ai/_view/www/src/utils/{Path.mjs → path.ts} +2 -9
  225. inspect_ai/_view/www/src/utils/{Print.mjs → print.ts} +34 -26
  226. inspect_ai/_view/www/src/utils/queue.ts +51 -0
  227. inspect_ai/_view/www/src/utils/sync.ts +114 -0
  228. inspect_ai/_view/www/src/utils/{Type.mjs → type.ts} +3 -6
  229. inspect_ai/_view/www/src/utils/vscode.ts +13 -0
  230. inspect_ai/_view/www/src/workspace/WorkSpace.tsx +324 -0
  231. inspect_ai/_view/www/src/workspace/WorkSpaceView.module.css +33 -0
  232. inspect_ai/_view/www/src/workspace/WorkSpaceView.tsx +160 -0
  233. inspect_ai/_view/www/src/workspace/error/TaskErrorPanel.module.css +3 -0
  234. inspect_ai/_view/www/src/workspace/error/TaskErrorPanel.tsx +28 -0
  235. inspect_ai/_view/www/src/workspace/navbar/Navbar.module.css +54 -0
  236. inspect_ai/_view/www/src/workspace/navbar/Navbar.tsx +68 -0
  237. inspect_ai/_view/www/src/workspace/navbar/PrimaryBar.module.css +52 -0
  238. inspect_ai/_view/www/src/workspace/navbar/PrimaryBar.tsx +113 -0
  239. inspect_ai/_view/www/src/workspace/navbar/ResultsPanel.module.css +67 -0
  240. inspect_ai/_view/www/src/workspace/navbar/ResultsPanel.tsx +156 -0
  241. inspect_ai/_view/www/src/workspace/navbar/SecondaryBar.module.css +28 -0
  242. inspect_ai/_view/www/src/workspace/navbar/SecondaryBar.tsx +222 -0
  243. inspect_ai/_view/www/src/workspace/navbar/StatusPanel.module.css +14 -0
  244. inspect_ai/_view/www/src/workspace/navbar/StatusPanel.tsx +61 -0
  245. inspect_ai/_view/www/src/workspace/sidebar/EvalStatus.module.css +15 -0
  246. inspect_ai/_view/www/src/workspace/sidebar/EvalStatus.tsx +71 -0
  247. inspect_ai/_view/www/src/workspace/sidebar/LogDirectoryTitleView.module.css +5 -0
  248. inspect_ai/_view/www/src/workspace/sidebar/LogDirectoryTitleView.tsx +56 -0
  249. inspect_ai/_view/www/src/workspace/sidebar/Sidebar.module.css +68 -0
  250. inspect_ai/_view/www/src/workspace/sidebar/Sidebar.tsx +85 -0
  251. inspect_ai/_view/www/src/workspace/sidebar/SidebarLogEntry.module.css +29 -0
  252. inspect_ai/_view/www/src/workspace/sidebar/SidebarLogEntry.tsx +95 -0
  253. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoreView.module.css +23 -0
  254. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoreView.tsx +41 -0
  255. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoresView.module.css +35 -0
  256. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoresView.tsx +61 -0
  257. inspect_ai/_view/www/src/workspace/tabs/InfoTab.tsx +80 -0
  258. inspect_ai/_view/www/src/workspace/tabs/JsonTab.module.css +5 -0
  259. inspect_ai/_view/www/src/workspace/tabs/JsonTab.tsx +46 -0
  260. inspect_ai/_view/www/src/workspace/tabs/SamplesTab.tsx +204 -0
  261. inspect_ai/_view/www/src/workspace/tabs/grouping.ts +195 -0
  262. inspect_ai/_view/www/src/workspace/tabs/types.ts +19 -0
  263. inspect_ai/_view/www/src/workspace/types.ts +10 -0
  264. inspect_ai/_view/www/tsconfig.json +23 -9
  265. inspect_ai/_view/www/vite.config.js +8 -17
  266. inspect_ai/_view/www/yarn.lock +627 -556
  267. inspect_ai/dataset/_dataset.py +36 -0
  268. inspect_ai/dataset/_sources/csv.py +8 -0
  269. inspect_ai/dataset/_sources/file.py +4 -0
  270. inspect_ai/dataset/_sources/hf.py +11 -1
  271. inspect_ai/dataset/_sources/json.py +8 -0
  272. inspect_ai/log/_log.py +3 -6
  273. inspect_ai/log/_message.py +1 -1
  274. inspect_ai/log/_recorders/json.py +5 -7
  275. inspect_ai/model/_call_tools.py +2 -1
  276. inspect_ai/model/_providers/anthropic.py +3 -3
  277. inspect_ai/model/_providers/openai_o1.py +3 -5
  278. inspect_ai/model/_providers/openrouter.py +86 -0
  279. inspect_ai/model/_providers/providers.py +11 -0
  280. inspect_ai/scorer/_answer.py +7 -7
  281. inspect_ai/scorer/_classification.py +34 -18
  282. inspect_ai/scorer/_common.py +2 -8
  283. inspect_ai/solver/_multiple_choice.py +24 -9
  284. inspect_ai/tool/__init__.py +2 -0
  285. inspect_ai/tool/{beta → _tools}/_computer/_computer.py +2 -5
  286. inspect_ai/tool/_tools/_computer/_resources/tool/__init__.py +0 -0
  287. inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_x11_client.py +1 -1
  288. inspect_ai/tool/_tools/_computer/_resources/tool/requirements.txt +0 -0
  289. inspect_ai/tool/_tools/_execute.py +8 -2
  290. inspect_ai/tool/beta.py +3 -0
  291. inspect_ai/util/_sandbox/docker/docker.py +32 -85
  292. inspect_ai/util/_sandbox/self_check.py +124 -16
  293. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.63.dist-info}/METADATA +2 -1
  294. inspect_ai-0.3.63.dist-info/RECORD +618 -0
  295. inspect_ai/_view/www/src/Register.mjs +0 -3
  296. inspect_ai/_view/www/src/Types.mjs +0 -38
  297. inspect_ai/_view/www/src/appearance/Colors.mjs +0 -27
  298. inspect_ai/_view/www/src/appearance/Fonts.mjs +0 -66
  299. inspect_ai/_view/www/src/appearance/Icons.mjs +0 -240
  300. inspect_ai/_view/www/src/components/AnsiDisplay.mjs +0 -184
  301. inspect_ai/_view/www/src/components/AppErrorBoundary.mjs +0 -34
  302. inspect_ai/_view/www/src/components/AsciiCinemaPlayer.mjs +0 -74
  303. inspect_ai/_view/www/src/components/Card.mjs +0 -126
  304. inspect_ai/_view/www/src/components/ChatView.mjs +0 -441
  305. inspect_ai/_view/www/src/components/CopyButton.mjs +0 -48
  306. inspect_ai/_view/www/src/components/Dialog.mjs +0 -61
  307. inspect_ai/_view/www/src/components/DownloadButton.mjs +0 -15
  308. inspect_ai/_view/www/src/components/DownloadPanel.mjs +0 -29
  309. inspect_ai/_view/www/src/components/EmptyPanel.mjs +0 -23
  310. inspect_ai/_view/www/src/components/ErrorPanel.mjs +0 -66
  311. inspect_ai/_view/www/src/components/ExpandablePanel.mjs +0 -136
  312. inspect_ai/_view/www/src/components/FindBand.mjs +0 -157
  313. inspect_ai/_view/www/src/components/HumanBaselineView.mjs +0 -168
  314. inspect_ai/_view/www/src/components/JsonPanel.mjs +0 -61
  315. inspect_ai/_view/www/src/components/LabeledValue.mjs +0 -32
  316. inspect_ai/_view/www/src/components/LargeModal.mjs +0 -190
  317. inspect_ai/_view/www/src/components/LightboxCarousel.mjs +0 -217
  318. inspect_ai/_view/www/src/components/MarkdownDiv.mjs +0 -118
  319. inspect_ai/_view/www/src/components/MessageBand.mjs +0 -48
  320. inspect_ai/_view/www/src/components/MessageContent.mjs +0 -111
  321. inspect_ai/_view/www/src/components/MetaDataGrid.mjs +0 -92
  322. inspect_ai/_view/www/src/components/MetaDataView.mjs +0 -109
  323. inspect_ai/_view/www/src/components/MorePopOver.mjs +0 -50
  324. inspect_ai/_view/www/src/components/NavPills.mjs +0 -63
  325. inspect_ai/_view/www/src/components/ProgressBar.mjs +0 -51
  326. inspect_ai/_view/www/src/components/RenderedContent/ChatMessageRenderer.mjs +0 -54
  327. inspect_ai/_view/www/src/components/RenderedContent/Types.mjs +0 -19
  328. inspect_ai/_view/www/src/components/TabSet.mjs +0 -184
  329. inspect_ai/_view/www/src/components/ToolButton.mjs +0 -16
  330. inspect_ai/_view/www/src/components/Tools.mjs +0 -376
  331. inspect_ai/_view/www/src/components/VirtualList.mjs +0 -280
  332. inspect_ai/_view/www/src/components/ansi-output.js +0 -932
  333. inspect_ai/_view/www/src/json/JsonTab.mjs +0 -48
  334. inspect_ai/_view/www/src/log-reader/Log-Reader.mjs +0 -25
  335. inspect_ai/_view/www/src/log-reader/Native-Log-Reader.mjs +0 -13
  336. inspect_ai/_view/www/src/log-reader/Open-AI-Log-Reader.mjs +0 -263
  337. inspect_ai/_view/www/src/navbar/Navbar.mjs +0 -418
  338. inspect_ai/_view/www/src/navbar/SecondaryBar.mjs +0 -175
  339. inspect_ai/_view/www/src/plan/PlanCard.mjs +0 -418
  340. inspect_ai/_view/www/src/samples/SampleDialog.mjs +0 -123
  341. inspect_ai/_view/www/src/samples/SampleDisplay.mjs +0 -516
  342. inspect_ai/_view/www/src/samples/SampleError.mjs +0 -99
  343. inspect_ai/_view/www/src/samples/SampleList.mjs +0 -427
  344. inspect_ai/_view/www/src/samples/SampleScoreView.mjs +0 -172
  345. inspect_ai/_view/www/src/samples/SampleScores.mjs +0 -34
  346. inspect_ai/_view/www/src/samples/SampleTranscript.mjs +0 -20
  347. inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +0 -771
  348. inspect_ai/_view/www/src/samples/SamplesTab.mjs +0 -399
  349. inspect_ai/_view/www/src/samples/SamplesTools.mjs +0 -64
  350. inspect_ai/_view/www/src/samples/tools/EpochFilter.mjs +0 -38
  351. inspect_ai/_view/www/src/samples/tools/SampleFilter.mjs +0 -756
  352. inspect_ai/_view/www/src/samples/tools/SelectScorer.mjs +0 -141
  353. inspect_ai/_view/www/src/samples/tools/SortFilter.mjs +0 -151
  354. inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.mjs +0 -71
  355. inspect_ai/_view/www/src/samples/transcript/ErrorEventView.mjs +0 -44
  356. inspect_ai/_view/www/src/samples/transcript/EventPanel.mjs +0 -271
  357. inspect_ai/_view/www/src/samples/transcript/EventRow.mjs +0 -46
  358. inspect_ai/_view/www/src/samples/transcript/EventSection.mjs +0 -33
  359. inspect_ai/_view/www/src/samples/transcript/InfoEventView.mjs +0 -59
  360. inspect_ai/_view/www/src/samples/transcript/InputEventView.mjs +0 -44
  361. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.mjs +0 -32
  362. inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +0 -216
  363. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.mjs +0 -107
  364. inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.mjs +0 -74
  365. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.mjs +0 -100
  366. inspect_ai/_view/www/src/samples/transcript/StepEventView.mjs +0 -187
  367. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.mjs +0 -133
  368. inspect_ai/_view/www/src/samples/transcript/ToolEventView.mjs +0 -88
  369. inspect_ai/_view/www/src/samples/transcript/TranscriptView.mjs +0 -459
  370. inspect_ai/_view/www/src/samples/transcript/Types.mjs +0 -44
  371. inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.mjs +0 -53
  372. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.mjs +0 -254
  373. inspect_ai/_view/www/src/sidebar/Sidebar.mjs +0 -418
  374. inspect_ai/_view/www/src/usage/ModelTokenTable.mjs +0 -72
  375. inspect_ai/_view/www/src/usage/UsageCard.mjs +0 -159
  376. inspect_ai/_view/www/src/utils/Format.mjs +0 -260
  377. inspect_ai/_view/www/src/utils/Git.mjs +0 -12
  378. inspect_ai/_view/www/src/utils/Html.mjs +0 -21
  379. inspect_ai/_view/www/src/utils/attachments.mjs +0 -31
  380. inspect_ai/_view/www/src/utils/debugging.mjs +0 -23
  381. inspect_ai/_view/www/src/utils/http.mjs +0 -18
  382. inspect_ai/_view/www/src/utils/queue.mjs +0 -67
  383. inspect_ai/_view/www/src/utils/sync.mjs +0 -101
  384. inspect_ai/_view/www/src/workspace/TaskErrorPanel.mjs +0 -17
  385. inspect_ai/_view/www/src/workspace/WorkSpace.mjs +0 -516
  386. inspect_ai/tool/beta/__init__.py +0 -5
  387. inspect_ai-0.3.62.dist-info/RECORD +0 -481
  388. /inspect_ai/{tool/beta/_computer/_resources/tool/__init__.py → _view/www/src/components/MorePopOver.css} +0 -0
  389. /inspect_ai/_view/www/src/{constants.mjs → constants.ts} +0 -0
  390. /inspect_ai/{tool/beta/_computer/_resources/tool/requirements.txt → _view/www/src/workspace/tabs/InfoTab.module.css} +0 -0
  391. /inspect_ai/tool/{beta → _tools}/_computer/__init__.py +0 -0
  392. /inspect_ai/tool/{beta → _tools}/_computer/_common.py +0 -0
  393. /inspect_ai/tool/{beta → _tools}/_computer/_computer_split.py +0 -0
  394. /inspect_ai/tool/{beta → _tools}/_computer/_resources/Dockerfile +0 -0
  395. /inspect_ai/tool/{beta → _tools}/_computer/_resources/README.md +0 -0
  396. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/entrypoint.sh +0 -0
  397. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/novnc_startup.sh +0 -0
  398. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/x11vnc_startup.sh +0 -0
  399. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/xfce_startup.sh +0 -0
  400. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/xvfb_startup.sh +0 -0
  401. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/Code/User/globalStorage/state.vscdb +0 -0
  402. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/Code/User/settings.json +0 -0
  403. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/xfce4/xfconf/xfce-perchannel-xml/xfce4-panel.xml +0 -0
  404. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/xfce4/xfconf/xfce-perchannel-xml/xfce4-screensaver.xml +0 -0
  405. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Firefox Web Browser.desktop +0 -0
  406. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Terminal.desktop +0 -0
  407. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Visual Studio Code.desktop +0 -0
  408. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_logger.py +0 -0
  409. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_run.py +0 -0
  410. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_tool_result.py +0 -0
  411. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/computer_tool.py +0 -0
  412. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.63.dist-info}/LICENSE +0 -0
  413. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.63.dist-info}/WHEEL +0 -0
  414. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.63.dist-info}/entry_points.txt +0 -0
  415. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.63.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,190 @@
1
+ import clsx from "clsx";
2
+ import { ReactNode } from "react";
3
+ import { ApplicationIcons } from "../../../appearance/icons";
4
+ import { EventNavs } from "./EventNavs";
5
+
6
+ import React from "react";
7
+ import styles from "./EventPanel.module.css";
8
+
9
+ interface EventPanelProps {
10
+ id: string;
11
+ className?: string | string[];
12
+ title?: string;
13
+ subTitle?: string;
14
+ text?: string;
15
+ icon?: string;
16
+ collapse?: boolean;
17
+ collapsed?: boolean;
18
+ setCollapsed: (collapse: boolean) => void;
19
+ selectedNav: string;
20
+ setSelectedNav: (nav: string) => void;
21
+ children?: ReactNode | ReactNode[];
22
+ }
23
+
24
+ interface ChildProps {
25
+ "data-name"?: string;
26
+ }
27
+
28
+ /**
29
+ * Renders the StateEventView component.
30
+ */
31
+ export const EventPanel: React.FC<EventPanelProps> = ({
32
+ id,
33
+ className,
34
+ title,
35
+ subTitle,
36
+ text,
37
+ icon,
38
+ collapse,
39
+ collapsed,
40
+ setCollapsed,
41
+ children,
42
+ setSelectedNav,
43
+ selectedNav,
44
+ }) => {
45
+ const hasCollapse = collapse !== undefined;
46
+ const isCollapsed = collapsed === undefined ? collapse : collapsed;
47
+
48
+ const pillId = (index: number) => {
49
+ return `${id}-nav-pill-${index}`;
50
+ };
51
+
52
+ const filteredArrChildren = (
53
+ Array.isArray(children) ? children : [children]
54
+ ).filter((child) => !!child);
55
+ const defaultPillId = pillId(0);
56
+
57
+ const gridColumns = [];
58
+ if (hasCollapse) {
59
+ gridColumns.push("minmax(0, max-content)");
60
+ }
61
+ if (icon) {
62
+ gridColumns.push("max-content");
63
+ }
64
+ gridColumns.push("minmax(0, max-content)");
65
+ if (subTitle) {
66
+ gridColumns.push("minmax(0, max-content)");
67
+ }
68
+ gridColumns.push("auto");
69
+ gridColumns.push("minmax(0, max-content)");
70
+ gridColumns.push("minmax(0, max-content)");
71
+
72
+ const titleEl =
73
+ title || icon || filteredArrChildren.length > 1 ? (
74
+ <div
75
+ title={subTitle}
76
+ className={clsx("text-size-small")}
77
+ style={{
78
+ display: "grid",
79
+ gridTemplateColumns: gridColumns.join(" "),
80
+ columnGap: "0.3em",
81
+ cursor: hasCollapse ? "pointer" : undefined,
82
+ }}
83
+ >
84
+ {hasCollapse ? (
85
+ <i
86
+ onClick={() => {
87
+ setCollapsed(!isCollapsed);
88
+ }}
89
+ className={
90
+ isCollapsed
91
+ ? ApplicationIcons.chevron.right
92
+ : ApplicationIcons.chevron.down
93
+ }
94
+ />
95
+ ) : (
96
+ ""
97
+ )}
98
+ {icon ? (
99
+ <i
100
+ className={clsx(
101
+ icon || ApplicationIcons.metadata,
102
+ "text-style-secondary",
103
+ )}
104
+ onClick={() => {
105
+ setCollapsed(!isCollapsed);
106
+ }}
107
+ />
108
+ ) : (
109
+ ""
110
+ )}
111
+ <div
112
+ className={clsx("text-style-secondary", "text-style-label")}
113
+ onClick={() => {
114
+ setCollapsed(!isCollapsed);
115
+ }}
116
+ >
117
+ {title}
118
+ </div>
119
+ <div
120
+ onClick={() => {
121
+ setCollapsed(!isCollapsed);
122
+ }}
123
+ ></div>
124
+ <div
125
+ className={clsx("text-style-secondary", styles.label)}
126
+ onClick={() => {
127
+ setCollapsed(!isCollapsed);
128
+ }}
129
+ >
130
+ {collapsed ? text : ""}
131
+ </div>
132
+ <div className={styles.navs}>
133
+ {(!hasCollapse || !isCollapsed) &&
134
+ filteredArrChildren &&
135
+ filteredArrChildren.length > 1 ? (
136
+ <EventNavs
137
+ navs={filteredArrChildren.map((child, index) => {
138
+ const defaultTitle = `Tab ${index}`;
139
+ const title =
140
+ child && React.isValidElement<ChildProps>(child)
141
+ ? (child.props as ChildProps)["data-name"] || defaultTitle
142
+ : defaultTitle;
143
+ return {
144
+ id: `eventpanel-${id}-${index}`,
145
+ title: title,
146
+ target: pillId(index),
147
+ };
148
+ })}
149
+ selectedNav={selectedNav || defaultPillId}
150
+ setSelectedNav={setSelectedNav}
151
+ />
152
+ ) : (
153
+ ""
154
+ )}
155
+ </div>
156
+ </div>
157
+ ) : (
158
+ ""
159
+ );
160
+
161
+ const card = (
162
+ <div id={id} className={clsx(className, styles.card)}>
163
+ {titleEl}
164
+ <div
165
+ className={clsx(
166
+ "tab-content",
167
+ styles.cardContent,
168
+ hasCollapse && isCollapsed ? styles.hidden : undefined,
169
+ )}
170
+ >
171
+ {filteredArrChildren?.map((child, index) => {
172
+ const id = pillId(index);
173
+ const isSelected = selectedNav
174
+ ? id === selectedNav
175
+ : id === defaultPillId;
176
+
177
+ return (
178
+ <div
179
+ id={id}
180
+ className={clsx("tab-pane", "show", isSelected ? "active" : "")}
181
+ >
182
+ {child}
183
+ </div>
184
+ );
185
+ })}
186
+ </div>
187
+ </div>
188
+ );
189
+ return card;
190
+ };
@@ -0,0 +1,13 @@
1
+ .title {
2
+ margin-left: 0.5em;
3
+ display: grid;
4
+ grid-template-columns: max-content max-content minmax(0, 1fr);
5
+ column-gap: 0.5em;
6
+ }
7
+
8
+ .contents {
9
+ padding: 0.4em;
10
+ margin-bottom: 0;
11
+ border: solid 1px var(--bs-light-border-subtle);
12
+ border-radius: var(--bs-border-radius);
13
+ }
@@ -0,0 +1,32 @@
1
+ import clsx from "clsx";
2
+ import { ApplicationIcons } from "../../../appearance/icons";
3
+ import styles from "./EventRow.module.css";
4
+
5
+ interface EventRowProps {
6
+ title: string;
7
+ icon: string;
8
+ className?: string | string[];
9
+ children?: React.ReactNode | React.ReactNode[];
10
+ }
11
+ /**
12
+ * Renders the EventRow component.
13
+ */
14
+ export const EventRow: React.FC<EventRowProps> = ({
15
+ title,
16
+ icon,
17
+ className,
18
+ children,
19
+ }) => {
20
+ const contentEl = title ? (
21
+ <div className={clsx("text-size-small", styles.title, className)}>
22
+ <i className={icon || ApplicationIcons.metadata} />
23
+ <div className={clsx("text-style-label")}>{title}</div>
24
+ <div>{children}</div>
25
+ </div>
26
+ ) : (
27
+ ""
28
+ );
29
+
30
+ const card = <div className={clsx("card", styles.contents)}>{contentEl}</div>;
31
+ return card;
32
+ };
@@ -0,0 +1,8 @@
1
+ .container {
2
+ margin: 1em 0 0 0;
3
+ }
4
+
5
+ .title {
6
+ font-weight: 600;
7
+ padding-bottom: 0.3em;
8
+ }
@@ -0,0 +1,29 @@
1
+ import clsx from "clsx";
2
+ import { ReactNode } from "react";
3
+ import styles from "./EventSection.module.css";
4
+
5
+ interface EventSectionProps {
6
+ title: string;
7
+ children: ReactNode;
8
+ className?: string | string[];
9
+ }
10
+
11
+ /**
12
+ * Renders the Event Section component.
13
+ */
14
+ export const EventSection: React.FC<EventSectionProps> = ({
15
+ title,
16
+ children,
17
+ className,
18
+ }) => {
19
+ return (
20
+ <div className={clsx(styles.container, className)}>
21
+ <div
22
+ className={clsx("text-size-small", "text-style-label", styles.title)}
23
+ >
24
+ {title}
25
+ </div>
26
+ {children}
27
+ </div>
28
+ );
29
+ };
@@ -0,0 +1,67 @@
1
+ import clsx from "clsx";
2
+ import { diff } from "jsondiffpatch";
3
+ import { format } from "jsondiffpatch/formatters/html";
4
+
5
+ interface StateDiffViewProps {
6
+ before: Object;
7
+ after: Object;
8
+ className?: string | string[];
9
+ }
10
+
11
+ /**
12
+ * Renders a view displaying a list of state changes.
13
+ */
14
+ export const StateDiffView: React.FC<StateDiffViewProps> = ({
15
+ before,
16
+ after,
17
+ className,
18
+ }) => {
19
+ // Diff the objects and render the diff
20
+ const state_diff = diff(sanitizeKeys(before), sanitizeKeys(after));
21
+
22
+ const html_result = format(state_diff) || "Unable to render differences";
23
+ return (
24
+ <div
25
+ dangerouslySetInnerHTML={{ __html: unescapeNewlines(html_result) }}
26
+ className={clsx(className)}
27
+ ></div>
28
+ );
29
+ };
30
+
31
+ function unescapeNewlines<T>(obj: T): T {
32
+ if (typeof obj === "string") {
33
+ return obj.replace(/\\n/g, "\n") as T;
34
+ }
35
+
36
+ if (obj === null || typeof obj !== "object") {
37
+ return obj;
38
+ }
39
+
40
+ if (Array.isArray(obj)) {
41
+ return obj.map((item) => unescapeNewlines(item)) as T;
42
+ }
43
+
44
+ return Object.fromEntries(
45
+ Object.entries(obj as Record<string, unknown>).map(([key, value]) => [
46
+ key,
47
+ unescapeNewlines(value),
48
+ ]),
49
+ ) as T;
50
+ }
51
+
52
+ function sanitizeKeys<T>(obj: T): T {
53
+ if (typeof obj !== "object" || obj === null) {
54
+ return obj;
55
+ }
56
+
57
+ if (Array.isArray(obj)) {
58
+ return obj.map((item) => sanitizeKeys(item)) as T;
59
+ }
60
+
61
+ return Object.fromEntries(
62
+ Object.entries(obj as Record<string, unknown>).map(([key, value]) => [
63
+ key.replace(/</g, "&lt;").replace(/>/g, "&gt;"),
64
+ sanitizeKeys(value),
65
+ ]),
66
+ ) as T;
67
+ }
@@ -0,0 +1,274 @@
1
+ import clsx from "clsx";
2
+ import { Fragment, ReactNode } from "react";
3
+ import {
4
+ HumanBaselineView,
5
+ SessionLog,
6
+ } from "../../../components/HumanBaselineView";
7
+ import { JsonChange, Messages } from "../../../types/log";
8
+ import { ChatView } from "../../chat/ChatView";
9
+
10
+ import styles from "./StateEventRenders.module.css";
11
+
12
+ interface Signature {
13
+ remove: string[];
14
+ replace: string[];
15
+ add: string[];
16
+ }
17
+
18
+ interface ChangeType {
19
+ type: string;
20
+ signature: Signature;
21
+ render: (changes: JsonChange[], state: Record<string, unknown>) => ReactNode;
22
+ }
23
+
24
+ const system_msg_added_sig: ChangeType = {
25
+ type: "system_message",
26
+ signature: {
27
+ remove: ["/messages/0/source"],
28
+ replace: ["/messages/0/role", "/messages/0/content"],
29
+ add: ["/messages/1"],
30
+ },
31
+ render: (_changes, resolvedState) => {
32
+ const messages = resolvedState["messages"] as Array<unknown>;
33
+ const message = messages[0];
34
+ return (
35
+ <ChatView
36
+ id="system_msg_event_preview"
37
+ messages={[message] as Messages}
38
+ />
39
+ );
40
+ },
41
+ };
42
+
43
+ const kToolPattern = "/tools/(\\d+)";
44
+
45
+ const use_tools: ChangeType = {
46
+ type: "use_tools",
47
+ signature: {
48
+ add: ["/tools/0"],
49
+ replace: ["/tool_choice"],
50
+ remove: [],
51
+ },
52
+ render: (changes, resolvedState) => {
53
+ return renderTools(changes, resolvedState);
54
+ },
55
+ };
56
+
57
+ const add_tools: ChangeType = {
58
+ type: "add_tools",
59
+ signature: {
60
+ add: [kToolPattern],
61
+ replace: [],
62
+ remove: [],
63
+ },
64
+ render: (changes, resolvedState) => {
65
+ return renderTools(changes, resolvedState);
66
+ },
67
+ };
68
+
69
+ const humanAgentKey = (key: string) => {
70
+ return `HumanAgentState:${key}`;
71
+ };
72
+ const human_baseline_session: ChangeType = {
73
+ type: "human_baseline_session",
74
+ signature: {
75
+ add: ["HumanAgentState:logs"],
76
+ replace: [],
77
+ remove: [],
78
+ },
79
+ render: (_changes, state: Record<string, unknown>) => {
80
+ // Read the session values
81
+ const started = state[humanAgentKey("started_running")] as number;
82
+ const runtime = state[humanAgentKey("accumulated_time")] as number;
83
+ const answer = state[humanAgentKey("answer")] as string;
84
+ const completed = !!answer;
85
+ const running = state[humanAgentKey("running_state")] as boolean;
86
+ const rawSessions = state[humanAgentKey("logs")] as Record<string, unknown>;
87
+
88
+ // Tweak the date value
89
+ const startedDate = started ? new Date(started * 1000) : undefined;
90
+
91
+ // Convert raw sessions into session logs
92
+ const sessions: Record<string, SessionLog> = {};
93
+ if (rawSessions) {
94
+ for (const key of Object.keys(rawSessions)) {
95
+ const value = rawSessions[key] as string;
96
+ // this pulls the key apart into
97
+ // <user>_<timestamp>.<type>
98
+ const match = key.match(/(.*)_(\d+_\d+)\.(.*)/);
99
+ if (match) {
100
+ const user = match[1];
101
+ const timestamp = match[2];
102
+ const type = match[3];
103
+ sessions[timestamp] = sessions[timestamp] || {};
104
+ switch (type) {
105
+ case "input":
106
+ (sessions[timestamp] as SessionLog).input = value;
107
+ break;
108
+ case "output":
109
+ (sessions[timestamp] as SessionLog).output = value;
110
+ break;
111
+ case "timing":
112
+ (sessions[timestamp] as SessionLog).timing = value;
113
+ break;
114
+ case "name":
115
+ (sessions[timestamp] as SessionLog).name = value;
116
+ break;
117
+ }
118
+
119
+ (sessions[timestamp] as SessionLog).user = user;
120
+ }
121
+ }
122
+ }
123
+
124
+ return (
125
+ <HumanBaselineView
126
+ started={startedDate}
127
+ running={running}
128
+ completed={completed}
129
+ answer={answer}
130
+ runtime={runtime}
131
+ sessionLogs={Object.values(sessions)}
132
+ />
133
+ );
134
+ },
135
+ };
136
+
137
+ const renderTools = (
138
+ changes: JsonChange[],
139
+ resolvedState: Record<string, unknown>,
140
+ ) => {
141
+ // Find which tools were added in this change
142
+ const toolIndexes: string[] = [];
143
+ for (const change of changes) {
144
+ const match = change.path.match(kToolPattern);
145
+ if (match) {
146
+ toolIndexes.push(match[1]);
147
+ }
148
+ }
149
+
150
+ const toolName = (toolChoice: unknown): string => {
151
+ if (
152
+ typeof toolChoice === "object" &&
153
+ toolChoice &&
154
+ !Array.isArray(toolChoice)
155
+ ) {
156
+ return (toolChoice as Record<string, string>)["name"];
157
+ } else {
158
+ return String(toolChoice);
159
+ }
160
+ };
161
+
162
+ const toolsInfo: Record<string, ReactNode> = {};
163
+
164
+ // Show tool choice if it was changed
165
+ const hasToolChoice = changes.find((change) => {
166
+ return change.path.startsWith("/tool_choice");
167
+ });
168
+ if (resolvedState.tool_choice && hasToolChoice) {
169
+ toolsInfo["Tool Choice"] = toolName(resolvedState.tool_choice);
170
+ }
171
+
172
+ // Show either all tools or just the specific tools
173
+ const tools = resolvedState.tools as [];
174
+ if (tools.length > 0) {
175
+ if (toolIndexes.length === 0) {
176
+ toolsInfo["Tools"] = (
177
+ <Tools toolDefinitions={resolvedState.tools as ToolDefinition[]} />
178
+ );
179
+ } else {
180
+ const filtered = tools.filter((_, index) => {
181
+ return toolIndexes.includes(index.toString());
182
+ });
183
+ toolsInfo["Tools"] = <Tools toolDefinitions={filtered} />;
184
+ }
185
+ }
186
+
187
+ return (
188
+ <div className={clsx(styles.tools)}>
189
+ {Object.keys(toolsInfo).map((key) => {
190
+ return (
191
+ <Fragment>
192
+ <div
193
+ className={clsx(
194
+ "text-size-smaller",
195
+ "text-style-label",
196
+ "text-style-secondary",
197
+ )}
198
+ >
199
+ {key}
200
+ </div>
201
+ <div className={clsx("text-size-base")}>{toolsInfo[key]}</div>
202
+ </Fragment>
203
+ );
204
+ })}
205
+ </div>
206
+ );
207
+ };
208
+
209
+ export const RenderableChangeTypes: ChangeType[] = [
210
+ system_msg_added_sig,
211
+ use_tools,
212
+ add_tools,
213
+ ];
214
+
215
+ export const StoreSpecificRenderableTypes: ChangeType[] = [
216
+ human_baseline_session,
217
+ ];
218
+
219
+ interface ToolParameters {
220
+ type: string;
221
+ properties: {
222
+ code: ToolProperty;
223
+ };
224
+ required: string[];
225
+ }
226
+
227
+ interface ToolProperty {
228
+ type: string;
229
+ description: string;
230
+ }
231
+
232
+ interface ToolDefinition {
233
+ name: string;
234
+ description: string;
235
+ parameters?: ToolParameters;
236
+ }
237
+
238
+ interface ToolsProps {
239
+ toolDefinitions: ToolDefinition[];
240
+ }
241
+ /**
242
+ * Renders a list of tool components based on the provided tool definitions.
243
+ */
244
+ export const Tools: React.FC<ToolsProps> = ({ toolDefinitions }) => {
245
+ return toolDefinitions.map((toolDefinition) => {
246
+ const toolName = toolDefinition.name;
247
+ const toolArgs = toolDefinition.parameters?.properties
248
+ ? Object.keys(toolDefinition.parameters.properties)
249
+ : [];
250
+ return <Tool toolName={toolName} toolArgs={toolArgs} />;
251
+ });
252
+ };
253
+
254
+ interface ToolProps {
255
+ toolName: string;
256
+ toolArgs?: string[];
257
+ toolDesc?: string;
258
+ }
259
+ /**
260
+ * Renders a single tool component.
261
+ */
262
+ export const Tool: React.FC<ToolProps> = ({ toolName, toolArgs }) => {
263
+ const functionCall =
264
+ toolArgs && toolArgs.length > 0
265
+ ? `${toolName}(${toolArgs.join(", ")})`
266
+ : toolName;
267
+ return (
268
+ <div>
269
+ <code className={clsx("text-size-small", styles.tool)}>
270
+ {functionCall}
271
+ </code>
272
+ </div>
273
+ );
274
+ };
@@ -0,0 +1,10 @@
1
+ .tools {
2
+ display: grid;
3
+ grid-template-columns: max-content max-content;
4
+ column-gap: 1rem;
5
+ margin: 0;
6
+ }
7
+
8
+ .tool {
9
+ padding: 0;
10
+ }
@@ -0,0 +1,9 @@
1
+ .diff {
2
+ margin: 1em 0em;
3
+ width: 100%;
4
+ }
5
+
6
+ .summary {
7
+ margin: 1em 0em;
8
+ width: 100%;
9
+ }