inspect-ai 0.3.62__py3-none-any.whl → 0.3.64__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (518) hide show
  1. inspect_ai/_cli/cache.py +8 -7
  2. inspect_ai/_cli/common.py +0 -12
  3. inspect_ai/_cli/eval.py +32 -4
  4. inspect_ai/_cli/info.py +1 -0
  5. inspect_ai/_cli/list.py +1 -1
  6. inspect_ai/_cli/log.py +2 -0
  7. inspect_ai/_cli/main.py +1 -1
  8. inspect_ai/_cli/sandbox.py +4 -1
  9. inspect_ai/_cli/score.py +181 -32
  10. inspect_ai/_cli/trace.py +10 -0
  11. inspect_ai/_cli/view.py +4 -2
  12. inspect_ai/_display/core/active.py +2 -3
  13. inspect_ai/_display/core/config.py +7 -1
  14. inspect_ai/_display/textual/widgets/samples.py +4 -3
  15. inspect_ai/_display/textual/widgets/sandbox.py +6 -0
  16. inspect_ai/_eval/eval.py +104 -101
  17. inspect_ai/_eval/evalset.py +75 -75
  18. inspect_ai/_eval/loader.py +122 -12
  19. inspect_ai/_eval/registry.py +1 -1
  20. inspect_ai/_eval/run.py +14 -0
  21. inspect_ai/_eval/score.py +125 -36
  22. inspect_ai/_eval/task/log.py +105 -4
  23. inspect_ai/_eval/task/results.py +92 -38
  24. inspect_ai/_eval/task/run.py +9 -2
  25. inspect_ai/_eval/task/sandbox.py +35 -2
  26. inspect_ai/_eval/task/task.py +49 -46
  27. inspect_ai/_util/constants.py +1 -1
  28. inspect_ai/_util/content.py +8 -0
  29. inspect_ai/_util/error.py +2 -0
  30. inspect_ai/_util/file.py +15 -1
  31. inspect_ai/_util/hash.py +1 -1
  32. inspect_ai/_util/logger.py +4 -2
  33. inspect_ai/_util/registry.py +7 -1
  34. inspect_ai/_view/view.py +1 -2
  35. inspect_ai/_view/www/.vscode/extensions.json +3 -0
  36. inspect_ai/_view/www/.vscode/settings.json +8 -0
  37. inspect_ai/_view/www/App.css +97 -29
  38. inspect_ai/_view/www/README.md +1 -1
  39. inspect_ai/_view/www/dist/assets/index.css +16663 -14674
  40. inspect_ai/_view/www/dist/assets/index.js +58808 -51348
  41. inspect_ai/_view/www/dist/index.html +1 -1
  42. inspect_ai/_view/www/index.html +2 -2
  43. inspect_ai/_view/www/log-schema.json +87 -73
  44. inspect_ai/_view/www/package.json +22 -4
  45. inspect_ai/_view/www/postcss.config.cjs +8 -9
  46. inspect_ai/_view/www/src/{App.mjs → App.tsx} +356 -365
  47. inspect_ai/_view/www/src/AppErrorBoundary.tsx +47 -0
  48. inspect_ai/_view/www/src/api/api-browser.ts +2 -2
  49. inspect_ai/_view/www/src/api/api-http.ts +3 -5
  50. inspect_ai/_view/www/src/api/api-vscode.ts +6 -6
  51. inspect_ai/_view/www/src/api/client-api.ts +4 -4
  52. inspect_ai/_view/www/src/api/index.ts +4 -4
  53. inspect_ai/_view/www/src/api/{Types.ts → types.ts} +25 -9
  54. inspect_ai/_view/www/src/appearance/colors.ts +9 -0
  55. inspect_ai/_view/www/src/appearance/fonts.ts +39 -0
  56. inspect_ai/_view/www/src/appearance/icons.ts +100 -0
  57. inspect_ai/_view/www/src/appearance/{Styles.mjs → styles.ts} +2 -32
  58. inspect_ai/_view/www/src/components/AnsiDisplay.tsx +198 -0
  59. inspect_ai/_view/www/src/components/AsciinemaPlayer.tsx +86 -0
  60. inspect_ai/_view/www/src/components/Card.css +60 -0
  61. inspect_ai/_view/www/src/components/Card.tsx +109 -0
  62. inspect_ai/_view/www/src/components/CopyButton.module.css +11 -0
  63. inspect_ai/_view/www/src/components/CopyButton.tsx +58 -0
  64. inspect_ai/_view/www/src/components/DownloadButton.css +4 -0
  65. inspect_ai/_view/www/src/components/DownloadButton.tsx +25 -0
  66. inspect_ai/_view/www/src/components/DownloadPanel.css +10 -0
  67. inspect_ai/_view/www/src/components/DownloadPanel.tsx +30 -0
  68. inspect_ai/_view/www/src/components/EmptyPanel.css +12 -0
  69. inspect_ai/_view/www/src/components/EmptyPanel.tsx +15 -0
  70. inspect_ai/_view/www/src/components/ErrorPanel.css +37 -0
  71. inspect_ai/_view/www/src/components/ErrorPanel.tsx +39 -0
  72. inspect_ai/_view/www/src/components/ExpandablePanel.css +40 -0
  73. inspect_ai/_view/www/src/components/ExpandablePanel.tsx +115 -0
  74. inspect_ai/_view/www/src/components/FindBand.css +49 -0
  75. inspect_ai/_view/www/src/components/FindBand.tsx +130 -0
  76. inspect_ai/_view/www/src/components/HumanBaselineView.css +41 -0
  77. inspect_ai/_view/www/src/components/HumanBaselineView.tsx +162 -0
  78. inspect_ai/_view/www/src/components/JsonPanel.css +20 -0
  79. inspect_ai/_view/www/src/components/JsonPanel.tsx +82 -0
  80. inspect_ai/_view/www/src/components/LabeledValue.css +20 -0
  81. inspect_ai/_view/www/src/components/LabeledValue.tsx +41 -0
  82. inspect_ai/_view/www/src/components/LargeModal.module.css +54 -0
  83. inspect_ai/_view/www/src/components/LargeModal.tsx +189 -0
  84. inspect_ai/_view/www/src/components/LightboxCarousel.css +95 -0
  85. inspect_ai/_view/www/src/components/LightboxCarousel.tsx +132 -0
  86. inspect_ai/_view/www/src/components/MarkdownDiv.css +3 -0
  87. inspect_ai/_view/www/src/components/MarkdownDiv.tsx +133 -0
  88. inspect_ai/_view/www/src/components/MessageBand.css +43 -0
  89. inspect_ai/_view/www/src/components/MessageBand.tsx +39 -0
  90. inspect_ai/_view/www/src/components/MorePopOver.css +0 -0
  91. inspect_ai/_view/www/src/components/MorePopOver.tsx +67 -0
  92. inspect_ai/_view/www/src/components/NavPills.module.css +18 -0
  93. inspect_ai/_view/www/src/components/NavPills.tsx +101 -0
  94. inspect_ai/_view/www/src/components/ProgressBar.module.css +37 -0
  95. inspect_ai/_view/www/src/components/ProgressBar.tsx +22 -0
  96. inspect_ai/_view/www/src/components/TabSet.module.css +40 -0
  97. inspect_ai/_view/www/src/components/TabSet.tsx +215 -0
  98. inspect_ai/_view/www/src/components/ToolButton.css +3 -0
  99. inspect_ai/_view/www/src/components/ToolButton.tsx +27 -0
  100. inspect_ai/_view/www/src/components/VirtualList.module.css +19 -0
  101. inspect_ai/_view/www/src/components/VirtualList.tsx +292 -0
  102. inspect_ai/_view/www/src/{index.js → index.tsx} +45 -19
  103. inspect_ai/_view/www/src/{log → logfile}/remoteLogFile.ts +3 -8
  104. inspect_ai/_view/www/src/{utils/remoteZipFile.mjs → logfile/remoteZipFile.ts} +86 -80
  105. inspect_ai/_view/www/src/metadata/MetaDataGrid.tsx +83 -0
  106. inspect_ai/_view/www/src/metadata/MetaDataView.module.css +35 -0
  107. inspect_ai/_view/www/src/metadata/MetaDataView.tsx +95 -0
  108. inspect_ai/_view/www/src/metadata/MetadataGrid.module.css +15 -0
  109. inspect_ai/_view/www/src/metadata/RenderedContent.module.css +12 -0
  110. inspect_ai/_view/www/src/{components/RenderedContent/RenderedContent.mjs → metadata/RenderedContent.tsx} +92 -73
  111. inspect_ai/_view/www/src/metadata/types.ts +18 -0
  112. inspect_ai/_view/www/src/plan/DatasetDetailView.module.css +3 -0
  113. inspect_ai/_view/www/src/plan/DatasetDetailView.tsx +37 -0
  114. inspect_ai/_view/www/src/plan/DetailStep.module.css +9 -0
  115. inspect_ai/_view/www/src/plan/DetailStep.tsx +31 -0
  116. inspect_ai/_view/www/src/plan/PlanCard.tsx +28 -0
  117. inspect_ai/_view/www/src/plan/PlanDetailView.module.css +48 -0
  118. inspect_ai/_view/www/src/plan/PlanDetailView.tsx +324 -0
  119. inspect_ai/_view/www/src/plan/ScorerDetailView.module.css +3 -0
  120. inspect_ai/_view/www/src/plan/ScorerDetailView.tsx +30 -0
  121. inspect_ai/_view/www/src/plan/SolverDetailView.module.css +15 -0
  122. inspect_ai/_view/www/src/plan/SolverDetailView.tsx +32 -0
  123. inspect_ai/_view/www/src/samples/InlineSampleDisplay.module.css +8 -0
  124. inspect_ai/_view/www/src/samples/InlineSampleDisplay.tsx +53 -0
  125. inspect_ai/_view/www/src/samples/SampleDialog.tsx +122 -0
  126. inspect_ai/_view/www/src/samples/SampleDisplay.module.css +29 -0
  127. inspect_ai/_view/www/src/samples/SampleDisplay.tsx +331 -0
  128. inspect_ai/_view/www/src/samples/SampleSummaryView.module.css +24 -0
  129. inspect_ai/_view/www/src/samples/SampleSummaryView.tsx +177 -0
  130. inspect_ai/_view/www/src/samples/SamplesTools.tsx +52 -0
  131. inspect_ai/_view/www/src/samples/chat/ChatMessage.module.css +29 -0
  132. inspect_ai/_view/www/src/samples/chat/ChatMessage.tsx +76 -0
  133. inspect_ai/_view/www/src/samples/chat/ChatMessageRenderer.tsx +60 -0
  134. inspect_ai/_view/www/src/samples/chat/ChatMessageRow.module.css +9 -0
  135. inspect_ai/_view/www/src/samples/chat/ChatMessageRow.tsx +57 -0
  136. inspect_ai/_view/www/src/samples/chat/ChatView.tsx +47 -0
  137. inspect_ai/_view/www/src/samples/chat/ChatViewVirtualList.module.css +4 -0
  138. inspect_ai/_view/www/src/samples/chat/ChatViewVirtualList.tsx +58 -0
  139. inspect_ai/_view/www/src/samples/chat/MessageContent.module.css +4 -0
  140. inspect_ai/_view/www/src/samples/chat/MessageContent.tsx +157 -0
  141. inspect_ai/_view/www/src/samples/chat/MessageContents.module.css +3 -0
  142. inspect_ai/_view/www/src/samples/chat/MessageContents.tsx +133 -0
  143. inspect_ai/_view/www/src/samples/chat/messages.ts +112 -0
  144. inspect_ai/_view/www/src/samples/chat/tools/ToolCallView.tsx +147 -0
  145. inspect_ai/_view/www/src/samples/chat/tools/ToolInput.module.css +14 -0
  146. inspect_ai/_view/www/src/samples/chat/tools/ToolInput.tsx +76 -0
  147. inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.module.css +19 -0
  148. inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.tsx +60 -0
  149. inspect_ai/_view/www/src/samples/chat/tools/ToolTitle.module.css +4 -0
  150. inspect_ai/_view/www/src/samples/chat/tools/ToolTitle.tsx +18 -0
  151. inspect_ai/_view/www/src/samples/chat/tools/tool.ts +92 -0
  152. inspect_ai/_view/www/src/samples/descriptor/samplesDescriptor.tsx +365 -0
  153. inspect_ai/_view/www/src/samples/descriptor/score/BooleanScoreDescriptor.module.css +22 -0
  154. inspect_ai/_view/www/src/samples/descriptor/score/BooleanScoreDescriptor.tsx +26 -0
  155. inspect_ai/_view/www/src/samples/descriptor/score/CategoricalScoreDescriptor.tsx +18 -0
  156. inspect_ai/_view/www/src/samples/descriptor/score/NumericScoreDescriptor.tsx +27 -0
  157. inspect_ai/_view/www/src/samples/descriptor/score/ObjectScoreDescriptor.module.css +18 -0
  158. inspect_ai/_view/www/src/samples/descriptor/score/ObjectScoreDescriptor.tsx +71 -0
  159. inspect_ai/_view/www/src/samples/descriptor/score/OtherScoreDescriptor.tsx +20 -0
  160. inspect_ai/_view/www/src/samples/descriptor/score/PassFailScoreDescriptor.module.css +28 -0
  161. inspect_ai/_view/www/src/samples/descriptor/score/PassFailScoreDescriptor.tsx +81 -0
  162. inspect_ai/_view/www/src/samples/descriptor/score/ScoreDescriptor.tsx +99 -0
  163. inspect_ai/_view/www/src/samples/descriptor/types.ts +55 -0
  164. inspect_ai/_view/www/src/samples/error/FlatSampleErrorView.module.css +19 -0
  165. inspect_ai/_view/www/src/samples/error/FlatSampleErrorView.tsx +22 -0
  166. inspect_ai/_view/www/src/samples/error/SampleErrorView.module.css +17 -0
  167. inspect_ai/_view/www/src/samples/error/SampleErrorView.tsx +31 -0
  168. inspect_ai/_view/www/src/samples/error/error.ts +15 -0
  169. inspect_ai/_view/www/src/samples/list/SampleFooter.module.css +9 -0
  170. inspect_ai/_view/www/src/samples/list/SampleFooter.tsx +14 -0
  171. inspect_ai/_view/www/src/samples/list/SampleHeader.module.css +13 -0
  172. inspect_ai/_view/www/src/samples/list/SampleHeader.tsx +36 -0
  173. inspect_ai/_view/www/src/samples/list/SampleList.module.css +11 -0
  174. inspect_ai/_view/www/src/samples/list/SampleList.tsx +247 -0
  175. inspect_ai/_view/www/src/samples/list/SampleRow.module.css +33 -0
  176. inspect_ai/_view/www/src/samples/list/SampleRow.tsx +98 -0
  177. inspect_ai/_view/www/src/samples/list/SampleSeparator.module.css +6 -0
  178. inspect_ai/_view/www/src/samples/list/SampleSeparator.tsx +24 -0
  179. inspect_ai/_view/www/src/samples/sample-tools/EpochFilter.module.css +9 -0
  180. inspect_ai/_view/www/src/samples/sample-tools/EpochFilter.tsx +51 -0
  181. inspect_ai/_view/www/src/samples/sample-tools/SelectScorer.module.css +16 -0
  182. inspect_ai/_view/www/src/samples/sample-tools/SelectScorer.tsx +175 -0
  183. inspect_ai/_view/www/src/samples/sample-tools/SortFilter.module.css +9 -0
  184. inspect_ai/_view/www/src/samples/sample-tools/SortFilter.tsx +186 -0
  185. inspect_ai/_view/www/src/samples/{tools/filters.mjs → sample-tools/filters.ts} +86 -81
  186. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/SampleFilter.module.css +16 -0
  187. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/SampleFilter.tsx +288 -0
  188. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/completions.ts +346 -0
  189. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/language.ts +19 -0
  190. inspect_ai/_view/www/src/samples/sample-tools/sample-filter/tokenize.ts +97 -0
  191. inspect_ai/_view/www/src/samples/{SampleLimit.mjs → sampleLimit.ts} +3 -6
  192. inspect_ai/_view/www/src/samples/scores/SampleScoreView.module.css +53 -0
  193. inspect_ai/_view/www/src/samples/scores/SampleScoreView.tsx +168 -0
  194. inspect_ai/_view/www/src/samples/scores/SampleScores.module.css +5 -0
  195. inspect_ai/_view/www/src/samples/scores/SampleScores.tsx +37 -0
  196. inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.tsx +66 -0
  197. inspect_ai/_view/www/src/samples/transcript/ErrorEventView.tsx +51 -0
  198. inspect_ai/_view/www/src/samples/transcript/InfoEventView.module.css +3 -0
  199. inspect_ai/_view/www/src/samples/transcript/InfoEventView.tsx +54 -0
  200. inspect_ai/_view/www/src/samples/transcript/InputEventView.tsx +48 -0
  201. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.module.css +6 -0
  202. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.tsx +36 -0
  203. inspect_ai/_view/www/src/samples/transcript/ModelEventView.module.css +43 -0
  204. inspect_ai/_view/www/src/samples/transcript/ModelEventView.tsx +223 -0
  205. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.module.css +23 -0
  206. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.tsx +112 -0
  207. inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.tsx +75 -0
  208. inspect_ai/_view/www/src/samples/transcript/SampleTranscript.tsx +22 -0
  209. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.module.css +15 -0
  210. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.tsx +100 -0
  211. inspect_ai/_view/www/src/samples/transcript/StepEventView.tsx +171 -0
  212. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.module.css +19 -0
  213. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.tsx +133 -0
  214. inspect_ai/_view/www/src/samples/transcript/ToolEventView.module.css +10 -0
  215. inspect_ai/_view/www/src/samples/transcript/ToolEventView.tsx +92 -0
  216. inspect_ai/_view/www/src/samples/transcript/TranscriptView.module.css +49 -0
  217. inspect_ai/_view/www/src/samples/transcript/TranscriptView.tsx +449 -0
  218. inspect_ai/_view/www/src/samples/transcript/event/EventNav.module.css +5 -0
  219. inspect_ai/_view/www/src/samples/transcript/event/EventNav.tsx +43 -0
  220. inspect_ai/_view/www/src/samples/transcript/event/EventNavs.module.css +3 -0
  221. inspect_ai/_view/www/src/samples/transcript/event/EventNavs.tsx +39 -0
  222. inspect_ai/_view/www/src/samples/transcript/event/EventPanel.module.css +25 -0
  223. inspect_ai/_view/www/src/samples/transcript/event/EventPanel.tsx +191 -0
  224. inspect_ai/_view/www/src/samples/transcript/event/EventRow.module.css +13 -0
  225. inspect_ai/_view/www/src/samples/transcript/event/EventRow.tsx +32 -0
  226. inspect_ai/_view/www/src/samples/transcript/event/EventSection.module.css +8 -0
  227. inspect_ai/_view/www/src/samples/transcript/event/EventSection.tsx +29 -0
  228. inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.tsx +67 -0
  229. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.tsx +285 -0
  230. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenders.module.css +10 -0
  231. inspect_ai/_view/www/src/samples/transcript/state/StateEventView.module.css +9 -0
  232. inspect_ai/_view/www/src/samples/transcript/state/StateEventView.tsx +346 -0
  233. inspect_ai/_view/www/src/samples/transcript/types.ts +58 -0
  234. inspect_ai/_view/www/src/types/log.d.ts +108 -19
  235. inspect_ai/_view/www/src/types/prism.d.ts +11 -0
  236. inspect_ai/_view/www/src/types.ts +71 -0
  237. inspect_ai/_view/www/src/usage/ModelTokenTable.tsx +28 -0
  238. inspect_ai/_view/www/src/usage/ModelUsagePanel.module.css +24 -0
  239. inspect_ai/_view/www/src/usage/ModelUsagePanel.tsx +97 -0
  240. inspect_ai/_view/www/src/usage/TokenTable.module.css +17 -0
  241. inspect_ai/_view/www/src/usage/TokenTable.tsx +91 -0
  242. inspect_ai/_view/www/src/usage/UsageCard.module.css +15 -0
  243. inspect_ai/_view/www/src/usage/UsageCard.tsx +67 -0
  244. inspect_ai/_view/www/src/utils/attachments.ts +42 -0
  245. inspect_ai/_view/www/src/utils/{Base64.mjs → base64.ts} +1 -6
  246. inspect_ai/_view/www/src/{components/Browser.mjs → utils/browser.ts} +0 -1
  247. inspect_ai/_view/www/src/utils/debugging.ts +28 -0
  248. inspect_ai/_view/www/src/utils/dom.ts +30 -0
  249. inspect_ai/_view/www/src/utils/format.ts +194 -0
  250. inspect_ai/_view/www/src/utils/git.ts +7 -0
  251. inspect_ai/_view/www/src/utils/html.ts +6 -0
  252. inspect_ai/_view/www/src/utils/http.ts +14 -0
  253. inspect_ai/_view/www/src/utils/{Path.mjs → path.ts} +2 -9
  254. inspect_ai/_view/www/src/utils/{Print.mjs → print.ts} +34 -26
  255. inspect_ai/_view/www/src/utils/queue.ts +51 -0
  256. inspect_ai/_view/www/src/utils/sync.ts +114 -0
  257. inspect_ai/_view/www/src/utils/{Type.mjs → type.ts} +3 -6
  258. inspect_ai/_view/www/src/utils/vscode.ts +13 -0
  259. inspect_ai/_view/www/src/workspace/WorkSpace.tsx +324 -0
  260. inspect_ai/_view/www/src/workspace/WorkSpaceView.module.css +33 -0
  261. inspect_ai/_view/www/src/workspace/WorkSpaceView.tsx +158 -0
  262. inspect_ai/_view/www/src/workspace/error/TaskErrorPanel.module.css +3 -0
  263. inspect_ai/_view/www/src/workspace/error/TaskErrorPanel.tsx +28 -0
  264. inspect_ai/_view/www/src/workspace/navbar/Navbar.module.css +54 -0
  265. inspect_ai/_view/www/src/workspace/navbar/Navbar.tsx +68 -0
  266. inspect_ai/_view/www/src/workspace/navbar/PrimaryBar.module.css +52 -0
  267. inspect_ai/_view/www/src/workspace/navbar/PrimaryBar.tsx +114 -0
  268. inspect_ai/_view/www/src/workspace/navbar/ResultsPanel.module.css +90 -0
  269. inspect_ai/_view/www/src/workspace/navbar/ResultsPanel.tsx +180 -0
  270. inspect_ai/_view/www/src/workspace/navbar/SecondaryBar.module.css +28 -0
  271. inspect_ai/_view/www/src/workspace/navbar/SecondaryBar.tsx +226 -0
  272. inspect_ai/_view/www/src/workspace/navbar/StatusPanel.module.css +14 -0
  273. inspect_ai/_view/www/src/workspace/navbar/StatusPanel.tsx +61 -0
  274. inspect_ai/_view/www/src/workspace/sidebar/EvalStatus.module.css +15 -0
  275. inspect_ai/_view/www/src/workspace/sidebar/EvalStatus.tsx +71 -0
  276. inspect_ai/_view/www/src/workspace/sidebar/LogDirectoryTitleView.module.css +5 -0
  277. inspect_ai/_view/www/src/workspace/sidebar/LogDirectoryTitleView.tsx +56 -0
  278. inspect_ai/_view/www/src/workspace/sidebar/Sidebar.module.css +68 -0
  279. inspect_ai/_view/www/src/workspace/sidebar/Sidebar.tsx +85 -0
  280. inspect_ai/_view/www/src/workspace/sidebar/SidebarLogEntry.module.css +29 -0
  281. inspect_ai/_view/www/src/workspace/sidebar/SidebarLogEntry.tsx +95 -0
  282. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoreView.module.css +23 -0
  283. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoreView.tsx +43 -0
  284. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoresView.module.css +35 -0
  285. inspect_ai/_view/www/src/workspace/sidebar/SidebarScoresView.tsx +63 -0
  286. inspect_ai/_view/www/src/workspace/tabs/InfoTab.module.css +0 -0
  287. inspect_ai/_view/www/src/workspace/tabs/InfoTab.tsx +70 -0
  288. inspect_ai/_view/www/src/workspace/tabs/JsonTab.module.css +5 -0
  289. inspect_ai/_view/www/src/workspace/tabs/JsonTab.tsx +46 -0
  290. inspect_ai/_view/www/src/workspace/tabs/SamplesTab.tsx +204 -0
  291. inspect_ai/_view/www/src/workspace/tabs/grouping.ts +195 -0
  292. inspect_ai/_view/www/src/workspace/tabs/types.ts +19 -0
  293. inspect_ai/_view/www/src/workspace/types.ts +10 -0
  294. inspect_ai/_view/www/src/workspace/utils.ts +34 -0
  295. inspect_ai/_view/www/tsconfig.json +23 -9
  296. inspect_ai/_view/www/vite.config.js +8 -17
  297. inspect_ai/_view/www/yarn.lock +627 -556
  298. inspect_ai/approval/_approval.py +2 -0
  299. inspect_ai/approval/_approver.py +4 -4
  300. inspect_ai/approval/_auto.py +1 -1
  301. inspect_ai/approval/_human/approver.py +3 -0
  302. inspect_ai/approval/_policy.py +5 -0
  303. inspect_ai/approval/_registry.py +2 -2
  304. inspect_ai/dataset/_dataset.py +64 -37
  305. inspect_ai/dataset/_sources/__init__.py +0 -0
  306. inspect_ai/dataset/_sources/csv.py +20 -12
  307. inspect_ai/dataset/_sources/file.py +4 -0
  308. inspect_ai/dataset/_sources/hf.py +39 -29
  309. inspect_ai/dataset/_sources/json.py +17 -9
  310. inspect_ai/log/__init__.py +2 -0
  311. inspect_ai/log/_convert.py +3 -3
  312. inspect_ai/log/_file.py +24 -9
  313. inspect_ai/log/_log.py +101 -13
  314. inspect_ai/log/_message.py +4 -2
  315. inspect_ai/log/_recorders/file.py +4 -0
  316. inspect_ai/log/_recorders/json.py +5 -7
  317. inspect_ai/log/_recorders/recorder.py +3 -0
  318. inspect_ai/log/_transcript.py +19 -8
  319. inspect_ai/model/__init__.py +2 -0
  320. inspect_ai/model/_cache.py +39 -21
  321. inspect_ai/model/_call_tools.py +4 -3
  322. inspect_ai/model/_chat_message.py +14 -4
  323. inspect_ai/model/_generate_config.py +1 -1
  324. inspect_ai/model/_model.py +31 -24
  325. inspect_ai/model/_model_output.py +14 -1
  326. inspect_ai/model/_openai.py +10 -18
  327. inspect_ai/model/_providers/anthropic.py +3 -3
  328. inspect_ai/model/_providers/google.py +9 -5
  329. inspect_ai/model/_providers/openai.py +5 -9
  330. inspect_ai/model/_providers/openai_o1.py +3 -5
  331. inspect_ai/model/_providers/openrouter.py +86 -0
  332. inspect_ai/model/_providers/providers.py +11 -0
  333. inspect_ai/scorer/__init__.py +6 -1
  334. inspect_ai/scorer/_answer.py +7 -7
  335. inspect_ai/scorer/_classification.py +38 -18
  336. inspect_ai/scorer/_common.py +2 -8
  337. inspect_ai/scorer/_match.py +4 -5
  338. inspect_ai/scorer/_metric.py +87 -28
  339. inspect_ai/scorer/_metrics/__init__.py +3 -3
  340. inspect_ai/scorer/_metrics/accuracy.py +8 -10
  341. inspect_ai/scorer/_metrics/mean.py +3 -17
  342. inspect_ai/scorer/_metrics/std.py +111 -30
  343. inspect_ai/scorer/_model.py +12 -12
  344. inspect_ai/scorer/_pattern.py +3 -3
  345. inspect_ai/scorer/_reducer/reducer.py +36 -21
  346. inspect_ai/scorer/_reducer/registry.py +2 -2
  347. inspect_ai/scorer/_reducer/types.py +7 -1
  348. inspect_ai/scorer/_score.py +11 -1
  349. inspect_ai/scorer/_scorer.py +110 -16
  350. inspect_ai/solver/__init__.py +1 -1
  351. inspect_ai/solver/_basic_agent.py +19 -22
  352. inspect_ai/solver/_bridge/__init__.py +0 -3
  353. inspect_ai/solver/_bridge/bridge.py +3 -3
  354. inspect_ai/solver/_chain.py +1 -2
  355. inspect_ai/solver/_critique.py +3 -3
  356. inspect_ai/solver/_fork.py +2 -2
  357. inspect_ai/solver/_human_agent/__init__.py +0 -0
  358. inspect_ai/solver/_human_agent/agent.py +5 -8
  359. inspect_ai/solver/_human_agent/commands/clock.py +14 -10
  360. inspect_ai/solver/_human_agent/commands/note.py +1 -1
  361. inspect_ai/solver/_human_agent/commands/score.py +0 -11
  362. inspect_ai/solver/_multiple_choice.py +38 -26
  363. inspect_ai/solver/_prompt.py +7 -7
  364. inspect_ai/solver/_solver.py +53 -52
  365. inspect_ai/solver/_task_state.py +80 -69
  366. inspect_ai/solver/_use_tools.py +9 -9
  367. inspect_ai/tool/__init__.py +4 -1
  368. inspect_ai/tool/_tool.py +43 -14
  369. inspect_ai/tool/_tool_call.py +6 -2
  370. inspect_ai/tool/_tool_choice.py +3 -1
  371. inspect_ai/tool/_tool_def.py +10 -8
  372. inspect_ai/tool/_tool_params.py +24 -0
  373. inspect_ai/tool/_tool_with.py +7 -7
  374. inspect_ai/tool/_tools/__init__.py +0 -0
  375. inspect_ai/tool/{beta → _tools}/_computer/_common.py +2 -2
  376. inspect_ai/tool/{beta → _tools}/_computer/_computer.py +13 -5
  377. inspect_ai/tool/_tools/_computer/_resources/tool/__init__.py +0 -0
  378. inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_x11_client.py +1 -1
  379. inspect_ai/tool/_tools/_computer/_resources/tool/requirements.txt +0 -0
  380. inspect_ai/tool/_tools/_execute.py +23 -11
  381. inspect_ai/tool/_tools/_web_browser/_resources/README.md +2 -2
  382. inspect_ai/tool/_tools/_web_browser/_web_browser.py +5 -3
  383. inspect_ai/tool/_tools/_web_search.py +7 -5
  384. inspect_ai/tool/beta.py +3 -0
  385. inspect_ai/util/_concurrency.py +3 -3
  386. inspect_ai/util/_panel.py +2 -0
  387. inspect_ai/util/_resource.py +12 -12
  388. inspect_ai/util/_sandbox/docker/compose.py +23 -20
  389. inspect_ai/util/_sandbox/docker/config.py +2 -1
  390. inspect_ai/util/_sandbox/docker/docker.py +42 -86
  391. inspect_ai/util/_sandbox/docker/service.py +100 -0
  392. inspect_ai/util/_sandbox/environment.py +99 -96
  393. inspect_ai/util/_sandbox/self_check.py +124 -16
  394. inspect_ai/util/_subprocess.py +5 -3
  395. inspect_ai/util/_subtask.py +15 -16
  396. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.64.dist-info}/LICENSE +1 -1
  397. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.64.dist-info}/METADATA +11 -6
  398. inspect_ai-0.3.64.dist-info/RECORD +625 -0
  399. inspect_ai/_view/www/src/Register.mjs +0 -3
  400. inspect_ai/_view/www/src/Types.mjs +0 -38
  401. inspect_ai/_view/www/src/appearance/Colors.mjs +0 -27
  402. inspect_ai/_view/www/src/appearance/Fonts.mjs +0 -66
  403. inspect_ai/_view/www/src/appearance/Icons.mjs +0 -240
  404. inspect_ai/_view/www/src/components/AnsiDisplay.mjs +0 -184
  405. inspect_ai/_view/www/src/components/AppErrorBoundary.mjs +0 -34
  406. inspect_ai/_view/www/src/components/AsciiCinemaPlayer.mjs +0 -74
  407. inspect_ai/_view/www/src/components/Card.mjs +0 -126
  408. inspect_ai/_view/www/src/components/ChatView.mjs +0 -441
  409. inspect_ai/_view/www/src/components/CopyButton.mjs +0 -48
  410. inspect_ai/_view/www/src/components/Dialog.mjs +0 -61
  411. inspect_ai/_view/www/src/components/DownloadButton.mjs +0 -15
  412. inspect_ai/_view/www/src/components/DownloadPanel.mjs +0 -29
  413. inspect_ai/_view/www/src/components/EmptyPanel.mjs +0 -23
  414. inspect_ai/_view/www/src/components/ErrorPanel.mjs +0 -66
  415. inspect_ai/_view/www/src/components/ExpandablePanel.mjs +0 -136
  416. inspect_ai/_view/www/src/components/FindBand.mjs +0 -157
  417. inspect_ai/_view/www/src/components/HumanBaselineView.mjs +0 -168
  418. inspect_ai/_view/www/src/components/JsonPanel.mjs +0 -61
  419. inspect_ai/_view/www/src/components/LabeledValue.mjs +0 -32
  420. inspect_ai/_view/www/src/components/LargeModal.mjs +0 -190
  421. inspect_ai/_view/www/src/components/LightboxCarousel.mjs +0 -217
  422. inspect_ai/_view/www/src/components/MarkdownDiv.mjs +0 -118
  423. inspect_ai/_view/www/src/components/MessageBand.mjs +0 -48
  424. inspect_ai/_view/www/src/components/MessageContent.mjs +0 -111
  425. inspect_ai/_view/www/src/components/MetaDataGrid.mjs +0 -92
  426. inspect_ai/_view/www/src/components/MetaDataView.mjs +0 -109
  427. inspect_ai/_view/www/src/components/MorePopOver.mjs +0 -50
  428. inspect_ai/_view/www/src/components/NavPills.mjs +0 -63
  429. inspect_ai/_view/www/src/components/ProgressBar.mjs +0 -51
  430. inspect_ai/_view/www/src/components/RenderedContent/ChatMessageRenderer.mjs +0 -54
  431. inspect_ai/_view/www/src/components/RenderedContent/Types.mjs +0 -19
  432. inspect_ai/_view/www/src/components/TabSet.mjs +0 -184
  433. inspect_ai/_view/www/src/components/ToolButton.mjs +0 -16
  434. inspect_ai/_view/www/src/components/Tools.mjs +0 -376
  435. inspect_ai/_view/www/src/components/VirtualList.mjs +0 -280
  436. inspect_ai/_view/www/src/components/ansi-output.js +0 -932
  437. inspect_ai/_view/www/src/json/JsonTab.mjs +0 -48
  438. inspect_ai/_view/www/src/log-reader/Log-Reader.mjs +0 -25
  439. inspect_ai/_view/www/src/log-reader/Native-Log-Reader.mjs +0 -13
  440. inspect_ai/_view/www/src/log-reader/Open-AI-Log-Reader.mjs +0 -263
  441. inspect_ai/_view/www/src/navbar/Navbar.mjs +0 -418
  442. inspect_ai/_view/www/src/navbar/SecondaryBar.mjs +0 -175
  443. inspect_ai/_view/www/src/plan/PlanCard.mjs +0 -418
  444. inspect_ai/_view/www/src/samples/SampleDialog.mjs +0 -123
  445. inspect_ai/_view/www/src/samples/SampleDisplay.mjs +0 -516
  446. inspect_ai/_view/www/src/samples/SampleError.mjs +0 -99
  447. inspect_ai/_view/www/src/samples/SampleList.mjs +0 -427
  448. inspect_ai/_view/www/src/samples/SampleScoreView.mjs +0 -172
  449. inspect_ai/_view/www/src/samples/SampleScores.mjs +0 -34
  450. inspect_ai/_view/www/src/samples/SampleTranscript.mjs +0 -20
  451. inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +0 -771
  452. inspect_ai/_view/www/src/samples/SamplesTab.mjs +0 -399
  453. inspect_ai/_view/www/src/samples/SamplesTools.mjs +0 -64
  454. inspect_ai/_view/www/src/samples/tools/EpochFilter.mjs +0 -38
  455. inspect_ai/_view/www/src/samples/tools/SampleFilter.mjs +0 -756
  456. inspect_ai/_view/www/src/samples/tools/SelectScorer.mjs +0 -141
  457. inspect_ai/_view/www/src/samples/tools/SortFilter.mjs +0 -151
  458. inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.mjs +0 -71
  459. inspect_ai/_view/www/src/samples/transcript/ErrorEventView.mjs +0 -44
  460. inspect_ai/_view/www/src/samples/transcript/EventPanel.mjs +0 -271
  461. inspect_ai/_view/www/src/samples/transcript/EventRow.mjs +0 -46
  462. inspect_ai/_view/www/src/samples/transcript/EventSection.mjs +0 -33
  463. inspect_ai/_view/www/src/samples/transcript/InfoEventView.mjs +0 -59
  464. inspect_ai/_view/www/src/samples/transcript/InputEventView.mjs +0 -44
  465. inspect_ai/_view/www/src/samples/transcript/LoggerEventView.mjs +0 -32
  466. inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +0 -216
  467. inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.mjs +0 -107
  468. inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.mjs +0 -74
  469. inspect_ai/_view/www/src/samples/transcript/ScoreEventView.mjs +0 -100
  470. inspect_ai/_view/www/src/samples/transcript/StepEventView.mjs +0 -187
  471. inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.mjs +0 -133
  472. inspect_ai/_view/www/src/samples/transcript/ToolEventView.mjs +0 -88
  473. inspect_ai/_view/www/src/samples/transcript/TranscriptView.mjs +0 -459
  474. inspect_ai/_view/www/src/samples/transcript/Types.mjs +0 -44
  475. inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.mjs +0 -53
  476. inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.mjs +0 -254
  477. inspect_ai/_view/www/src/samples/transcript/state/StateEventView.mjs +0 -313
  478. inspect_ai/_view/www/src/sidebar/Sidebar.mjs +0 -418
  479. inspect_ai/_view/www/src/usage/ModelTokenTable.mjs +0 -72
  480. inspect_ai/_view/www/src/usage/UsageCard.mjs +0 -159
  481. inspect_ai/_view/www/src/utils/Format.mjs +0 -260
  482. inspect_ai/_view/www/src/utils/Git.mjs +0 -12
  483. inspect_ai/_view/www/src/utils/Html.mjs +0 -21
  484. inspect_ai/_view/www/src/utils/attachments.mjs +0 -31
  485. inspect_ai/_view/www/src/utils/debugging.mjs +0 -23
  486. inspect_ai/_view/www/src/utils/http.mjs +0 -18
  487. inspect_ai/_view/www/src/utils/queue.mjs +0 -67
  488. inspect_ai/_view/www/src/utils/sync.mjs +0 -101
  489. inspect_ai/_view/www/src/workspace/TaskErrorPanel.mjs +0 -17
  490. inspect_ai/_view/www/src/workspace/WorkSpace.mjs +0 -516
  491. inspect_ai/tool/beta/__init__.py +0 -5
  492. inspect_ai-0.3.62.dist-info/RECORD +0 -481
  493. /inspect_ai/{tool/beta/_computer/_resources/tool → _eval}/__init__.py +0 -0
  494. /inspect_ai/{tool/beta/_computer/_resources/tool/requirements.txt → _util/__init__.py} +0 -0
  495. /inspect_ai/_view/www/src/{constants.mjs → constants.ts} +0 -0
  496. /inspect_ai/tool/{beta → _tools}/_computer/__init__.py +0 -0
  497. /inspect_ai/tool/{beta → _tools}/_computer/_computer_split.py +0 -0
  498. /inspect_ai/tool/{beta → _tools}/_computer/_resources/Dockerfile +0 -0
  499. /inspect_ai/tool/{beta → _tools}/_computer/_resources/README.md +0 -0
  500. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/entrypoint.sh +0 -0
  501. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/novnc_startup.sh +0 -0
  502. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/x11vnc_startup.sh +0 -0
  503. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/xfce_startup.sh +0 -0
  504. /inspect_ai/tool/{beta → _tools}/_computer/_resources/entrypoint/xvfb_startup.sh +0 -0
  505. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/Code/User/globalStorage/state.vscdb +0 -0
  506. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/Code/User/settings.json +0 -0
  507. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/xfce4/xfconf/xfce-perchannel-xml/xfce4-panel.xml +0 -0
  508. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/.config/xfce4/xfconf/xfce-perchannel-xml/xfce4-screensaver.xml +0 -0
  509. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Firefox Web Browser.desktop +0 -0
  510. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Terminal.desktop +0 -0
  511. /inspect_ai/tool/{beta → _tools}/_computer/_resources/image_home_dir/Desktop/Visual Studio Code.desktop +0 -0
  512. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_logger.py +0 -0
  513. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_run.py +0 -0
  514. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/_tool_result.py +0 -0
  515. /inspect_ai/tool/{beta → _tools}/_computer/_resources/tool/computer_tool.py +0 -0
  516. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.64.dist-info}/WHEEL +0 -0
  517. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.64.dist-info}/entry_points.txt +0 -0
  518. {inspect_ai-0.3.62.dist-info → inspect_ai-0.3.64.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,47 @@
1
+ import { Component, ErrorInfo, ReactNode } from "react";
2
+ import { ErrorPanel } from "./components/ErrorPanel";
3
+
4
+ interface Props {
5
+ children: ReactNode;
6
+ }
7
+
8
+ interface State {
9
+ hasError: boolean;
10
+ error?: Error;
11
+ }
12
+
13
+ export class AppErrorBoundary extends Component<Props, State> {
14
+ constructor(props: Props) {
15
+ super(props);
16
+ this.state = { hasError: false };
17
+ }
18
+
19
+ static getDerivedStateFromError(error: Error): State {
20
+ // Update state so the next render will show the fallback UI.
21
+ return { hasError: true, error: error };
22
+ }
23
+
24
+ componentDidCatch(error: Error, errorInfo: ErrorInfo): void {
25
+ // You can also log the error to an error reporting service
26
+ console.log({ error, errorInfo });
27
+ }
28
+
29
+ render(): ReactNode {
30
+ if (this.state.hasError) {
31
+ console.error({ e: this.state.error });
32
+ if (this.state.error) {
33
+ return (
34
+ <ErrorPanel
35
+ title="An unexpected error occurred."
36
+ error={this.state.error}
37
+ />
38
+ );
39
+ } else {
40
+ return (
41
+ <div>An unknown error with no additional information occured.</div>
42
+ );
43
+ }
44
+ }
45
+ return this.props.children;
46
+ }
47
+ }
@@ -1,7 +1,7 @@
1
- import { Capabilities } from "../Types.mjs";
1
+ import { Capabilities } from "../types";
2
2
  import { asyncJsonParse } from "../utils/json-worker";
3
3
  import { download_file } from "./api-shared";
4
- import { LogContents, LogViewAPI } from "./Types";
4
+ import { LogContents, LogViewAPI } from "./types";
5
5
 
6
6
  const loaded_time = Date.now();
7
7
  let last_eval_time = 0;
@@ -1,15 +1,14 @@
1
- //@ts-check
1
+ import { fetchRange, fetchSize } from "../logfile/remoteZipFile";
2
+ import { EvalLog } from "../types/log";
2
3
  import { asyncJsonParse } from "../utils/json-worker";
3
4
  import { download_file, encodePathParts } from "./api-shared";
4
- import { fetchRange, fetchSize } from "../utils/remoteZipFile.mjs";
5
5
  import {
6
6
  Capabilities,
7
7
  LogContents,
8
8
  LogFiles,
9
9
  LogFilesFetchResponse,
10
10
  LogViewAPI,
11
- } from "./Types";
12
- import { EvalLog } from "../types/log";
11
+ } from "./types";
13
12
 
14
13
  interface LogInfo {
15
14
  log_dir?: string;
@@ -38,7 +37,6 @@ export default function simpleHttpApi(
38
37
  * Fetches a file from the specified URL and parses its content.
39
38
  */
40
39
  function simpleHttpAPI(logInfo: LogInfo): LogViewAPI {
41
- const log_file = logInfo.log_file;
42
40
  const log_dir = logInfo.log_dir;
43
41
 
44
42
  async function open_log_file() {
@@ -1,16 +1,16 @@
1
- import { asyncJsonParse } from "../utils/json-worker";
2
1
  import JSON5 from "json5";
2
+ import { asyncJsonParse } from "../utils/json-worker";
3
3
 
4
+ import { getVscodeApi } from "../utils/vscode";
4
5
  import {
5
- webViewJsonRpcClient,
6
6
  kMethodEvalLog,
7
- kMethodEvalLogs,
8
- kMethodEvalLogSize,
9
7
  kMethodEvalLogBytes,
10
8
  kMethodEvalLogHeaders,
9
+ kMethodEvalLogs,
10
+ kMethodEvalLogSize,
11
+ webViewJsonRpcClient,
11
12
  } from "./jsonrpc";
12
- import { getVscodeApi } from "../utils/vscode";
13
- import { Capabilities, LogContents, LogViewAPI } from "./Types";
13
+ import { Capabilities, LogContents, LogViewAPI } from "./types";
14
14
 
15
15
  const vscodeClient = webViewJsonRpcClient(getVscodeApi());
16
16
 
@@ -1,14 +1,14 @@
1
- import { openRemoteLogFile, RemoteLogFile } from "../log/remoteLogFile";
1
+ import { openRemoteLogFile, RemoteLogFile } from "../logfile/remoteLogFile";
2
+ import { FileSizeLimitError } from "../logfile/remoteZipFile";
2
3
  import { EvalLog, EvalSample } from "../types/log";
3
- import { FileSizeLimitError } from "../utils/remoteZipFile.mjs";
4
4
  import { encodePathParts } from "./api-shared";
5
5
  import {
6
6
  ClientAPI,
7
7
  EvalSummary,
8
8
  LogContents,
9
- LogViewAPI,
10
9
  LogFiles,
11
- } from "./Types";
10
+ LogViewAPI,
11
+ } from "./types";
12
12
 
13
13
  const isEvalFile = (file: string) => {
14
14
  return file.endsWith(".eval");
@@ -1,10 +1,10 @@
1
+ import { dirname } from "../utils/path";
2
+ import { getVscodeApi } from "../utils/vscode";
1
3
  import browserApi from "./api-browser";
2
- import vscodeApi from "./api-vscode";
3
4
  import simpleHttpApi from "./api-http";
4
- import { dirname } from "../utils/Path.mjs";
5
- import { getVscodeApi } from "../utils/vscode";
5
+ import vscodeApi from "./api-vscode";
6
6
  import { clientApi } from "./client-api";
7
- import { ClientAPI } from "./Types";
7
+ import { ClientAPI } from "./types";
8
8
 
9
9
  //
10
10
  /**
@@ -1,17 +1,17 @@
1
1
  import {
2
- Version,
3
- Status,
4
- EvalSpec,
2
+ EvalError,
3
+ EvalLog,
5
4
  EvalPlan,
6
5
  EvalResults,
6
+ EvalSample,
7
+ EvalSpec,
7
8
  EvalStats,
8
- EvalError,
9
9
  Input,
10
- Target,
11
10
  Scores1,
11
+ Status,
12
+ Target,
12
13
  Type11,
13
- EvalLog,
14
- EvalSample,
14
+ Version,
15
15
  } from "../types/log";
16
16
 
17
17
  export interface EvalSummary {
@@ -118,8 +118,8 @@ export interface LogFiles {
118
118
 
119
119
  export interface LogFile {
120
120
  name: string;
121
- task: string;
122
- task_id: string;
121
+ task?: string;
122
+ task_id?: string;
123
123
  }
124
124
 
125
125
  export interface LogContents {
@@ -131,3 +131,19 @@ export interface LogFilesFetchResponse {
131
131
  raw: string;
132
132
  parsed: Record<string, EvalHeader>;
133
133
  }
134
+
135
+ export interface UpdateStateMessage {
136
+ data: {
137
+ type: "updateState";
138
+ url: string;
139
+ };
140
+ }
141
+
142
+ export interface BackgroundUpdateMessage {
143
+ data: {
144
+ type: "backgroundUpdate";
145
+ url: string;
146
+ log_dir: string;
147
+ };
148
+ }
149
+ export type HostMessage = UpdateStateMessage | BackgroundUpdateMessage;
@@ -0,0 +1,9 @@
1
+ export const ApplicationColors = {
2
+ logging: {
3
+ debug: "var(--bs-secondary)",
4
+ info: "var(--bs-blue)",
5
+ warning: "var(--bs-warning)",
6
+ error: "var(--bs-danger)",
7
+ critical: "var(--bs-danger)",
8
+ },
9
+ };
@@ -0,0 +1,39 @@
1
+ /**
2
+ * The base font size in rem units.
3
+ */
4
+ const kBaseFontSize: number = 0.9;
5
+
6
+ /**
7
+ * Scales the base font size by the provided scale factor.
8
+ */
9
+ const ScaleBaseFont = (scale: number): string => {
10
+ return `${kBaseFontSize + scale}rem`;
11
+ };
12
+
13
+ /**
14
+ * An object representing font sizes for different text elements.
15
+ */
16
+ export const FontSize = {
17
+ title: ScaleBaseFont(0.6),
18
+ "title-secondary": ScaleBaseFont(0.4),
19
+ larger: ScaleBaseFont(0.2),
20
+ large: ScaleBaseFont(0.1),
21
+ base: ScaleBaseFont(0),
22
+ small: ScaleBaseFont(-0.1),
23
+ smaller: ScaleBaseFont(-0.1),
24
+ };
25
+
26
+ /**
27
+ * An object representing text styles for different elements.
28
+ */
29
+ export const TextStyle = {
30
+ label: {
31
+ textTransform: "uppercase",
32
+ },
33
+ secondary: {
34
+ color: "var(--bs-secondary)",
35
+ },
36
+ tertiary: {
37
+ color: "var(--bs-tertiary-color)",
38
+ },
39
+ };
@@ -0,0 +1,100 @@
1
+ const loggingIcons: Record<string, string> = {
2
+ notset: "bi bi-card-text",
3
+ debug: "bi bi-bug",
4
+ http: "bi bi-download",
5
+ info: "bi bi-info-square",
6
+ warning: "bi bi-exclamation-triangle",
7
+ error: "bi bi-x-circle",
8
+ critical: "bi bi-fire",
9
+ };
10
+
11
+ export const ApplicationIcons = {
12
+ approve: "bi bi-shield",
13
+ approvals: {
14
+ approve: "bi bi-shield-check",
15
+ reject: "bi bi-shield-x",
16
+ terminate: "bi bi-shield-exclamation",
17
+ escalate: "bi bi-box-arrow-up",
18
+ modify: "bi bi-pencil-square",
19
+ },
20
+ arrows: {
21
+ right: "bi bi-arrow-right",
22
+ down: "bi bi-arrow-down",
23
+ up: "bi bi-arrow-up",
24
+ },
25
+ caret: {
26
+ right: "bi bi-caret-right",
27
+ down: "bi bi-caret-down",
28
+ },
29
+ changes: {
30
+ add: "bi bi-plus",
31
+ remove: "bi bi-dash",
32
+ replace: "bi bi-plus-slash-minus",
33
+ },
34
+ chevron: {
35
+ right: "bi bi-chevron-right",
36
+ down: "bi bi-chevron-down",
37
+ },
38
+ collapse: {
39
+ all: "bi bi-arrows-collapse",
40
+ up: "bi bi-chevron-up",
41
+ },
42
+ close: "bi bi-x",
43
+ config: "bi bi-gear",
44
+ confirm: "bi bi-check",
45
+ copy: "bi bi-copy",
46
+ epoch: (epoch: string) => {
47
+ return `bi bi-${epoch}-circle`;
48
+ },
49
+ error: "bi bi-exclamation-circle",
50
+ "expand-all": "bi bi-arrows-expand",
51
+ "expand-down": "bi bi-chevron-down",
52
+ fork: "bi bi-signpost-split",
53
+ info: "bi bi-info-circle",
54
+ input: "bi bi-terminal",
55
+ inspect: "bi bi-gear",
56
+ json: "bi bi-filetype-json",
57
+ limits: {
58
+ messages: "bi bi-chat-right-text",
59
+ custom: "bi bi-person-workspace",
60
+ operator: "bi bi-person-workspace",
61
+ tokens: "bi bi-list",
62
+ time: "bi bi-stopwatch",
63
+ },
64
+ logging: loggingIcons,
65
+ menu: "bi bi-list",
66
+ messages: "bi bi-chat-right-text",
67
+ metadata: "bi bi-table",
68
+ model: "bi bi-grid-3x3-gap",
69
+ "toggle-right": "bi bi-chevron-right",
70
+ more: "bi bi-zoom-in",
71
+ "multiple-choice": "bi bi-card-list",
72
+ next: "bi bi-chevron-right",
73
+ play: "bi bi-play-fill",
74
+ previous: "bi bi-chevron-left",
75
+ refresh: "bi bi-arrow-clockwise",
76
+ role: {
77
+ user: "bi bi-person",
78
+ system: "bi bi-cpu",
79
+ assistant: "bi bi-robot",
80
+ tool: "bi bi-tools",
81
+ unknown: "bi bi-patch-question",
82
+ },
83
+ running: "bi bi-stars",
84
+ sample: "bi bi-database",
85
+ samples: "bi bi-file-spreadsheet",
86
+ scorer: "bi bi-calculator",
87
+ search: "bi bi-search",
88
+ solvers: {
89
+ default: "bi bi-arrow-return-right",
90
+ generate: "bi bi-share",
91
+ chain_of_thought: "bi bi-link",
92
+ self_critique: "bi bi-arrow-left-right",
93
+ system_message: "bi bi-cpu",
94
+ use_tools: "bi bi-tools",
95
+ },
96
+ step: "bi bi-fast-forward-btn",
97
+ subtask: "bi bi-subtract",
98
+ transcript: "bi bi-list-columns-reverse",
99
+ usage: "bi bi-stopwatch",
100
+ };
@@ -1,35 +1,5 @@
1
- // @ts-check
2
- /**
3
- * @typedef {Record<string, string>} Style
4
- */
1
+ import { FontSize, TextStyle } from "./fonts";
5
2
 
6
- import { FontSize, TextStyle } from "./Fonts.mjs";
7
-
8
- /**
9
- * Generates line clamp style.
10
- * @param {number} len - The number of lines to clamp.
11
- * @returns {Style} The style object for line clamping.
12
- */
13
-
14
- /**
15
- * Provides centralized repository of score fill styles.
16
- * @typedef {Object} ScoreFills
17
- * @property {Style} green
18
- * @property {Style} red
19
- * @property {Style} orange
20
- */
21
-
22
- /**
23
- * Provides centralized repository of shared styles.
24
- * @typedef {Object} SharedStyles
25
- * @property {Style} moreButton
26
- * @property {Style} threeLineClamp
27
- * @property {(len: number) => Style} lineClamp
28
- * @property {() => Object} wrapText
29
- * @property {ScoreFills} scoreFills
30
- */
31
-
32
- /** @type {SharedStyles} */
33
3
  export const ApplicationStyles = {
34
4
  moreButton: {
35
5
  maxHeight: "1.8em",
@@ -43,7 +13,7 @@ export const ApplicationStyles = {
43
13
  "-webkit-box-orient": "vertical",
44
14
  overflow: "hidden",
45
15
  },
46
- lineClamp: (len) => {
16
+ lineClamp: (len: number) => {
47
17
  return {
48
18
  display: "-webkit-box",
49
19
  "-webkit-line-clamp": `${len}`,
@@ -0,0 +1,198 @@
1
+ import { ANSIColor, ANSIOutput, ANSIOutputRun, ANSIStyle } from "ansi-output";
2
+ import clsx from "clsx";
3
+ import "./AnsiDisplay.css";
4
+
5
+ interface ANSIDisplayProps {
6
+ output: string;
7
+ style?: React.CSSProperties;
8
+ className?: string[] | string;
9
+ }
10
+
11
+ export const ANSIDisplay: React.FC<ANSIDisplayProps> = ({
12
+ output,
13
+ style,
14
+ className,
15
+ }) => {
16
+ const ansiOutput = new ANSIOutput();
17
+ ansiOutput.processOutput(output);
18
+
19
+ let firstOutput = false;
20
+ return (
21
+ <div className={clsx("ansi-display", className)} style={{ ...style }}>
22
+ {ansiOutput.outputLines.map((line) => {
23
+ firstOutput = firstOutput || !!line.outputRuns.length;
24
+ return (
25
+ <div className={"ansi-display-line"}>
26
+ {!line.outputRuns.length ? (
27
+ firstOutput ? (
28
+ <br />
29
+ ) : null
30
+ ) : (
31
+ line.outputRuns.map((outputRun) => (
32
+ <OutputRun key={outputRun.id} run={outputRun} />
33
+ ))
34
+ )}
35
+ </div>
36
+ );
37
+ })}
38
+ </div>
39
+ );
40
+ };
41
+
42
+ const kForeground = 0;
43
+ const kBackground = 1;
44
+
45
+ interface OutputRunProps {
46
+ run: ANSIOutputRun;
47
+ }
48
+
49
+ const OutputRun: React.FC<OutputRunProps> = ({ run }) => {
50
+ // Render.
51
+ return <span style={computeCSSProperties(run)}>{run.text}</span>;
52
+ };
53
+
54
+ const computeCSSProperties = (outputRun: ANSIOutputRun) => {
55
+ return !outputRun.format
56
+ ? {}
57
+ : {
58
+ ...computeStyles(outputRun.format.styles || []),
59
+ ...computeForegroundBackgroundColor(
60
+ kForeground,
61
+ outputRun.format.foregroundColor,
62
+ ),
63
+ ...computeForegroundBackgroundColor(
64
+ kBackground,
65
+ outputRun.format.backgroundColor,
66
+ ),
67
+ };
68
+ };
69
+
70
+ const computeStyles = (styles: ANSIStyle[]) => {
71
+ let cssProperties = {};
72
+ if (styles) {
73
+ styles.forEach((style) => {
74
+ switch (style) {
75
+ // Bold.
76
+ case ANSIStyle.Bold:
77
+ cssProperties = { ...cssProperties, ...{ fontWeight: "bold" } };
78
+ break;
79
+
80
+ // Dim.
81
+ case ANSIStyle.Dim:
82
+ cssProperties = { ...cssProperties, ...{ fontWeight: "lighter" } };
83
+ break;
84
+
85
+ // Italic.
86
+ case ANSIStyle.Italic:
87
+ cssProperties = { ...cssProperties, ...{ fontStyle: "italic" } };
88
+ break;
89
+
90
+ // Underlined.
91
+ case ANSIStyle.Underlined:
92
+ cssProperties = {
93
+ ...cssProperties,
94
+ ...{
95
+ textDecorationLine: "underline",
96
+ textDecorationStyle: "solid",
97
+ },
98
+ };
99
+ break;
100
+
101
+ // Slow blink.
102
+ case ANSIStyle.SlowBlink:
103
+ cssProperties = {
104
+ ...cssProperties,
105
+ ...{ animation: "ansi-display-run-blink 1s linear infinite" },
106
+ };
107
+ break;
108
+
109
+ // Rapid blink.
110
+ case ANSIStyle.RapidBlink:
111
+ cssProperties = {
112
+ ...cssProperties,
113
+ ...{ animation: "ansi-display-run-blink 0.5s linear infinite" },
114
+ };
115
+ break;
116
+
117
+ // Hidden.
118
+ case ANSIStyle.Hidden:
119
+ cssProperties = { ...cssProperties, ...{ visibility: "hidden" } };
120
+ break;
121
+
122
+ // CrossedOut.
123
+ case ANSIStyle.CrossedOut:
124
+ cssProperties = {
125
+ ...cssProperties,
126
+ ...{
127
+ textDecorationLine: "line-through",
128
+ textDecorationStyle: "solid",
129
+ },
130
+ };
131
+ break;
132
+
133
+ // TODO Fraktur
134
+
135
+ // DoubleUnderlined.
136
+ case ANSIStyle.DoubleUnderlined:
137
+ cssProperties = {
138
+ ...cssProperties,
139
+ ...{
140
+ textDecorationLine: "underline",
141
+ textDecorationStyle: "double",
142
+ },
143
+ };
144
+ break;
145
+
146
+ // TODO Framed
147
+ // TODO Encircled
148
+ // TODO Overlined
149
+ // TODO Superscript
150
+ // TODO Subscript
151
+ }
152
+ });
153
+ }
154
+
155
+ return cssProperties;
156
+ };
157
+
158
+ const computeForegroundBackgroundColor = (
159
+ colorType: number,
160
+ color?: string,
161
+ ) => {
162
+ switch (color) {
163
+ // Undefined.
164
+ case undefined:
165
+ return {};
166
+
167
+ // One of the standard colors.
168
+ case ANSIColor.Black:
169
+ case ANSIColor.Red:
170
+ case ANSIColor.Green:
171
+ case ANSIColor.Yellow:
172
+ case ANSIColor.Blue:
173
+ case ANSIColor.Magenta:
174
+ case ANSIColor.Cyan:
175
+ case ANSIColor.White:
176
+ case ANSIColor.BrightBlack:
177
+ case ANSIColor.BrightRed:
178
+ case ANSIColor.BrightGreen:
179
+ case ANSIColor.BrightYellow:
180
+ case ANSIColor.BrightBlue:
181
+ case ANSIColor.BrightMagenta:
182
+ case ANSIColor.BrightCyan:
183
+ case ANSIColor.BrightWhite:
184
+ if (colorType === kForeground) {
185
+ return { color: `var(--${color})` };
186
+ } else {
187
+ return { background: `var(--${color})` };
188
+ }
189
+
190
+ // TODO@softwarenerd - This isn't hooked up.
191
+ default:
192
+ if (colorType === kForeground) {
193
+ return { color: color };
194
+ } else {
195
+ return { background: color };
196
+ }
197
+ }
198
+ };
@@ -0,0 +1,86 @@
1
+ import * as AsciicinemaPlayerJS from "asciinema-player";
2
+ import "asciinema-player/dist/bundle/asciinema-player.css";
3
+ import React, { useEffect, useRef } from "react";
4
+
5
+ interface AsciinemaPlayerProps {
6
+ id?: string;
7
+ inputUrl: string;
8
+ outputUrl: string;
9
+ timingUrl: string;
10
+ rows?: number;
11
+ cols?: number;
12
+ fit?: string;
13
+ style?: React.CSSProperties;
14
+ speed?: number;
15
+ autoPlay?: boolean;
16
+ loop?: boolean;
17
+ theme?: string;
18
+ idleTimeLimit?: number;
19
+ className?: string;
20
+ }
21
+
22
+ export const AsciinemaPlayer: React.FC<AsciinemaPlayerProps> = ({
23
+ id,
24
+ rows,
25
+ cols,
26
+ inputUrl,
27
+ outputUrl,
28
+ timingUrl,
29
+ fit,
30
+ speed,
31
+ autoPlay,
32
+ loop,
33
+ theme,
34
+ idleTimeLimit = 2,
35
+ style,
36
+ }) => {
37
+ const playerContainerRef = useRef<HTMLDivElement>(null);
38
+
39
+ useEffect(() => {
40
+ if (!playerContainerRef.current) return;
41
+
42
+ const player = AsciicinemaPlayerJS.create(
43
+ {
44
+ url: [timingUrl, outputUrl, inputUrl],
45
+ parser: "typescript",
46
+ },
47
+ playerContainerRef.current,
48
+ {
49
+ rows,
50
+ cols,
51
+ autoPlay,
52
+ loop,
53
+ theme,
54
+ speed,
55
+ idleTimeLimit,
56
+ fit,
57
+ },
58
+ );
59
+
60
+ player.play();
61
+
62
+ return () => {
63
+ player.dispose();
64
+ };
65
+ }, [
66
+ timingUrl,
67
+ outputUrl,
68
+ inputUrl,
69
+ rows,
70
+ cols,
71
+ autoPlay,
72
+ loop,
73
+ theme,
74
+ speed,
75
+ idleTimeLimit,
76
+ fit,
77
+ ]);
78
+
79
+ return (
80
+ <div
81
+ id={`asciinema-player-${id || "default"}`}
82
+ ref={playerContainerRef}
83
+ style={{ ...style }}
84
+ />
85
+ );
86
+ };