inspect-ai 0.3.89__py3-none-any.whl → 0.3.90__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -642,18 +642,6 @@ async def task_run_sample(
642
642
  )
643
643
  )
644
644
 
645
- # sample init event (remove file bodies as they have content or absolute paths)
646
- event_sample = sample.model_copy(
647
- update=dict(files={k: "" for k in sample.files.keys()})
648
- if sample.files
649
- else None
650
- )
651
- transcript()._event(
652
- SampleInitEvent(
653
- sample=event_sample, state=state_jsonable(state)
654
- )
655
- )
656
-
657
645
  # set progress for plan then run it
658
646
  state = await plan(state, generate)
659
647
 
@@ -15909,18 +15909,18 @@ ul.jsondiffpatch-textdiff {
15909
15909
  ._output_s17ok_1 {
15910
15910
  padding-top: 1em;
15911
15911
  }
15912
- ._outputPre_1h1fn_1 {
15912
+ ._outputPre_1t1y9_1 {
15913
15913
  padding: 0.5em;
15914
15914
  margin-top: 0.25em;
15915
15915
  margin-bottom: 1rem;
15916
15916
  }
15917
15917
 
15918
- ._outputCode_1h1fn_7 {
15919
- overflow-wrap: anywhere;
15920
- white-space: pre-wrap;
15918
+ ._outputCode_1t1y9_7 {
15919
+ overflow-wrap: anywhere !important;
15920
+ white-space: pre-wrap !important;
15921
15921
  }
15922
15922
 
15923
- ._bottomPadding_1h1fn_12 {
15923
+ ._bottomPadding_1t1y9_12 {
15924
15924
  padding-bottom: 1em;
15925
15925
  }
15926
15926
  ._image_10saa_1 {
@@ -19336,53 +19336,51 @@ span.ap-marker-container:hover span.ap-marker {
19336
19336
  ._progress_1qsnv_12 {
19337
19337
  margin-left: 0.5em;
19338
19338
  }
19339
- ._darkenedBg_c8m1t_1 {
19339
+ ._darkenedBg_eq9th_1 {
19340
19340
  background-color: var(--bs-light-bg-subtle);
19341
19341
  }
19342
19342
 
19343
- ._normalBg_c8m1t_5 {
19343
+ ._normalBg_eq9th_5 {
19344
19344
  background-color: var(--bs-body-bg);
19345
19345
  }
19346
19346
 
19347
- ._node_c8m1t_9._first_c8m1t_9 {
19347
+ ._node_eq9th_9._first_eq9th_9 {
19348
19348
  padding-top: 0.5em;
19349
19349
  }
19350
19350
 
19351
- ._node_c8m1t_9 {
19351
+ ._node_eq9th_9 {
19352
19352
  padding-top: 0;
19353
19353
  padding-bottom: 0.5em;
19354
19354
  }
19355
19355
 
19356
- ._nodes_c8m1t_18 {
19356
+ ._nodes_eq9th_18 {
19357
19357
  width: 100%;
19358
19358
  margin-top: 1em;
19359
19359
  }
19360
19360
 
19361
- ._transcriptComponent_c8m1t_23 {
19361
+ ._transcriptComponent_eq9th_23 {
19362
19362
  display: grid;
19363
19363
  margin: 0.5em 0 0 0;
19364
19364
  width: 100%;
19365
19365
  }
19366
19366
 
19367
- ._eventNode_c8m1t_29 {
19367
+ ._eventNode_eq9th_29 {
19368
19368
  background-color: var(--bs-body-bg);
19369
- margin-bottom: 1.5em;
19370
- padding-bottom: 0.5em;
19371
19369
  }
19372
19370
 
19373
- ._eventNode_c8m1t_29._darkenBg_c8m1t_35 {
19371
+ ._eventNode_eq9th_29._darkenBg_eq9th_33 {
19374
19372
  background-color: var(--bs-light-bg-subtle);
19375
19373
  }
19376
19374
 
19377
- ._eventNode_c8m1t_29._lastNode_c8m1t_39 {
19375
+ ._eventNode_eq9th_29._lastNode_eq9th_37 {
19378
19376
  margin-bottom: 0;
19379
19377
  }
19380
19378
 
19381
- ._eventNodeContainer_c8m1t_43 {
19379
+ ._eventNodeContainer_eq9th_41 {
19382
19380
  padding-bottom: 0.5em;
19383
19381
  }
19384
19382
 
19385
- ._eventNodeContainer_c8m1t_43._noBottom_c8m1t_47 {
19383
+ ._eventNodeContainer_eq9th_41._noBottom_eq9th_45 {
19386
19384
  padding-bottom: 0;
19387
19385
  }
19388
19386
  ._darkenedBg_1ye6u_1 {
@@ -34090,9 +34090,9 @@ self.onmessage = function (e) {
34090
34090
  const styles$16 = {
34091
34091
  output: output$1
34092
34092
  };
34093
- const outputPre = "_outputPre_1h1fn_1";
34094
- const outputCode = "_outputCode_1h1fn_7";
34095
- const bottomPadding = "_bottomPadding_1h1fn_12";
34093
+ const outputPre = "_outputPre_1t1y9_1";
34094
+ const outputCode = "_outputCode_1t1y9_7";
34095
+ const bottomPadding = "_bottomPadding_1t1y9_12";
34096
34096
  const styles$15 = {
34097
34097
  outputPre,
34098
34098
  outputCode,
@@ -34410,7 +34410,7 @@ self.onmessage = function (e) {
34410
34410
  indented: indented2,
34411
34411
  toolCallStyle
34412
34412
  }) => {
34413
- const collapse = message2.role === "system";
34413
+ const collapse = message2.role === "system" || message2.role === "user";
34414
34414
  return /* @__PURE__ */ jsxRuntimeExports.jsxs(
34415
34415
  "div",
34416
34416
  {
@@ -34432,7 +34432,7 @@ self.onmessage = function (e) {
34432
34432
  styles$1a.messageContents,
34433
34433
  indented2 ? styles$1a.indented : void 0
34434
34434
  ),
34435
- children: /* @__PURE__ */ jsxRuntimeExports.jsx(ExpandablePanel, { id: `${id}-message`, collapse, lines: 30, children: /* @__PURE__ */ jsxRuntimeExports.jsx(
34435
+ children: /* @__PURE__ */ jsxRuntimeExports.jsx(ExpandablePanel, { id: `${id}-message`, collapse, lines: 15, children: /* @__PURE__ */ jsxRuntimeExports.jsx(
34436
34436
  MessageContents,
34437
34437
  {
34438
34438
  id: `${id}-contents`,
@@ -71520,6 +71520,18 @@ ${events}
71520
71520
  return {
71521
71521
  ...rootStepDescriptor
71522
71522
  };
71523
+ } else if (event.event === "step") {
71524
+ if (event.name === "init") {
71525
+ return {
71526
+ ...rootStepDescriptor,
71527
+ name: "Init",
71528
+ collapse: true
71529
+ };
71530
+ } else {
71531
+ return {
71532
+ ...rootStepDescriptor
71533
+ };
71534
+ }
71523
71535
  } else {
71524
71536
  switch (event.name) {
71525
71537
  case "sample_init":
@@ -71528,12 +71540,6 @@ ${events}
71528
71540
  name: "Sample Init",
71529
71541
  collapse: true
71530
71542
  };
71531
- case "init":
71532
- return {
71533
- ...rootStepDescriptor,
71534
- name: "Init",
71535
- collapse: true
71536
- };
71537
71543
  default:
71538
71544
  return {
71539
71545
  endSpace: false
@@ -71738,12 +71744,12 @@ ${events}
71738
71744
  this.depth = depth;
71739
71745
  }
71740
71746
  }
71741
- const transcriptComponent = "_transcriptComponent_c8m1t_23";
71742
- const eventNode = "_eventNode_c8m1t_29";
71743
- const darkenBg = "_darkenBg_c8m1t_35";
71744
- const lastNode = "_lastNode_c8m1t_39";
71745
- const eventNodeContainer = "_eventNodeContainer_c8m1t_43";
71746
- const noBottom = "_noBottom_c8m1t_47";
71747
+ const transcriptComponent = "_transcriptComponent_eq9th_23";
71748
+ const eventNode = "_eventNode_eq9th_29";
71749
+ const darkenBg = "_darkenBg_eq9th_33";
71750
+ const lastNode = "_lastNode_eq9th_37";
71751
+ const eventNodeContainer = "_eventNodeContainer_eq9th_41";
71752
+ const noBottom = "_noBottom_eq9th_45";
71747
71753
  const styles$t = {
71748
71754
  transcriptComponent,
71749
71755
  eventNode,
@@ -26,7 +26,7 @@ export const ChatMessage: FC<ChatMessageProps> = ({
26
26
  indented,
27
27
  toolCallStyle,
28
28
  }) => {
29
- const collapse = message.role === "system";
29
+ const collapse = message.role === "system" || message.role === "user";
30
30
  return (
31
31
  <div
32
32
  className={clsx(
@@ -46,7 +46,7 @@ export const ChatMessage: FC<ChatMessageProps> = ({
46
46
  indented ? styles.indented : undefined,
47
47
  )}
48
48
  >
49
- <ExpandablePanel id={`${id}-message`} collapse={collapse} lines={30}>
49
+ <ExpandablePanel id={`${id}-message`} collapse={collapse} lines={15}>
50
50
  <MessageContents
51
51
  id={`${id}-contents`}
52
52
  key={`${id}-contents`}
@@ -5,8 +5,8 @@
5
5
  }
6
6
 
7
7
  .outputCode {
8
- overflow-wrap: anywhere;
9
- white-space: pre-wrap;
8
+ overflow-wrap: anywhere !important;
9
+ white-space: pre-wrap !important;
10
10
  }
11
11
 
12
12
  .bottomPadding {
@@ -132,6 +132,18 @@ const stepDescriptor = (
132
132
  return {
133
133
  ...rootStepDescriptor,
134
134
  };
135
+ } else if (event.event === "step") {
136
+ if (event.name === "init") {
137
+ return {
138
+ ...rootStepDescriptor,
139
+ name: "Init",
140
+ collapse: true,
141
+ };
142
+ } else {
143
+ return {
144
+ ...rootStepDescriptor,
145
+ };
146
+ }
135
147
  } else {
136
148
  switch (event.name) {
137
149
  case "sample_init":
@@ -140,12 +152,6 @@ const stepDescriptor = (
140
152
  name: "Sample Init",
141
153
  collapse: true,
142
154
  };
143
- case "init":
144
- return {
145
- ...rootStepDescriptor,
146
- name: "Init",
147
- collapse: true,
148
- };
149
155
  default:
150
156
  return {
151
157
  endSpace: false,
@@ -28,8 +28,6 @@
28
28
 
29
29
  .eventNode {
30
30
  background-color: var(--bs-body-bg);
31
- margin-bottom: 1.5em;
32
- padding-bottom: 0.5em;
33
31
  }
34
32
 
35
33
  .eventNode.darkenBg {
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: inspect_ai
3
- Version: 0.3.89
3
+ Version: 0.3.90
4
4
  Summary: Framework for large language model evaluations
5
5
  Author: UK AI Security Institute
6
6
  License: MIT License
@@ -62,7 +62,7 @@ inspect_ai/_eval/task/images.py,sha256=nTzHizlyuPYumPH7gAOBSrNkTwTbAmZ7tKdzN7d_R
62
62
  inspect_ai/_eval/task/log.py,sha256=cAnnsICthsIIexTypNcFAy9uNHU5Sa0F7RmzdnZoSpk,11629
63
63
  inspect_ai/_eval/task/resolved.py,sha256=LBVHEeq9N1fkRObmA2pnDE_l_EuH6n2Dg8-c8yCGT5U,1007
64
64
  inspect_ai/_eval/task/results.py,sha256=x4weYRK2XGowfBG3f2msOeZQ_pxh230HTlw6kps33jw,17925
65
- inspect_ai/_eval/task/run.py,sha256=c9IRP2Rrqo9rlufweTWyPeX_nCcwQW9k5tuy5EXi7A0,37591
65
+ inspect_ai/_eval/task/run.py,sha256=uoU1GwjB5bHBde__brfUff4ssxRqiea0lzjiCJ7LEpk,37009
66
66
  inspect_ai/_eval/task/sandbox.py,sha256=A4OirmhKtXzg_Bu-g2yo-vC_vnXocpBevns5M07k-qE,7095
67
67
  inspect_ai/_eval/task/task.py,sha256=GyyzKkljhIHgM0Lh7wcBFHOgjqTqhOSkThHSQD4fIvk,16308
68
68
  inspect_ai/_eval/task/tasks.py,sha256=8fy5k070KgjYwaZQ_Nk6_r-38VTU6HB-qh7ixc4JzKI,727
@@ -143,8 +143,8 @@ inspect_ai/_view/www/.vscode/extensions.json,sha256=E73RWLzcoyeluE_ijGxaNSOK9xC0
143
143
  inspect_ai/_view/www/.vscode/settings.json,sha256=g5hrVnMaYxM06JpiJD2EuE2xjcbF6xNAtL2fuKgG1-8,200
144
144
  inspect_ai/_view/www/dist/index.html,sha256=gpdu6SR-SOH9EWx15cCWHzujMZujnZR5tRlEfROJg2A,997
145
145
  inspect_ai/_view/www/dist/assets/favicon.svg,sha256=b9AHYZaO2zBzeKH6G4PwXZMGGW_UxY0omKHam-c9MAs,1508
146
- inspect_ai/_view/www/dist/assets/index.css,sha256=c9D67a2-Erjgh3_yr-HeGnROu6TWx5iiRj90WXXT8rs,2360874
147
- inspect_ai/_view/www/dist/assets/index.js,sha256=8hgHDrBGBuN3hLOIotyZGYV0WHZ_0OMs12F72p7BkOE,3097948
146
+ inspect_ai/_view/www/dist/assets/index.css,sha256=_K7N7DK5k7VLO6DQxaP4zhuqQsYKlUS9VEJM2sPJZWk,2360847
147
+ inspect_ai/_view/www/dist/assets/index.js,sha256=nvJOVc6JXD9lfkFLkCiiOA2JFJTZVC3-R-mQkSX25eU,3098116
148
148
  inspect_ai/_view/www/src/App.tsx,sha256=M21uqy08olnk9s3JJxOJ5dYSBP7LBQ1MIUXDWpO8878,9931
149
149
  inspect_ai/_view/www/src/AppErrorBoundary.tsx,sha256=RyhZWbIMZj1QeUOUUXh9hUFvq6LoDEoHuTY0giswmL0,1169
150
150
  inspect_ai/_view/www/src/constants.ts,sha256=aLncMT1XjKzyphLF_jkXPZicsCJXMsBXcDomAC4EaIY,1228
@@ -248,7 +248,7 @@ inspect_ai/_view/www/src/samples/SamplesTools.tsx,sha256=wj1Iwlpkc-cF7KHtHwpj_zv
248
248
  inspect_ai/_view/www/src/samples/sampleDataAdapter.ts,sha256=LinV7zL4id1T_IRJe6LRni4I2TyOsVhwHnUCS-IUPBE,919
249
249
  inspect_ai/_view/www/src/samples/sampleLimit.ts,sha256=0OGoyQmuytXxPskO4hAJJ9i_5HiLobMfiYkp-yadngs,604
250
250
  inspect_ai/_view/www/src/samples/chat/ChatMessage.module.css,sha256=w5CIir3cw1WNvLuo43KNPWAF9jjzOZy87BijICcCafk,435
251
- inspect_ai/_view/www/src/samples/chat/ChatMessage.tsx,sha256=DY5d6QNb9UTxQoQF0Qnqrrgwx3iQadQlNlFyRDtGpkA,1605
251
+ inspect_ai/_view/www/src/samples/chat/ChatMessage.tsx,sha256=-URkbyxT_k5z9pLLd3uc7CWSQUS_RuwpTPlFkkpaDIY,1632
252
252
  inspect_ai/_view/www/src/samples/chat/ChatMessageRenderer.tsx,sha256=UAl6VkQ5tnaiBkArRLOo3aEGQtoPA-_6z50jNHVpwwg,1499
253
253
  inspect_ai/_view/www/src/samples/chat/ChatMessageRow.module.css,sha256=akFmz9wQ6r0CGp6BpiE5nfHS3TBfQ83LQmS3dV9sAYU,125
254
254
  inspect_ai/_view/www/src/samples/chat/ChatMessageRow.tsx,sha256=W6SCL-0ezf2a5npMbodEwzsnmaApiIMyKM3zHBlN6iM,1347
@@ -262,7 +262,7 @@ inspect_ai/_view/www/src/samples/chat/MessageContents.tsx,sha256=fW5j6P1quG-85AA
262
262
  inspect_ai/_view/www/src/samples/chat/messages.ts,sha256=eJaXPmf8v5j2Hr-IpkqQLxIlQn9nkN3-58lseN_ZJwc,4027
263
263
  inspect_ai/_view/www/src/samples/chat/tools/ToolCallView.module.css,sha256=A2SVUV7FpnyipyGkmQ4drO2kzKx5KyDbKPDURLHNz4Q,32
264
264
  inspect_ai/_view/www/src/samples/chat/tools/ToolCallView.tsx,sha256=5uu7KrZ3MDJ2Kg3e4sVuRr1NTomtr-_jl5VHHUKCVg8,3879
265
- inspect_ai/_view/www/src/samples/chat/tools/ToolInput.module.css,sha256=apEfqHAe683GyFx803xDO6Wid3m3xn_3ftGSLa4uxVI,190
265
+ inspect_ai/_view/www/src/samples/chat/tools/ToolInput.module.css,sha256=ujqWdG8IaWm-m8YQCvo_TMuTTVZDkSYiwuc_bVQByRY,212
266
266
  inspect_ai/_view/www/src/samples/chat/tools/ToolInput.tsx,sha256=PldJ9eHpoSqOSwAdtSRJXyrTbvHzQzs7OtB7CBxXmC8,1362
267
267
  inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.module.css,sha256=p8jLonoAawbhuaqNzFPzToD-KRa3tBwX9w4yVOf3xqo,266
268
268
  inspect_ai/_view/www/src/samples/chat/tools/ToolOutput.tsx,sha256=kOHkL97fnw1xwfgP_ys0JGl-9gd7rZDO_FVQzX8oQ9s,1616
@@ -330,12 +330,12 @@ inspect_ai/_view/www/src/samples/transcript/SandboxEventView.module.css,sha256=G
330
330
  inspect_ai/_view/www/src/samples/transcript/SandboxEventView.tsx,sha256=0gQEjTMnfMgcPj28V-ATzwL-gWWSZBjZxeYN8G2cMzQ,3799
331
331
  inspect_ai/_view/www/src/samples/transcript/ScoreEventView.module.css,sha256=YWHWPM_-2UognvNIjB5-UejG17xy0yRW3jyfN4UeD1E,246
332
332
  inspect_ai/_view/www/src/samples/transcript/ScoreEventView.tsx,sha256=ycEHCwllialOK-3NtsiybcIjg8QEW1lYr59wp3xEzZM,2621
333
- inspect_ai/_view/www/src/samples/transcript/StepEventView.tsx,sha256=40xL9vSRQiIx8AXEFp2UOyf9tOHvLmO18oqZbvupcFM,3598
333
+ inspect_ai/_view/www/src/samples/transcript/StepEventView.tsx,sha256=qEP7Kn1p9Aq3nhcEcH50t36s6CQYSbyBOSnEtsTETNw,3715
334
334
  inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.module.css,sha256=L6u8qUl3_V9cYf36zT1NOvXEJ5dqoO5JlAgoioMguR8,274
335
335
  inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.tsx,sha256=AzZDQhLMn-fbAcIOK3uJ0lolkA0UsmbZTh4cZzon25A,3742
336
336
  inspect_ai/_view/www/src/samples/transcript/ToolEventView.module.css,sha256=nGootHKSBsnOv2UGw9cVfIAGzw-a3x6IOgHu8SAU9lE,149
337
337
  inspect_ai/_view/www/src/samples/transcript/ToolEventView.tsx,sha256=Cg5__N0YMFCAgdegYHpy8XfVL7NuBeHJggXXsHchF7c,3229
338
- inspect_ai/_view/www/src/samples/transcript/TranscriptView.module.css,sha256=zExatTZIn6UEC98D1uNGifN2EJhLF9RyvA0XQxNbwXA,663
338
+ inspect_ai/_view/www/src/samples/transcript/TranscriptView.module.css,sha256=C0wFxmQtkmy89qr9Sl6YblQ0XObH3nVDg4vLpqFNgcI,614
339
339
  inspect_ai/_view/www/src/samples/transcript/TranscriptView.tsx,sha256=lzYKIdd3-oJ0jNGffsHVMueWjZWzcV3R2Ki5RxqIbkY,8880
340
340
  inspect_ai/_view/www/src/samples/transcript/TranscriptVirtualListComponent.module.css,sha256=f-4Mic4ORce1qIUFH262x2zoQngYMPm1_KZraZtOgiw,210
341
341
  inspect_ai/_view/www/src/samples/transcript/TranscriptVirtualListComponent.tsx,sha256=DiC5la5vH5YS8JvyzSxBGtsmw3ulkY8wVqWkqyJeYF8,1275
@@ -697,9 +697,9 @@ inspect_ai/util/_sandbox/docker/internal.py,sha256=c8X8TLrBPOvsfnq5TkMlb_bzTALyc
697
697
  inspect_ai/util/_sandbox/docker/prereqs.py,sha256=0j6_OauBBnVlpBleADcZavIAAQZy4WewVjbRn9c0stg,3355
698
698
  inspect_ai/util/_sandbox/docker/service.py,sha256=hhHIWH1VDFLwehdGd19aUBD_VKfDO3GCPxpw1HSwVQk,2437
699
699
  inspect_ai/util/_sandbox/docker/util.py,sha256=EeInihCNXgUWxaqZ4dNOJd719kXL2_jr63QCoXn68vA,3154
700
- inspect_ai-0.3.89.dist-info/licenses/LICENSE,sha256=xZPCr8gTiFIerrA_DRpLAbw-UUftnLFsHxKeW-NTtq8,1081
701
- inspect_ai-0.3.89.dist-info/METADATA,sha256=GAxu-5LVKaqRpjOgkkWTogcjsj5qeW8_GFKLoSKq0-0,4965
702
- inspect_ai-0.3.89.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
703
- inspect_ai-0.3.89.dist-info/entry_points.txt,sha256=WGGLmzTzDWLzYfiyovSY6oEKuf-gqzSDNOb5V-hk3fM,54
704
- inspect_ai-0.3.89.dist-info/top_level.txt,sha256=Tp3za30CHXJEKLk8xLe9qGsW4pBzJpEIOMHOHNCXiVo,11
705
- inspect_ai-0.3.89.dist-info/RECORD,,
700
+ inspect_ai-0.3.90.dist-info/licenses/LICENSE,sha256=xZPCr8gTiFIerrA_DRpLAbw-UUftnLFsHxKeW-NTtq8,1081
701
+ inspect_ai-0.3.90.dist-info/METADATA,sha256=2BRKWXKir4JerjMcQEGoZ5csLeaffrkAOI3SVNVAfME,4965
702
+ inspect_ai-0.3.90.dist-info/WHEEL,sha256=pxyMxgL8-pra_rKaQ4drOZAegBVuX-G_4nRHjjgWbmo,91
703
+ inspect_ai-0.3.90.dist-info/entry_points.txt,sha256=WGGLmzTzDWLzYfiyovSY6oEKuf-gqzSDNOb5V-hk3fM,54
704
+ inspect_ai-0.3.90.dist-info/top_level.txt,sha256=Tp3za30CHXJEKLk8xLe9qGsW4pBzJpEIOMHOHNCXiVo,11
705
+ inspect_ai-0.3.90.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (78.1.0)
2
+ Generator: setuptools (79.0.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5