inspect-ai 0.3.91__py3-none-any.whl → 0.3.92__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
inspect_ai/_cli/eval.py CHANGED
@@ -1164,6 +1164,10 @@ def eval_retry_command(
1164
1164
  elif fail_on_error == 0.0:
1165
1165
  fail_on_error = True
1166
1166
 
1167
+ # resolve retry on error
1168
+ if retry_on_error == 0:
1169
+ retry_on_error = None
1170
+
1167
1171
  # resolve log file
1168
1172
  retry_log_files = [
1169
1173
  log_file_info(filesystem(log_file).info(log_file)) for log_file in log_files
@@ -1,3 +1,4 @@
1
+ import json
1
2
  from itertools import chain
2
3
  from typing import TypedDict, cast
3
4
 
@@ -306,6 +307,14 @@ def _openai_input_items_from_chat_message_assistant(
306
307
  """
307
308
  (output_message_id, tool_message_ids) = _ids_from_assistant_internal(message)
308
309
 
310
+ # we want to prevent yielding output messages in the case where we have an
311
+ # 'internal' field (so the message came from the model API as opposed to
312
+ # being user synthesized) AND there is no output_message_id (indicating that
313
+ # when reading the message from the server we didn't find output). this could
314
+ # happen e.g. when a react() agent sets the output.completion in response
315
+ # to a submit() tool call
316
+ suppress_output_message = message.internal is not None and output_message_id is None
317
+
309
318
  # if we are not storing messages on the server then blank these out
310
319
  if not store:
311
320
  output_message_id = None
@@ -341,6 +350,9 @@ def _openai_input_items_from_chat_message_assistant(
341
350
  )
342
351
  )
343
352
  case ContentText(text=text, refusal=refusal):
353
+ if suppress_output_message:
354
+ continue
355
+
344
356
  new_content = (
345
357
  ResponseOutputRefusalParam(type="refusal", refusal=text)
346
358
  if refusal
@@ -415,7 +427,7 @@ def _tool_call_items_from_assistant_message(
415
427
  type="function_call",
416
428
  call_id=call.id,
417
429
  name=_responses_tool_alias(call.function),
418
- arguments=call.function,
430
+ arguments=json.dumps(call.arguments),
419
431
  )
420
432
 
421
433
  # add id if available
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: inspect_ai
3
- Version: 0.3.91
3
+ Version: 0.3.92
4
4
  Summary: Framework for large language model evaluations
5
5
  Author: UK AI Security Institute
6
6
  License: MIT License
@@ -3,7 +3,7 @@ inspect_ai/__main__.py,sha256=oWX4YwDZDg3GS3-IG0yPGoSEOfSzWihELg7QmrUlxjM,67
3
3
  inspect_ai/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
4
4
  inspect_ai/_cli/cache.py,sha256=RVGuBYwwk3c45JfyfcSFJ419etSsv3-Z7AyfQE-Hul0,3912
5
5
  inspect_ai/_cli/common.py,sha256=WbAgGbLcxABcWoEWiGCWSbkkxYr2jmL9i0cyseWHmRA,4165
6
- inspect_ai/_cli/eval.py,sha256=A__oE6kYtcZC3aevIDkEoAoaqK0OFccR_Gl8NVMrVrw,38442
6
+ inspect_ai/_cli/eval.py,sha256=g1hNhMG79mtGYq1YAC-FKgdSwpTQK6jOj7yYu2IkOlY,38530
7
7
  inspect_ai/_cli/info.py,sha256=QMxaTG9TmzW95EiLrOgkzubvavoR-VHxo3eV7ppmrzI,1789
8
8
  inspect_ai/_cli/list.py,sha256=M8mazI8Zuq8Hp99YWKnxQd9UWx1Qi87zfXRzZYAAakk,2459
9
9
  inspect_ai/_cli/log.py,sha256=O-w7GqsE7tLojPnEtpWXPSh0Vu2Hbrbxjneyc1BFfpk,5817
@@ -559,7 +559,7 @@ inspect_ai/model/_model_call.py,sha256=VJ8wnl9Y81JaiClBYM8eyt1jVb3n-yc6Dd88ofRiJ
559
559
  inspect_ai/model/_model_output.py,sha256=UNodmzkeFE1JXfVtnu0i8q6rwgTj2BClJqcftLSGXdA,7829
560
560
  inspect_ai/model/_openai.py,sha256=WlsWWMzP55_pxP_6yp_5eCKo4Ie418OgcgEDKmqjq34,24364
561
561
  inspect_ai/model/_openai_computer_use.py,sha256=vbKkYLhqNuX16zuWfg5MaGp9H8URrPcLhKQ1pDsZtPo,5943
562
- inspect_ai/model/_openai_responses.py,sha256=-mCLQmcR7JVZbTzaHdMBBsGHOyYGAwKQqUbEQ_jnLmI,21912
562
+ inspect_ai/model/_openai_responses.py,sha256=PW17R217NBy0exq4LLfM-eI0GTcG4gm6cxjVG9Uy3d8,22528
563
563
  inspect_ai/model/_reasoning.py,sha256=qmR8WT6t_cb7NIsJOQHPyFZh2eLV0HmYxKo2vtvteQ4,929
564
564
  inspect_ai/model/_registry.py,sha256=Cr2y32EqLnOqLbSWoXHVK4ivTTzCUhJuACxoTyPt8kY,2032
565
565
  inspect_ai/model/_render.py,sha256=rWypNUjgrH4NGp0r-ESAze9gZz7lYNjheEP438vRYZE,922
@@ -724,9 +724,9 @@ inspect_ai/util/_sandbox/docker/internal.py,sha256=c8X8TLrBPOvsfnq5TkMlb_bzTALyc
724
724
  inspect_ai/util/_sandbox/docker/prereqs.py,sha256=0j6_OauBBnVlpBleADcZavIAAQZy4WewVjbRn9c0stg,3355
725
725
  inspect_ai/util/_sandbox/docker/service.py,sha256=hhHIWH1VDFLwehdGd19aUBD_VKfDO3GCPxpw1HSwVQk,2437
726
726
  inspect_ai/util/_sandbox/docker/util.py,sha256=EeInihCNXgUWxaqZ4dNOJd719kXL2_jr63QCoXn68vA,3154
727
- inspect_ai-0.3.91.dist-info/licenses/LICENSE,sha256=xZPCr8gTiFIerrA_DRpLAbw-UUftnLFsHxKeW-NTtq8,1081
728
- inspect_ai-0.3.91.dist-info/METADATA,sha256=h1x-Ak_MDOKNR8pUHwQ7l_3CnHwo6wVceyiKUrFpIbI,5143
729
- inspect_ai-0.3.91.dist-info/WHEEL,sha256=SmOxYU7pzNKBqASvQJ7DjX3XGUF92lrGhMb3R6_iiqI,91
730
- inspect_ai-0.3.91.dist-info/entry_points.txt,sha256=WGGLmzTzDWLzYfiyovSY6oEKuf-gqzSDNOb5V-hk3fM,54
731
- inspect_ai-0.3.91.dist-info/top_level.txt,sha256=Tp3za30CHXJEKLk8xLe9qGsW4pBzJpEIOMHOHNCXiVo,11
732
- inspect_ai-0.3.91.dist-info/RECORD,,
727
+ inspect_ai-0.3.92.dist-info/licenses/LICENSE,sha256=xZPCr8gTiFIerrA_DRpLAbw-UUftnLFsHxKeW-NTtq8,1081
728
+ inspect_ai-0.3.92.dist-info/METADATA,sha256=BtQ8ClHkDw2ChlQl_rV7AS4wtisP49cxajyuKIhCmkI,5143
729
+ inspect_ai-0.3.92.dist-info/WHEEL,sha256=SmOxYU7pzNKBqASvQJ7DjX3XGUF92lrGhMb3R6_iiqI,91
730
+ inspect_ai-0.3.92.dist-info/entry_points.txt,sha256=WGGLmzTzDWLzYfiyovSY6oEKuf-gqzSDNOb5V-hk3fM,54
731
+ inspect_ai-0.3.92.dist-info/top_level.txt,sha256=Tp3za30CHXJEKLk8xLe9qGsW4pBzJpEIOMHOHNCXiVo,11
732
+ inspect_ai-0.3.92.dist-info/RECORD,,