inspect-ai 0.3.91__py3-none-any.whl → 0.3.92__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- inspect_ai/_cli/eval.py +4 -0
- inspect_ai/model/_openai_responses.py +13 -1
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/METADATA +1 -1
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/RECORD +8 -8
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/WHEEL +0 -0
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/entry_points.txt +0 -0
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/licenses/LICENSE +0 -0
- {inspect_ai-0.3.91.dist-info → inspect_ai-0.3.92.dist-info}/top_level.txt +0 -0
inspect_ai/_cli/eval.py
CHANGED
@@ -1164,6 +1164,10 @@ def eval_retry_command(
|
|
1164
1164
|
elif fail_on_error == 0.0:
|
1165
1165
|
fail_on_error = True
|
1166
1166
|
|
1167
|
+
# resolve retry on error
|
1168
|
+
if retry_on_error == 0:
|
1169
|
+
retry_on_error = None
|
1170
|
+
|
1167
1171
|
# resolve log file
|
1168
1172
|
retry_log_files = [
|
1169
1173
|
log_file_info(filesystem(log_file).info(log_file)) for log_file in log_files
|
@@ -1,3 +1,4 @@
|
|
1
|
+
import json
|
1
2
|
from itertools import chain
|
2
3
|
from typing import TypedDict, cast
|
3
4
|
|
@@ -306,6 +307,14 @@ def _openai_input_items_from_chat_message_assistant(
|
|
306
307
|
"""
|
307
308
|
(output_message_id, tool_message_ids) = _ids_from_assistant_internal(message)
|
308
309
|
|
310
|
+
# we want to prevent yielding output messages in the case where we have an
|
311
|
+
# 'internal' field (so the message came from the model API as opposed to
|
312
|
+
# being user synthesized) AND there is no output_message_id (indicating that
|
313
|
+
# when reading the message from the server we didn't find output). this could
|
314
|
+
# happen e.g. when a react() agent sets the output.completion in response
|
315
|
+
# to a submit() tool call
|
316
|
+
suppress_output_message = message.internal is not None and output_message_id is None
|
317
|
+
|
309
318
|
# if we are not storing messages on the server then blank these out
|
310
319
|
if not store:
|
311
320
|
output_message_id = None
|
@@ -341,6 +350,9 @@ def _openai_input_items_from_chat_message_assistant(
|
|
341
350
|
)
|
342
351
|
)
|
343
352
|
case ContentText(text=text, refusal=refusal):
|
353
|
+
if suppress_output_message:
|
354
|
+
continue
|
355
|
+
|
344
356
|
new_content = (
|
345
357
|
ResponseOutputRefusalParam(type="refusal", refusal=text)
|
346
358
|
if refusal
|
@@ -415,7 +427,7 @@ def _tool_call_items_from_assistant_message(
|
|
415
427
|
type="function_call",
|
416
428
|
call_id=call.id,
|
417
429
|
name=_responses_tool_alias(call.function),
|
418
|
-
arguments=call.
|
430
|
+
arguments=json.dumps(call.arguments),
|
419
431
|
)
|
420
432
|
|
421
433
|
# add id if available
|
@@ -3,7 +3,7 @@ inspect_ai/__main__.py,sha256=oWX4YwDZDg3GS3-IG0yPGoSEOfSzWihELg7QmrUlxjM,67
|
|
3
3
|
inspect_ai/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
4
4
|
inspect_ai/_cli/cache.py,sha256=RVGuBYwwk3c45JfyfcSFJ419etSsv3-Z7AyfQE-Hul0,3912
|
5
5
|
inspect_ai/_cli/common.py,sha256=WbAgGbLcxABcWoEWiGCWSbkkxYr2jmL9i0cyseWHmRA,4165
|
6
|
-
inspect_ai/_cli/eval.py,sha256=
|
6
|
+
inspect_ai/_cli/eval.py,sha256=g1hNhMG79mtGYq1YAC-FKgdSwpTQK6jOj7yYu2IkOlY,38530
|
7
7
|
inspect_ai/_cli/info.py,sha256=QMxaTG9TmzW95EiLrOgkzubvavoR-VHxo3eV7ppmrzI,1789
|
8
8
|
inspect_ai/_cli/list.py,sha256=M8mazI8Zuq8Hp99YWKnxQd9UWx1Qi87zfXRzZYAAakk,2459
|
9
9
|
inspect_ai/_cli/log.py,sha256=O-w7GqsE7tLojPnEtpWXPSh0Vu2Hbrbxjneyc1BFfpk,5817
|
@@ -559,7 +559,7 @@ inspect_ai/model/_model_call.py,sha256=VJ8wnl9Y81JaiClBYM8eyt1jVb3n-yc6Dd88ofRiJ
|
|
559
559
|
inspect_ai/model/_model_output.py,sha256=UNodmzkeFE1JXfVtnu0i8q6rwgTj2BClJqcftLSGXdA,7829
|
560
560
|
inspect_ai/model/_openai.py,sha256=WlsWWMzP55_pxP_6yp_5eCKo4Ie418OgcgEDKmqjq34,24364
|
561
561
|
inspect_ai/model/_openai_computer_use.py,sha256=vbKkYLhqNuX16zuWfg5MaGp9H8URrPcLhKQ1pDsZtPo,5943
|
562
|
-
inspect_ai/model/_openai_responses.py,sha256
|
562
|
+
inspect_ai/model/_openai_responses.py,sha256=PW17R217NBy0exq4LLfM-eI0GTcG4gm6cxjVG9Uy3d8,22528
|
563
563
|
inspect_ai/model/_reasoning.py,sha256=qmR8WT6t_cb7NIsJOQHPyFZh2eLV0HmYxKo2vtvteQ4,929
|
564
564
|
inspect_ai/model/_registry.py,sha256=Cr2y32EqLnOqLbSWoXHVK4ivTTzCUhJuACxoTyPt8kY,2032
|
565
565
|
inspect_ai/model/_render.py,sha256=rWypNUjgrH4NGp0r-ESAze9gZz7lYNjheEP438vRYZE,922
|
@@ -724,9 +724,9 @@ inspect_ai/util/_sandbox/docker/internal.py,sha256=c8X8TLrBPOvsfnq5TkMlb_bzTALyc
|
|
724
724
|
inspect_ai/util/_sandbox/docker/prereqs.py,sha256=0j6_OauBBnVlpBleADcZavIAAQZy4WewVjbRn9c0stg,3355
|
725
725
|
inspect_ai/util/_sandbox/docker/service.py,sha256=hhHIWH1VDFLwehdGd19aUBD_VKfDO3GCPxpw1HSwVQk,2437
|
726
726
|
inspect_ai/util/_sandbox/docker/util.py,sha256=EeInihCNXgUWxaqZ4dNOJd719kXL2_jr63QCoXn68vA,3154
|
727
|
-
inspect_ai-0.3.
|
728
|
-
inspect_ai-0.3.
|
729
|
-
inspect_ai-0.3.
|
730
|
-
inspect_ai-0.3.
|
731
|
-
inspect_ai-0.3.
|
732
|
-
inspect_ai-0.3.
|
727
|
+
inspect_ai-0.3.92.dist-info/licenses/LICENSE,sha256=xZPCr8gTiFIerrA_DRpLAbw-UUftnLFsHxKeW-NTtq8,1081
|
728
|
+
inspect_ai-0.3.92.dist-info/METADATA,sha256=BtQ8ClHkDw2ChlQl_rV7AS4wtisP49cxajyuKIhCmkI,5143
|
729
|
+
inspect_ai-0.3.92.dist-info/WHEEL,sha256=SmOxYU7pzNKBqASvQJ7DjX3XGUF92lrGhMb3R6_iiqI,91
|
730
|
+
inspect_ai-0.3.92.dist-info/entry_points.txt,sha256=WGGLmzTzDWLzYfiyovSY6oEKuf-gqzSDNOb5V-hk3fM,54
|
731
|
+
inspect_ai-0.3.92.dist-info/top_level.txt,sha256=Tp3za30CHXJEKLk8xLe9qGsW4pBzJpEIOMHOHNCXiVo,11
|
732
|
+
inspect_ai-0.3.92.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|