inspect-ai 0.3.58__py3-none-any.whl → 0.3.60__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- inspect_ai/_cli/common.py +3 -1
- inspect_ai/_cli/eval.py +15 -9
- inspect_ai/_display/core/active.py +4 -1
- inspect_ai/_display/core/config.py +3 -3
- inspect_ai/_display/core/panel.py +7 -3
- inspect_ai/_display/plain/__init__.py +0 -0
- inspect_ai/_display/plain/display.py +203 -0
- inspect_ai/_display/rich/display.py +0 -5
- inspect_ai/_display/textual/widgets/port_mappings.py +110 -0
- inspect_ai/_display/textual/widgets/samples.py +79 -12
- inspect_ai/_display/textual/widgets/sandbox.py +37 -0
- inspect_ai/_eval/eval.py +10 -1
- inspect_ai/_eval/loader.py +79 -19
- inspect_ai/_eval/registry.py +6 -0
- inspect_ai/_eval/score.py +3 -1
- inspect_ai/_eval/task/results.py +51 -22
- inspect_ai/_eval/task/run.py +47 -13
- inspect_ai/_eval/task/sandbox.py +10 -5
- inspect_ai/_util/constants.py +1 -0
- inspect_ai/_util/port_names.py +61 -0
- inspect_ai/_util/text.py +23 -0
- inspect_ai/_view/www/App.css +31 -1
- inspect_ai/_view/www/dist/assets/index.css +31 -1
- inspect_ai/_view/www/dist/assets/index.js +25498 -2044
- inspect_ai/_view/www/log-schema.json +32 -2
- inspect_ai/_view/www/package.json +2 -0
- inspect_ai/_view/www/src/App.mjs +14 -16
- inspect_ai/_view/www/src/Types.mjs +1 -2
- inspect_ai/_view/www/src/api/Types.ts +133 -0
- inspect_ai/_view/www/src/api/{api-browser.mjs → api-browser.ts} +25 -13
- inspect_ai/_view/www/src/api/api-http.ts +219 -0
- inspect_ai/_view/www/src/api/api-shared.ts +47 -0
- inspect_ai/_view/www/src/api/{api-vscode.mjs → api-vscode.ts} +22 -19
- inspect_ai/_view/www/src/api/{client-api.mjs → client-api.ts} +93 -53
- inspect_ai/_view/www/src/api/index.ts +51 -0
- inspect_ai/_view/www/src/api/jsonrpc.ts +225 -0
- inspect_ai/_view/www/src/components/ChatView.mjs +133 -43
- inspect_ai/_view/www/src/components/DownloadButton.mjs +1 -1
- inspect_ai/_view/www/src/components/ExpandablePanel.mjs +0 -4
- inspect_ai/_view/www/src/components/LargeModal.mjs +19 -20
- inspect_ai/_view/www/src/components/TabSet.mjs +3 -1
- inspect_ai/_view/www/src/components/VirtualList.mjs +266 -84
- inspect_ai/_view/www/src/index.js +77 -4
- inspect_ai/_view/www/src/log/{remoteLogFile.mjs → remoteLogFile.ts} +62 -46
- inspect_ai/_view/www/src/navbar/Navbar.mjs +4 -1
- inspect_ai/_view/www/src/navbar/SecondaryBar.mjs +19 -10
- inspect_ai/_view/www/src/samples/SampleDialog.mjs +5 -1
- inspect_ai/_view/www/src/samples/SampleDisplay.mjs +23 -15
- inspect_ai/_view/www/src/samples/SampleList.mjs +19 -49
- inspect_ai/_view/www/src/samples/SampleScores.mjs +1 -1
- inspect_ai/_view/www/src/samples/SampleTranscript.mjs +8 -3
- inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +38 -26
- inspect_ai/_view/www/src/samples/SamplesTab.mjs +14 -11
- inspect_ai/_view/www/src/samples/SamplesTools.mjs +8 -8
- inspect_ai/_view/www/src/samples/tools/SampleFilter.mjs +712 -89
- inspect_ai/_view/www/src/samples/tools/SortFilter.mjs +2 -2
- inspect_ai/_view/www/src/samples/tools/filters.mjs +260 -87
- inspect_ai/_view/www/src/samples/transcript/ErrorEventView.mjs +24 -2
- inspect_ai/_view/www/src/samples/transcript/EventPanel.mjs +29 -24
- inspect_ai/_view/www/src/samples/transcript/EventRow.mjs +1 -1
- inspect_ai/_view/www/src/samples/transcript/InfoEventView.mjs +24 -2
- inspect_ai/_view/www/src/samples/transcript/InputEventView.mjs +24 -2
- inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +31 -10
- inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.mjs +24 -2
- inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.mjs +23 -2
- inspect_ai/_view/www/src/samples/transcript/ScoreEventView.mjs +24 -2
- inspect_ai/_view/www/src/samples/transcript/StepEventView.mjs +33 -3
- inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.mjs +25 -2
- inspect_ai/_view/www/src/samples/transcript/ToolEventView.mjs +25 -2
- inspect_ai/_view/www/src/samples/transcript/TranscriptView.mjs +193 -11
- inspect_ai/_view/www/src/samples/transcript/Types.mjs +10 -0
- inspect_ai/_view/www/src/samples/transcript/state/StateEventView.mjs +26 -2
- inspect_ai/_view/www/src/types/log.d.ts +13 -2
- inspect_ai/_view/www/src/utils/Format.mjs +10 -3
- inspect_ai/_view/www/src/utils/{Json.mjs → json-worker.ts} +13 -9
- inspect_ai/_view/www/src/utils/vscode.ts +36 -0
- inspect_ai/_view/www/src/workspace/WorkSpace.mjs +11 -5
- inspect_ai/_view/www/vite.config.js +7 -0
- inspect_ai/_view/www/yarn.lock +116 -0
- inspect_ai/approval/_human/__init__.py +0 -0
- inspect_ai/approval/_human/manager.py +1 -1
- inspect_ai/approval/_policy.py +12 -6
- inspect_ai/log/_log.py +1 -1
- inspect_ai/log/_samples.py +16 -0
- inspect_ai/log/_transcript.py +4 -1
- inspect_ai/model/_call_tools.py +59 -0
- inspect_ai/model/_conversation.py +16 -7
- inspect_ai/model/_generate_config.py +12 -12
- inspect_ai/model/_model.py +117 -18
- inspect_ai/model/_model_output.py +22 -2
- inspect_ai/model/_openai.py +383 -0
- inspect_ai/model/_providers/anthropic.py +152 -55
- inspect_ai/model/_providers/azureai.py +21 -21
- inspect_ai/model/_providers/bedrock.py +37 -40
- inspect_ai/model/_providers/goodfire.py +248 -0
- inspect_ai/model/_providers/google.py +46 -54
- inspect_ai/model/_providers/groq.py +7 -3
- inspect_ai/model/_providers/hf.py +6 -0
- inspect_ai/model/_providers/mistral.py +13 -12
- inspect_ai/model/_providers/openai.py +51 -218
- inspect_ai/model/_providers/openai_o1.py +11 -12
- inspect_ai/model/_providers/providers.py +23 -1
- inspect_ai/model/_providers/together.py +12 -12
- inspect_ai/model/_providers/util/__init__.py +2 -3
- inspect_ai/model/_providers/util/hf_handler.py +1 -1
- inspect_ai/model/_providers/util/llama31.py +1 -1
- inspect_ai/model/_providers/util/util.py +0 -76
- inspect_ai/model/_providers/vertex.py +1 -4
- inspect_ai/scorer/_metric.py +3 -0
- inspect_ai/scorer/_reducer/reducer.py +1 -1
- inspect_ai/scorer/_scorer.py +4 -3
- inspect_ai/solver/__init__.py +4 -5
- inspect_ai/solver/_basic_agent.py +1 -1
- inspect_ai/solver/_bridge/__init__.py +3 -0
- inspect_ai/solver/_bridge/bridge.py +100 -0
- inspect_ai/solver/_bridge/patch.py +170 -0
- inspect_ai/solver/_prompt.py +35 -5
- inspect_ai/solver/_solver.py +6 -0
- inspect_ai/solver/_task_state.py +80 -38
- inspect_ai/tool/__init__.py +2 -0
- inspect_ai/tool/_tool.py +12 -1
- inspect_ai/tool/_tool_call.py +10 -0
- inspect_ai/tool/_tool_def.py +16 -5
- inspect_ai/tool/_tool_with.py +21 -4
- inspect_ai/tool/beta/__init__.py +5 -0
- inspect_ai/tool/beta/_computer/__init__.py +3 -0
- inspect_ai/tool/beta/_computer/_common.py +133 -0
- inspect_ai/tool/beta/_computer/_computer.py +155 -0
- inspect_ai/tool/beta/_computer/_computer_split.py +198 -0
- inspect_ai/tool/beta/_computer/_resources/Dockerfile +100 -0
- inspect_ai/tool/beta/_computer/_resources/README.md +30 -0
- inspect_ai/tool/beta/_computer/_resources/entrypoint/entrypoint.sh +18 -0
- inspect_ai/tool/beta/_computer/_resources/entrypoint/novnc_startup.sh +20 -0
- inspect_ai/tool/beta/_computer/_resources/entrypoint/x11vnc_startup.sh +48 -0
- inspect_ai/tool/beta/_computer/_resources/entrypoint/xfce_startup.sh +13 -0
- inspect_ai/tool/beta/_computer/_resources/entrypoint/xvfb_startup.sh +48 -0
- inspect_ai/tool/beta/_computer/_resources/image_home_dir/Desktop/Firefox Web Browser.desktop +10 -0
- inspect_ai/tool/beta/_computer/_resources/image_home_dir/Desktop/Visual Studio Code.desktop +10 -0
- inspect_ai/tool/beta/_computer/_resources/image_home_dir/Desktop/XPaint.desktop +10 -0
- inspect_ai/tool/beta/_computer/_resources/tool/__init__.py +0 -0
- inspect_ai/tool/beta/_computer/_resources/tool/_logger.py +22 -0
- inspect_ai/tool/beta/_computer/_resources/tool/_run.py +42 -0
- inspect_ai/tool/beta/_computer/_resources/tool/_tool_result.py +33 -0
- inspect_ai/tool/beta/_computer/_resources/tool/_x11_client.py +262 -0
- inspect_ai/tool/beta/_computer/_resources/tool/computer_tool.py +85 -0
- inspect_ai/tool/beta/_computer/_resources/tool/requirements.txt +0 -0
- inspect_ai/util/__init__.py +2 -0
- inspect_ai/util/_display.py +5 -0
- inspect_ai/util/_limit.py +26 -0
- inspect_ai/util/_sandbox/docker/docker.py +64 -1
- inspect_ai/util/_sandbox/docker/internal.py +3 -1
- inspect_ai/util/_sandbox/docker/prereqs.py +1 -1
- inspect_ai/util/_sandbox/environment.py +14 -0
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/METADATA +3 -2
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/RECORD +159 -126
- inspect_ai/_view/www/src/api/Types.mjs +0 -117
- inspect_ai/_view/www/src/api/api-http.mjs +0 -300
- inspect_ai/_view/www/src/api/api-shared.mjs +0 -10
- inspect_ai/_view/www/src/api/index.mjs +0 -49
- inspect_ai/_view/www/src/api/jsonrpc.mjs +0 -208
- inspect_ai/_view/www/src/samples/transcript/TranscriptState.mjs +0 -70
- inspect_ai/_view/www/src/utils/vscode.mjs +0 -16
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/LICENSE +0 -0
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/WHEEL +0 -0
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/entry_points.txt +0 -0
- {inspect_ai-0.3.58.dist-info → inspect_ai-0.3.60.dist-info}/top_level.txt +0 -0
inspect_ai/_util/text.py
CHANGED
@@ -108,3 +108,26 @@ def str_to_float(s: str) -> float:
|
|
108
108
|
exponent = 1 # Default exponent is 1 if no superscript is present
|
109
109
|
|
110
110
|
return base**exponent
|
111
|
+
|
112
|
+
|
113
|
+
def truncate(text: str, length: int, overflow: str = "...", pad: bool = True) -> str:
|
114
|
+
"""
|
115
|
+
Truncate text to specified length with optional padding and overflow indicator.
|
116
|
+
|
117
|
+
Args:
|
118
|
+
text (str): Text to truncate
|
119
|
+
length (int): Maximum length including overflow indicator
|
120
|
+
overflow (str): String to indicate truncation (defaults to '...')
|
121
|
+
pad (bool): Whether to pad the result to full length (defaults to padding)
|
122
|
+
|
123
|
+
Returns:
|
124
|
+
Truncated string, padded if requested
|
125
|
+
|
126
|
+
"""
|
127
|
+
if len(text) <= length:
|
128
|
+
return text + (" " * (length - len(text))) if pad else text
|
129
|
+
|
130
|
+
overflow_length = len(overflow)
|
131
|
+
truncated = text[: length - overflow_length] + overflow
|
132
|
+
|
133
|
+
return truncated
|
inspect_ai/_view/www/App.css
CHANGED
@@ -9,6 +9,12 @@
|
|
9
9
|
--inspect-input-border: var(--bs-light-border-subtle);
|
10
10
|
--inspect-diff-add-color: #dafbe1;
|
11
11
|
--inspect-diff-remove-color: #ffebe9;
|
12
|
+
--inspect-inactive-selection-background: var(--vscode-editor-inactiveSelectionBackground, #d9d9d9);
|
13
|
+
--inspect-active-selection-background: var(--vscode-editor-selectionBackground, #d7d4f0);
|
14
|
+
--inspect-focus-border-color: #86b7fe;
|
15
|
+
--inspect-focus-border-shadow: 0 0 0 0.25rem rgba(var(--bs-primary-rgb), 0.25);
|
16
|
+
--inspect-focus-border-gray-color: #808080;
|
17
|
+
--inspect-focus-border-gray-shadow: 0 0 0 0.25rem rgba(48, 48, 48, 0.25);
|
12
18
|
}
|
13
19
|
|
14
20
|
body:not([class^="vscode-"]) button {
|
@@ -650,6 +656,30 @@ table.table.table-sm td {
|
|
650
656
|
height: auto !important;
|
651
657
|
}
|
652
658
|
|
659
|
+
[data-tooltip] {
|
660
|
+
position: relative;
|
661
|
+
}
|
662
|
+
[data-tooltip]:hover::after {
|
663
|
+
content: attr(data-tooltip);
|
664
|
+
position: absolute;
|
665
|
+
line-height: 1.25;
|
666
|
+
background: var(--bs-light);
|
667
|
+
color: var(--bs-body-color);
|
668
|
+
opacity: 1;
|
669
|
+
padding: 4px 8px;
|
670
|
+
border-radius: 4px;
|
671
|
+
border: 1px solid var(--bs-border-color);
|
672
|
+
box-shadow: 0 2px 10px 0 rgba(0, 0, 0, 0.25);
|
673
|
+
white-space: pre-wrap;
|
674
|
+
width: max-content;
|
675
|
+
max-width: 400px;
|
676
|
+
z-index: 1000;
|
677
|
+
}
|
678
|
+
[data-tooltip][data-tooltip-position="bottom-left"]:hover::after {
|
679
|
+
right: 0%;
|
680
|
+
top: 100%;
|
681
|
+
}
|
682
|
+
|
653
683
|
/* ANSI Coloring */
|
654
684
|
.ansi-display {
|
655
685
|
font-family: monospace;
|
@@ -725,7 +755,7 @@ pre[class*="language-"].tool-output {
|
|
725
755
|
background: none !important;
|
726
756
|
border: none !important;
|
727
757
|
box-shadow: none !important;
|
728
|
-
border-radius: var(--bs-border-radius) !important;
|
758
|
+
border-radius: var(--bs-border-radius) !important;
|
729
759
|
}
|
730
760
|
|
731
761
|
/* lightbox styles */
|
@@ -14282,6 +14282,12 @@ pre[class*="language-"] {
|
|
14282
14282
|
--inspect-input-border: var(--bs-light-border-subtle);
|
14283
14283
|
--inspect-diff-add-color: #dafbe1;
|
14284
14284
|
--inspect-diff-remove-color: #ffebe9;
|
14285
|
+
--inspect-inactive-selection-background: var(--vscode-editor-inactiveSelectionBackground, #d9d9d9);
|
14286
|
+
--inspect-active-selection-background: var(--vscode-editor-selectionBackground, #d7d4f0);
|
14287
|
+
--inspect-focus-border-color: #86b7fe;
|
14288
|
+
--inspect-focus-border-shadow: 0 0 0 0.25rem rgba(var(--bs-primary-rgb), 0.25);
|
14289
|
+
--inspect-focus-border-gray-color: #808080;
|
14290
|
+
--inspect-focus-border-gray-shadow: 0 0 0 0.25rem rgba(48, 48, 48, 0.25);
|
14285
14291
|
}
|
14286
14292
|
|
14287
14293
|
body:not([class^="vscode-"]) button {
|
@@ -14923,6 +14929,30 @@ table.table.table-sm td {
|
|
14923
14929
|
height: auto !important;
|
14924
14930
|
}
|
14925
14931
|
|
14932
|
+
[data-tooltip] {
|
14933
|
+
position: relative;
|
14934
|
+
}
|
14935
|
+
[data-tooltip]:hover::after {
|
14936
|
+
content: attr(data-tooltip);
|
14937
|
+
position: absolute;
|
14938
|
+
line-height: 1.25;
|
14939
|
+
background: var(--bs-light);
|
14940
|
+
color: var(--bs-body-color);
|
14941
|
+
opacity: 1;
|
14942
|
+
padding: 4px 8px;
|
14943
|
+
border-radius: 4px;
|
14944
|
+
border: 1px solid var(--bs-border-color);
|
14945
|
+
box-shadow: 0 2px 10px 0 rgba(0, 0, 0, 0.25);
|
14946
|
+
white-space: pre-wrap;
|
14947
|
+
width: max-content;
|
14948
|
+
max-width: 400px;
|
14949
|
+
z-index: 1000;
|
14950
|
+
}
|
14951
|
+
[data-tooltip][data-tooltip-position="bottom-left"]:hover::after {
|
14952
|
+
right: 0%;
|
14953
|
+
top: 100%;
|
14954
|
+
}
|
14955
|
+
|
14926
14956
|
/* ANSI Coloring */
|
14927
14957
|
.ansi-display {
|
14928
14958
|
font-family: monospace;
|
@@ -14998,7 +15028,7 @@ pre[class*="language-"].tool-output {
|
|
14998
15028
|
background: none !important;
|
14999
15029
|
border: none !important;
|
15000
15030
|
box-shadow: none !important;
|
15001
|
-
border-radius: var(--bs-border-radius) !important;
|
15031
|
+
border-radius: var(--bs-border-radius) !important;
|
15002
15032
|
}
|
15003
15033
|
|
15004
15034
|
/* lightbox styles */
|