inspect-ai 0.3.52__tar.gz → 0.3.54__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/CHANGELOG.md +60 -33
- {inspect_ai-0.3.52/src/inspect_ai.egg-info → inspect_ai-0.3.54}/PKG-INFO +6 -8
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/README.md +5 -5
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_quarto.yml +0 -3
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_sandboxenv-interface.md +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/eval-logs.qmd +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/extensions.qmd +6 -1
- inspect_ai-0.3.54/docs/images/task-max-sandboxes.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/parallelism.qmd +6 -4
- inspect_ai-0.3.54/docs/scripts/post-render.sh +23 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/tools.qmd +6 -6
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/tutorial.qmd +2 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/pyproject.toml +0 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/requirements.txt +0 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/eval.py +55 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/main.py +2 -0
- inspect_ai-0.3.54/src/inspect_ai/_cli/trace.py +244 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/progress.py +9 -3
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/results.py +8 -4
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/app.py +5 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/task_detail.py +3 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/tasks.py +97 -6
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/eval.py +33 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/evalset.py +4 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/registry.py +2 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/images.py +4 -14
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/results.py +22 -4
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/run.py +40 -20
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/sandbox.py +72 -43
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/task.py +4 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/util.py +2 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/constants.py +3 -3
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/display.py +1 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/logger.py +34 -8
- inspect_ai-0.3.54/src/inspect_ai/_util/trace.py +275 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/App.css +13 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/index.css +13 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/index.js +80 -43
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/App.mjs +31 -6
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/Types.mjs +6 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/JsonPanel.mjs +11 -17
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MessageContent.mjs +9 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Tools.mjs +46 -18
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/navbar/Navbar.mjs +12 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleList.mjs +2 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ToolEventView.mjs +2 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_log.py +6 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_message.py +2 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/eval.py +8 -18
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/json.py +19 -17
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_cache.py +22 -16
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_call_tools.py +9 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_generate_config.py +8 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_model.py +11 -12
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/azureai.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/bedrock.py +18 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/hf.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/openai.py +32 -8
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/providers.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/vllm.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_web_browser.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/context.py +7 -3
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/compose.py +58 -19
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/config.py +8 -10
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/docker.py +20 -16
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/util.py +3 -9
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/environment.py +7 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/limits.py +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/local.py +8 -9
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/service.py +17 -7
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_subprocess.py +6 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_subtask.py +8 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54/src/inspect_ai.egg-info}/PKG-INFO +6 -8
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/SOURCES.txt +4 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/requires.txt +0 -2
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_metric.py +80 -0
- inspect_ai-0.3.54/tests/solver/test_setup.py +21 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tool_types.py +39 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/CHANGELOG.md +9 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/package.json +1 -1
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/extension.ts +1 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-panel.ts +1 -1
- inspect_ai-0.3.52/docs/scripts/post-render.sh +0 -13
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/dependabot.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/pull_request_template.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/workflows/build.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/workflows/docs.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/workflows/log_viewer.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/workflows/pypi.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.github/workflows/vscode.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.pre-commit-config.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.vscode/extensions.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/.vscode/settings.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/CITATION.cff +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/LICENSE +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/Makefile +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/CNAME +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_errors_and_retries.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_sample-preservation.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_tools-annotations-required.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_tools-scaffold.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_trace.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/_variables.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/agents-api.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/agents.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/approval.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/caching.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/datasets.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/errors-and-limits.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/eval-sets.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/examples/examples.bib +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/examples/examples.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/examples/examples.ejs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/examples/examples.yml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/examples/index.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/aisi-logo.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/eval-log.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-activity-bar.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-multiple-models.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-answers.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-filter.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-history.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-home.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-info.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-logging-console.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-logging.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-main.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-messages.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-metadata.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-scoring.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-sort.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-view-splash.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-vscode-config.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-vscode-install.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-vscode-logview.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-vscode-output-channel.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect-vscode-run-task.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/inspect.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/logs-drop-down.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/logs-open-button.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/logs.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/popularity.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/python-tool-view.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/rate-limit.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/running-theory.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/toolenv-no-cleanup.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/images/web-browser-tool-view.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/index.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/interactivity.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/llms.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/log-viewer.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/models.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/scorers.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/solvers.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/theme.scss +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/vscode.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/docs/workflow.qmd +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/approval/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/approval/approval.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/approval/approval.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/biology_qa.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/browser/browser.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/browser/compose.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/cache.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/evalset.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/hello_world.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/images/ballons.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/images/bike.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/images/images.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/images/images.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/intervention/Dockerfile +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/intervention/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/intervention/compose.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/intervention/intervention.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/.env.example +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/inspect_langchain.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/requirements.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/wikipedia.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/langchain/wikipedia.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/popularity.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/security_guide.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/theory_of_mind.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/examples/tool_use.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/setup.cfg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/__main__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/cache.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/common.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/info.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/list.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/log.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/sandbox.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/score.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_cli/view.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/active.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/config.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/display.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/footer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/group.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/panel.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/rich.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/textual.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/rich/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/rich/display.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/app.tcss +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/display.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/theme.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/clock.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/console.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/footer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/samples.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/titlebar.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/toggle.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/context.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/list.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/loader.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/run.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/score.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/constants.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/epochs.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/error.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/generate.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/log.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/rundir.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/_async.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/appdirs.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/config.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/content.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/datetime.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/decorator.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/deprecation.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/dev.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/dict.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/dotenv.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/entrypoints.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/environ.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/error.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/file.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/format.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/git.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/hash.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/hooks.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/html.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/http.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/images.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/json.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/list.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/notebook.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/package.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/path.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/pattern.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/platform.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/retry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/rich.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/samples.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/terminal.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/text.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/throttle.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/timeouts.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/url.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_util/version.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/notify.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/schema.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/server.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/view.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.prettierignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.tool-versions +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/favicon.svg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/index.html +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/eslint.config.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/favicon.svg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/index.html +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/jsconfig.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/log-schema.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/package.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/postcss.config.cjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/Register.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/Types.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-browser.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-http.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-shared.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-vscode.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/client-api.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/index.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/jsonrpc.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Colors.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Fonts.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Icons.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Styles.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AnsiDisplay.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AnsiDisplay.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AppErrorBoundary.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Browser.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Card.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ChatView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/CopyButton.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Dialog.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/DownloadButton.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/DownloadPanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/EmptyPanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ErrorPanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ExpandablePanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/FindBand.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/LabeledValue.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/LargeModal.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MarkdownDiv.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MessageBand.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MetaDataGrid.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MetaDataView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MorePopOver.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/NavPills.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ProgressBar.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/ChatMessageRenderer.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/RenderedContent.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/Types.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/TabSet.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ToolButton.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/VirtualList.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ansi-output.js +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/constants.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/index.js +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/json/JsonTab.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log/remoteLogFile.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Log-Reader.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Native-Log-Reader.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Open-AI-Log-Reader.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/navbar/SecondaryBar.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/plan/PlanCard.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleDialog.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleDisplay.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleError.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleLimit.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleScoreView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleScores.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleTranscript.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesTab.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesTools.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/EpochFilter.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SampleFilter.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SelectScorer.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SortFilter.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/filters.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ErrorEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventPanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventRow.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventSection.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/InfoEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/InputEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/LoggerEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ScoreEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/StepEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/TranscriptState.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/TranscriptView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/Types.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateEventView.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/sidebar/Sidebar.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/jsondiffpatch.d.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/log.d.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/prism.d.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/usage/ModelTokenTable.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/usage/UsageCard.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Base64.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Format.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Git.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Html.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Json.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Path.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Print.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Type.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/attachments.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/debugging.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/http.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/queue.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/remoteZipFile.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/sync.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/vscode.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/workspace/TaskErrorPanel.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/workspace/WorkSpace.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/tsconfig.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/vite.config.js +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/yarn.lock +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_apply.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_approval.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_approver.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_auto.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_call.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/approver.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/console.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/manager.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/panel.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_policy.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/approval/_registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_dataset.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/bias_detection.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/biology_qa.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/popularity.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/security_guide.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/theory_of_mind.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/csv.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/example.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/file.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/hf.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/json.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_bundle.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_condense.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_convert.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_file.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/create.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/file.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/recorder.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_retry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_samples.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/log/_transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_chat_message.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_image.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_model_call.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_model_output.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/anthropic.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/cloudflare.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/google.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/grok.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/groq.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/llama_cpp_python.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/mistral.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/mockllm.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/ollama.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/openai_o1.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/together.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/chatapi.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/hf_handler.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/llama31.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/vertex.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_render.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/model/_trace.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/py.typed +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_answer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_choice.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_classification.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_common.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_match.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metric.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/accuracy.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/mean.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/std.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_model.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_multi.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_pattern.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/reducer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/types.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_score.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_scorer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_target.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_basic_agent.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_chain.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_critique.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_fork.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_multiple_choice.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_plan.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_prompt.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_solver.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_task_state.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_use_tools.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/solver/_util.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_call.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_choice.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_def.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_description.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_info.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_params.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_with.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_execute.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/Dockerfile +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/accessibility_node.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/dm_env_servicer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/images/usage_diagram.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/mock_environment.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/playwright_crawler.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_accessibility_node.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_dm_env_servicer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_playwright_crawler.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_web_environment.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_client.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_client_new_session.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_environment.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_server.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_search.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_concurrency.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_console.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_panel.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_resource.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/cleanup.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/internal.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/prereqs.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/self_check.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_store.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai/util/_trace.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/dependency_links.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/entry_points.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/top_level.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/approve.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/escalate.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/modify.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/reject.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/terminate.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/approval/test_approval.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/conftest.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/dataset.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/images/ballons.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/images.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.csv +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.csv +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/dataset/test_dataset.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_formats.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_images.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_images_tc.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_invalid.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_length_stop_reason.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_streaming.eval +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_valid.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_version_3.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_with_nan.txt +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_eval_log.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_list_logs/2024-11-05T13-31-45-05-00_input-task_8zXjbRzCWrL9GXiXo2vus9.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_list_logs/2024-11-05T13-32-37-05-00_input-task_hxs4q9azL3ySGkjJirypKZ.eval +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_list_logs/custom.eval +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_list_logs/ignore.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_list_logs.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_log_attachments.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_log_formats.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_log_level.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_log_streaming.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/log/test_log_tags.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_anthropic.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_azureai.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_cloudflare.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_google.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_grok.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_groq.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_hf.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_llama_cpp_python.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_openai.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_openai_o1.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_vertex.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/providers/test_vllm.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_api_key.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_collapse_assistant_message.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_collapse_user_message.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_disable.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_logprobs.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_mock_model_llm.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_num_choices.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_parse_tool_call.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/model/test_stop_reason.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_answer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_choice.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_classification.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_match.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_model_graded.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_multiscorer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_pattern.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_reducers.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_scorer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/scorer/test_value_to_float.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_basic_agent.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_chain.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_fork.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_multiple_choice.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_prompt.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_solver.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_solver_decorator.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_solver_spec.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_store.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_subtask.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/solver/test_transcript.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_config/model.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_config/solver.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_config/task.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_config.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_set/2024-08-29T15-11-17+00-00_popularity_5EAmX6wjMFqea6WY7XHzZp.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_set/2024-08-29T15-11-18+00-00_popularity_5EAmX6wjMFqea6WY7XHzZp.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_eval_set.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_examples.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_extensions.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_fail_on_error.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_helpers/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_helpers/tasks.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_helpers/tool_call_utils.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_helpers/tools.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_helpers/utils.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_list_task.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_log_dir/example_task/example_task.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_log_dir/test_log_dir.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/_registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/approvers/renamer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/modelapi/custom.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/py.typed +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/sandboxenv/podman.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/score/scorer.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/inspect_package/solvers/cot.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_package/pyproject.toml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_retry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_run_dir/task1/task1.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_run_dir/task2/task2.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_run_dir.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_sample_id.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_sample_limits.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_attr.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/__init__.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/attribs.ipynb +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/multiple.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/_decoy/testit.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/_decoy2.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/bar.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/foo.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/.folder3/epsilon.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder1/_decoy.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder1/theta.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/.folder3/epsilon.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/another.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/first.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/docker-compose-context/Dockerfile +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/docker-compose-context-alpine/Dockerfile +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_bash_tool.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_max_exec_output.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_max_tool_output.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_python_tool.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_sandbox_compose.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_sandbox_compose_alpine.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_sandbox_docker_and_local.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_sandbox_dockerfile.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_sandbox_tool_eval.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tool_def.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tool_parse.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tool_view.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tool_with.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_tools.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_use_tools.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_web_browser.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/tools/test_web_browser_compose.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/sandbox/docker_compose_multiple_services/docker-compose.yaml +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/sandbox/sandbox_setup.sh +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/sandbox/test_docker_compose_multiple_services.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/sandbox/test_sandbox_service.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/sandbox/test_sandbox_setup.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_file.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_images/images.jsonl +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_images.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_package.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_registry.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_str_to_float.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/util/test_subprocess.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tests/view/test_bundle.py +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.eslintrc.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscode/extensions.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscode/launch.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscode/settings.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscode/tasks.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscode-test.mjs +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.vscodeignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/.yarnrc +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/LICENSE +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/README.md +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/icon/eval-treeview.svg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/icon/eval.svg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/logo/inspect.png +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/logo/inspect.svg +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/templates/task.py.template +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/www/codicon/codicon.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/www/codicon/codicon.ttf +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/assets/www/view/view-overrides.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/@types/hooks.d.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/@types/log.d.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/document.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/error.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/focus.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/notebook.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/symbol.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/task.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/templates.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/components/webview.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/appdirs.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/command.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/dispose.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/env.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/file.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/git.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/jsonrpc.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/log.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/nonce.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/path.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/port.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/process.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/python/code.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/python/env.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/python/exec.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/python/index.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/python/interpreter.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/random.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/string.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/text.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/uri.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/vscode/association.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/wait.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/core/workspace.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/hooks/hooks.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/hooks/index.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/hooks/preview.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/inspect/index.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/inspect/logs.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/inspect/props.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/inspect/version.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/active-task/active-task-command.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/active-task/active-task-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/activity-bar-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/env-config-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-directory-selector.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-data.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-mru.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-config-commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-config-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-outline-commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-outline-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/env-config-webview.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/env-config-webview.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/task-config-webview.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/task-config-webview.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/vscode-controls.css +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/webview-utils.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/codelens/codelens-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-constants.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-eval-commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-eval.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-logs-watcher.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-manager.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-view-server.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/lognotify.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-editor.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-link-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-state.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-view.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/openlog.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/protocol-handler.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/settings/inspect-settings.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/settings/user-settings.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/statusbar.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-env-commands.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-env-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-init.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-state-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-task-provider.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/src/test/extension.test.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/.gitignore +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/package.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/rollup.config.js +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/src/index.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/src/jsonrpc.ts +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/yarn.lock +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/tsconfig.json +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/webpack.config.js +0 -0
- {inspect_ai-0.3.52 → inspect_ai-0.3.54}/tools/vscode/yarn.lock +0 -0
@@ -1,5 +1,35 @@
|
|
1
1
|
# Changelog
|
2
2
|
|
3
|
+
## v0.3.54 (26 December 2024)
|
4
|
+
|
5
|
+
- [Action tracing](https://github.com/UKGovernmentBEIS/inspect_ai/pull/1038) for diagnosing runs with unterminated action (e.g. model calls, docker commands, etc.).
|
6
|
+
- Provide default timeout/retry for docker compose commands to mitigate unreliability in some configurations.
|
7
|
+
- Switch to sync S3 writes to overcome unreliability observed when using async interface.
|
8
|
+
- Task display: Added `--no-score-display` option to disable realtime scoring metrics.
|
9
|
+
- Bugfix: Fix failure to fully clone samples that have message lists as input.
|
10
|
+
- llama-cpp-python: Support for `logprobs`.
|
11
|
+
|
12
|
+
## v0.3.53 (20 December 2024)
|
13
|
+
|
14
|
+
- OpenAI: Support for o1 including native tool calling and `reasoning_effort` generation option.
|
15
|
+
- Task API: Introduce `setup` step that always runs even if `solver` is replaced.
|
16
|
+
- Bedrock: Support for tool calling on Nova models.
|
17
|
+
- Bedrock: Support for custom `model_args` passed through to `session.Client`.
|
18
|
+
- Bedrock: Support for `jpeg` images.
|
19
|
+
- Bedrock: Correct max_tokens for llama3-8b, llama3-70b models on Bedrock.
|
20
|
+
- Inspect View: Various improvements to appearance of tool calls in transcript.
|
21
|
+
- Task display: Ensure that widths of progress elements are kept consistent across tasks.
|
22
|
+
- Sandboxes: New `max_sandboxes` option for (per-provider) maximum number of running sandboxes.
|
23
|
+
- Sandboxes: Remove use of aiofiles to mitigate potential for threading deadlocks.
|
24
|
+
- Concurrency: Do not use `max_tasks` as a lower bound for `max_samples`.
|
25
|
+
- Log recorder: Always re-open log buffer for `eval` format logs.
|
26
|
+
- Bugfix: Proper handling of text find for eval raw JSON display
|
27
|
+
- Bugfix: Correct handling for `--sample-id` integer comparisons.
|
28
|
+
- Bugfix: Proper removal of model_args with falsey values (explicit check for `None`)
|
29
|
+
- Bugfix: Properly handle custom metrics that return dictionaries or lists
|
30
|
+
- Bugfix: Proper sample count display when retrying an evaluation
|
31
|
+
- Bugfix: Fix inability to define and run tasks in a notebook.
|
32
|
+
|
3
33
|
## v0.3.52 (13 December 2024)
|
4
34
|
|
5
35
|
- Eval: `--sample-id` option for evaluating specific sample id(s).
|
@@ -26,10 +56,10 @@
|
|
26
56
|
- Task display: Resolve issue where task display would lose mouse input after VS Code reload.
|
27
57
|
- Datasets: Validate that all IDs in datasets are unique (as several downstream problems occur w/ duplicate IDs).
|
28
58
|
- Inspect View: Fix issue with incorrectly displayed custom tool views.
|
29
|
-
- Human approval: Use
|
59
|
+
- Human approval: Use fullscreen display (makes approval UI async and enables rapid processing of approvals via the `Enter` key).
|
30
60
|
- Added `input_panel()` API for adding custom panels to the fullscreen task display.
|
31
61
|
- Log recorder: Methods are now async which will improve performance for fsspec filesystems with async implementations (e.g. S3)
|
32
|
-
- Log recorder: Improve `.eval` log reading performance for remote filesystem (
|
62
|
+
- Log recorder: Improve `.eval` log reading performance for remote filesystem (eagerly fetch log to local buffer).
|
33
63
|
- Add `token_usage` property to `TaskState` which has current total tokens used across all calls to `generate()` (same value that is used for enforcing token limits).
|
34
64
|
- Add `time` field to `ModelOutput` that records total time spent within call to ModelAPI `generate()`.
|
35
65
|
- Web browser: Remove base64 images from web page contents (prevent filling up model context with large images).
|
@@ -42,7 +72,7 @@
|
|
42
72
|
- Bugfix: Correct rate limit error display when running in fullscreen mode.
|
43
73
|
- Bugfix: `hf_dataset` now explicitly requires the `split` argument (previously, it would crash when not specified).
|
44
74
|
- Bugfix: Prevent cascading textual error when an error occurs during task initialisation.
|
45
|
-
- Bugfix: Correctly restore sample summaries from log file after
|
75
|
+
- Bugfix: Correctly restore sample summaries from log file after amend.
|
46
76
|
- Bugfix: Report errors that occur during task finalisation.
|
47
77
|
|
48
78
|
## v0.3.49 (03 December 2024)
|
@@ -50,9 +80,9 @@
|
|
50
80
|
- Logging: Only call CreateBucket on Amazon S3 when the bucket does not already exist.
|
51
81
|
- Improve cancellation feedback and prevent multiple cancellations when using fullscreen display.
|
52
82
|
- Inspect View: Prevent circular reference error when rendering complex tool input.
|
53
|
-
- Inspect View: Resolve display issue with sorting by sample then epoch.
|
83
|
+
- Inspect View: Resolve display issue with sorting by sample then epoch.
|
54
84
|
|
55
|
-
## v0.3.48 (01 December 2024)
|
85
|
+
## v0.3.48 (01 December 2024)
|
56
86
|
|
57
87
|
- [Realtime display](https://github.com/UKGovernmentBEIS/inspect_ai/pull/865) of sample transcripts (including ability to cancel running samples).
|
58
88
|
- Scoring: When using a dictionary to map metrics to score value dictionaries, you may now use globs as keys. See our [scorer documentation](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) for more information.
|
@@ -64,9 +94,9 @@
|
|
64
94
|
- Google: Support for tools/functions that have no parameters.
|
65
95
|
- Google/Vertex: Support for `logprobs` and other new 1.5 (002 series) options.
|
66
96
|
- AzureAI: Change default max_tokens for Llama models to 2048 (4096 currently yields an error w/ Llama 3.1).
|
67
|
-
- Mistral: Various
|
97
|
+
- Mistral: Various compatibility changes for their client and tool calling implementation.
|
68
98
|
- Handle exponents in numeric normalisation for match, include, and answer scorers.
|
69
|
-
- hf_dataset: Added `cached` argument to control whether to use a previously cached version of the dataset if available (defaults to `True`).
|
99
|
+
- hf_dataset: Added `cached` argument to control whether to use a previously cached version of the dataset if available (defaults to `True`).
|
70
100
|
- hf_dataset: Added `revision` option to load a specific branch or commit SHA (when using `revision` datasets are always revalidated on Hugging Face, i.e. `cached` is ignored).
|
71
101
|
- Log viewer: Display sample ids rather than indexes.
|
72
102
|
- Log viewer: Add timestamps to transcript events.
|
@@ -74,9 +104,9 @@
|
|
74
104
|
- Log viewer: Show custom tool call views in messages display.
|
75
105
|
- Bugfix: Correctly read and forward image detail property.
|
76
106
|
- Bugfix: Correct resolution of global eval override of task or sample sandboxes.
|
77
|
-
- Bugfix: Don't do eval log listing on background threads (s3fs can deadlock when run from
|
107
|
+
- Bugfix: Don't do eval log listing on background threads (s3fs can deadlock when run from multiple threads).
|
78
108
|
|
79
|
-
## v0.3.47 (18 November 2024)
|
109
|
+
## v0.3.47 (18 November 2024)
|
80
110
|
|
81
111
|
- Basic agent: Ensure that the scorer is only run once when max_attempts = 1.
|
82
112
|
- Basic agent: Support custom function for incorrect_message reply to model.
|
@@ -87,7 +117,7 @@
|
|
87
117
|
- Scoring: When using a dictionary to map metrics to score value dictionaries, you may now use globs as keys. See our [scorer documentation](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) for more information.
|
88
118
|
- Sample limit events will now appear in the transcript if a limit (e.g. message, token, or time limit) halt a sample. The sample list and sample detail also display the limit, if applicable.
|
89
119
|
|
90
|
-
## v0.3.46 (12 November 2024)
|
120
|
+
## v0.3.46 (12 November 2024)
|
91
121
|
|
92
122
|
- [eval](https://inspect.ai-safety-institute.org.uk/eval-logs.html#sec-log-format) is now the default log format (use `--log-format=json` to use old format).
|
93
123
|
- Base 64 images are now logged by default for all log formats (disable with `--no-log-images`).
|
@@ -112,7 +142,7 @@
|
|
112
142
|
- Log model calls when model providers return bad request errors
|
113
143
|
- Better lay out large numbers of configuration and parameters when displaying log files.
|
114
144
|
- The log viewer now properly displays sample scores for running tasks.
|
115
|
-
- Add `metadata` field to `ModelOutput` and provide
|
145
|
+
- Add `metadata` field to `ModelOutput` and provide various fields for the Groq provider.
|
116
146
|
|
117
147
|
## v0.3.44 (04 November 2024)
|
118
148
|
|
@@ -128,7 +158,7 @@
|
|
128
158
|
- View: properly render complex score objects in transcript.
|
129
159
|
- Write custom tool call views into transcript for use by Inspect View.
|
130
160
|
- Use `casefold()` for case-insensitive compare in `includes()`, `match()`, `exact()`, and `f1()` scorers.
|
131
|
-
- OpenAI: eliminate use of `strict` tool calling (sporadically supported across models and we already
|
161
|
+
- OpenAI: eliminate use of `strict` tool calling (sporadically supported across models and we already internally validate).
|
132
162
|
- Mistral: fix bug where base_url was not respected when passing both an api_key and base_url.
|
133
163
|
- Don't include package scope for task name part of log files.
|
134
164
|
- Improve performance of write_file for Docker sandboxes.
|
@@ -181,7 +211,7 @@
|
|
181
211
|
- Correct llama3 and o1 tool calling when empty arguments passed.
|
182
212
|
- Allow resolution of any sandbox name when there is only a single environment.
|
183
213
|
- Introduce `--log-level-transcript` option for separate control of log entries recorded in the eval log file
|
184
|
-
- Improve mime type detection for image content encoding (fixes issues w/ webp images).
|
214
|
+
- Improve mime type detection for image content encoding (fixes issues w/ webp images).
|
185
215
|
- Fix memory leak in Inspect View worker-based JSON parsing.
|
186
216
|
- Add `fail_on_error` option for `eval_retry()` and `inspect eval-retry`.
|
187
217
|
- Defer resolving helper models in `self_critique()` and `model_graded_qa()`.
|
@@ -204,7 +234,7 @@
|
|
204
234
|
## v0.3.39 (3 October 2024)
|
205
235
|
|
206
236
|
- The sample transcript will now display the target for scoring in the Score Event (for newly run evaluations).
|
207
|
-
- Provide setter for `max_messages` on `TaskState`.
|
237
|
+
- Provide setter for `max_messages` on `TaskState`.
|
208
238
|
- Provide `max_messages` option for `basic_agent()` (defaulting to 50) and use it rather than any task `max_messages` defined.
|
209
239
|
- Improved implementation of disabling parallel tool calling (also fixes a transcript issue introduced by the original implementation).
|
210
240
|
- Improve quality of error messages when a model API key environment variable is missing.
|
@@ -215,7 +245,7 @@
|
|
215
245
|
- Rename `web_browser_tools()` to `web_browser()`, and don't export individual web browsing tools.
|
216
246
|
- Add `parallel` option to `@tool` decorator and specify `parallel=False` for web browsing tools.
|
217
247
|
- Improve prompting for web browser tools using more explicit examples.
|
218
|
-
- Improve prompting for `</tool_call>` end sequence for Llama models.
|
248
|
+
- Improve prompting for `</tool_call>` end sequence for Llama models.
|
219
249
|
- Fix issue with failure to execute sample setup scripts.
|
220
250
|
|
221
251
|
## v0.3.37 (2 October 2024)
|
@@ -224,7 +254,7 @@
|
|
224
254
|
|
225
255
|
## v0.3.36 (2 October 2024)
|
226
256
|
|
227
|
-
- [Web Browser](https://inspect.ai-safety-institute.org.uk/tools.html#sec-web-browser) tool which provides a headless
|
257
|
+
- [Web Browser](https://inspect.ai-safety-institute.org.uk/tools.html#sec-web-browser) tool which provides a headless Chromium browser that supports navigation, history, and mouse/keyboard interactions.
|
228
258
|
- `auto_id` option for dataset readers to assign an auto-incrementing ID to records.
|
229
259
|
- Task args: don't attempt to serialise registry objects that don't have captured parameters.
|
230
260
|
|
@@ -242,7 +272,7 @@
|
|
242
272
|
|
243
273
|
- Support for `max_tokens` on OpenAI o1 models (map to `max_completion_tokens`).
|
244
274
|
- Fix regression of log and debug options on `inspect view`
|
245
|
-
- Improved focus management for
|
275
|
+
- Improved focus management for Inspect View
|
246
276
|
- Raise error if `epochs` is less than 1
|
247
277
|
- Improve code parsing for HumanEval (compatibility with Llama model output)
|
248
278
|
|
@@ -253,9 +283,9 @@
|
|
253
283
|
- Option to disable ANSI terminal output with `--no-ansi` or `INSPECT_NO_ANSI`
|
254
284
|
- Add chain of thought option to `multiple_choice()` and export `MultipleChoiceTemplate` enumeration
|
255
285
|
- Allow Docker sandboxes configured with `x-default` to be referred to by their declared service name.
|
256
|
-
- Improved error messages for
|
286
|
+
- Improved error messages for Docker sandbox initialisation.
|
257
287
|
- Improve legibility of Docker sandbox log entries (join rather than displaying as array)
|
258
|
-
- Display user message immediately
|
288
|
+
- Display user message immediately proceeding assistant message in model call transcripts.
|
259
289
|
- Display images created by tool calls in the Viewer.
|
260
290
|
- Fix duplicated tool call output display in Viewer for Gemini and Llama models.
|
261
291
|
- Require a `max_messages` for use of `basic_agent()` (as without it, the agent could end up in an infinite loop).
|
@@ -270,8 +300,8 @@
|
|
270
300
|
|
271
301
|
- Fix issue w/ subtasks not getting a fresh store() (regression from introduction of `fork()` in v0.3.30)
|
272
302
|
- Fix issue w/ subtasks that return None invalidating the log file.
|
273
|
-
- Make subtasks
|
274
|
-
- Improved error reporting for missing `web_search()` provider environment variables.
|
303
|
+
- Make subtasks collapsible in Inspect View.
|
304
|
+
- Improved error reporting for missing `web_search()` provider environment variables.
|
275
305
|
|
276
306
|
## v0.3.31 (24 September 2024)
|
277
307
|
|
@@ -309,7 +339,7 @@
|
|
309
339
|
- Don't log base64 images by default (re-enable logging with `--log-images`).
|
310
340
|
- Provide unique tool id when parsing tool calls for models that don't support native tool usage.
|
311
341
|
- Fix bug that prevented `epoch_reducer` from being used in eval-retry.
|
312
|
-
- Fix bug that prevented eval() level `epoch` from overriding task level `epoch`.
|
342
|
+
- Fix bug that prevented eval() level `epoch` from overriding task level `epoch`.
|
313
343
|
|
314
344
|
## v0.3.28 (14 September 2024)
|
315
345
|
|
@@ -353,7 +383,7 @@
|
|
353
383
|
- Add optional user parameter to SandboxEnvironment.exec for specifying the user. Currently only DockerSandboxEnvironment is supported.
|
354
384
|
- Fix issue with resolving Docker configuration files when not running from the task directory.
|
355
385
|
- Only populate Docker compose config metadata values when they are used in the file.
|
356
|
-
- Treat Sandbox exec `cwd` that are relative paths as relative to sample working
|
386
|
+
- Treat Sandbox exec `cwd` that are relative paths as relative to sample working directory.
|
357
387
|
- Filter base64 encoded images out of model API call logs.
|
358
388
|
- Raise error when a Solver does not return a TaskState.
|
359
389
|
- Only run tests that use model APIs when the `--runapi` flag is passed to `pytest` (prevents unintended token usage)
|
@@ -362,7 +392,6 @@
|
|
362
392
|
- Only enable `strict` mode for OpenAI tool calls when all function parameters are required.
|
363
393
|
- Added [MMMU](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/mmmu), [CommonsenseQA](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/commonsense_qa), [MMLU-Pro](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/mmlu_pro), and [XSTest](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/xstest) benchmarks.
|
364
394
|
|
365
|
-
|
366
395
|
## v0.3.25 (25 August 2024)
|
367
396
|
|
368
397
|
- [Store](https://inspect.ai-safety-institute.org.uk/agents-api.html#sharing-state) for manipulating arbitrary sample state from within solvers and tools.
|
@@ -383,7 +412,7 @@
|
|
383
412
|
## v0.3.23 (16 August 2024)
|
384
413
|
|
385
414
|
- Support for tool calling for Llama 3.1 models on Azure AI and CloudFlare.
|
386
|
-
-
|
415
|
+
- Increase default `max_tokens` from 1024 to 2048.
|
387
416
|
- Record individual sample reductions along with results for multi-epoch evals.
|
388
417
|
- Change default to not log base64 encoded versions of images, as this often resulted in extremely large log files (use `--log-images` to opt back in).
|
389
418
|
- Update to new Mistral API (v1.0.1 of `mistralai` is now required).
|
@@ -405,13 +434,13 @@
|
|
405
434
|
- Set Claude default `max_tokens` to 4096
|
406
435
|
- Combine user and assistant messages for Vertex models.
|
407
436
|
- Warn when using the `name` parameter with task created from `@task` decorated function.
|
408
|
-
- Make sample `metadata` available in prompt, grading, and self-
|
437
|
+
- Make sample `metadata` available in prompt, grading, and self-critique templates.
|
409
438
|
- Retry on several additional OpenAI errors (APIConnectionError | APITimeoutError | InternalServerError)
|
410
439
|
- Fix a regression which would cause the 'answer' to be improperly recorded when scoring a sample.
|
411
440
|
|
412
441
|
## v0.3.20 (03 August 2024)
|
413
442
|
|
414
|
-
- `Epochs` data type for specifying epochs and reducers together (deprecated `epochs_reducer` argument).
|
443
|
+
- `Epochs` data type for specifying epochs and reducers together (deprecated `epochs_reducer` argument).
|
415
444
|
- Enable customisation of model generation cache dir via `INSPECT_CACHE_DIR` environment variable.
|
416
445
|
- Use doc comment description rather than `prompt` attribute of `@tool` for descriptions.
|
417
446
|
- Include examples section from doc comments in tool descriptions.
|
@@ -464,8 +493,6 @@
|
|
464
493
|
- Set maximum rate limit backoff time to 30 minutes
|
465
494
|
- Retry with exponential backoff for web_search Google provider.
|
466
495
|
|
467
|
-
|
468
|
-
|
469
496
|
## v0.3.18 (14 July 2024)
|
470
497
|
|
471
498
|
- [Multiple Scorers](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) are now supported for evaluation tasks.
|
@@ -474,7 +501,7 @@
|
|
474
501
|
- Improved handling of very large (> 100MB) log files in Inspect View.
|
475
502
|
- Use `network_mode: none` for disabling networking by default in Docker tool environments.
|
476
503
|
- Shorten the default shutdown grace period for Docker container cleanup to 1 second.
|
477
|
-
- Allow sandbox
|
504
|
+
- Allow sandbox environment providers to specify a default `max_samples` (set to 25 for the Docker provider).
|
478
505
|
- Prevent concurrent calls to `eval_async()` (unsafe because of need to change directories for tasks). Parallel task evaluation will instead be implemented as a top-level feature of `eval()` and `eval_async()`.
|
479
506
|
- Match scorers now return answers consistently even when there is no match.
|
480
507
|
- Relocate tool related types into a new top-level `inspect_ai.tool` module (previous imports still work fow now, but result in a runtime deprecation warning).
|
@@ -485,7 +512,7 @@
|
|
485
512
|
|
486
513
|
- Optional increased control over the tool use loop via the `call_tools()` function and new `tool_calls` parameter for `generate()`.
|
487
514
|
- New `per_epoch` option for `CachePolicy` to allow caching to ignore epochs.
|
488
|
-
- Correctly handle `choices` and `files` when converting `Sample` images to base64.
|
515
|
+
- Correctly handle `choices` and `files` when converting `Sample` images to base64.
|
489
516
|
|
490
517
|
## v0.3.16 (24 June 2024)
|
491
518
|
|
@@ -564,7 +591,7 @@
|
|
564
591
|
- Add `multi_scorer()` and `majority_vote()` functions for combining multiple scorers into a single score.
|
565
592
|
- Add support for multiple model graders in `model_graded_qa()`.
|
566
593
|
- Raise `TypeError` for solvers and scorers not declared as `async`.
|
567
|
-
- Fallback to standard
|
594
|
+
- Fallback to standard parse if `NaN` or `Inf` is encountered while reading log file header.
|
568
595
|
- Remove deprecated support for matching partial model names (e.g. "gpt" or "claude").
|
569
596
|
|
570
597
|
## v0.3.8 (07 May 2024)
|
@@ -596,7 +623,7 @@
|
|
596
623
|
- `write_eval_log()` now ignores unserializable objects in metadata fields.
|
597
624
|
- `read_eval_log()` now takes a `str` or `FileInfo` (for compatibility w/ list returned from `list_eval_logs()`).
|
598
625
|
- Registry name looks are now case sensitive (fixes issue w/ loading tasks w/ mixed case names).
|
599
|
-
-
|
626
|
+
- Resiliency to Python syntax errors that occur when enumerating tasks in a directory.
|
600
627
|
- Do not throw error if unable to parse or load `.ipynb` file due to lack of dependencies (e.g. `nbformat`).
|
601
628
|
- Various additions to log viewer display (log file name, dataset/scorer in listing, filter by complex score types).
|
602
629
|
- Improvements to markdown rendering in log viewer (don't render intraword underscores, escape html tags).
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: inspect_ai
|
3
|
-
Version: 0.3.
|
3
|
+
Version: 0.3.54
|
4
4
|
Summary: Framework for large language model evaluations
|
5
5
|
Author: UK AI Safety Institute
|
6
6
|
License: MIT License
|
@@ -20,7 +20,6 @@ Classifier: Operating System :: OS Independent
|
|
20
20
|
Requires-Python: >=3.10
|
21
21
|
Description-Content-Type: text/markdown
|
22
22
|
License-File: LICENSE
|
23
|
-
Requires-Dist: aiofiles
|
24
23
|
Requires-Dist: aiohttp>=3.9.0
|
25
24
|
Requires-Dist: anyio>=4.4.0
|
26
25
|
Requires-Dist: beautifulsoup4
|
@@ -71,7 +70,6 @@ Requires-Dist: pytest-xdist; extra == "dev"
|
|
71
70
|
Requires-Dist: ruff==0.8.3; extra == "dev"
|
72
71
|
Requires-Dist: textual-dev>=0.86.2; extra == "dev"
|
73
72
|
Requires-Dist: types-PyYAML; extra == "dev"
|
74
|
-
Requires-Dist: types-aiofiles; extra == "dev"
|
75
73
|
Requires-Dist: types-beautifulsoup4; extra == "dev"
|
76
74
|
Requires-Dist: types-aioboto3; extra == "dev"
|
77
75
|
Requires-Dist: types-boto3; extra == "dev"
|
@@ -98,22 +96,22 @@ To get started with Inspect, please see the documentation at <https://inspect.ai
|
|
98
96
|
|
99
97
|
***
|
100
98
|
|
101
|
-
|
102
|
-
|
103
99
|
To work on development of Inspect, clone the repository and install with the `-e` flag and `[dev]` optional dependencies:
|
104
100
|
|
105
101
|
```bash
|
106
|
-
|
107
|
-
|
108
|
-
|
102
|
+
git clone https://github.com/UKGovernmentBEIS/inspect_ai.git
|
103
|
+
cd inspect_ai
|
104
|
+
pip install -e ".[dev]"
|
109
105
|
```
|
110
106
|
|
111
107
|
Optionally install pre-commit hooks via
|
108
|
+
|
112
109
|
```bash
|
113
110
|
make hooks
|
114
111
|
```
|
115
112
|
|
116
113
|
Run linting, formatting, and tests via
|
114
|
+
|
117
115
|
```bash
|
118
116
|
make check
|
119
117
|
make test
|
@@ -8,22 +8,22 @@ To get started with Inspect, please see the documentation at <https://inspect.ai
|
|
8
8
|
|
9
9
|
***
|
10
10
|
|
11
|
-
|
12
|
-
|
13
11
|
To work on development of Inspect, clone the repository and install with the `-e` flag and `[dev]` optional dependencies:
|
14
12
|
|
15
13
|
```bash
|
16
|
-
|
17
|
-
|
18
|
-
|
14
|
+
git clone https://github.com/UKGovernmentBEIS/inspect_ai.git
|
15
|
+
cd inspect_ai
|
16
|
+
pip install -e ".[dev]"
|
19
17
|
```
|
20
18
|
|
21
19
|
Optionally install pre-commit hooks via
|
20
|
+
|
22
21
|
```bash
|
23
22
|
make hooks
|
24
23
|
```
|
25
24
|
|
26
25
|
Run linting, formatting, and tests via
|
26
|
+
|
27
27
|
```bash
|
28
28
|
make check
|
29
29
|
make test
|
@@ -90,7 +90,7 @@ If you do need to interact with the underlying JSON (e.g., when reading logs fro
|
|
90
90
|
|
91
91
|
## Image Logging
|
92
92
|
|
93
|
-
By default, full base64 encoded copies of images are included in the log file. Image logging will not create performance problems when using `.eval` logs, however if you are using `.json` logs then large numbers of images could become
|
93
|
+
By default, full base64 encoded copies of images are included in the log file. Image logging will not create performance problems when using `.eval` logs, however if you are using `.json` logs then large numbers of images could become unwieldy (i.e. if your `.json` log file grows to 100mb or larger as a result).
|
94
94
|
|
95
95
|
You can disable this using the `--no-log-images` flag. For example, here we enable the `.json` log format and disable image logging:
|
96
96
|
|
@@ -125,6 +125,10 @@ class PodmanSandboxEnvironment(SandboxEnvironment):
|
|
125
125
|
def config_files(cls) -> list[str]:
|
126
126
|
...
|
127
127
|
|
128
|
+
@classmethod
|
129
|
+
def default_concurrency(cls) -> int | None:
|
130
|
+
...
|
131
|
+
|
128
132
|
@classmethod
|
129
133
|
async def task_init(
|
130
134
|
cls, task_name: str, config: SandboxEnvironmentConfigType | None
|
@@ -180,6 +184,7 @@ The class methods take care of various stages of initialisation, setup, and tear
|
|
180
184
|
| Method | Lifecycle | Purpose |
|
181
185
|
|-------------------|-------------------|----------------------------------|
|
182
186
|
| `config_files()` | Called once to determine the names of 'default' config files for this provider (e.g. 'compose.yaml'). | |
|
187
|
+
| `default_concurrency()` | Called once to determine the default maximum number of sandboxes to run in parallel. Return `None` for no limit (the default behavior). | |
|
183
188
|
| `task_init()` | Called once for each unique sandbox environment config before executing the tasks in an `eval()` run. | Expensive initialisation operations (e.g. pulling or building images) |
|
184
189
|
| `sample_init()` | Called at the beginning of each `Sample`. | Create `SandboxEnvironment` instances for the sample. |
|
185
190
|
| `sample_cleanup()` | Called at the end of each `Sample` | Cleanup `SandboxEnvironment` instances for the sample. |
|
@@ -319,7 +324,7 @@ The `_registry.py` file serves a place to import things that you wan't registere
|
|
319
324
|
from .approvers import auto_approver
|
320
325
|
```
|
321
326
|
|
322
|
-
You can then register your `auto_approver` Inspect extension (and
|
327
|
+
You can then register your `auto_approver` Inspect extension (and anything else imported into `_registry.py`) like this in `pyproject.toml`:
|
323
328
|
|
324
329
|
::: {.panel-tabset group="entry-points"}
|
325
330
|
## Setuptools
|
Binary file
|
@@ -122,13 +122,15 @@ This code will evaluate a total of 12 tasks (6 temperature variations against 2
|
|
122
122
|
|
123
123
|
[Sandbox Environments](agents.qmd#sec-sandbox-environments) (e.g. Docker containers) often allocate resources on a per-sample basis, and also make use of the Inspect `subprocess()` function for executing commands within the environment.
|
124
124
|
|
125
|
-
### Max
|
125
|
+
### Max Sandboxes
|
126
126
|
|
127
|
-
The `
|
127
|
+
The `max_sandboxes` option determines how many sandboxes can be executed in parallel. Individual sandbox providers can establish their own default limits (for example, the Docker provider has a default of `2 * os.cpu_count()`). You can modify this option as required, but be aware that container runtimes have resource limits, and pushing up against and beyond them can lead to instability and failed evaluations.
|
128
128
|
|
129
|
-
|
129
|
+
When a `max_sandboxes` is applied, an indicator at the bottom of the task status screen will be shown:
|
130
130
|
|
131
|
-
|
131
|
+

|
132
|
+
|
133
|
+
Note that when `max_sandboxes` is applied this effectively creates a global `max_samples` limit that is equal to the `max_sandboxes`.
|
132
134
|
|
133
135
|
### Max Subprocesses
|
134
136
|
|
@@ -0,0 +1,23 @@
|
|
1
|
+
#!/bin/bash
|
2
|
+
|
3
|
+
files=("index" "tutorial" "workflow" "log-viewer" "vscode" "solvers" "tools" "agents" "agents-api" "scorers" "datasets" "models" "eval-sets" "errors-and-limits" "caching" "parallelism" "interactivity" "approval" "eval-logs" "extensions")
|
4
|
+
|
5
|
+
|
6
|
+
if [ "$QUARTO_PROJECT_RENDER_ALL" = "1" ]; then
|
7
|
+
llms_full="_site/llms-full.txt"
|
8
|
+
rm -f "${llms_full}"
|
9
|
+
mv _quarto.yml _quarto.yml.bak
|
10
|
+
for file in "${files[@]}"; do
|
11
|
+
echo "llms: ${file}.qmd"
|
12
|
+
quarto render "${file}.qmd" --to gfm --quiet --no-execute
|
13
|
+
output_file="${file}.md"
|
14
|
+
cat "${output_file}" >> "${llms_full}"
|
15
|
+
echo "" >> "${llms_full}"
|
16
|
+
mv $output_file "_site/${file}.html.md"
|
17
|
+
done
|
18
|
+
mv _quarto.yml.bak _quarto.yml
|
19
|
+
fi
|
20
|
+
|
21
|
+
|
22
|
+
|
23
|
+
|
@@ -20,7 +20,7 @@ Inspect has several built-in tools, including:
|
|
20
20
|
|
21
21
|
- [Bash and Python](#sec-bash-and-python) for executing arbitrary shell and Python code.
|
22
22
|
|
23
|
-
- [Web Browser](#sec-web-browser), which provides the model with a headless
|
23
|
+
- [Web Browser](#sec-web-browser), which provides the model with a headless Chromium web browser that supports navigation, history, and mouse/keyboard interactions.
|
24
24
|
|
25
25
|
- [Web Search](#sec-web-search), which uses the Google Search API to execute and summarise web searches.
|
26
26
|
|
@@ -100,11 +100,11 @@ If you do not explicitly handle errors, then Inspect provides some default error
|
|
100
100
|
|
101
101
|
- `UnicodeDecodeError` — Occurs when the output from executing a process or reading a file is binary rather than text.
|
102
102
|
|
103
|
-
- `OutputLimitExceededError` - Occurs when one or both of the output streams from `sandbox().exec()` exceed
|
103
|
+
- `OutputLimitExceededError` - Occurs when one or both of the output streams from `sandbox().exec()` exceed 10 MiB or when attempting to read a file over 100 MiB in size.
|
104
104
|
|
105
105
|
- `ToolError` — Special error thrown by tools to indicate they'd like to report an error to the model.
|
106
106
|
|
107
|
-
These are all errors that are *expected* (in fact the `
|
107
|
+
These are all errors that are *expected* (in fact the `SandboxEnvironment` interface documents them as such) and possibly recoverable by the model (try a different command, read a different file, etc.). Unexpected errors (e.g. a network error communicating with a remote service or container runtime) on the other hand are not automatically handled and result in the `Sample` failing with an error.
|
108
108
|
|
109
109
|
Many tools can simply rely on the default handling to provide reasonable behaviour around both expected and unexpected errors.
|
110
110
|
|
@@ -120,7 +120,7 @@ Another type of explicit handling is re-raising an error to bypass Inspect's def
|
|
120
120
|
|
121
121
|
``` python
|
122
122
|
try:
|
123
|
-
result = await
|
123
|
+
result = await sandbox().exec(
|
124
124
|
cmd=["decode", file],
|
125
125
|
timeout=timeout
|
126
126
|
)
|
@@ -314,7 +314,7 @@ See the [Agents](#sec-agents) section for more details on how to build evaluatio
|
|
314
314
|
|
315
315
|
## Web Browser {#sec-web-browser}
|
316
316
|
|
317
|
-
The web browser tools
|
317
|
+
The web browser tools provides models with the ability to browse the web using a headless Chromium browser. Navigation, history, and mouse/keyboard interactions are all supported.
|
318
318
|
|
319
319
|
### Configuration
|
320
320
|
|
@@ -408,7 +408,7 @@ RUN pip install playwright
|
|
408
408
|
RUN playwright install
|
409
409
|
RUN playwright install-deps
|
410
410
|
|
411
|
-
# Install other
|
411
|
+
# Install other dependencies
|
412
412
|
RUN pip install dm-env-rpc pillow bs4 lxml
|
413
413
|
|
414
414
|
# Copy Python files alongside the Dockerfile
|
@@ -78,7 +78,7 @@ inspect eval security_guide.py
|
|
78
78
|
|
79
79
|
[HellaSwag](https://rowanzellers.com/hellaswag/) is a dataset designed to test commonsense natural language inference (NLI) about physical situations. It includes samples that are adversarially constructed to violate common sense about the physical world, so can be a challenge for some language models.
|
80
80
|
|
81
|
-
For example, here is one of the questions in the dataset along with its set of possible
|
81
|
+
For example, here is one of the questions in the dataset along with its set of possible answers (the correct answer is C):
|
82
82
|
|
83
83
|
> In home pet groomers demonstrate how to groom a pet. the person
|
84
84
|
>
|
@@ -570,4 +570,4 @@ def ctf_agent(max_attempts=3, message_limit=30):
|
|
570
570
|
|
571
571
|
The `basic_agent()` provides a ReAct tool loop with support for retries and encouraging the model to continue if its gives up or gets stuck. The `bash()` and `python()` tools are provided to the model with a 3-minute timeout to prevent long running commands from getting the evaluation stuck.
|
572
572
|
|
573
|
-
See the [full source code](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/gdm_capabilities/intercode_ctf) of the Intercode CTF example to explore the dataset and evaluation code in more depth.
|
573
|
+
See the [full source code](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/gdm_capabilities/intercode_ctf) of the Intercode CTF example to explore the dataset and evaluation code in more depth.
|