inspect-ai 0.3.53__tar.gz → 0.3.54__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/CHANGELOG.md +40 -34
- {inspect_ai-0.3.53/src/inspect_ai.egg-info → inspect_ai-0.3.54}/PKG-INFO +6 -6
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/README.md +5 -5
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/eval-logs.qmd +1 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/extensions.qmd +1 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/tools.qmd +5 -5
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/tutorial.qmd +2 -2
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/eval.py +26 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/main.py +2 -0
- inspect_ai-0.3.54/src/inspect_ai/_cli/trace.py +244 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/app.py +5 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/tasks.py +13 -3
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/eval.py +17 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/images.py +4 -14
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/run.py +26 -10
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/constants.py +3 -3
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/display.py +1 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/logger.py +34 -8
- inspect_ai-0.3.54/src/inspect_ai/_util/trace.py +275 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_log.py +3 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_message.py +2 -2
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/eval.py +6 -17
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/json.py +19 -17
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_cache.py +22 -16
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_call_tools.py +9 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_generate_config.py +2 -2
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_model.py +11 -12
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/bedrock.py +1 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_web_browser.py +1 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/context.py +6 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/compose.py +58 -19
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/docker.py +11 -11
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/util.py +0 -6
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/service.py +17 -7
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_subprocess.py +6 -1
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_subtask.py +8 -2
- {inspect_ai-0.3.53 → inspect_ai-0.3.54/src/inspect_ai.egg-info}/PKG-INFO +6 -6
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/SOURCES.txt +2 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tool_types.py +39 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/dependabot.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/pull_request_template.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/workflows/build.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/workflows/docs.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/workflows/log_viewer.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/workflows/pypi.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.github/workflows/vscode.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.pre-commit-config.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.vscode/extensions.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/.vscode/settings.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/CITATION.cff +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/LICENSE +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/Makefile +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/CNAME +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_errors_and_retries.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_quarto.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_sample-preservation.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_sandboxenv-interface.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_tools-annotations-required.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_tools-scaffold.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_trace.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/_variables.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/agents-api.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/agents.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/approval.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/caching.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/datasets.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/errors-and-limits.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/eval-sets.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/examples/examples.bib +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/examples/examples.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/examples/examples.ejs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/examples/examples.yml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/examples/index.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/aisi-logo.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/eval-log.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-activity-bar.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-multiple-models.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-answers.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-filter.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-history.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-home.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-info.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-logging-console.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-logging.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-main.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-messages.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-metadata.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-scoring.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-sort.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-view-splash.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-vscode-config.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-vscode-install.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-vscode-logview.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-vscode-output-channel.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect-vscode-run-task.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/inspect.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/logs-drop-down.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/logs-open-button.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/logs.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/popularity.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/python-tool-view.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/rate-limit.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/running-theory.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/task-max-sandboxes.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/toolenv-no-cleanup.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/images/web-browser-tool-view.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/index.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/interactivity.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/llms.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/log-viewer.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/models.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/parallelism.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/scorers.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/scripts/post-render.sh +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/solvers.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/theme.scss +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/vscode.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/docs/workflow.qmd +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/approval/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/approval/approval.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/approval/approval.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/biology_qa.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/browser/browser.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/browser/compose.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/cache.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/evalset.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/hello_world.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/images/ballons.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/images/bike.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/images/images.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/images/images.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/intervention/Dockerfile +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/intervention/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/intervention/compose.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/intervention/intervention.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/.env.example +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/inspect_langchain.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/requirements.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/wikipedia.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/langchain/wikipedia.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/popularity.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/security_guide.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/theory_of_mind.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/examples/tool_use.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/pyproject.toml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/requirements.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/setup.cfg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/__main__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/cache.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/common.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/info.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/list.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/log.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/sandbox.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/score.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_cli/view.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/active.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/config.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/display.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/footer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/group.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/panel.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/progress.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/results.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/rich.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/core/textual.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/rich/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/rich/display.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/app.tcss +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/display.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/theme.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/clock.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/console.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/footer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/samples.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/task_detail.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/titlebar.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/toggle.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_display/textual/widgets/transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/context.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/evalset.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/list.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/loader.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/run.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/score.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/constants.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/epochs.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/error.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/generate.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/log.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/results.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/rundir.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/sandbox.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/task.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_eval/task/util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/_async.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/appdirs.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/config.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/content.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/datetime.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/decorator.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/deprecation.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/dev.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/dict.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/dotenv.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/entrypoints.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/environ.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/error.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/file.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/format.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/git.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/hash.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/hooks.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/html.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/http.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/images.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/json.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/list.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/notebook.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/package.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/path.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/pattern.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/platform.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/retry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/rich.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/samples.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/terminal.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/text.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/throttle.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/timeouts.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/url.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_util/version.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/notify.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/schema.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/server.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/view.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.prettierignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/.tool-versions +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/App.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/favicon.svg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/index.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/assets/index.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/dist/index.html +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/eslint.config.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/favicon.svg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/index.html +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/jsconfig.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/log-schema.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/package.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/postcss.config.cjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/App.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/Register.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/Types.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/Types.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-browser.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-http.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-shared.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/api-vscode.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/client-api.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/index.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/api/jsonrpc.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Colors.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Fonts.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Icons.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/appearance/Styles.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AnsiDisplay.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AnsiDisplay.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/AppErrorBoundary.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Browser.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Card.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ChatView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/CopyButton.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Dialog.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/DownloadButton.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/DownloadPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/EmptyPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ErrorPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ExpandablePanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/FindBand.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/JsonPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/LabeledValue.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/LargeModal.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MarkdownDiv.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MessageBand.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MessageContent.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MetaDataGrid.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MetaDataView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/MorePopOver.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/NavPills.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ProgressBar.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/ChatMessageRenderer.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/RenderedContent.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/RenderedContent/Types.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/TabSet.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ToolButton.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/Tools.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/VirtualList.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/components/ansi-output.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/constants.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/index.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/json/JsonTab.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log/remoteLogFile.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Log-Reader.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Native-Log-Reader.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/log-reader/Open-AI-Log-Reader.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/navbar/Navbar.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/navbar/SecondaryBar.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/plan/PlanCard.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleDialog.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleDisplay.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleError.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleLimit.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleList.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleScoreView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleScores.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SampleTranscript.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesTab.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/SamplesTools.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/EpochFilter.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SampleFilter.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SelectScorer.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/SortFilter.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/tools/filters.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ApprovalEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ErrorEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventRow.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/EventSection.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/InfoEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/InputEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/LoggerEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SampleInitEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SampleLimitEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ScoreEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/StepEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/SubtaskEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/ToolEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/TranscriptState.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/TranscriptView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/Types.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateDiffView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/samples/transcript/state/StateEventView.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/sidebar/Sidebar.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/jsondiffpatch.d.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/log.d.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/types/prism.d.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/usage/ModelTokenTable.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/usage/UsageCard.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Base64.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Format.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Git.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Html.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Json.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Path.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Print.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/Type.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/attachments.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/debugging.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/http.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/queue.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/remoteZipFile.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/sync.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/utils/vscode.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/workspace/TaskErrorPanel.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/src/workspace/WorkSpace.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/tsconfig.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/vite.config.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/_view/www/yarn.lock +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_apply.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_approval.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_approver.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_auto.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_call.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/approver.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/console.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/manager.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/panel.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_human/util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_policy.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/approval/_registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_dataset.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/bias_detection.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/biology_qa.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/popularity.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/security_guide.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_examples/theory_of_mind.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/csv.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/example.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/file.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/hf.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/json.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_sources/util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/dataset/_util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_bundle.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_condense.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_convert.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_file.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/create.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/file.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_recorders/recorder.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_retry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_samples.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/log/_transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_chat_message.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_image.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_model_call.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_model_output.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/anthropic.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/azureai.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/cloudflare.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/google.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/grok.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/groq.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/hf.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/llama_cpp_python.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/mistral.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/mockllm.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/ollama.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/openai.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/openai_o1.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/providers.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/together.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/chatapi.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/hf_handler.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/llama31.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/util/util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/vertex.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_providers/vllm.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_render.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/model/_trace.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/py.typed +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_answer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_choice.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_classification.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_common.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_match.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metric.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/accuracy.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/mean.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_metrics/std.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_model.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_multi.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_pattern.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/reducer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_reducer/types.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_score.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_scorer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/scorer/_target.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_basic_agent.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_chain.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_critique.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_fork.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_multiple_choice.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_plan.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_prompt.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_solver.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_task_state.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_use_tools.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/solver/_util.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_call.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_choice.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_def.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_description.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_info.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_params.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tool_with.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_execute.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/Dockerfile +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/accessibility_node.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/dm_env_servicer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/images/usage_diagram.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/mock_environment.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/playwright_crawler.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_accessibility_node.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_dm_env_servicer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_playwright_crawler.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/test_web_environment.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_client.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_client_new_session.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_environment.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_browser/_resources/web_server.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/tool/_tools/_web_search.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_concurrency.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_console.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_panel.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_resource.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/cleanup.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/config.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/internal.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/docker/prereqs.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/environment.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/limits.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/local.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_sandbox/self_check.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_store.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai/util/_trace.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/dependency_links.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/entry_points.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/requires.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/src/inspect_ai.egg-info/top_level.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/approve.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/escalate.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/modify.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/reject.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/terminate.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/approval/test_approval.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/conftest.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/dataset.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/images/ballons.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/images.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.csv +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples-md.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.csv +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset/samples.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/dataset/test_dataset.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_formats.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_images.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_images_tc.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_invalid.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_length_stop_reason.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_streaming.eval +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_valid.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_version_3.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log/log_with_nan.txt +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_eval_log.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_list_logs/2024-11-05T13-31-45-05-00_input-task_8zXjbRzCWrL9GXiXo2vus9.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_list_logs/2024-11-05T13-32-37-05-00_input-task_hxs4q9azL3ySGkjJirypKZ.eval +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_list_logs/custom.eval +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_list_logs/ignore.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_list_logs.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_log_attachments.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_log_formats.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_log_level.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_log_streaming.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/log/test_log_tags.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_anthropic.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_azureai.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_cloudflare.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_google.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_grok.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_groq.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_hf.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_llama_cpp_python.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_openai.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_openai_o1.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_vertex.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/providers/test_vllm.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_api_key.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_collapse_assistant_message.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_collapse_user_message.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_disable.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_logprobs.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_mock_model_llm.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_num_choices.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_parse_tool_call.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/model/test_stop_reason.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_answer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_choice.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_classification.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_match.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_metric.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_model_graded.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_multiscorer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_pattern.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_reducers.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_scorer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/scorer/test_value_to_float.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_basic_agent.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_chain.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_fork.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_multiple_choice.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_prompt.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_setup.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_solver.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_solver_decorator.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_solver_spec.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_store.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_subtask.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/solver/test_transcript.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_config/model.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_config/solver.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_config/task.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_config.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_set/2024-08-29T15-11-17+00-00_popularity_5EAmX6wjMFqea6WY7XHzZp.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_set/2024-08-29T15-11-18+00-00_popularity_5EAmX6wjMFqea6WY7XHzZp.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_eval_set.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_examples.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_extensions.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_fail_on_error.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_helpers/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_helpers/tasks.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_helpers/tool_call_utils.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_helpers/tools.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_helpers/utils.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_list_task.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_log_dir/example_task/example_task.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_log_dir/test_log_dir.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/_registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/approvers/renamer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/modelapi/custom.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/py.typed +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/sandboxenv/podman.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/score/scorer.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/inspect_package/solvers/cot.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_package/pyproject.toml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_retry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_run_dir/task1/task1.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_run_dir/task2/task2.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_run_dir.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_sample_id.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_sample_limits.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_attr.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/__init__.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/attribs.ipynb +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/multiple.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/_decoy/testit.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/_decoy2.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/bar.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/multiple_dir/foo.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/.folder3/epsilon.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder1/_decoy.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder1/theta.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/.folder3/epsilon.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/another.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/test_task_list/recurse/folder2/first.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/docker-compose-context/Dockerfile +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/docker-compose-context-alpine/Dockerfile +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_bash_tool.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_max_exec_output.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_max_tool_output.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_python_tool.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_sandbox_compose.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_sandbox_compose_alpine.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_sandbox_docker_and_local.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_sandbox_dockerfile.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_sandbox_tool_eval.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tool_def.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tool_parse.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tool_view.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tool_with.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_tools.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_use_tools.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_web_browser.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/tools/test_web_browser_compose.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/sandbox/docker_compose_multiple_services/docker-compose.yaml +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/sandbox/sandbox_setup.sh +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/sandbox/test_docker_compose_multiple_services.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/sandbox/test_sandbox_service.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/sandbox/test_sandbox_setup.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_file.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_images/images.jsonl +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_images.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_package.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_registry.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_str_to_float.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/util/test_subprocess.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tests/view/test_bundle.py +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.eslintrc.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscode/extensions.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscode/launch.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscode/settings.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscode/tasks.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscode-test.mjs +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.vscodeignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/.yarnrc +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/CHANGELOG.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/LICENSE +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/README.md +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/icon/eval-treeview.svg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/icon/eval.svg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/logo/inspect.png +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/logo/inspect.svg +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/templates/task.py.template +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/www/codicon/codicon.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/www/codicon/codicon.ttf +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/assets/www/view/view-overrides.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/package.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/@types/hooks.d.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/@types/log.d.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/document.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/error.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/focus.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/notebook.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/symbol.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/task.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/templates.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/components/webview.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/appdirs.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/command.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/dispose.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/env.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/file.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/git.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/jsonrpc.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/log.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/nonce.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/path.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/port.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/process.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/python/code.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/python/env.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/python/exec.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/python/index.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/python/interpreter.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/random.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/string.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/text.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/uri.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/vscode/association.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/wait.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/core/workspace.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/extension.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/hooks/hooks.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/hooks/index.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/hooks/preview.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/inspect/index.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/inspect/logs.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/inspect/props.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/inspect/version.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/active-task/active-task-command.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/active-task/active-task-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/activity-bar-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/env-config-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-directory-selector.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-data.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-mru.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/log-listing/log-listing.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-config-commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-config-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-outline-commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/task-outline-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/env-config-webview.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/env-config-webview.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/task-config-webview.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/task-config-webview.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/vscode-controls.css +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/activity-bar/webview/webview-utils.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/codelens/codelens-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-constants.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-eval-commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-eval.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-logs-watcher.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-manager.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/inspect/inspect-view-server.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/lognotify.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-editor.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-link-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-panel.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-state.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview-view.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/logview/logview.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/openlog.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/protocol-handler.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/settings/inspect-settings.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/settings/user-settings.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/statusbar.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-env-commands.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-env-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-init.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-state-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/providers/workspace/workspace-task-provider.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/src/test/extension.test.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/.gitignore +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/package.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/rollup.config.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/src/index.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/src/jsonrpc.ts +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tools/ts-to-mjs/yarn.lock +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/tsconfig.json +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/webpack.config.js +0 -0
- {inspect_ai-0.3.53 → inspect_ai-0.3.54}/tools/vscode/yarn.lock +0 -0
@@ -1,5 +1,14 @@
|
|
1
1
|
# Changelog
|
2
2
|
|
3
|
+
## v0.3.54 (26 December 2024)
|
4
|
+
|
5
|
+
- [Action tracing](https://github.com/UKGovernmentBEIS/inspect_ai/pull/1038) for diagnosing runs with unterminated action (e.g. model calls, docker commands, etc.).
|
6
|
+
- Provide default timeout/retry for docker compose commands to mitigate unreliability in some configurations.
|
7
|
+
- Switch to sync S3 writes to overcome unreliability observed when using async interface.
|
8
|
+
- Task display: Added `--no-score-display` option to disable realtime scoring metrics.
|
9
|
+
- Bugfix: Fix failure to fully clone samples that have message lists as input.
|
10
|
+
- llama-cpp-python: Support for `logprobs`.
|
11
|
+
|
3
12
|
## v0.3.53 (20 December 2024)
|
4
13
|
|
5
14
|
- OpenAI: Support for o1 including native tool calling and `reasoning_effort` generation option.
|
@@ -9,7 +18,7 @@
|
|
9
18
|
- Bedrock: Support for `jpeg` images.
|
10
19
|
- Bedrock: Correct max_tokens for llama3-8b, llama3-70b models on Bedrock.
|
11
20
|
- Inspect View: Various improvements to appearance of tool calls in transcript.
|
12
|
-
- Task display: Ensure that widths of progress elements are kept
|
21
|
+
- Task display: Ensure that widths of progress elements are kept consistent across tasks.
|
13
22
|
- Sandboxes: New `max_sandboxes` option for (per-provider) maximum number of running sandboxes.
|
14
23
|
- Sandboxes: Remove use of aiofiles to mitigate potential for threading deadlocks.
|
15
24
|
- Concurrency: Do not use `max_tasks` as a lower bound for `max_samples`.
|
@@ -47,10 +56,10 @@
|
|
47
56
|
- Task display: Resolve issue where task display would lose mouse input after VS Code reload.
|
48
57
|
- Datasets: Validate that all IDs in datasets are unique (as several downstream problems occur w/ duplicate IDs).
|
49
58
|
- Inspect View: Fix issue with incorrectly displayed custom tool views.
|
50
|
-
- Human approval: Use
|
59
|
+
- Human approval: Use fullscreen display (makes approval UI async and enables rapid processing of approvals via the `Enter` key).
|
51
60
|
- Added `input_panel()` API for adding custom panels to the fullscreen task display.
|
52
61
|
- Log recorder: Methods are now async which will improve performance for fsspec filesystems with async implementations (e.g. S3)
|
53
|
-
- Log recorder: Improve `.eval` log reading performance for remote filesystem (
|
62
|
+
- Log recorder: Improve `.eval` log reading performance for remote filesystem (eagerly fetch log to local buffer).
|
54
63
|
- Add `token_usage` property to `TaskState` which has current total tokens used across all calls to `generate()` (same value that is used for enforcing token limits).
|
55
64
|
- Add `time` field to `ModelOutput` that records total time spent within call to ModelAPI `generate()`.
|
56
65
|
- Web browser: Remove base64 images from web page contents (prevent filling up model context with large images).
|
@@ -63,7 +72,7 @@
|
|
63
72
|
- Bugfix: Correct rate limit error display when running in fullscreen mode.
|
64
73
|
- Bugfix: `hf_dataset` now explicitly requires the `split` argument (previously, it would crash when not specified).
|
65
74
|
- Bugfix: Prevent cascading textual error when an error occurs during task initialisation.
|
66
|
-
- Bugfix: Correctly restore sample summaries from log file after
|
75
|
+
- Bugfix: Correctly restore sample summaries from log file after amend.
|
67
76
|
- Bugfix: Report errors that occur during task finalisation.
|
68
77
|
|
69
78
|
## v0.3.49 (03 December 2024)
|
@@ -71,9 +80,9 @@
|
|
71
80
|
- Logging: Only call CreateBucket on Amazon S3 when the bucket does not already exist.
|
72
81
|
- Improve cancellation feedback and prevent multiple cancellations when using fullscreen display.
|
73
82
|
- Inspect View: Prevent circular reference error when rendering complex tool input.
|
74
|
-
- Inspect View: Resolve display issue with sorting by sample then epoch.
|
83
|
+
- Inspect View: Resolve display issue with sorting by sample then epoch.
|
75
84
|
|
76
|
-
## v0.3.48 (01 December 2024)
|
85
|
+
## v0.3.48 (01 December 2024)
|
77
86
|
|
78
87
|
- [Realtime display](https://github.com/UKGovernmentBEIS/inspect_ai/pull/865) of sample transcripts (including ability to cancel running samples).
|
79
88
|
- Scoring: When using a dictionary to map metrics to score value dictionaries, you may now use globs as keys. See our [scorer documentation](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) for more information.
|
@@ -85,9 +94,9 @@
|
|
85
94
|
- Google: Support for tools/functions that have no parameters.
|
86
95
|
- Google/Vertex: Support for `logprobs` and other new 1.5 (002 series) options.
|
87
96
|
- AzureAI: Change default max_tokens for Llama models to 2048 (4096 currently yields an error w/ Llama 3.1).
|
88
|
-
- Mistral: Various
|
97
|
+
- Mistral: Various compatibility changes for their client and tool calling implementation.
|
89
98
|
- Handle exponents in numeric normalisation for match, include, and answer scorers.
|
90
|
-
- hf_dataset: Added `cached` argument to control whether to use a previously cached version of the dataset if available (defaults to `True`).
|
99
|
+
- hf_dataset: Added `cached` argument to control whether to use a previously cached version of the dataset if available (defaults to `True`).
|
91
100
|
- hf_dataset: Added `revision` option to load a specific branch or commit SHA (when using `revision` datasets are always revalidated on Hugging Face, i.e. `cached` is ignored).
|
92
101
|
- Log viewer: Display sample ids rather than indexes.
|
93
102
|
- Log viewer: Add timestamps to transcript events.
|
@@ -95,9 +104,9 @@
|
|
95
104
|
- Log viewer: Show custom tool call views in messages display.
|
96
105
|
- Bugfix: Correctly read and forward image detail property.
|
97
106
|
- Bugfix: Correct resolution of global eval override of task or sample sandboxes.
|
98
|
-
- Bugfix: Don't do eval log listing on background threads (s3fs can deadlock when run from
|
107
|
+
- Bugfix: Don't do eval log listing on background threads (s3fs can deadlock when run from multiple threads).
|
99
108
|
|
100
|
-
## v0.3.47 (18 November 2024)
|
109
|
+
## v0.3.47 (18 November 2024)
|
101
110
|
|
102
111
|
- Basic agent: Ensure that the scorer is only run once when max_attempts = 1.
|
103
112
|
- Basic agent: Support custom function for incorrect_message reply to model.
|
@@ -108,7 +117,7 @@
|
|
108
117
|
- Scoring: When using a dictionary to map metrics to score value dictionaries, you may now use globs as keys. See our [scorer documentation](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) for more information.
|
109
118
|
- Sample limit events will now appear in the transcript if a limit (e.g. message, token, or time limit) halt a sample. The sample list and sample detail also display the limit, if applicable.
|
110
119
|
|
111
|
-
## v0.3.46 (12 November 2024)
|
120
|
+
## v0.3.46 (12 November 2024)
|
112
121
|
|
113
122
|
- [eval](https://inspect.ai-safety-institute.org.uk/eval-logs.html#sec-log-format) is now the default log format (use `--log-format=json` to use old format).
|
114
123
|
- Base 64 images are now logged by default for all log formats (disable with `--no-log-images`).
|
@@ -133,7 +142,7 @@
|
|
133
142
|
- Log model calls when model providers return bad request errors
|
134
143
|
- Better lay out large numbers of configuration and parameters when displaying log files.
|
135
144
|
- The log viewer now properly displays sample scores for running tasks.
|
136
|
-
- Add `metadata` field to `ModelOutput` and provide
|
145
|
+
- Add `metadata` field to `ModelOutput` and provide various fields for the Groq provider.
|
137
146
|
|
138
147
|
## v0.3.44 (04 November 2024)
|
139
148
|
|
@@ -149,7 +158,7 @@
|
|
149
158
|
- View: properly render complex score objects in transcript.
|
150
159
|
- Write custom tool call views into transcript for use by Inspect View.
|
151
160
|
- Use `casefold()` for case-insensitive compare in `includes()`, `match()`, `exact()`, and `f1()` scorers.
|
152
|
-
- OpenAI: eliminate use of `strict` tool calling (sporadically supported across models and we already
|
161
|
+
- OpenAI: eliminate use of `strict` tool calling (sporadically supported across models and we already internally validate).
|
153
162
|
- Mistral: fix bug where base_url was not respected when passing both an api_key and base_url.
|
154
163
|
- Don't include package scope for task name part of log files.
|
155
164
|
- Improve performance of write_file for Docker sandboxes.
|
@@ -202,7 +211,7 @@
|
|
202
211
|
- Correct llama3 and o1 tool calling when empty arguments passed.
|
203
212
|
- Allow resolution of any sandbox name when there is only a single environment.
|
204
213
|
- Introduce `--log-level-transcript` option for separate control of log entries recorded in the eval log file
|
205
|
-
- Improve mime type detection for image content encoding (fixes issues w/ webp images).
|
214
|
+
- Improve mime type detection for image content encoding (fixes issues w/ webp images).
|
206
215
|
- Fix memory leak in Inspect View worker-based JSON parsing.
|
207
216
|
- Add `fail_on_error` option for `eval_retry()` and `inspect eval-retry`.
|
208
217
|
- Defer resolving helper models in `self_critique()` and `model_graded_qa()`.
|
@@ -225,7 +234,7 @@
|
|
225
234
|
## v0.3.39 (3 October 2024)
|
226
235
|
|
227
236
|
- The sample transcript will now display the target for scoring in the Score Event (for newly run evaluations).
|
228
|
-
- Provide setter for `max_messages` on `TaskState`.
|
237
|
+
- Provide setter for `max_messages` on `TaskState`.
|
229
238
|
- Provide `max_messages` option for `basic_agent()` (defaulting to 50) and use it rather than any task `max_messages` defined.
|
230
239
|
- Improved implementation of disabling parallel tool calling (also fixes a transcript issue introduced by the original implementation).
|
231
240
|
- Improve quality of error messages when a model API key environment variable is missing.
|
@@ -236,7 +245,7 @@
|
|
236
245
|
- Rename `web_browser_tools()` to `web_browser()`, and don't export individual web browsing tools.
|
237
246
|
- Add `parallel` option to `@tool` decorator and specify `parallel=False` for web browsing tools.
|
238
247
|
- Improve prompting for web browser tools using more explicit examples.
|
239
|
-
- Improve prompting for `</tool_call>` end sequence for Llama models.
|
248
|
+
- Improve prompting for `</tool_call>` end sequence for Llama models.
|
240
249
|
- Fix issue with failure to execute sample setup scripts.
|
241
250
|
|
242
251
|
## v0.3.37 (2 October 2024)
|
@@ -245,7 +254,7 @@
|
|
245
254
|
|
246
255
|
## v0.3.36 (2 October 2024)
|
247
256
|
|
248
|
-
- [Web Browser](https://inspect.ai-safety-institute.org.uk/tools.html#sec-web-browser) tool which provides a headless
|
257
|
+
- [Web Browser](https://inspect.ai-safety-institute.org.uk/tools.html#sec-web-browser) tool which provides a headless Chromium browser that supports navigation, history, and mouse/keyboard interactions.
|
249
258
|
- `auto_id` option for dataset readers to assign an auto-incrementing ID to records.
|
250
259
|
- Task args: don't attempt to serialise registry objects that don't have captured parameters.
|
251
260
|
|
@@ -263,7 +272,7 @@
|
|
263
272
|
|
264
273
|
- Support for `max_tokens` on OpenAI o1 models (map to `max_completion_tokens`).
|
265
274
|
- Fix regression of log and debug options on `inspect view`
|
266
|
-
- Improved focus management for
|
275
|
+
- Improved focus management for Inspect View
|
267
276
|
- Raise error if `epochs` is less than 1
|
268
277
|
- Improve code parsing for HumanEval (compatibility with Llama model output)
|
269
278
|
|
@@ -274,9 +283,9 @@
|
|
274
283
|
- Option to disable ANSI terminal output with `--no-ansi` or `INSPECT_NO_ANSI`
|
275
284
|
- Add chain of thought option to `multiple_choice()` and export `MultipleChoiceTemplate` enumeration
|
276
285
|
- Allow Docker sandboxes configured with `x-default` to be referred to by their declared service name.
|
277
|
-
- Improved error messages for
|
286
|
+
- Improved error messages for Docker sandbox initialisation.
|
278
287
|
- Improve legibility of Docker sandbox log entries (join rather than displaying as array)
|
279
|
-
- Display user message immediately
|
288
|
+
- Display user message immediately proceeding assistant message in model call transcripts.
|
280
289
|
- Display images created by tool calls in the Viewer.
|
281
290
|
- Fix duplicated tool call output display in Viewer for Gemini and Llama models.
|
282
291
|
- Require a `max_messages` for use of `basic_agent()` (as without it, the agent could end up in an infinite loop).
|
@@ -291,8 +300,8 @@
|
|
291
300
|
|
292
301
|
- Fix issue w/ subtasks not getting a fresh store() (regression from introduction of `fork()` in v0.3.30)
|
293
302
|
- Fix issue w/ subtasks that return None invalidating the log file.
|
294
|
-
- Make subtasks
|
295
|
-
- Improved error reporting for missing `web_search()` provider environment variables.
|
303
|
+
- Make subtasks collapsible in Inspect View.
|
304
|
+
- Improved error reporting for missing `web_search()` provider environment variables.
|
296
305
|
|
297
306
|
## v0.3.31 (24 September 2024)
|
298
307
|
|
@@ -330,7 +339,7 @@
|
|
330
339
|
- Don't log base64 images by default (re-enable logging with `--log-images`).
|
331
340
|
- Provide unique tool id when parsing tool calls for models that don't support native tool usage.
|
332
341
|
- Fix bug that prevented `epoch_reducer` from being used in eval-retry.
|
333
|
-
- Fix bug that prevented eval() level `epoch` from overriding task level `epoch`.
|
342
|
+
- Fix bug that prevented eval() level `epoch` from overriding task level `epoch`.
|
334
343
|
|
335
344
|
## v0.3.28 (14 September 2024)
|
336
345
|
|
@@ -374,7 +383,7 @@
|
|
374
383
|
- Add optional user parameter to SandboxEnvironment.exec for specifying the user. Currently only DockerSandboxEnvironment is supported.
|
375
384
|
- Fix issue with resolving Docker configuration files when not running from the task directory.
|
376
385
|
- Only populate Docker compose config metadata values when they are used in the file.
|
377
|
-
- Treat Sandbox exec `cwd` that are relative paths as relative to sample working
|
386
|
+
- Treat Sandbox exec `cwd` that are relative paths as relative to sample working directory.
|
378
387
|
- Filter base64 encoded images out of model API call logs.
|
379
388
|
- Raise error when a Solver does not return a TaskState.
|
380
389
|
- Only run tests that use model APIs when the `--runapi` flag is passed to `pytest` (prevents unintended token usage)
|
@@ -383,7 +392,6 @@
|
|
383
392
|
- Only enable `strict` mode for OpenAI tool calls when all function parameters are required.
|
384
393
|
- Added [MMMU](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/mmmu), [CommonsenseQA](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/commonsense_qa), [MMLU-Pro](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/mmlu_pro), and [XSTest](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/xstest) benchmarks.
|
385
394
|
|
386
|
-
|
387
395
|
## v0.3.25 (25 August 2024)
|
388
396
|
|
389
397
|
- [Store](https://inspect.ai-safety-institute.org.uk/agents-api.html#sharing-state) for manipulating arbitrary sample state from within solvers and tools.
|
@@ -404,7 +412,7 @@
|
|
404
412
|
## v0.3.23 (16 August 2024)
|
405
413
|
|
406
414
|
- Support for tool calling for Llama 3.1 models on Azure AI and CloudFlare.
|
407
|
-
-
|
415
|
+
- Increase default `max_tokens` from 1024 to 2048.
|
408
416
|
- Record individual sample reductions along with results for multi-epoch evals.
|
409
417
|
- Change default to not log base64 encoded versions of images, as this often resulted in extremely large log files (use `--log-images` to opt back in).
|
410
418
|
- Update to new Mistral API (v1.0.1 of `mistralai` is now required).
|
@@ -426,13 +434,13 @@
|
|
426
434
|
- Set Claude default `max_tokens` to 4096
|
427
435
|
- Combine user and assistant messages for Vertex models.
|
428
436
|
- Warn when using the `name` parameter with task created from `@task` decorated function.
|
429
|
-
- Make sample `metadata` available in prompt, grading, and self-
|
437
|
+
- Make sample `metadata` available in prompt, grading, and self-critique templates.
|
430
438
|
- Retry on several additional OpenAI errors (APIConnectionError | APITimeoutError | InternalServerError)
|
431
439
|
- Fix a regression which would cause the 'answer' to be improperly recorded when scoring a sample.
|
432
440
|
|
433
441
|
## v0.3.20 (03 August 2024)
|
434
442
|
|
435
|
-
- `Epochs` data type for specifying epochs and reducers together (deprecated `epochs_reducer` argument).
|
443
|
+
- `Epochs` data type for specifying epochs and reducers together (deprecated `epochs_reducer` argument).
|
436
444
|
- Enable customisation of model generation cache dir via `INSPECT_CACHE_DIR` environment variable.
|
437
445
|
- Use doc comment description rather than `prompt` attribute of `@tool` for descriptions.
|
438
446
|
- Include examples section from doc comments in tool descriptions.
|
@@ -485,8 +493,6 @@
|
|
485
493
|
- Set maximum rate limit backoff time to 30 minutes
|
486
494
|
- Retry with exponential backoff for web_search Google provider.
|
487
495
|
|
488
|
-
|
489
|
-
|
490
496
|
## v0.3.18 (14 July 2024)
|
491
497
|
|
492
498
|
- [Multiple Scorers](https://inspect.ai-safety-institute.org.uk/scorers.html#sec-multiple-scorers) are now supported for evaluation tasks.
|
@@ -495,7 +501,7 @@
|
|
495
501
|
- Improved handling of very large (> 100MB) log files in Inspect View.
|
496
502
|
- Use `network_mode: none` for disabling networking by default in Docker tool environments.
|
497
503
|
- Shorten the default shutdown grace period for Docker container cleanup to 1 second.
|
498
|
-
- Allow sandbox
|
504
|
+
- Allow sandbox environment providers to specify a default `max_samples` (set to 25 for the Docker provider).
|
499
505
|
- Prevent concurrent calls to `eval_async()` (unsafe because of need to change directories for tasks). Parallel task evaluation will instead be implemented as a top-level feature of `eval()` and `eval_async()`.
|
500
506
|
- Match scorers now return answers consistently even when there is no match.
|
501
507
|
- Relocate tool related types into a new top-level `inspect_ai.tool` module (previous imports still work fow now, but result in a runtime deprecation warning).
|
@@ -506,7 +512,7 @@
|
|
506
512
|
|
507
513
|
- Optional increased control over the tool use loop via the `call_tools()` function and new `tool_calls` parameter for `generate()`.
|
508
514
|
- New `per_epoch` option for `CachePolicy` to allow caching to ignore epochs.
|
509
|
-
- Correctly handle `choices` and `files` when converting `Sample` images to base64.
|
515
|
+
- Correctly handle `choices` and `files` when converting `Sample` images to base64.
|
510
516
|
|
511
517
|
## v0.3.16 (24 June 2024)
|
512
518
|
|
@@ -585,7 +591,7 @@
|
|
585
591
|
- Add `multi_scorer()` and `majority_vote()` functions for combining multiple scorers into a single score.
|
586
592
|
- Add support for multiple model graders in `model_graded_qa()`.
|
587
593
|
- Raise `TypeError` for solvers and scorers not declared as `async`.
|
588
|
-
- Fallback to standard
|
594
|
+
- Fallback to standard parse if `NaN` or `Inf` is encountered while reading log file header.
|
589
595
|
- Remove deprecated support for matching partial model names (e.g. "gpt" or "claude").
|
590
596
|
|
591
597
|
## v0.3.8 (07 May 2024)
|
@@ -617,7 +623,7 @@
|
|
617
623
|
- `write_eval_log()` now ignores unserializable objects in metadata fields.
|
618
624
|
- `read_eval_log()` now takes a `str` or `FileInfo` (for compatibility w/ list returned from `list_eval_logs()`).
|
619
625
|
- Registry name looks are now case sensitive (fixes issue w/ loading tasks w/ mixed case names).
|
620
|
-
-
|
626
|
+
- Resiliency to Python syntax errors that occur when enumerating tasks in a directory.
|
621
627
|
- Do not throw error if unable to parse or load `.ipynb` file due to lack of dependencies (e.g. `nbformat`).
|
622
628
|
- Various additions to log viewer display (log file name, dataset/scorer in listing, filter by complex score types).
|
623
629
|
- Improvements to markdown rendering in log viewer (don't render intraword underscores, escape html tags).
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: inspect_ai
|
3
|
-
Version: 0.3.
|
3
|
+
Version: 0.3.54
|
4
4
|
Summary: Framework for large language model evaluations
|
5
5
|
Author: UK AI Safety Institute
|
6
6
|
License: MIT License
|
@@ -96,22 +96,22 @@ To get started with Inspect, please see the documentation at <https://inspect.ai
|
|
96
96
|
|
97
97
|
***
|
98
98
|
|
99
|
-
|
100
|
-
|
101
99
|
To work on development of Inspect, clone the repository and install with the `-e` flag and `[dev]` optional dependencies:
|
102
100
|
|
103
101
|
```bash
|
104
|
-
|
105
|
-
|
106
|
-
|
102
|
+
git clone https://github.com/UKGovernmentBEIS/inspect_ai.git
|
103
|
+
cd inspect_ai
|
104
|
+
pip install -e ".[dev]"
|
107
105
|
```
|
108
106
|
|
109
107
|
Optionally install pre-commit hooks via
|
108
|
+
|
110
109
|
```bash
|
111
110
|
make hooks
|
112
111
|
```
|
113
112
|
|
114
113
|
Run linting, formatting, and tests via
|
114
|
+
|
115
115
|
```bash
|
116
116
|
make check
|
117
117
|
make test
|
@@ -8,22 +8,22 @@ To get started with Inspect, please see the documentation at <https://inspect.ai
|
|
8
8
|
|
9
9
|
***
|
10
10
|
|
11
|
-
|
12
|
-
|
13
11
|
To work on development of Inspect, clone the repository and install with the `-e` flag and `[dev]` optional dependencies:
|
14
12
|
|
15
13
|
```bash
|
16
|
-
|
17
|
-
|
18
|
-
|
14
|
+
git clone https://github.com/UKGovernmentBEIS/inspect_ai.git
|
15
|
+
cd inspect_ai
|
16
|
+
pip install -e ".[dev]"
|
19
17
|
```
|
20
18
|
|
21
19
|
Optionally install pre-commit hooks via
|
20
|
+
|
22
21
|
```bash
|
23
22
|
make hooks
|
24
23
|
```
|
25
24
|
|
26
25
|
Run linting, formatting, and tests via
|
26
|
+
|
27
27
|
```bash
|
28
28
|
make check
|
29
29
|
make test
|
@@ -90,7 +90,7 @@ If you do need to interact with the underlying JSON (e.g., when reading logs fro
|
|
90
90
|
|
91
91
|
## Image Logging
|
92
92
|
|
93
|
-
By default, full base64 encoded copies of images are included in the log file. Image logging will not create performance problems when using `.eval` logs, however if you are using `.json` logs then large numbers of images could become
|
93
|
+
By default, full base64 encoded copies of images are included in the log file. Image logging will not create performance problems when using `.eval` logs, however if you are using `.json` logs then large numbers of images could become unwieldy (i.e. if your `.json` log file grows to 100mb or larger as a result).
|
94
94
|
|
95
95
|
You can disable this using the `--no-log-images` flag. For example, here we enable the `.json` log format and disable image logging:
|
96
96
|
|
@@ -324,7 +324,7 @@ The `_registry.py` file serves a place to import things that you wan't registere
|
|
324
324
|
from .approvers import auto_approver
|
325
325
|
```
|
326
326
|
|
327
|
-
You can then register your `auto_approver` Inspect extension (and
|
327
|
+
You can then register your `auto_approver` Inspect extension (and anything else imported into `_registry.py`) like this in `pyproject.toml`:
|
328
328
|
|
329
329
|
::: {.panel-tabset group="entry-points"}
|
330
330
|
## Setuptools
|
@@ -20,7 +20,7 @@ Inspect has several built-in tools, including:
|
|
20
20
|
|
21
21
|
- [Bash and Python](#sec-bash-and-python) for executing arbitrary shell and Python code.
|
22
22
|
|
23
|
-
- [Web Browser](#sec-web-browser), which provides the model with a headless
|
23
|
+
- [Web Browser](#sec-web-browser), which provides the model with a headless Chromium web browser that supports navigation, history, and mouse/keyboard interactions.
|
24
24
|
|
25
25
|
- [Web Search](#sec-web-search), which uses the Google Search API to execute and summarise web searches.
|
26
26
|
|
@@ -104,7 +104,7 @@ If you do not explicitly handle errors, then Inspect provides some default error
|
|
104
104
|
|
105
105
|
- `ToolError` — Special error thrown by tools to indicate they'd like to report an error to the model.
|
106
106
|
|
107
|
-
These are all errors that are *expected* (in fact the `
|
107
|
+
These are all errors that are *expected* (in fact the `SandboxEnvironment` interface documents them as such) and possibly recoverable by the model (try a different command, read a different file, etc.). Unexpected errors (e.g. a network error communicating with a remote service or container runtime) on the other hand are not automatically handled and result in the `Sample` failing with an error.
|
108
108
|
|
109
109
|
Many tools can simply rely on the default handling to provide reasonable behaviour around both expected and unexpected errors.
|
110
110
|
|
@@ -120,7 +120,7 @@ Another type of explicit handling is re-raising an error to bypass Inspect's def
|
|
120
120
|
|
121
121
|
``` python
|
122
122
|
try:
|
123
|
-
result = await
|
123
|
+
result = await sandbox().exec(
|
124
124
|
cmd=["decode", file],
|
125
125
|
timeout=timeout
|
126
126
|
)
|
@@ -314,7 +314,7 @@ See the [Agents](#sec-agents) section for more details on how to build evaluatio
|
|
314
314
|
|
315
315
|
## Web Browser {#sec-web-browser}
|
316
316
|
|
317
|
-
The web browser tools
|
317
|
+
The web browser tools provides models with the ability to browse the web using a headless Chromium browser. Navigation, history, and mouse/keyboard interactions are all supported.
|
318
318
|
|
319
319
|
### Configuration
|
320
320
|
|
@@ -408,7 +408,7 @@ RUN pip install playwright
|
|
408
408
|
RUN playwright install
|
409
409
|
RUN playwright install-deps
|
410
410
|
|
411
|
-
# Install other
|
411
|
+
# Install other dependencies
|
412
412
|
RUN pip install dm-env-rpc pillow bs4 lxml
|
413
413
|
|
414
414
|
# Copy Python files alongside the Dockerfile
|
@@ -78,7 +78,7 @@ inspect eval security_guide.py
|
|
78
78
|
|
79
79
|
[HellaSwag](https://rowanzellers.com/hellaswag/) is a dataset designed to test commonsense natural language inference (NLI) about physical situations. It includes samples that are adversarially constructed to violate common sense about the physical world, so can be a challenge for some language models.
|
80
80
|
|
81
|
-
For example, here is one of the questions in the dataset along with its set of possible
|
81
|
+
For example, here is one of the questions in the dataset along with its set of possible answers (the correct answer is C):
|
82
82
|
|
83
83
|
> In home pet groomers demonstrate how to groom a pet. the person
|
84
84
|
>
|
@@ -570,4 +570,4 @@ def ctf_agent(max_attempts=3, message_limit=30):
|
|
570
570
|
|
571
571
|
The `basic_agent()` provides a ReAct tool loop with support for retries and encouraging the model to continue if its gives up or gets stuck. The `bash()` and `python()` tools are provided to the model with a 3-minute timeout to prevent long running commands from getting the evaluation stuck.
|
572
572
|
|
573
|
-
See the [full source code](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/gdm_capabilities/intercode_ctf) of the Intercode CTF example to explore the dataset and evaluation code in more depth.
|
573
|
+
See the [full source code](https://github.com/UKGovernmentBEIS/inspect_evals/tree/main/src/inspect_evals/gdm_capabilities/intercode_ctf) of the Intercode CTF example to explore the dataset and evaluation code in more depth.
|
@@ -42,6 +42,7 @@ LOG_BUFFER_HELP = "Number of samples to buffer before writing log file. If not s
|
|
42
42
|
NO_SCORE_HELP = (
|
43
43
|
"Do not score model output (use the inspect score command to score output later)"
|
44
44
|
)
|
45
|
+
NO_SCORE_DISPLAY = "Do not display scoring metrics in realtime."
|
45
46
|
MAX_CONNECTIONS_HELP = f"Maximum number of concurrent connections to Model API (defaults to {DEFAULT_MAX_CONNECTIONS})"
|
46
47
|
MAX_RETRIES_HELP = (
|
47
48
|
f"Maximum number of times to retry request (defaults to {DEFAULT_MAX_RETRIES})"
|
@@ -257,6 +258,13 @@ def eval_options(func: Callable[..., Any]) -> Callable[..., click.Context]:
|
|
257
258
|
help=NO_SCORE_HELP,
|
258
259
|
envvar="INSPECT_EVAL_NO_SCORE",
|
259
260
|
)
|
261
|
+
@click.option(
|
262
|
+
"--no-score-display",
|
263
|
+
type=bool,
|
264
|
+
is_flag=True,
|
265
|
+
help=NO_SCORE_HELP,
|
266
|
+
envvar="INSPECT_EVAL_SCORE_DISPLAY",
|
267
|
+
)
|
260
268
|
@click.option(
|
261
269
|
"--max-tokens",
|
262
270
|
type=int,
|
@@ -339,7 +347,7 @@ def eval_options(func: Callable[..., Any]) -> Callable[..., click.Context]:
|
|
339
347
|
"--logprobs",
|
340
348
|
type=bool,
|
341
349
|
is_flag=True,
|
342
|
-
help="Return log probabilities of the output tokens. OpenAI, Google, Grok, TogetherAI, Huggingface, vLLM only.",
|
350
|
+
help="Return log probabilities of the output tokens. OpenAI, Google, Grok, TogetherAI, Huggingface, llama-cpp-python, and vLLM only.",
|
343
351
|
envvar="INSPECT_EVAL_LOGPROBS",
|
344
352
|
)
|
345
353
|
@click.option(
|
@@ -446,6 +454,7 @@ def eval_command(
|
|
446
454
|
log_images: bool | None,
|
447
455
|
log_buffer: int | None,
|
448
456
|
no_score: bool | None,
|
457
|
+
no_score_display: bool | None,
|
449
458
|
log_format: Literal["eval", "json"] | None,
|
450
459
|
**common: Unpack[CommonOptions],
|
451
460
|
) -> None:
|
@@ -495,6 +504,7 @@ def eval_command(
|
|
495
504
|
log_images=log_images,
|
496
505
|
log_buffer=log_buffer,
|
497
506
|
no_score=no_score,
|
507
|
+
no_score_display=no_score_display,
|
498
508
|
is_eval_set=False,
|
499
509
|
**config,
|
500
510
|
)
|
@@ -603,6 +613,7 @@ def eval_set_command(
|
|
603
613
|
log_images: bool | None,
|
604
614
|
log_buffer: int | None,
|
605
615
|
no_score: bool | None,
|
616
|
+
no_score_display: bool | None,
|
606
617
|
bundle_dir: str | None,
|
607
618
|
bundle_overwrite: bool | None,
|
608
619
|
log_format: Literal["eval", "json"] | None,
|
@@ -654,6 +665,7 @@ def eval_set_command(
|
|
654
665
|
log_images=log_images,
|
655
666
|
log_buffer=log_buffer,
|
656
667
|
no_score=no_score,
|
668
|
+
no_score_display=no_score_display,
|
657
669
|
is_eval_set=True,
|
658
670
|
retry_attempts=retry_attempts,
|
659
671
|
retry_wait=retry_wait,
|
@@ -706,6 +718,7 @@ def eval_exec(
|
|
706
718
|
log_images: bool | None,
|
707
719
|
log_buffer: int | None,
|
708
720
|
no_score: bool | None,
|
721
|
+
no_score_display: bool | None,
|
709
722
|
is_eval_set: bool = False,
|
710
723
|
retry_attempts: int | None = None,
|
711
724
|
retry_wait: int | None = None,
|
@@ -746,6 +759,7 @@ def eval_exec(
|
|
746
759
|
log_images = False if log_images is False else None
|
747
760
|
trace = True if trace else None
|
748
761
|
score = False if no_score else True
|
762
|
+
score_display = False if no_score_display else None
|
749
763
|
|
750
764
|
# build params
|
751
765
|
params: dict[str, Any] = (
|
@@ -781,6 +795,7 @@ def eval_exec(
|
|
781
795
|
log_images=log_images,
|
782
796
|
log_buffer=log_buffer,
|
783
797
|
score=score,
|
798
|
+
score_display=score_display,
|
784
799
|
)
|
785
800
|
| kwargs
|
786
801
|
)
|
@@ -915,6 +930,13 @@ def parse_comma_separated(value: str | None) -> list[str] | None:
|
|
915
930
|
help=NO_SCORE_HELP,
|
916
931
|
envvar="INSPECT_EVAL_SCORE",
|
917
932
|
)
|
933
|
+
@click.option(
|
934
|
+
"--no-score-display",
|
935
|
+
type=bool,
|
936
|
+
is_flag=True,
|
937
|
+
help=NO_SCORE_HELP,
|
938
|
+
envvar="INSPECT_EVAL_SCORE_DISPLAY",
|
939
|
+
)
|
918
940
|
@click.option(
|
919
941
|
"--max-connections",
|
920
942
|
type=int,
|
@@ -940,6 +962,7 @@ def eval_retry_command(
|
|
940
962
|
log_images: bool | None,
|
941
963
|
log_buffer: int | None,
|
942
964
|
no_score: bool | None,
|
965
|
+
no_score_display: bool | None,
|
943
966
|
max_connections: int | None,
|
944
967
|
max_retries: int | None,
|
945
968
|
timeout: int | None,
|
@@ -954,6 +977,7 @@ def eval_retry_command(
|
|
954
977
|
log_samples = False if no_log_samples else None
|
955
978
|
log_images = False if log_images is False else None
|
956
979
|
score = False if no_score else True
|
980
|
+
score_display = False if no_score_display else None
|
957
981
|
|
958
982
|
# resolve fail_on_error
|
959
983
|
if no_fail_on_error is True:
|
@@ -984,6 +1008,7 @@ def eval_retry_command(
|
|
984
1008
|
log_images=log_images,
|
985
1009
|
log_buffer=log_buffer,
|
986
1010
|
score=score,
|
1011
|
+
score_display=score_display,
|
987
1012
|
max_retries=max_retries,
|
988
1013
|
timeout=timeout,
|
989
1014
|
max_connections=max_connections,
|
@@ -11,6 +11,7 @@ from .list import list_command
|
|
11
11
|
from .log import log_command
|
12
12
|
from .sandbox import sandbox_command
|
13
13
|
from .score import score_command
|
14
|
+
from .trace import trace_command
|
14
15
|
from .view import view_command
|
15
16
|
|
16
17
|
|
@@ -46,6 +47,7 @@ inspect.add_command(log_command)
|
|
46
47
|
inspect.add_command(score_command)
|
47
48
|
inspect.add_command(view_command)
|
48
49
|
inspect.add_command(sandbox_command)
|
50
|
+
inspect.add_command(trace_command)
|
49
51
|
|
50
52
|
|
51
53
|
def main() -> None:
|