PyPI - inspect-ai - Versions diffs - 0.3.49__py3-none-any.whl → 0.3.51__py3-none-any.whl - Mend

inspect-ai 0.3.49py3-none-any.whl → 0.3.51py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

inspect_ai/_cli/info.py +2 -2
inspect_ai/_cli/log.py +2 -2
inspect_ai/_cli/score.py +2 -2
inspect_ai/_display/core/display.py +19 -0
inspect_ai/_display/core/panel.py +37 -7
inspect_ai/_display/core/progress.py +29 -2
inspect_ai/_display/core/results.py +79 -40
inspect_ai/_display/core/textual.py +21 -0
inspect_ai/_display/rich/display.py +28 -8
inspect_ai/_display/textual/app.py +107 -1
inspect_ai/_display/textual/display.py +1 -1
inspect_ai/_display/textual/widgets/samples.py +132 -91
inspect_ai/_display/textual/widgets/task_detail.py +236 -0
inspect_ai/_display/textual/widgets/tasks.py +74 -6
inspect_ai/_display/textual/widgets/toggle.py +32 -0
inspect_ai/_eval/context.py +2 -0
inspect_ai/_eval/eval.py +4 -3
inspect_ai/_eval/loader.py +1 -1
inspect_ai/_eval/run.py +35 -2
inspect_ai/_eval/task/log.py +13 -11
inspect_ai/_eval/task/results.py +12 -3
inspect_ai/_eval/task/run.py +139 -36
inspect_ai/_eval/task/sandbox.py +2 -1
inspect_ai/_util/_async.py +30 -1
inspect_ai/_util/file.py +31 -4
inspect_ai/_util/html.py +3 -0
inspect_ai/_util/logger.py +6 -5
inspect_ai/_util/platform.py +5 -6
inspect_ai/_util/registry.py +1 -1
inspect_ai/_view/server.py +9 -9
inspect_ai/_view/www/App.css +2 -2
inspect_ai/_view/www/dist/assets/index.css +2 -2
inspect_ai/_view/www/dist/assets/index.js +352 -294
inspect_ai/_view/www/log-schema.json +13 -0
inspect_ai/_view/www/package.json +1 -0
inspect_ai/_view/www/src/components/MessageBand.mjs +1 -1
inspect_ai/_view/www/src/components/Tools.mjs +16 -13
inspect_ai/_view/www/src/samples/SampleDisplay.mjs +1 -3
inspect_ai/_view/www/src/samples/SampleScoreView.mjs +52 -77
inspect_ai/_view/www/src/samples/SamplesDescriptor.mjs +38 -13
inspect_ai/_view/www/src/samples/transcript/ModelEventView.mjs +15 -2
inspect_ai/_view/www/src/samples/transcript/state/StateEventRenderers.mjs +4 -2
inspect_ai/_view/www/src/types/log.d.ts +2 -0
inspect_ai/_view/www/src/workspace/WorkSpace.mjs +2 -0
inspect_ai/_view/www/yarn.lock +9 -4
inspect_ai/approval/__init__.py +1 -1
inspect_ai/approval/_human/approver.py +35 -0
inspect_ai/approval/_human/console.py +62 -0
inspect_ai/approval/_human/manager.py +108 -0
inspect_ai/approval/_human/panel.py +233 -0
inspect_ai/approval/_human/util.py +51 -0
inspect_ai/dataset/_sources/hf.py +2 -2
inspect_ai/dataset/_sources/util.py +1 -1
inspect_ai/log/_file.py +106 -36
inspect_ai/log/_recorders/eval.py +226 -158
inspect_ai/log/_recorders/file.py +9 -6
inspect_ai/log/_recorders/json.py +35 -12
inspect_ai/log/_recorders/recorder.py +15 -15
inspect_ai/log/_samples.py +52 -0
inspect_ai/model/_model.py +14 -0
inspect_ai/model/_model_output.py +4 -0
inspect_ai/model/_providers/azureai.py +1 -1
inspect_ai/model/_providers/hf.py +106 -4
inspect_ai/model/_providers/util/__init__.py +2 -0
inspect_ai/model/_providers/util/hf_handler.py +200 -0
inspect_ai/scorer/_common.py +1 -1
inspect_ai/solver/_plan.py +0 -8
inspect_ai/solver/_task_state.py +18 -1
inspect_ai/solver/_use_tools.py +9 -1
inspect_ai/tool/_tool_def.py +2 -2
inspect_ai/tool/_tool_info.py +14 -2
inspect_ai/tool/_tool_params.py +2 -1
inspect_ai/tool/_tools/_execute.py +1 -1
inspect_ai/tool/_tools/_web_browser/_web_browser.py +6 -0
inspect_ai/util/__init__.py +5 -6
inspect_ai/util/_panel.py +91 -0
inspect_ai/util/_sandbox/__init__.py +2 -6
inspect_ai/util/_sandbox/context.py +4 -3
inspect_ai/util/_sandbox/docker/compose.py +12 -2
inspect_ai/util/_sandbox/docker/docker.py +19 -9
inspect_ai/util/_sandbox/docker/util.py +10 -2
inspect_ai/util/_sandbox/environment.py +47 -41
inspect_ai/util/_sandbox/local.py +15 -10
inspect_ai/util/_subprocess.py +43 -3
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/METADATA +2 -2
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/RECORD +90 -82
inspect_ai/_view/www/node_modules/flatted/python/flatted.py +0 -149
inspect_ai/_view/www/node_modules/flatted/python/test.py +0 -63
inspect_ai/approval/_human.py +0 -123
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/LICENSE +0 -0
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/WHEEL +0 -0
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/entry_points.txt +0 -0
{inspect_ai-0.3.49.dist-info → inspect_ai-0.3.51.dist-info}/top_level.txt +0 -0

inspect_ai/log/_recorders/eval.py CHANGED Viewed

@@ -1,8 +1,13 @@
+import asyncio
 import json
+import os
 import tempfile
+from contextlib import _AsyncGeneratorContextManager
+from logging import getLogger
 from typing import Any, BinaryIO, Literal, cast
 from zipfile import ZIP_DEFLATED, ZipFile
+from fsspec.asyn import AsyncFileSystem  # type: ignore
 from pydantic import BaseModel, Field
 from pydantic_core import to_json
 from typing_extensions import override
@@ -10,7 +15,7 @@ from typing_extensions import override
 from inspect_ai._util.constants import LOG_SCHEMA_VERSION
 from inspect_ai._util.content import ContentImage, ContentText
 from inspect_ai._util.error import EvalError
-from inspect_ai._util.file import dirname, file
+from inspect_ai._util.file import FileSystem, async_fileystem, dirname, file, filesystem
 from inspect_ai._util.json import jsonable_python
 from inspect_ai.model._chat_message import ChatMessage
 from inspect_ai.scorer._metric import Score
@@ -27,15 +32,17 @@ from .._log import (
 )
 from .file import FileRecorder
+logger = getLogger(__name__)
 class SampleSummary(BaseModel):
     id: int | str
     epoch: int
     input: str | list[ChatMessage]
     target: str | list[str]
-    scores: dict[str, Score] | None
-    error: str | None
-    limit: str | None
+    scores: dict[str, Score] | None = Field(default=None)
+    error: str | None = Field(default=None)
+    limit: str | None = Field(default=None)
 class LogStart(BaseModel):
@@ -82,55 +89,54 @@ class EvalRecorder(FileRecorder):
         self.data: dict[str, ZipLogFile] = {}
     @override
-    def log_init(self, eval: EvalSpec, location: str | None = None) -> str:
-        # file to write to
-        file = location or self._log_file_path(eval)
+    async def log_init(self, eval: EvalSpec, location: str | None = None) -> str:
+        # if the file exists then read summaries
+        if location is not None and self.fs.exists(location):
+            with file(location, "rb") as f:
+                with ZipFile(f, "r") as zip:
+                    log_start = _read_start(zip)
+                    summary_counter = _read_summary_counter(zip)
+                    summaries = _read_all_summaries(zip, summary_counter)
+        else:
+            log_start = None
+            summary_counter = 0
+            summaries = []
         # create zip wrapper
-        zip_log_file = ZipLogFile(file=file)
-        # Initialize the summary counter and existing summaries
-        summary_counter = _read_summary_counter(zip_log_file.zip)
-        summaries = _read_all_summaries(zip_log_file.zip, summary_counter)
-        # Initialize the eval header (without results)
-        log_start = _read_start(zip_log_file.zip)
-        # The zip log file
-        zip_log_file.init(log_start, summary_counter, summaries)
+        zip_file = location or self._log_file_path(eval)
+        zip_log_file = ZipLogFile(file=zip_file)
+        await zip_log_file.init(log_start, summary_counter, summaries)
         # track zip
         self.data[self._log_file_key(eval)] = zip_log_file
         # return file path
-        return file
+        return zip_file
     @override
-    def log_start(self, eval: EvalSpec, plan: EvalPlan) -> None:
+    async def log_start(self, eval: EvalSpec, plan: EvalPlan) -> None:
+        log = self.data[self._log_file_key(eval)]
         start = LogStart(version=LOG_SCHEMA_VERSION, eval=eval, plan=plan)
-        self._write(eval, _journal_path(START_JSON), start)
-        log = self.data[self._log_file_key(eval)]  # noqa: F841
-        log.log_start = start
+        await log.start(start)
     @override
-    def log_sample(self, eval: EvalSpec, sample: EvalSample) -> None:
-        log = self.data[self._log_file_key(eval)]  # noqa: F841
-        log.samples.append(sample)
+    async def log_sample(self, eval: EvalSpec, sample: EvalSample) -> None:
+        log = self.data[self._log_file_key(eval)]
+        await log.buffer_sample(sample)
     @override
-    def flush(self, eval: EvalSpec) -> None:
+    async def flush(self, eval: EvalSpec) -> None:
         # get the zip log
         log = self.data[self._log_file_key(eval)]
         # write the buffered samples
-        self._write_buffered_samples(eval)
+        await log.write_buffered_samples()
         # flush to underlying stream
-        log.flush()
+        await log.flush()
     @override
-    def log_finish(
+    async def log_finish(
         self,
         eval: EvalSpec,
         status: Literal["started", "success", "cancelled", "error"],
@@ -144,18 +150,14 @@ class EvalRecorder(FileRecorder):
         log = self.data[key]
         # write the buffered samples
-        self._write_buffered_samples(eval)
+        await log.write_buffered_samples()
         # write consolidated summaries
-        self._write(eval, SUMMARIES_JSON, log.summaries)
+        await log.write(SUMMARIES_JSON, log._summaries)
         # write reductions
         if reductions is not None:
-            self._write(
-                eval,
-                REDUCTIONS_JSON,
-                reductions,
-            )
+            await log.write(REDUCTIONS_JSON, reductions)
         # Get the results
         log_results = LogResults(
@@ -165,7 +167,7 @@ class EvalRecorder(FileRecorder):
         # add the results to the original eval log from start.json
         log_start = log.log_start
         if log_start is None:
-            raise RuntimeError("Unexpectedly issing the log start value")
+            raise RuntimeError("Log not properly initialised")
         eval_header = EvalLog(
             version=log_start.version,
@@ -176,50 +178,39 @@ class EvalRecorder(FileRecorder):
             status=log_results.status,
             error=log_results.error,
         )
-        # write the results
-        self._write(eval, HEADER_JSON, eval_header)
-        # close the file
-        log.close()
+        await log.write(HEADER_JSON, eval_header)
         # stop tracking this eval
         del self.data[key]
-        # return the full EvalLog
-        return self.read_log(log.file)
+        # flush and write the results
+        await log.flush()
+        return await log.close()
     @classmethod
     @override
-    def read_log(cls, location: str, header_only: bool = False) -> EvalLog:
-        with file(location, "rb") as z:
-            with ZipFile(z, mode="r") as zip:
-                evalLog = _read_header(zip, location)
-                if REDUCTIONS_JSON in zip.namelist():
-                    with zip.open(REDUCTIONS_JSON, "r") as f:
-                        reductions = [
-                            EvalSampleReductions(**reduction)
-                            for reduction in json.load(f)
-                        ]
-                        if evalLog.results is not None:
-                            evalLog.reductions = reductions
-                samples: list[EvalSample] | None = None
-                if not header_only:
-                    samples = []
-                    for name in zip.namelist():
-                        if name.startswith(f"{SAMPLES_DIR}/") and name.endswith(
-                            ".json"
-                        ):
-                            with zip.open(name, "r") as f:
-                                samples.append(EvalSample(**json.load(f)))
-                    sort_samples(samples)
-                    evalLog.samples = samples
-                return evalLog
+    async def read_log(cls, location: str, header_only: bool = False) -> EvalLog:
+        # if the log is not stored in the local filesystem then download it first,
+        # and then read it from a temp file (eliminates the possiblity of hundreds
+        # of small fetches from the zip file streams)
+        temp_log: str | None = None
+        fs = filesystem(location)
+        if not fs.is_local():
+            with tempfile.NamedTemporaryFile(delete=False) as temp:
+                temp_log = temp.name
+                fs.get_file(location, temp_log)
+        # read log (use temp_log if we have it)
+        try:
+            with file(temp_log or location, "rb") as z:
+                return _read_log(z, location, header_only)
+        finally:
+            if temp_log:
+                os.unlink(temp_log)
     @override
     @classmethod
-    def read_log_sample(
+    async def read_log_sample(
         cls, location: str, id: str | int, epoch: int = 1
     ) -> EvalSample:
         with file(location, "rb") as z:
@@ -234,67 +225,17 @@ class EvalRecorder(FileRecorder):
     @classmethod
     @override
-    def write_log(cls, location: str, log: EvalLog) -> None:
+    async def write_log(cls, location: str, log: EvalLog) -> None:
         # write using the recorder (so we get all of the extra streams)
         recorder = EvalRecorder(dirname(location))
-        recorder.log_init(log.eval, location)
-        recorder.log_start(log.eval, log.plan)
+        await recorder.log_init(log.eval, location)
+        await recorder.log_start(log.eval, log.plan)
         for sample in log.samples or []:
-            recorder.log_sample(log.eval, sample)
-        recorder.log_finish(
+            await recorder.log_sample(log.eval, sample)
+        await recorder.log_finish(
             log.eval, log.status, log.stats, log.results, log.reductions, log.error
         )
-    # write to the zip file
-    def _write(self, eval: EvalSpec, filename: str, data: Any) -> None:
-        log = self.data[self._log_file_key(eval)]
-        zip_write(log.zip, filename, data)
-    # write buffered samples to the zip file
-    def _write_buffered_samples(self, eval: EvalSpec) -> None:
-        # get the log
-        log = self.data[self._log_file_key(eval)]
-        # Write the buffered samples
-        summaries: list[SampleSummary] = []
-        for sample in log.samples:
-            # Write the sample
-            self._write(eval, _sample_filename(sample.id, sample.epoch), sample)
-            # Capture the summary
-            summaries.append(
-                SampleSummary(
-                    id=sample.id,
-                    epoch=sample.epoch,
-                    input=text_inputs(sample.input),
-                    target=sample.target,
-                    scores=sample.scores,
-                    error=sample.error.message if sample.error is not None else None,
-                    limit=f"{sample.limit.type}" if sample.limit is not None else None,
-                )
-            )
-        log.samples.clear()
-        # write intermediary summaries and add to master list
-        if len(summaries) > 0:
-            log.summary_counter += 1
-            summary_file = _journal_summary_file(log.summary_counter)
-            summary_path = _journal_summary_path(summary_file)
-            self._write(eval, summary_path, summaries)
-            log.summaries.extend(summaries)
-def zip_write(zip: ZipFile, filename: str, data: Any) -> None:
-    zip.writestr(
-        filename,
-        to_json(
-            value=jsonable_python(data),
-            indent=2,
-            exclude_none=True,
-            fallback=lambda _x: None,
-        ),
-    )
 def text_inputs(inputs: str | list[ChatMessage]) -> str | list[ChatMessage]:
     # Clean the input of any images
@@ -317,52 +258,179 @@ def text_inputs(inputs: str | list[ChatMessage]) -> str | list[ChatMessage]:
 class ZipLogFile:
-    TEMP_LOG_FILE_MAX = 20 * 1024 * 1024
-    zip: ZipFile
-    temp_file: BinaryIO
+    _zip: ZipFile
+    _temp_file: BinaryIO
+    _fs: FileSystem
+    _async_fs_context: _AsyncGeneratorContextManager[AsyncFileSystem] | None = None
+    _async_fs: AsyncFileSystem | None = None
     def __init__(self, file: str) -> None:
-        self.file = file
-        self.temp_file = cast(
-            BinaryIO,
-            tempfile.SpooledTemporaryFile(self.TEMP_LOG_FILE_MAX),
-        )
-        self._open()
-        self.samples: list[EvalSample] = []
-        self.summary_counter = 0
-        self.summaries: list[SampleSummary] = []
-        self.log_start: LogStart | None = None
-    def init(
+        self._file = file
+        self._fs = filesystem(file)
+        self._lock = asyncio.Lock()
+        self._temp_file = tempfile.TemporaryFile()
+        self._samples: list[EvalSample] = []
+        self._summary_counter = 0
+        self._summaries: list[SampleSummary] = []
+        self._log_start: LogStart | None = None
+    async def init(
         self,
         log_start: LogStart | None,
         summary_counter: int,
         summaries: list[SampleSummary],
     ) -> None:
-        self.summary_counter = summary_counter
-        self.summaries = summaries
-        self.log_start = log_start
+        async with self._lock:
+            # connect to async filesystem if we can
+            if self._fs.is_async():
+                self._async_fs_context = async_fileystem(self._file)
+                self._async_fs = await self._async_fs_context.__aenter__()
+            self._open()
+            self._summary_counter = summary_counter
+            self._summaries = summaries
+            self._log_start = log_start
+    @property
+    def log_start(self) -> LogStart | None:
+        return self._log_start
+    async def start(self, start: LogStart) -> None:
+        async with self._lock:
+            self._log_start = start
+            self._zip_writestr(_journal_path(START_JSON), start)
+    async def buffer_sample(self, sample: EvalSample) -> None:
+        async with self._lock:
+            self._samples.append(sample)
+    async def write_buffered_samples(self) -> None:
+        async with self._lock:
+            # Write the buffered samples
+            summaries: list[SampleSummary] = []
+            for sample in self._samples:
+                # Write the sample
+                self._zip_writestr(_sample_filename(sample.id, sample.epoch), sample)
+                # Capture the summary
+                summaries.append(
+                    SampleSummary(
+                        id=sample.id,
+                        epoch=sample.epoch,
+                        input=text_inputs(sample.input),
+                        target=sample.target,
+                        scores=sample.scores,
+                        error=sample.error.message
+                        if sample.error is not None
+                        else None,
+                        limit=f"{sample.limit.type}"
+                        if sample.limit is not None
+                        else None,
+                    )
+                )
+            self._samples.clear()
+            # write intermediary summaries and add to master list
+            if len(summaries) > 0:
+                self._summary_counter += 1
+                summary_file = _journal_summary_file(self._summary_counter)
+                summary_path = _journal_summary_path(summary_file)
+                self._zip_writestr(summary_path, summaries)
+                self._summaries.extend(summaries)
+    async def write(self, filename: str, data: Any) -> None:
+        async with self._lock:
+            self._zip_writestr(filename, data)
+    async def flush(self) -> None:
+        async with self._lock:
+            # close the zip file so it is flushed
+            self._zip.close()
+            # read the temp_file (leaves pointer at end for subsequent appends)
+            self._temp_file.seek(0)
+            log_bytes = self._temp_file.read()
+            # attempt async write
+            written = False
+            try:
+                if self._async_fs:
+                    await self._async_fs._pipe_file(self._file, log_bytes)
+                    written = True
+            except Exception as ex:
+                logger.warning(
+                    f"Error occurred during async write to {self._file}: {ex}. Falling back to sync write."
+                )
-    def flush(self) -> None:
-        self.zip.close()
-        self.temp_file.seek(0)
-        with file(self.file, "wb") as f:
-            f.write(self.temp_file.read())
-        self._open()
+            # write sync if we need to
+            if not written:
+                with file(self._file, "wb") as f:
+                    f.write(log_bytes)
+            # re-open zip file w/ self.temp_file pointer at end
+            self._open()
+    async def close(self) -> EvalLog:
+        async with self._lock:
+            # close the async context if we have one
+            try:
+                if self._async_fs_context:
+                    await self._async_fs_context.__aexit__(None, None, None)
+            except Exception as ex:
+                logger.warning(
+                    f"Error occurred while closing async fs for {self._file}: {ex}"
+                )
-    def close(self) -> None:
-        self.flush()
-        self.temp_file.close()
+            # read the log from the temp file then close it
+            try:
+                self._temp_file.seek(0)
+                return _read_log(self._temp_file, self._file)
+            finally:
+                self._temp_file.close()
     def _open(self) -> None:
-        self.zip = ZipFile(
-            self.temp_file,
+        self._zip = ZipFile(
+            self._temp_file,
             mode="a",
             compression=ZIP_DEFLATED,
             compresslevel=5,
         )
+    # raw unsynchronized version of write
+    def _zip_writestr(self, filename: str, data: Any) -> None:
+        self._zip.writestr(
+            filename,
+            to_json(
+                value=jsonable_python(data),
+                indent=2,
+                exclude_none=True,
+                fallback=lambda _x: None,
+            ),
+        )
+def _read_log(log: BinaryIO, location: str, header_only: bool = False) -> EvalLog:
+    with ZipFile(log, mode="r") as zip:
+        evalLog = _read_header(zip, location)
+        if REDUCTIONS_JSON in zip.namelist():
+            with zip.open(REDUCTIONS_JSON, "r") as f:
+                reductions = [
+                    EvalSampleReductions(**reduction) for reduction in json.load(f)
+                ]
+                if evalLog.results is not None:
+                    evalLog.reductions = reductions
+        samples: list[EvalSample] | None = None
+        if not header_only:
+            samples = []
+            for name in zip.namelist():
+                if name.startswith(f"{SAMPLES_DIR}/") and name.endswith(".json"):
+                    with zip.open(name, "r") as f:
+                        samples.append(EvalSample(**json.load(f)))
+            sort_samples(samples)
+            evalLog.samples = samples
+        return evalLog
 def _read_start(zip: ZipFile) -> LogStart | None:
     start_path = _journal_path(START_JSON)

inspect_ai/log/_recorders/file.py CHANGED Viewed

@@ -1,15 +1,16 @@
+from logging import getLogger
 from typing import Any
 from typing_extensions import override
-from inspect_ai._util.file import (
-    filesystem,
-)
+from inspect_ai._util.file import filesystem
 from inspect_ai._util.registry import registry_unqualified_name
 from .._log import EvalLog, EvalSample, EvalSpec
 from .recorder import Recorder
+logger = getLogger(__name__)
 class FileRecorder(Recorder):
     __last_read_sample_log: tuple[str, EvalLog] | None = None
@@ -18,23 +19,25 @@ class FileRecorder(Recorder):
         self, log_dir: str, suffix: str, fs_options: dict[str, Any] = {}
     ) -> None:
         self.log_dir = log_dir.rstrip("/\\")
+        self.suffix = suffix
+        # initialise filesystem
         self.fs = filesystem(log_dir, fs_options)
         self.fs.mkdir(self.log_dir, exist_ok=True)
-        self.suffix = suffix
     def is_local(self) -> bool:
         return self.fs.is_local()
     @override
     @classmethod
-    def read_log_sample(
+    async def read_log_sample(
         cls, location: str, id: str | int, epoch: int = 1
     ) -> EvalSample:
         # establish the log to read from (might be cached)
         if cls.__last_read_sample_log and (cls.__last_read_sample_log[0] == "location"):
             eval_log = cls.__last_read_sample_log[1]
         else:
-            eval_log = cls.read_log(location)
+            eval_log = await cls.read_log(location)
             cls.__last_read_sample_log = (location, eval_log)
         # throw if no samples

inspect_ai/log/_recorders/json.py CHANGED Viewed

@@ -1,3 +1,4 @@
+from logging import getLogger
 from typing import Any, Literal, get_args
 import ijson  # type: ignore
@@ -10,7 +11,9 @@ from inspect_ai._util.constants import LOG_SCHEMA_VERSION
 from inspect_ai._util.error import EvalError
 from inspect_ai._util.file import (
     absolute_file_path,
+    async_fileystem,
     file,
+    filesystem,
 )
 from .._log import (
@@ -25,6 +28,8 @@ from .._log import (
 )
 from .file import FileRecorder
+logger = getLogger(__name__)
 class JSONRecorder(FileRecorder):
     @override
@@ -57,7 +62,7 @@ class JSONRecorder(FileRecorder):
         self.data: dict[str, JSONRecorder.JSONLogFile] = {}
     @override
-    def log_init(self, eval: EvalSpec, location: str | None = None) -> str:
+    async def log_init(self, eval: EvalSpec, location: str | None = None) -> str:
         # initialize file log for this eval
         # compute an absolute path if it's a relative ref
         # (so that the writes go to the correct place even
@@ -75,19 +80,19 @@ class JSONRecorder(FileRecorder):
         return file
     @override
-    def log_start(self, eval: EvalSpec, plan: EvalPlan) -> None:
+    async def log_start(self, eval: EvalSpec, plan: EvalPlan) -> None:
         log = self.data[self._log_file_key(eval)]
         log.data.plan = plan
     @override
-    def log_sample(self, eval: EvalSpec, sample: EvalSample) -> None:
+    async def log_sample(self, eval: EvalSpec, sample: EvalSample) -> None:
         log = self.data[self._log_file_key(eval)]
         if log.data.samples is None:
             log.data.samples = []
         log.data.samples.append(sample)
     @override
-    def log_finish(
+    async def log_finish(
         self,
         spec: EvalSpec,
         status: Literal["started", "success", "cancelled", "error"],
@@ -104,7 +109,7 @@ class JSONRecorder(FileRecorder):
             log.data.error = error
         if reductions:
             log.data.reductions = reductions
-        self.write_log(log.file, log.data)
+        await self.write_log(log.file, log.data)
         log.data.location = log.file
         # stop tracking this data
@@ -114,13 +119,13 @@ class JSONRecorder(FileRecorder):
         return log.data
     @override
-    def flush(self, eval: EvalSpec) -> None:
+    async def flush(self, eval: EvalSpec) -> None:
         log = self.data[self._log_file_key(eval)]
-        self.write_log(log.file, log.data)
+        await self.write_log(log.file, log.data)
     @override
     @classmethod
-    def read_log(cls, location: str, header_only: bool = False) -> EvalLog:
+    async def read_log(cls, location: str, header_only: bool = False) -> EvalLog:
         if header_only:
             try:
                 return _read_header_streaming(location)
@@ -138,7 +143,7 @@ class JSONRecorder(FileRecorder):
                 else:
                     raise ValueError(f"Unable to read log file: {location}") from ex
-        # parse full log (also used as a fallback for header_only encountering NaN or Inf)
+        # full reads (and fallback to streaing reads if they encounter invalid json characters)
         with file(location, "r") as f:
             # parse w/ pydantic
             raw_data = from_json(f.read())
@@ -166,15 +171,33 @@ class JSONRecorder(FileRecorder):
     @override
     @classmethod
-    def write_log(cls, location: str, log: EvalLog) -> None:
+    async def write_log(cls, location: str, log: EvalLog) -> None:
         from inspect_ai.log._file import eval_log_json
         # sort samples before writing as they can come in out of order
         if log.samples:
             sort_samples(log.samples)
-        with file(location, "w") as f:
-            f.write(eval_log_json(log))
+        # get log as bytes
+        log_bytes = eval_log_json(log)
+        # try to write async for async filesystems
+        written = False
+        try:
+            fs = filesystem(location)
+            if fs.is_async():
+                async with async_fileystem(location) as async_fs:
+                    await async_fs._pipe_file(location, log_bytes)
+                    written = True
+        except Exception as ex:
+            logger.warning(
+                f"Error occurred during async write to {location}: {ex}. Falling back to sync write."
+            )
+        # otherwise use sync
+        if not written:
+            with file(location, "wb") as f:
+                f.write(log_bytes)
 def _validate_version(ver: int) -> None:

inspect-ai 0.3.49__py3-none-any.whl → 0.3.51__py3-none-any.whl

inspect-ai 0.3.49py3-none-any.whl → 0.3.51py3-none-any.whl