PyPI - biblicus - Versions diffs - 1.0.0__py3-none-any.whl → 1.1.1__py3-none-any.whl - Mend

biblicus 1.0.0py3-none-any.whl → 1.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

biblicus/__init__.py +5 -5
biblicus/analysis/__init__.py +1 -1
biblicus/analysis/base.py +10 -10
biblicus/analysis/markov.py +78 -68
biblicus/analysis/models.py +47 -47
biblicus/analysis/profiling.py +58 -48
biblicus/analysis/topic_modeling.py +56 -51
biblicus/cli.py +224 -177
biblicus/{recipes.py → configuration.py} +14 -14
biblicus/constants.py +2 -2
biblicus/context_engine/assembler.py +49 -19
biblicus/context_engine/retrieval.py +46 -42
biblicus/corpus.py +116 -108
biblicus/errors.py +3 -3
biblicus/evaluation.py +27 -25
biblicus/extraction.py +103 -98
biblicus/extraction_evaluation.py +26 -26
biblicus/extractors/deepgram_stt.py +7 -7
biblicus/extractors/docling_granite_text.py +11 -11
biblicus/extractors/docling_smol_text.py +11 -11
biblicus/extractors/markitdown_text.py +4 -4
biblicus/extractors/openai_stt.py +7 -7
biblicus/extractors/paddleocr_vl_text.py +20 -18
biblicus/extractors/pipeline.py +8 -8
biblicus/extractors/rapidocr_text.py +3 -3
biblicus/extractors/unstructured_text.py +3 -3
biblicus/hooks.py +4 -4
biblicus/knowledge_base.py +33 -31
biblicus/models.py +78 -78
biblicus/retrieval.py +47 -40
biblicus/retrievers/__init__.py +50 -0
biblicus/retrievers/base.py +65 -0
biblicus/{backends → retrievers}/embedding_index_common.py +44 -41
biblicus/{backends → retrievers}/embedding_index_file.py +87 -58
biblicus/{backends → retrievers}/embedding_index_inmemory.py +88 -59
biblicus/retrievers/hybrid.py +301 -0
biblicus/{backends → retrievers}/scan.py +83 -73
biblicus/{backends → retrievers}/sqlite_full_text_search.py +115 -101
biblicus/{backends → retrievers}/tf_vector.py +87 -77
biblicus/text/prompts.py +16 -8
biblicus/text/tool_loop.py +63 -5
{biblicus-1.0.0.dist-info → biblicus-1.1.1.dist-info}/METADATA +52 -43
biblicus-1.1.1.dist-info/RECORD +91 -0
biblicus/backends/__init__.py +0 -50
biblicus/backends/base.py +0 -65
biblicus/backends/hybrid.py +0 -292
biblicus-1.0.0.dist-info/RECORD +0 -91
{biblicus-1.0.0.dist-info → biblicus-1.1.1.dist-info}/WHEEL +0 -0
{biblicus-1.0.0.dist-info → biblicus-1.1.1.dist-info}/entry_points.txt +0 -0
{biblicus-1.0.0.dist-info → biblicus-1.1.1.dist-info}/licenses/LICENSE +0 -0
{biblicus-1.0.0.dist-info → biblicus-1.1.1.dist-info}/top_level.txt +0 -0

biblicus/corpus.py CHANGED Viewed

@@ -20,10 +20,10 @@ from .constants import (
     ANALYSIS_RUNS_DIR_NAME,
     CORPUS_DIR_NAME,
     DEFAULT_RAW_DIR,
-    EXTRACTION_RUNS_DIR_NAME,
-    RUNS_DIR_NAME,
+    EXTRACTION_SNAPSHOTS_DIR_NAME,
     SCHEMA_VERSION,
     SIDECAR_SUFFIX,
+    SNAPSHOTS_DIR_NAME,
 )
 from .errors import IngestCollisionError
 from .frontmatter import parse_front_matter, render_front_matter
@@ -34,10 +34,10 @@ from .models import (
     CatalogItem,
     CorpusCatalog,
     CorpusConfig,
-    ExtractionRunListEntry,
-    ExtractionRunReference,
+    ExtractionSnapshotListEntry,
+    ExtractionSnapshotReference,
     IngestResult,
-    RetrievalRun,
+    RetrievalSnapshot,
 )
 from .sources import load_source
 from .time import utc_now_iso
@@ -539,7 +539,7 @@ class Corpus:
             generated_at=utc_now_iso(),
             corpus_uri=normalize_corpus_uri(self.root),
             raw_dir=DEFAULT_RAW_DIR,
-            latest_run_id=None,
+            latest_snapshot_id=None,
             items={},
             order=[],
         )
@@ -602,69 +602,71 @@ class Corpus:
         return None
     @property
-    def runs_dir(self) -> Path:
+    def snapshots_dir(self) -> Path:
         """
-        Location of retrieval run manifests.
+        Location of retrieval snapshot manifests.
-        :return: Path to the runs directory.
+        :return: Path to the snapshots directory.
         :rtype: Path
         """
-        return self.meta_dir / RUNS_DIR_NAME
+        return self.meta_dir / SNAPSHOTS_DIR_NAME
     @property
-    def extraction_runs_dir(self) -> Path:
+    def extraction_snapshots_dir(self) -> Path:
         """
-        Location of extraction run artifacts.
+        Location of extraction snapshot artifacts.
-        :return: Path to the extraction runs directory.
+        :return: Path to the extraction snapshots directory.
         :rtype: Path
         """
-        return self.runs_dir / EXTRACTION_RUNS_DIR_NAME
+        return self.snapshots_dir / EXTRACTION_SNAPSHOTS_DIR_NAME
     @property
     def analysis_runs_dir(self) -> Path:
         """
-        Location of analysis run artifacts.
+        Location of analysis snapshot artifacts.
-        :return: Path to the analysis runs directory.
+        :return: Path to the analysis snapshots directory.
         :rtype: Path
         """
-        return self.runs_dir / ANALYSIS_RUNS_DIR_NAME
+        return self.snapshots_dir / ANALYSIS_RUNS_DIR_NAME
-    def extraction_run_dir(self, *, extractor_id: str, run_id: str) -> Path:
+    def extraction_snapshot_dir(self, *, extractor_id: str, snapshot_id: str) -> Path:
         """
-        Resolve an extraction run directory.
+        Resolve an extraction snapshot directory.
         :param extractor_id: Extractor plugin identifier.
         :type extractor_id: str
-        :param run_id: Extraction run identifier.
-        :type run_id: str
-        :return: Extraction run directory.
+        :param snapshot_id: Extraction snapshot identifier.
+        :type snapshot_id: str
+        :return: Extraction snapshot directory.
         :rtype: Path
         """
-        return self.extraction_runs_dir / extractor_id / run_id
+        return self.extraction_snapshots_dir / extractor_id / snapshot_id
-    def analysis_run_dir(self, *, analysis_id: str, run_id: str) -> Path:
+    def analysis_run_dir(self, *, analysis_id: str, snapshot_id: str) -> Path:
         """
-        Resolve an analysis run directory.
+        Resolve an analysis snapshot directory.
         :param analysis_id: Analysis backend identifier.
         :type analysis_id: str
-        :param run_id: Analysis run identifier.
-        :type run_id: str
-        :return: Analysis run directory.
+        :param snapshot_id: Analysis snapshot identifier.
+        :type snapshot_id: str
+        :return: Analysis snapshot directory.
         :rtype: Path
         """
-        return self.analysis_runs_dir / analysis_id / run_id
+        return self.analysis_runs_dir / analysis_id / snapshot_id
-    def read_extracted_text(self, *, extractor_id: str, run_id: str, item_id: str) -> Optional[str]:
+    def read_extracted_text(
+        self, *, extractor_id: str, snapshot_id: str, item_id: str
+    ) -> Optional[str]:
         """
-        Read extracted text for an item from an extraction run, when present.
+        Read extracted text for an item from an extraction snapshot, when present.
         :param extractor_id: Extractor plugin identifier.
         :type extractor_id: str
-        :param run_id: Extraction run identifier.
-        :type run_id: str
+        :param snapshot_id: Extraction snapshot identifier.
+        :type snapshot_id: str
         :param item_id: Item identifier.
         :type item_id: str
         :return: Extracted text or None if the artifact does not exist.
@@ -672,7 +674,7 @@ class Corpus:
         :raises OSError: If the file exists but cannot be read.
         """
         path = (
-            self.extraction_run_dir(extractor_id=extractor_id, run_id=run_id)
+            self.extraction_snapshot_dir(extractor_id=extractor_id, snapshot_id=snapshot_id)
             / "text"
             / f"{item_id}.txt"
         )
@@ -680,72 +682,73 @@ class Corpus:
             return None
         return path.read_text(encoding="utf-8")
-    def load_extraction_run_manifest(self, *, extractor_id: str, run_id: str):
+    def load_extraction_snapshot_manifest(self, *, extractor_id: str, snapshot_id: str):
         """
-        Load an extraction run manifest from the corpus.
+        Load an extraction snapshot manifest from the corpus.
         :param extractor_id: Extractor plugin identifier.
         :type extractor_id: str
-        :param run_id: Extraction run identifier.
-        :type run_id: str
-        :return: Parsed extraction run manifest.
-        :rtype: biblicus.extraction.ExtractionRunManifest
+        :param snapshot_id: Extraction snapshot identifier.
+        :type snapshot_id: str
+        :return: Parsed extraction snapshot manifest.
+        :rtype: biblicus.extraction.ExtractionSnapshotManifest
         :raises FileNotFoundError: If the manifest file does not exist.
         :raises ValueError: If the manifest data is invalid.
         """
-        from .extraction import ExtractionRunManifest
+        from .extraction import ExtractionSnapshotManifest
         manifest_path = (
-            self.extraction_run_dir(extractor_id=extractor_id, run_id=run_id) / "manifest.json"
+            self.extraction_snapshot_dir(extractor_id=extractor_id, snapshot_id=snapshot_id)
+            / "manifest.json"
         )
         if not manifest_path.is_file():
-            raise FileNotFoundError(f"Missing extraction run manifest: {manifest_path}")
+            raise FileNotFoundError(f"Missing extraction snapshot manifest: {manifest_path}")
         data = json.loads(manifest_path.read_text(encoding="utf-8"))
-        return ExtractionRunManifest.model_validate(data)
+        return ExtractionSnapshotManifest.model_validate(data)
-    def list_extraction_runs(
+    def list_extraction_snapshots(
         self, *, extractor_id: Optional[str] = None
-    ) -> List[ExtractionRunListEntry]:
+    ) -> List[ExtractionSnapshotListEntry]:
         """
-        List extraction runs stored under the corpus.
+        List extraction snapshots stored under the corpus.
         :param extractor_id: Optional extractor identifier filter.
         :type extractor_id: str or None
-        :return: Summary list entries for each run.
-        :rtype: list[biblicus.models.ExtractionRunListEntry]
+        :return: Summary list entries for each snapshot.
+        :rtype: list[biblicus.models.ExtractionSnapshotListEntry]
         """
-        runs_root = self.extraction_runs_dir
-        if not runs_root.is_dir():
+        snapshots_root = self.extraction_snapshots_dir
+        if not snapshots_root.is_dir():
             return []
         extractor_dirs: List[Path]
         if extractor_id is None:
-            extractor_dirs = [path for path in sorted(runs_root.iterdir()) if path.is_dir()]
+            extractor_dirs = [path for path in sorted(snapshots_root.iterdir()) if path.is_dir()]
         else:
-            extractor_path = runs_root / extractor_id
+            extractor_path = snapshots_root / extractor_id
             extractor_dirs = [extractor_path] if extractor_path.is_dir() else []
-        entries: List[ExtractionRunListEntry] = []
+        entries: List[ExtractionSnapshotListEntry] = []
         for extractor_dir in extractor_dirs:
-            for run_dir in sorted(extractor_dir.iterdir()):
-                if not run_dir.is_dir():
+            for snapshot_dir in sorted(extractor_dir.iterdir()):
+                if not snapshot_dir.is_dir():
                     continue
-                manifest_path = run_dir / "manifest.json"
+                manifest_path = snapshot_dir / "manifest.json"
                 if not manifest_path.is_file():
                     continue
                 try:
-                    manifest = self.load_extraction_run_manifest(
+                    manifest = self.load_extraction_snapshot_manifest(
                         extractor_id=extractor_dir.name,
-                        run_id=run_dir.name,
+                        snapshot_id=snapshot_dir.name,
                     )
                 except (FileNotFoundError, ValueError):
                     continue
                 entries.append(
-                    ExtractionRunListEntry(
+                    ExtractionSnapshotListEntry(
                         extractor_id=extractor_dir.name,
-                        run_id=run_dir.name,
-                        recipe_id=manifest.recipe.recipe_id,
-                        recipe_name=manifest.recipe.name,
+                        snapshot_id=snapshot_dir.name,
+                        configuration_id=manifest.configuration.configuration_id,
+                        configuration_name=manifest.configuration.name,
                         catalog_generated_at=manifest.catalog_generated_at,
                         created_at=manifest.created_at,
                         stats=dict(manifest.stats),
@@ -753,95 +756,100 @@ class Corpus:
                 )
         entries.sort(
-            key=lambda entry: (entry.created_at, entry.extractor_id, entry.run_id), reverse=True
+            key=lambda entry: (entry.created_at, entry.extractor_id, entry.snapshot_id),
+            reverse=True,
         )
         return entries
-    def latest_extraction_run_reference(
+    def latest_extraction_snapshot_reference(
         self, *, extractor_id: Optional[str] = None
-    ) -> Optional[ExtractionRunReference]:
+    ) -> Optional[ExtractionSnapshotReference]:
         """
-        Return the most recent extraction run reference.
+        Return the most recent extraction snapshot reference.
         :param extractor_id: Optional extractor identifier filter.
         :type extractor_id: str or None
-        :return: Latest extraction run reference or None when no runs exist.
-        :rtype: biblicus.models.ExtractionRunReference or None
+        :return: Latest extraction snapshot reference or None when no snapshots exist.
+        :rtype: biblicus.models.ExtractionSnapshotReference or None
         """
-        entries = self.list_extraction_runs(extractor_id=extractor_id)
+        entries = self.list_extraction_snapshots(extractor_id=extractor_id)
         if not entries:
             return None
         latest = entries[0]
-        return ExtractionRunReference(extractor_id=latest.extractor_id, run_id=latest.run_id)
+        return ExtractionSnapshotReference(
+            extractor_id=latest.extractor_id, snapshot_id=latest.snapshot_id
+        )
-    def delete_extraction_run(self, *, extractor_id: str, run_id: str) -> None:
+    def delete_extraction_snapshot(self, *, extractor_id: str, snapshot_id: str) -> None:
         """
-        Delete an extraction run directory and its derived artifacts.
+        Delete an extraction snapshot directory and its derived artifacts.
         :param extractor_id: Extractor plugin identifier.
         :type extractor_id: str
-        :param run_id: Extraction run identifier.
-        :type run_id: str
+        :param snapshot_id: Extraction snapshot identifier.
+        :type snapshot_id: str
         :return: None.
         :rtype: None
-        :raises FileNotFoundError: If the extraction run directory does not exist.
+        :raises FileNotFoundError: If the extraction snapshot directory does not exist.
         """
-        run_dir = self.extraction_run_dir(extractor_id=extractor_id, run_id=run_id)
-        if not run_dir.is_dir():
-            raise FileNotFoundError(f"Missing extraction run directory: {run_dir}")
-        shutil.rmtree(run_dir)
+        snapshot_dir = self.extraction_snapshot_dir(
+            extractor_id=extractor_id, snapshot_id=snapshot_id
+        )
+        if not snapshot_dir.is_dir():
+            raise FileNotFoundError(f"Missing extraction snapshot directory: {snapshot_dir}")
+        shutil.rmtree(snapshot_dir)
-    def _ensure_runs_dir(self) -> None:
+    def _ensure_snapshots_dir(self) -> None:
         """
-        Ensure the retrieval runs directory exists.
+        Ensure the retrieval snapshots directory exists.
         :return: None.
         :rtype: None
         """
-        self.runs_dir.mkdir(parents=True, exist_ok=True)
+        self.snapshots_dir.mkdir(parents=True, exist_ok=True)
-    def write_run(self, run: RetrievalRun) -> None:
+    def write_snapshot(self, snapshot: RetrievalSnapshot) -> None:
         """
-        Persist a retrieval run manifest and update the catalog pointer.
+        Persist a retrieval snapshot manifest and update the catalog pointer.
-        :param run: Run manifest to persist.
-        :type run: RetrievalRun
+        :param snapshot: Snapshot manifest to persist.
+        :type snapshot: RetrievalSnapshot
         :return: None.
         :rtype: None
         """
-        self._ensure_runs_dir()
-        path = self.runs_dir / f"{run.run_id}.json"
-        path.write_text(run.model_dump_json(indent=2) + "\n", encoding="utf-8")
+        self._ensure_snapshots_dir()
+        path = self.snapshots_dir / f"{snapshot.snapshot_id}.json"
+        path.write_text(snapshot.model_dump_json(indent=2) + "\n", encoding="utf-8")
         catalog = self._load_catalog()
-        catalog.latest_run_id = run.run_id
+        catalog.latest_snapshot_id = snapshot.snapshot_id
         catalog.generated_at = utc_now_iso()
         self._write_catalog(catalog)
-    def load_run(self, run_id: str) -> RetrievalRun:
+    def load_snapshot(self, snapshot_id: str) -> RetrievalSnapshot:
         """
-        Load a retrieval run manifest by identifier.
+        Load a retrieval snapshot manifest by identifier.
-        :param run_id: Run identifier.
-        :type run_id: str
-        :return: Parsed run manifest.
-        :rtype: RetrievalRun
-        :raises FileNotFoundError: If the run manifest does not exist.
+        :param snapshot_id: Snapshot identifier.
+        :type snapshot_id: str
+        :return: Parsed snapshot manifest.
+        :rtype: RetrievalSnapshot
+        :raises FileNotFoundError: If the snapshot manifest does not exist.
         """
-        path = self.runs_dir / f"{run_id}.json"
+        path = self.snapshots_dir / f"{snapshot_id}.json"
         if not path.is_file():
-            raise FileNotFoundError(f"Missing run manifest: {path}")
+            raise FileNotFoundError(f"Missing snapshot manifest: {path}")
         data = json.loads(path.read_text(encoding="utf-8"))
-        return RetrievalRun.model_validate(data)
+        return RetrievalSnapshot.model_validate(data)
     @property
-    def latest_run_id(self) -> Optional[str]:
+    def latest_snapshot_id(self) -> Optional[str]:
         """
-        Latest retrieval run identifier recorded in the catalog.
+        Latest retrieval snapshot identifier recorded in the catalog.
-        :return: Latest run identifier or None.
+        :return: Latest snapshot identifier or None.
         :rtype: str or None
         """
-        return self._load_catalog().latest_run_id
+        return self._load_catalog().latest_snapshot_id
     def _upsert_catalog_item(self, item: CatalogItem) -> None:
         """
@@ -860,7 +868,7 @@ class Corpus:
         ordered_ids.insert(0, item.id)
         catalog.order = ordered_ids
         catalog.generated_at = utc_now_iso()
-        catalog.latest_run_id = None
+        catalog.latest_snapshot_id = None
         self._write_catalog(catalog)
@@ -1621,7 +1629,7 @@ class Corpus:
             generated_at=utc_now_iso(),
             corpus_uri=normalize_corpus_uri(self.root),
             raw_dir=DEFAULT_RAW_DIR,
-            latest_run_id=None,
+            latest_snapshot_id=None,
             items=new_items,
             order=order,
         )
@@ -1673,7 +1681,7 @@ class Corpus:
                 generated_at=utc_now_iso(),
                 corpus_uri=normalize_corpus_uri(self.root),
                 raw_dir=DEFAULT_RAW_DIR,
-                latest_run_id=None,
+                latest_snapshot_id=None,
                 items={},
                 order=[],
             )

biblicus/errors.py CHANGED Viewed

@@ -5,13 +5,13 @@ Error types for Biblicus.
 from __future__ import annotations
-class ExtractionRunFatalError(RuntimeError):
+class ExtractionSnapshotFatalError(RuntimeError):
     """
-    Fatal extraction run error that should abort the entire run.
+    Fatal extraction snapshot error that should abort the entire snapshot.
     This exception is used for conditions that indicate a configuration or environment problem
     rather than a per-item extraction failure. For example, a selection extractor that depends
-    on referenced extraction run manifests treats missing manifests as fatal.
+    on referenced extraction snapshot manifests treats missing manifests as fatal.
     """

biblicus/evaluation.py CHANGED Viewed

@@ -1,5 +1,5 @@
 """
-Evaluation utilities for Biblicus retrieval runs.
+Evaluation utilities for Biblicus retrieval snapshots.
 """
 from __future__ import annotations
@@ -11,10 +11,10 @@ from typing import Dict, List, Optional
 from pydantic import BaseModel, ConfigDict, Field, model_validator
-from .backends import get_backend
 from .constants import DATASET_SCHEMA_VERSION
 from .corpus import Corpus
-from .models import QueryBudget, RetrievalResult, RetrievalRun
+from .models import QueryBudget, RetrievalResult, RetrievalSnapshot
+from .retrievers import get_retriever
 from .time import utc_now_iso
@@ -85,10 +85,10 @@ class EvaluationResult(BaseModel):
     :ivar dataset: Dataset metadata.
     :vartype dataset: dict[str, object]
-    :ivar backend_id: Backend identifier.
-    :vartype backend_id: str
-    :ivar run_id: Retrieval run identifier.
-    :vartype run_id: str
+    :ivar retriever_id: Retriever identifier.
+    :vartype retriever_id: str
+    :ivar snapshot_id: Retrieval snapshot identifier.
+    :vartype snapshot_id: str
     :ivar evaluated_at: International Organization for Standardization 8601 evaluation timestamp.
     :vartype evaluated_at: str
     :ivar metrics: Quality metrics for retrieval.
@@ -100,8 +100,8 @@ class EvaluationResult(BaseModel):
     model_config = ConfigDict(extra="forbid")
     dataset: Dict[str, object]
-    backend_id: str
-    run_id: str
+    retriever_id: str
+    snapshot_id: str
     evaluated_at: str
     metrics: Dict[str, float]
     system: Dict[str, float]
@@ -120,20 +120,20 @@ def load_dataset(path: Path) -> EvaluationDataset:
     return EvaluationDataset.model_validate(data)
-def evaluate_run(
+def evaluate_snapshot(
     *,
     corpus: Corpus,
-    run: RetrievalRun,
+    snapshot: RetrievalSnapshot,
     dataset: EvaluationDataset,
     budget: QueryBudget,
 ) -> EvaluationResult:
     """
-    Evaluate a retrieval run against a dataset.
+    Evaluate a retrieval snapshot against a dataset.
-    :param corpus: Corpus associated with the run.
+    :param corpus: Corpus associated with the snapshot.
     :type corpus: Corpus
-    :param run: Retrieval run manifest.
-    :type run: RetrievalRun
+    :param snapshot: Retrieval snapshot manifest.
+    :type snapshot: RetrievalSnapshot
     :param dataset: Evaluation dataset.
     :type dataset: EvaluationDataset
     :param budget: Evidence selection budget.
@@ -141,14 +141,16 @@ def evaluate_run(
     :return: Evaluation result bundle.
     :rtype: EvaluationResult
     """
-    backend = get_backend(run.recipe.backend_id)
+    retriever = get_retriever(snapshot.configuration.retriever_id)
     latency_seconds: List[float] = []
     hit_count = 0
     reciprocal_ranks: List[float] = []
     for query in dataset.queries:
         timer_start = time.perf_counter()
-        result = backend.query(corpus, run=run, query_text=query.query_text, budget=budget)
+        result = retriever.query(
+            corpus, snapshot=snapshot, query_text=query.query_text, budget=budget
+        )
         elapsed_seconds = time.perf_counter() - timer_start
         latency_seconds.append(elapsed_seconds)
         expected_rank = _expected_rank(result, query)
@@ -172,7 +174,7 @@ def evaluate_run(
     system = {
         "average_latency_milliseconds": _average_latency_milliseconds(latency_seconds),
         "percentile_95_latency_milliseconds": _percentile_95_latency_milliseconds(latency_seconds),
-        "index_bytes": float(_run_artifact_bytes(corpus, run)),
+        "index_bytes": float(_snapshot_artifact_bytes(corpus, snapshot)),
     }
     dataset_meta = {
         "name": dataset.name,
@@ -181,8 +183,8 @@ def evaluate_run(
     }
     return EvaluationResult(
         dataset=dataset_meta,
-        backend_id=run.recipe.backend_id,
-        run_id=run.run_id,
+        retriever_id=snapshot.configuration.retriever_id,
+        snapshot_id=snapshot.snapshot_id,
         evaluated_at=utc_now_iso(),
         metrics=metrics,
         system=system,
@@ -238,19 +240,19 @@ def _percentile_95_latency_milliseconds(latencies: List[float]) -> float:
     return sorted_latencies[percentile_index] * 1000.0
-def _run_artifact_bytes(corpus: Corpus, run: RetrievalRun) -> int:
+def _snapshot_artifact_bytes(corpus: Corpus, snapshot: RetrievalSnapshot) -> int:
     """
-    Sum artifact sizes for a retrieval run.
+    Sum artifact sizes for a retrieval snapshot.
     :param corpus: Corpus that owns the artifacts.
     :type corpus: Corpus
-    :param run: Retrieval run manifest.
-    :type run: RetrievalRun
+    :param snapshot: Retrieval snapshot manifest.
+    :type snapshot: RetrievalSnapshot
     :return: Total artifact bytes.
     :rtype: int
     """
     total_bytes = 0
-    for artifact_relpath in run.artifact_paths:
+    for artifact_relpath in snapshot.snapshot_artifacts:
         artifact_path = corpus.root / artifact_relpath
         if artifact_path.exists():
             total_bytes += artifact_path.stat().st_size

biblicus 1.0.0__py3-none-any.whl → 1.1.1__py3-none-any.whl

biblicus 1.0.0py3-none-any.whl → 1.1.1py3-none-any.whl