PyPI - orca-sdk - Versions diffs - 0.1.9__py3-none-any.whl - Mend

orca-sdk 0.1.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

orca_sdk/__init__.py +30 -0
orca_sdk/_shared/__init__.py +10 -0
orca_sdk/_shared/metrics.py +634 -0
orca_sdk/_shared/metrics_test.py +570 -0
orca_sdk/_utils/__init__.py +0 -0
orca_sdk/_utils/analysis_ui.py +196 -0
orca_sdk/_utils/analysis_ui_style.css +51 -0
orca_sdk/_utils/auth.py +65 -0
orca_sdk/_utils/auth_test.py +31 -0
orca_sdk/_utils/common.py +37 -0
orca_sdk/_utils/data_parsing.py +129 -0
orca_sdk/_utils/data_parsing_test.py +244 -0
orca_sdk/_utils/pagination.py +126 -0
orca_sdk/_utils/pagination_test.py +132 -0
orca_sdk/_utils/prediction_result_ui.css +18 -0
orca_sdk/_utils/prediction_result_ui.py +110 -0
orca_sdk/_utils/tqdm_file_reader.py +12 -0
orca_sdk/_utils/value_parser.py +45 -0
orca_sdk/_utils/value_parser_test.py +39 -0
orca_sdk/async_client.py +4104 -0
orca_sdk/classification_model.py +1165 -0
orca_sdk/classification_model_test.py +887 -0
orca_sdk/client.py +4096 -0
orca_sdk/conftest.py +382 -0
orca_sdk/credentials.py +217 -0
orca_sdk/credentials_test.py +121 -0
orca_sdk/datasource.py +576 -0
orca_sdk/datasource_test.py +463 -0
orca_sdk/embedding_model.py +712 -0
orca_sdk/embedding_model_test.py +206 -0
orca_sdk/job.py +343 -0
orca_sdk/job_test.py +108 -0
orca_sdk/memoryset.py +3811 -0
orca_sdk/memoryset_test.py +1150 -0
orca_sdk/regression_model.py +841 -0
orca_sdk/regression_model_test.py +595 -0
orca_sdk/telemetry.py +742 -0
orca_sdk/telemetry_test.py +119 -0
orca_sdk-0.1.9.dist-info/METADATA +98 -0
orca_sdk-0.1.9.dist-info/RECORD +41 -0
orca_sdk-0.1.9.dist-info/WHEEL +4 -0

orca_sdk/embedding_model_test.py ADDED Viewed

@@ -0,0 +1,206 @@
+import logging
+from typing import get_args
+from uuid import uuid4
+import pytest
+from .datasource import Datasource
+from .embedding_model import (
+    ClassificationMetrics,
+    FinetunedEmbeddingModel,
+    PretrainedEmbeddingModel,
+    PretrainedEmbeddingModelName,
+)
+from .job import Status
+from .memoryset import LabeledMemoryset
+def test_open_pretrained_model():
+    model = PretrainedEmbeddingModel.GTE_BASE
+    assert model is not None
+    assert isinstance(model, PretrainedEmbeddingModel)
+    assert model.name == "GTE_BASE"
+    assert model.embedding_dim == 768
+    assert model.max_seq_length == 8192
+    assert model is PretrainedEmbeddingModel.GTE_BASE
+def test_open_pretrained_model_unauthenticated(unauthenticated_client):
+    with unauthenticated_client.use():
+        with pytest.raises(ValueError, match="Invalid API key"):
+            PretrainedEmbeddingModel.GTE_BASE.embed("I love this airline")
+def test_open_pretrained_model_not_found():
+    with pytest.raises(LookupError):
+        PretrainedEmbeddingModel._get("INVALID_MODEL")  # type: ignore
+def test_all_pretrained_models():
+    models = PretrainedEmbeddingModel.all()
+    assert len(models) > 1
+    if len(models) != len(get_args(PretrainedEmbeddingModelName)):
+        logging.warning("Please regenerate the SDK client! Some pretrained model names are not exposed yet.")
+    model_names = [m.name for m in models]
+    assert all(m in model_names for m in get_args(PretrainedEmbeddingModelName))
+def test_embed_text():
+    embedding = PretrainedEmbeddingModel.GTE_BASE.embed("I love this airline", max_seq_length=32)
+    assert embedding is not None
+    assert isinstance(embedding, list)
+    assert len(embedding) == 768
+    assert isinstance(embedding[0], float)
+def test_embed_text_unauthenticated(unauthenticated_client):
+    with unauthenticated_client.use():
+        with pytest.raises(ValueError, match="Invalid API key"):
+            PretrainedEmbeddingModel.GTE_BASE.embed("I love this airline", max_seq_length=32)
+def test_evaluate_pretrained_model(datasource: Datasource):
+    metrics = PretrainedEmbeddingModel.GTE_BASE.evaluate(datasource=datasource, label_column="label")
+    assert metrics is not None
+    assert isinstance(metrics, ClassificationMetrics)
+    assert metrics.accuracy > 0.5
+@pytest.fixture(scope="session")
+def finetuned_model(datasource) -> FinetunedEmbeddingModel:
+    return PretrainedEmbeddingModel.DISTILBERT.finetune("test_finetuned_model", datasource)
+def test_finetune_model_with_datasource(finetuned_model: FinetunedEmbeddingModel):
+    assert finetuned_model is not None
+    assert finetuned_model.name == "test_finetuned_model"
+    assert finetuned_model.base_model == PretrainedEmbeddingModel.DISTILBERT
+    assert finetuned_model.embedding_dim == 768
+    assert finetuned_model.max_seq_length == 512
+    assert finetuned_model._status == Status.COMPLETED
+def test_finetune_model_with_memoryset(readonly_memoryset: LabeledMemoryset):
+    finetuned_model = PretrainedEmbeddingModel.DISTILBERT.finetune(
+        "test_finetuned_model_from_memoryset", readonly_memoryset
+    )
+    assert finetuned_model is not None
+    assert finetuned_model.name == "test_finetuned_model_from_memoryset"
+    assert finetuned_model.base_model == PretrainedEmbeddingModel.DISTILBERT
+    assert finetuned_model.embedding_dim == 768
+    assert finetuned_model.max_seq_length == 512
+    assert finetuned_model._status == Status.COMPLETED
+def test_finetune_model_already_exists_error(datasource: Datasource, finetuned_model):
+    with pytest.raises(ValueError):
+        PretrainedEmbeddingModel.DISTILBERT.finetune("test_finetuned_model", datasource)
+def test_finetune_model_already_exists_return(datasource: Datasource, finetuned_model):
+    with pytest.raises(ValueError):
+        PretrainedEmbeddingModel.GTE_BASE.finetune("test_finetuned_model", datasource, if_exists="open")
+    new_model = PretrainedEmbeddingModel.DISTILBERT.finetune("test_finetuned_model", datasource, if_exists="open")
+    assert new_model is not None
+    assert new_model.name == "test_finetuned_model"
+    assert new_model.base_model == PretrainedEmbeddingModel.DISTILBERT
+    assert new_model.embedding_dim == 768
+    assert new_model.max_seq_length == 512
+    assert new_model._status == Status.COMPLETED
+def test_finetune_model_unauthenticated(unauthenticated_client, datasource: Datasource):
+    with unauthenticated_client.use():
+        with pytest.raises(ValueError, match="Invalid API key"):
+            PretrainedEmbeddingModel.DISTILBERT.finetune("test_finetuned_model_unauthenticated", datasource)
+def test_use_finetuned_model_in_memoryset(datasource: Datasource, finetuned_model: FinetunedEmbeddingModel):
+    memoryset = LabeledMemoryset.create(
+        "test_memoryset_finetuned_model",
+        datasource=datasource,
+        embedding_model=finetuned_model,
+    )
+    assert memoryset is not None
+    assert memoryset.name == "test_memoryset_finetuned_model"
+    assert memoryset.embedding_model == finetuned_model
+    assert memoryset.length == datasource.length
+def test_open_finetuned_model(finetuned_model: FinetunedEmbeddingModel):
+    model = FinetunedEmbeddingModel.open(finetuned_model.name)
+    assert isinstance(model, FinetunedEmbeddingModel)
+    assert model.id == finetuned_model.id
+    assert model.name == finetuned_model.name
+    assert model.base_model == PretrainedEmbeddingModel.DISTILBERT
+    assert model.embedding_dim == 768
+    assert model.max_seq_length == 512
+    assert model == finetuned_model
+def test_embed_finetuned_model(finetuned_model: FinetunedEmbeddingModel):
+    embedding = finetuned_model.embed("I love this airline")
+    assert embedding is not None
+    assert isinstance(embedding, list)
+    assert len(embedding) == 768
+    assert isinstance(embedding[0], float)
+def test_all_finetuned_models(finetuned_model: FinetunedEmbeddingModel):
+    models = FinetunedEmbeddingModel.all()
+    assert len(models) > 0
+    assert any(model.name == finetuned_model.name for model in models)
+def test_all_finetuned_models_unauthenticated(unauthenticated_client):
+    with unauthenticated_client.use():
+        with pytest.raises(ValueError, match="Invalid API key"):
+            FinetunedEmbeddingModel.all()
+def test_all_finetuned_models_unauthorized(unauthorized_client, finetuned_model: FinetunedEmbeddingModel):
+    with unauthorized_client.use():
+        assert finetuned_model not in FinetunedEmbeddingModel.all()
+def test_drop_finetuned_model(datasource: Datasource):
+    PretrainedEmbeddingModel.DISTILBERT.finetune("finetuned_model_to_delete", datasource)
+    assert FinetunedEmbeddingModel.open("finetuned_model_to_delete")
+    FinetunedEmbeddingModel.drop("finetuned_model_to_delete")
+    with pytest.raises(LookupError):
+        FinetunedEmbeddingModel.open("finetuned_model_to_delete")
+def test_drop_finetuned_model_unauthenticated(unauthenticated_client, datasource: Datasource):
+    with unauthenticated_client.use():
+        with pytest.raises(ValueError, match="Invalid API key"):
+            PretrainedEmbeddingModel.DISTILBERT.finetune("finetuned_model_to_delete", datasource)
+def test_drop_finetuned_model_not_found():
+    with pytest.raises(LookupError):
+        FinetunedEmbeddingModel.drop(str(uuid4()))
+    # ignores error if specified
+    FinetunedEmbeddingModel.drop(str(uuid4()), if_not_exists="ignore")
+def test_drop_finetuned_model_unauthorized(unauthorized_client, finetuned_model: FinetunedEmbeddingModel):
+    with unauthorized_client.use():
+        with pytest.raises(LookupError):
+            FinetunedEmbeddingModel.drop(finetuned_model.id)
+def test_supports_instructions():
+    model = PretrainedEmbeddingModel.GTE_BASE
+    assert not model.supports_instructions
+    instruction_model = PretrainedEmbeddingModel.BGE_BASE
+    assert instruction_model.supports_instructions
+def test_use_explicit_instruction_prompt():
+    model = PretrainedEmbeddingModel.BGE_BASE
+    assert model.supports_instructions
+    input = "Hello world"
+    assert model.embed(input, prompt="Represent this sentence for sentiment retrieval:") != model.embed(input)

orca_sdk/job.py ADDED Viewed

@@ -0,0 +1,343 @@
+from __future__ import annotations
+import time
+from datetime import datetime, timedelta
+from enum import Enum
+from typing import Callable, Generic, TypedDict, TypeVar, cast
+from tqdm.auto import tqdm
+from .client import OrcaClient
+class JobConfig(TypedDict):
+    refresh_interval: int
+    show_progress: bool
+    max_wait: int
+class Status(Enum):
+    """Status of a cloud job in the job queue"""
+    # the INITIALIZED state should never be returned by the API
+    INITIALIZED = "INITIALIZED"
+    """The job has been initialized"""
+    DISPATCHED = "DISPATCHED"
+    """The job has been queued and is waiting to be processed"""
+    WAITING = "WAITING"
+    """The job is waiting for dependencies to complete"""
+    PROCESSING = "PROCESSING"
+    """The job is being processed"""
+    COMPLETED = "COMPLETED"
+    """The job has been completed successfully"""
+    FAILED = "FAILED"
+    """The job has failed"""
+    ABORTING = "ABORTING"
+    """The job is being aborted"""
+    ABORTED = "ABORTED"
+    """The job has been aborted"""
+TResult = TypeVar("TResult")
+class Job(Generic[TResult]):
+    """
+    Handle to a job that is run in the OrcaCloud
+    Attributes:
+        id: Unique identifier for the job
+        type: Type of the job
+        status: Current status of the job
+        steps_total: Total number of steps in the job, present if the job started processing
+        steps_completed: Number of steps completed in the job, present if the job started processing
+        completion: Percentage of the job that has been completed, present if the job started processing
+        exception: Exception that occurred during the job, present if the status is `FAILED`
+        value: Value of the result of the job, present if the status is `COMPLETED`
+        created_at: When the job was queued for processing
+        updated_at: When the job was last updated
+        refreshed_at: When the job status was last refreshed
+    Note:
+        Accessing status and related attributes will refresh the job status in the background.
+    """
+    id: str
+    type: str
+    status: Status
+    steps_total: int | None
+    steps_completed: int | None
+    exception: str | None
+    value: TResult | None
+    updated_at: datetime
+    created_at: datetime
+    refreshed_at: datetime
+    @property
+    def completion(self) -> float:
+        """
+        Percentage of the job that has been completed, present if the job started processing
+        """
+        return (self.steps_completed or 0) / self.steps_total if self.steps_total is not None else 0
+    # Global configuration for all jobs
+    config: JobConfig = {
+        "refresh_interval": 3,
+        "show_progress": True,
+        "max_wait": 60 * 60,
+    }
+    def __repr__(self) -> str:
+        return "Job({" + f" type: {self.type}, status: {self.status}, completion: {self.completion:.0%} " + "})"
+    @classmethod
+    def set_config(
+        cls, *, refresh_interval: int | None = None, show_progress: bool | None = None, max_wait: int | None = None
+    ):
+        """
+        Set global configuration for running jobs
+        Args:
+            refresh_interval: Time to wait between polling the job status in seconds, default is 3
+            show_progress: Whether to show a progress bar when calling the wait method, default is True
+            max_wait: Maximum time to wait for the job to complete in seconds, default is 1 hour
+        """
+        if refresh_interval is not None:
+            cls.config["refresh_interval"] = refresh_interval
+        if show_progress is not None:
+            cls.config["show_progress"] = show_progress
+        if max_wait is not None:
+            cls.config["max_wait"] = max_wait
+    @classmethod
+    def query(
+        cls,
+        status: Status | list[Status] | None = None,
+        type: str | list[str] | None = None,
+        limit: int = 100,
+        offset: int = 0,
+        start: datetime | None = None,
+        end: datetime | None = None,
+    ) -> list[Job]:
+        """
+        Query the job queue for jobs matching the given filters
+        Args:
+            status: Optional status or list of statuses to filter by
+            type: Optional type or list of types to filter by
+            limit: Maximum number of jobs to return
+            offset: Offset into the list of jobs to return
+            start: Optional minimum creation time of the jobs to query for
+            end: Optional maximum creation time of the jobs to query for
+        Returns:
+            List of jobs matching the given filters
+        """
+        client = OrcaClient._resolve_client()
+        paginated_jobs = client.GET(
+            "/job",
+            params={
+                "status": (
+                    [s.value for s in status]
+                    if isinstance(status, list)
+                    else status.value if isinstance(status, Status) else None
+                ),
+                "type": type,
+                "limit": limit,
+                "offset": offset,
+                "start_timestamp": start.isoformat() if start is not None else None,
+                "end_timestamp": end.isoformat() if end is not None else None,
+            },
+        )
+        # can't use constructor because it makes an API call, so we construct the objects manually
+        return [
+            (
+                lambda t: (
+                    obj := cls.__new__(cls),
+                    setattr(obj, "id", t["id"]),
+                    setattr(obj, "type", t["type"]),
+                    setattr(obj, "status", Status(t["status"])),
+                    setattr(obj, "steps_total", t["steps_total"]),
+                    setattr(obj, "steps_completed", t["steps_completed"]),
+                    setattr(obj, "exception", t["exception"]),
+                    setattr(obj, "value", cast(TResult, t["result"]) if t["result"] is not None else None),
+                    setattr(obj, "updated_at", datetime.fromisoformat(t["updated_at"])),
+                    setattr(obj, "created_at", datetime.fromisoformat(t["created_at"])),
+                    setattr(obj, "refreshed_at", datetime.now()),
+                    obj,
+                )[-1]
+            )(t)
+            for t in paginated_jobs["items"]
+        ]
+    def __init__(self, id: str, get_value: Callable[[], TResult | None] | None = None):
+        """
+        Create a handle to a job in the job queue
+        Args:
+            id: Unique identifier for the job
+            get_value: Optional function to customize how the value is resolved, if not provided the result will be a dict
+        """
+        self.id = id
+        client = OrcaClient._resolve_client()
+        job = client.GET("/job/{job_id}", params={"job_id": id})
+        def default_get_value():
+            client = OrcaClient._resolve_client()
+            return cast(TResult | None, client.GET("/job/{job_id}", params={"job_id": id})["result"])
+        self._get_value = get_value or default_get_value
+        self.type = job["type"]
+        self.status = Status(job["status"])
+        self.steps_total = job["steps_total"]
+        self.steps_completed = job["steps_completed"]
+        self.exception = job["exception"]
+        self.value = (
+            None
+            if job["status"] != "COMPLETED"
+            else (
+                get_value()
+                if get_value is not None
+                else cast(TResult, job["result"]) if job["result"] is not None else None
+            )
+        )
+        self.updated_at = datetime.fromisoformat(job["updated_at"])
+        self.created_at = datetime.fromisoformat(job["created_at"])
+        self.refreshed_at = datetime.now()
+    def refresh(self, throttle: float = 0):
+        """
+        Refresh the status and progress of the job
+        Params:
+            throttle: Minimum time in seconds between refreshes
+        """
+        current_time = datetime.now()
+        # Skip refresh if last refresh was too recent
+        if (current_time - self.refreshed_at) < timedelta(seconds=throttle):
+            return
+        self.refreshed_at = current_time
+        client = OrcaClient._resolve_client()
+        status_info = client.GET("/job/{job_id}/status", params={"job_id": self.id})
+        self.status = Status(status_info["status"])
+        if status_info["steps_total"] is not None:
+            self.steps_total = status_info["steps_total"]
+        if status_info["steps_completed"] is not None:
+            self.steps_completed = status_info["steps_completed"]
+        self.exception = status_info["exception"]
+        self.updated_at = datetime.fromisoformat(status_info["updated_at"])
+        if status_info["status"] == "COMPLETED":
+            self.value = self._get_value()
+    def __getattribute__(self, name: str):
+        # if the attribute is not immutable, refresh the job if it hasn't been refreshed recently
+        if name in ["status", "updated_at", "steps_total", "steps_completed", "exception", "value"]:
+            self.refresh(self.config["refresh_interval"])
+        return super().__getattribute__(name)
+    def wait(
+        self, show_progress: bool | None = None, refresh_interval: int | None = None, max_wait: int | None = None
+    ) -> None:
+        """
+        Block until the job is complete
+        Params:
+            show_progress: Show a progress bar while waiting for the job to complete
+            refresh_interval: Polling interval in seconds while waiting for the job to complete
+            max_wait: Maximum time to wait for the job to complete in seconds
+        Note:
+            The defaults for the config parameters can be set globally using the
+            [`set_config`][orca_sdk.Job.set_config] method.
+            This method will not return the result or raise an exception if the job fails. Call
+            [`result`][orca_sdk.Job.result] instead if you want to get the result.
+        Raises:
+            RuntimeError: If the job times out
+        """
+        start_time = time.time()
+        show_progress = show_progress if show_progress is not None else self.config["show_progress"]
+        refresh_interval = refresh_interval if refresh_interval is not None else self.config["refresh_interval"]
+        max_wait = max_wait if max_wait is not None else self.config["max_wait"]
+        pbar = None
+        while True:
+            # setup progress bar if steps total is known
+            if not pbar and self.steps_total is not None and show_progress:
+                desc = " ".join(self.type.split("_")).lower()
+                pbar = tqdm(total=self.steps_total, desc=desc)
+            # return if job is complete
+            if self.status in [Status.COMPLETED, Status.FAILED, Status.ABORTED]:
+                if pbar:
+                    pbar.update(self.steps_total - pbar.n)
+                    pbar.close()
+                return
+            # raise error if job timed out
+            if (time.time() - start_time) > max_wait:
+                raise RuntimeError(f"Job {self.id} timed out after {max_wait}s")
+            # update progress bar
+            if pbar and self.steps_completed is not None:
+                pbar.update(self.steps_completed - pbar.n)
+            # sleep before retrying
+            time.sleep(refresh_interval)
+    def result(
+        self, show_progress: bool | None = None, refresh_interval: int | None = None, max_wait: int | None = None
+    ) -> TResult:
+        """
+        Block until the job is complete and return the result value
+        Params:
+            show_progress: Show a progress bar while waiting for the job to complete
+            refresh_interval: Polling interval in seconds while waiting for the job to complete
+            max_wait: Maximum time to wait for the job to complete in seconds
+        Note:
+            The defaults for the config parameters can be set globally using the
+            [`set_config`][orca_sdk.Job.set_config] method.
+            This method will raise an exception if the job fails. Use [`wait`][orca_sdk.Job.wait]
+            if you just want to wait for the job to complete without raising errors on failure.
+        Returns:
+            The result value of the job
+        Raises:
+            RuntimeError: If the job fails or times out
+        """
+        if self.value is not None:
+            return self.value
+        self.wait(show_progress, refresh_interval, max_wait)
+        if self.status != Status.COMPLETED:
+            raise RuntimeError(f"Job failed with exception: {self.exception}")
+        assert self.value is not None
+        return self.value
+def abort(self, show_progress: bool = False, refresh_interval: int = 1, max_wait: int = 20) -> None:
+    """
+    Abort the job
+    Params:
+        show_progress: Optionally show a progress bar while waiting for the job to abort
+        refresh_interval: Polling interval in seconds while waiting for the job to abort
+        max_wait: Maximum time to wait for the job to abort in seconds
+    """
+    client = OrcaClient._resolve_client()
+    client.DELETE("/job/{job_id}/abort", params={"job_id": self.id})
+    self.wait(show_progress, refresh_interval, max_wait)

orca_sdk/job_test.py ADDED Viewed

@@ -0,0 +1,108 @@
+import time
+import pytest
+from datasets import Dataset
+from .classification_model import ClassificationModel
+from .datasource import Datasource
+from .job import Job, Status
+@pytest.fixture(scope="session")
+def datasource_without_nones(hf_dataset: Dataset):
+    return Datasource.from_hf_dataset(
+        "test_datasource_without_nones", hf_dataset.filter(lambda x: x["label"] is not None)
+    )
+def wait_for_jobs_status(job_ids, expected_statuses, timeout=10, poll_interval=0.2):
+    """
+    Wait until all jobs reach one of the expected statuses or timeout is reached.
+    """
+    start = time.time()
+    while time.time() - start < timeout:
+        jobs = [Job(job_id) for job_id in job_ids]
+        if all(job.status in expected_statuses for job in jobs):
+            return
+        time.sleep(poll_interval)
+    raise TimeoutError(f"Jobs did not reach statuses {expected_statuses} within {timeout} seconds")
+def test_job_creation(classification_model: ClassificationModel, datasource_without_nones: Datasource):
+    job = classification_model.evaluate(datasource_without_nones, background=True)
+    assert job.id is not None
+    assert job.type == "EVALUATE_MODEL"
+    assert job.status in [Status.DISPATCHED, Status.PROCESSING]
+    assert job.created_at is not None
+    assert job.updated_at is not None
+    assert job.refreshed_at is not None
+    assert len(Job.query(limit=5, type="EVALUATE_MODEL")) >= 1
+def test_job_result(classification_model: ClassificationModel, datasource_without_nones: Datasource):
+    job = classification_model.evaluate(datasource_without_nones, background=True)
+    result = job.result(show_progress=False)
+    assert result is not None
+    assert job.status == Status.COMPLETED
+    assert job.steps_completed is not None
+    assert job.steps_completed == job.steps_total
+def test_job_wait(classification_model: ClassificationModel, datasource_without_nones: Datasource):
+    job = classification_model.evaluate(datasource_without_nones, background=True)
+    job.wait(show_progress=False)
+    assert job.status == Status.COMPLETED
+    assert job.steps_completed is not None
+    assert job.steps_completed == job.steps_total
+    assert job.value is not None
+def test_job_refresh(classification_model: ClassificationModel, datasource_without_nones: Datasource):
+    job = classification_model.evaluate(datasource_without_nones, background=True)
+    last_refreshed_at = job.refreshed_at
+    # accessing the status attribute should refresh the job after the refresh interval
+    Job.set_config(refresh_interval=1)
+    time.sleep(1)
+    job.status
+    assert job.refreshed_at > last_refreshed_at
+    last_refreshed_at = job.refreshed_at
+    # calling refresh() should immediately refresh the job
+    job.refresh()
+    assert job.refreshed_at > last_refreshed_at
+def test_job_query_pagination(classification_model: ClassificationModel, datasource_without_nones: Datasource):
+    """Test pagination with Job.query() method"""
+    # Create multiple jobs to test pagination
+    jobs_created = []
+    for i in range(3):
+        job = classification_model.evaluate(datasource_without_nones, background=True)
+        jobs_created.append(job.id)
+    # Wait for jobs to be at least PROCESSING or COMPLETED
+    wait_for_jobs_status(jobs_created, expected_statuses=[Status.PROCESSING, Status.COMPLETED])
+    # Test basic pagination with limit
+    jobs_page1 = Job.query(type="EVALUATE_MODEL", limit=2)
+    assert len(jobs_page1) == 2
+    # Test pagination with offset
+    jobs_page2 = Job.query(type="EVALUATE_MODEL", limit=2, offset=1)
+    assert len(jobs_page2) == 2
+    # Verify different pages contain different jobs (allowing for some overlap due to timing)
+    page1_ids = {job.id for job in jobs_page1}
+    page2_ids = {job.id for job in jobs_page2}
+    # At least one job should be different between pages
+    assert len(page1_ids.symmetric_difference(page2_ids)) > 0
+    # Test filtering by status
+    jobs_by_status = Job.query(status=Status.PROCESSING, limit=10)
+    for job in jobs_by_status:
+        assert job.status == Status.PROCESSING
+    # Test filtering by multiple statuses
+    multi_status_jobs = Job.query(status=[Status.PROCESSING, Status.COMPLETED], limit=10)
+    for job in multi_status_jobs:
+        assert job.status in [Status.PROCESSING, Status.COMPLETED]