PyPI - driftless - Versions diffs - 0.2.7__tar.gz → 0.2.9__tar.gz - Mend

driftless 0.2.7tar.gz → 0.2.9tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

{driftless-0.2.7 → driftless-0.2.9}/CHANGELOG.md RENAMED Viewed

@@ -17,6 +17,27 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ---
+## [0.2.9] - 2026-07-01
+### Added
+- **P5.2 endpoint concurrency** — optional `run.endpoint_concurrency` (1–32,
+  default 1) runs endpoint POSTs in parallel via `ThreadPoolExecutor`; output
+  line order always matches the input file.
+---
+## [0.2.8] - 2026-07-01
+### Added
+- **P1.1 provider model discovery** — `tools/fetch_provider_models.py` queries
+  OpenAI and Anthropic `/models` APIs and emits new catalog entries only (never
+  overwrites lifecycle on existing ids). The scheduled `refresh-catalog.yml`
+  job merges discoveries when API keys are configured.
+---
 ## [0.2.7] - 2026-07-01
 ### Added
@@ -153,9 +174,9 @@ First public release on [PyPI](https://pypi.org/project/driftless/0.1.0/).
 - **Docs** — project overview, repair algorithm spec, 2×2 migration methodology,
   Poetry + Dependabot product framing.
-[Unreleased]: https://github.com/driftless-dev/driftless/compare/v0.2.7...HEAD
-[0.2.7]: https://github.com/driftless-dev/driftless/releases/tag/v0.2.7
-[0.2.6]: https://github.com/driftless-dev/driftless/compare/v0.2.6...v0.2.7
+[Unreleased]: https://github.com/driftless-dev/driftless/compare/v0.2.9...HEAD
+[0.2.9]: https://github.com/driftless-dev/driftless/releases/tag/v0.2.9
+[0.2.8]: https://github.com/driftless-dev/driftless/compare/v0.2.8...v0.2.9
 [0.2.4]: https://github.com/driftless-dev/driftless/compare/v0.2.4...v0.2.5
 [0.2.3]: https://github.com/driftless-dev/driftless/compare/v0.2.3...v0.2.4
 [0.2.2]: https://github.com/driftless-dev/driftless/compare/v0.2.2...v0.2.3

{driftless-0.2.7 → driftless-0.2.9}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: driftless
-Version: 0.2.7
+Version: 0.2.9
 Summary: Keep prompts in sync when model or eval data changes — Poetry-style lock regeneration, Dependabot-style PRs.
 Project-URL: Homepage, https://github.com/driftless-dev/driftless
 Project-URL: Repository, https://github.com/driftless-dev/driftless
@@ -133,7 +133,7 @@ can run in CI. See `.github/workflows/` for a scheduled deprecation scan, weekly
 `plan --act` triage, and manually-triggered migration workflows.
 ```yaml
-- uses: driftless-dev/driftless@v0.2.7
+- uses: driftless-dev/driftless@v0.2.9
   with:
     command: scan
 ```

{driftless-0.2.7 → driftless-0.2.9}/README.md RENAMED Viewed

@@ -94,7 +94,7 @@ can run in CI. See `.github/workflows/` for a scheduled deprecation scan, weekly
 `plan --act` triage, and manually-triggered migration workflows.
 ```yaml
-- uses: driftless-dev/driftless@v0.2.7
+- uses: driftless-dev/driftless@v0.2.9
   with:
     command: scan
 ```

{driftless-0.2.7 → driftless-0.2.9}/docs/RELEASE.md RENAMED Viewed

@@ -153,7 +153,7 @@ After a release, users can pin the composite Action by release tag
 (`action.yml` lives at the repo root — no `/action` path segment):
 ```yaml
-- uses: driftless-dev/driftless@v0.2.7
+- uses: driftless-dev/driftless@v0.2.9
   with:
     command: scan
 ```
@@ -161,9 +161,9 @@ After a release, users can pin the composite Action by release tag
 Or pin the PyPI package in the Action input:
 ```yaml
-- uses: driftless-dev/driftless@v0.2.7
+- uses: driftless-dev/driftless@v0.2.9
   with:
-    version: "==0.2.7"
+    version: "==0.2.9"
     command: migrate
 ```
@@ -171,7 +171,7 @@ Optionally maintain a floating **`v1`** tag on the latest stable minor release
 (point it at the current release tag after each publish):
 ```bash
-git tag -f v1 v0.2.7 && git push origin v1 --force
+git tag -f v1 v0.2.9 && git push origin v1 --force
 ```
 Update [`action.yml`](../action.yml) default `version` input when cutting releases.

{driftless-0.2.7 → driftless-0.2.9}/site/docs.html RENAMED Viewed

@@ -428,7 +428,7 @@ driftless view -w support_classifier</code></pre>
     <span class="tok-k">runs-on</span>: ubuntu-latest
     <span class="tok-k">steps</span>:
       - <span class="tok-k">uses</span>: actions/checkout@v4
-      - <span class="tok-k">uses</span>: driftless-dev/driftless@v0.2.7
+      - <span class="tok-k">uses</span>: driftless-dev/driftless@v0.2.9
         <span class="tok-k">with</span>:
           <span class="tok-k">command</span>: <span class="tok-s">plan</span></code></pre>
         <p>A scheduled <code class="inline">plan</code> gates CI when a deprecated model needs attention; a manually-triggered <code class="inline">migrate</code> opens a PR (or an issue when blocked) with the evidence attached.</p>

{driftless-0.2.7 → driftless-0.2.9}/src/driftless/__init__.py RENAMED Viewed

@@ -1,3 +1,3 @@
 """driftless: Dependabot for LLM models."""
-__version__ = "0.2.7"
+__version__ = "0.2.9"

{driftless-0.2.7 → driftless-0.2.9}/src/driftless/contract.py RENAMED Viewed

@@ -68,6 +68,9 @@ class RunSpec(StrictModel):
     # the shell runner, which uses ``{{ model }}`` substitution / env_var).
     model_param: str | None = None
     timeout_seconds: int = 1800
+    # For endpoints: max parallel POSTs (1 = sequential). Output order always
+    # matches input order regardless of completion order.
+    endpoint_concurrency: int = 1
     @field_validator("command", "endpoint")
     @classmethod
@@ -76,6 +79,13 @@ class RunSpec(StrictModel):
             raise ValueError("must not be blank")
         return v
+    @field_validator("endpoint_concurrency")
+    @classmethod
+    def _endpoint_concurrency_range(cls, v: int) -> int:
+        if v < 1 or v > 32:
+            raise ValueError("run.endpoint_concurrency must be between 1 and 32")
+        return v
     @model_validator(mode="after")
     def _one_runner(self) -> "RunSpec":
         if not self.command and not self.endpoint:

{driftless-0.2.7 → driftless-0.2.9}/src/driftless/harness.py RENAMED Viewed

@@ -16,6 +16,7 @@ import sys
 import time
 import urllib.error
 import urllib.request
+from concurrent.futures import ThreadPoolExecutor
 from dataclasses import dataclass, field
 from pathlib import Path
@@ -198,6 +199,52 @@ def _read_jsonl(path: Path) -> list[dict]:
     return records
+def _endpoint_post_record(
+    index: int,
+    rec: dict,
+    *,
+    endpoint: str,
+    model: str,
+    model_param: str,
+    headers: dict[str, str],
+    timeout: float,
+    id_field: str | None,
+) -> str:
+    """POST one input record and return the output JSONL line."""
+    body = dict(rec)
+    body[model_param] = model
+    try:
+        text = _http_post(
+            endpoint, json.dumps(body).encode("utf-8"), headers, timeout
+        )
+    except urllib.error.HTTPError as exc:
+        raise HarnessError(
+            f"endpoint returned HTTP {exc.code} on record {index}",
+            hint=_tail(exc.read().decode("utf-8", "replace")) if exc.fp else str(exc),
+        ) from exc
+    except (urllib.error.URLError, TimeoutError, OSError) as exc:
+        raise HarnessError(
+            f"endpoint request failed on record {index}: {endpoint}",
+            hint=str(getattr(exc, "reason", exc)),
+        ) from exc
+    try:
+        obj = json.loads(text)
+    except json.JSONDecodeError as exc:
+        raise HarnessError(
+            f"endpoint returned non-JSON on record {index}",
+            hint=_tail(text) or "expected a JSON object per record",
+        ) from exc
+    if not isinstance(obj, dict):
+        raise HarnessError(
+            f"endpoint response on record {index} must be a JSON object",
+            hint=f"got {type(obj).__name__}",
+        )
+    if id_field and id_field not in obj and id_field in rec:
+        obj[id_field] = rec[id_field]
+    return json.dumps(obj)
 def _run_endpoint(
     workflow: Workflow, model: str, *, cwd: Path, output_path: Path
 ) -> RunResult:
@@ -207,7 +254,8 @@ def _run_endpoint(
     ``run.model_param`` (default ``"model"``); the JSON response object is written
     as the corresponding output record. When ``eval.id_field`` is set and the
     response omits it, the input's id is copied through so output<->label
-    alignment still works.
+    alignment still works. Use ``run.endpoint_concurrency`` (>1) to POST in
+    parallel; output line order always matches the input file.
     """
     run = workflow.run
     input_path = (cwd / run.input_path).resolve()
@@ -225,48 +273,39 @@ def _run_endpoint(
     if token:
         headers["Authorization"] = f"Bearer {token}"
-    out_lines: list[str] = []
+    endpoint = run.endpoint
+    if endpoint is None:
+        raise HarnessError(
+            "no endpoint URL is configured",
+            hint="set run.endpoint in the contract",
+        )
+    concurrency = run.endpoint_concurrency
+    timeout = float(run.timeout_seconds)
     start = time.monotonic()
-    for i, rec in enumerate(records, start=1):
-        body = dict(rec)
-        body[model_param] = model
-        endpoint = run.endpoint
-        if endpoint is None:
-            raise HarnessError(
-                "no endpoint URL is configured",
-                hint="set run.endpoint in the contract",
-            )
-        try:
-            text = _http_post(
-                endpoint, json.dumps(body).encode("utf-8"), headers, run.timeout_seconds
-            )
-        except urllib.error.HTTPError as exc:
-            raise HarnessError(
-                f"endpoint returned HTTP {exc.code} on record {i}",
-                hint=_tail(exc.read().decode("utf-8", "replace")) if exc.fp else str(exc),
-            ) from exc
-        except (urllib.error.URLError, TimeoutError, OSError) as exc:
-            raise HarnessError(
-                f"endpoint request failed on record {i}: {run.endpoint}",
-                hint=str(getattr(exc, "reason", exc)),
-            ) from exc
-        try:
-            obj = json.loads(text)
-        except json.JSONDecodeError as exc:
-            raise HarnessError(
-                f"endpoint returned non-JSON on record {i}",
-                hint=_tail(text) or "expected a JSON object per record",
-            ) from exc
-        if not isinstance(obj, dict):
-            raise HarnessError(
-                f"endpoint response on record {i} must be a JSON object",
-                hint=f"got {type(obj).__name__}",
-            )
-        if id_field and id_field not in obj and id_field in rec:
-            obj[id_field] = rec[id_field]
-        out_lines.append(json.dumps(obj))
+    def post_one(index: int, rec: dict) -> tuple[int, str]:
+        line = _endpoint_post_record(
+            index,
+            rec,
+            endpoint=endpoint,
+            model=model,
+            model_param=model_param,
+            headers=headers,
+            timeout=timeout,
+            id_field=id_field,
+        )
+        return index, line
+    if concurrency <= 1 or len(records) <= 1:
+        indexed_lines = [post_one(i, rec) for i, rec in enumerate(records, start=1)]
+    else:
+        workers = min(concurrency, len(records))
+        pairs = [(i, rec) for i, rec in enumerate(records, start=1)]
+        with ThreadPoolExecutor(max_workers=workers) as pool:
+            indexed_lines = list(pool.map(lambda pair: post_one(pair[0], pair[1]), pairs))
+    out_lines = [line for _, line in indexed_lines]
     duration = time.monotonic() - start
     output_path.write_text("\n".join(out_lines) + "\n", encoding="utf-8")
     return RunResult(
@@ -274,7 +313,7 @@ def _run_endpoint(
         output_path=output_path,
         returncode=0,
         duration_seconds=duration,
-        stdout=f"{len(out_lines)} records via {run.endpoint}",
+        stdout=f"{len(out_lines)} records via {endpoint} (concurrency={concurrency})",
         stderr="",
         env_overrides={},
     )

{driftless-0.2.7 → driftless-0.2.9}/tests/test_endpoint.py RENAMED Viewed

@@ -118,3 +118,48 @@ def test_run_rejects_both_command_and_endpoint():
         RunSpec.model_validate(
             {"command": "echo hi", "endpoint": "http://x", "input_path": "i", "output_path": "o"}
         )
+def test_endpoint_concurrency_must_be_in_range():
+    with pytest.raises(ValueError, match="endpoint_concurrency"):
+        RunSpec.model_validate(
+            {
+                "endpoint": "http://x",
+                "input_path": "i",
+                "output_path": "o",
+                "endpoint_concurrency": 0,
+            }
+        )
+def test_endpoint_concurrency_preserves_order_and_parallelizes(tmp_path, monkeypatch):
+    import threading
+    import time
+    records = [{"id": str(i), "text": "x"} for i in range(8)]
+    _write_inputs(tmp_path, records)
+    lock = threading.Lock()
+    in_flight = 0
+    max_in_flight = 0
+    def fake_post(url, payload, headers, timeout):
+        nonlocal in_flight, max_in_flight
+        body = json.loads(payload.decode("utf-8"))
+        with lock:
+            in_flight += 1
+            max_in_flight = max(max_in_flight, in_flight)
+        time.sleep(0.03)
+        with lock:
+            in_flight -= 1
+        return json.dumps({"id": body["id"], "label": "ok"})
+    monkeypatch.setattr(harness, "_http_post", fake_post)
+    result = run_workflow(
+        _endpoint_workflow(endpoint_concurrency=4), "m1", cwd=tmp_path
+    )
+    assert result.ok
+    assert max_in_flight >= 3
+    rows = _read_out(result.output_path)
+    assert [r["id"] for r in rows] == [str(i) for i in range(8)]
+    assert "concurrency=4" in result.stdout

driftless-0.2.9/tests/test_fetch_provider_models.py ADDED Viewed

@@ -0,0 +1,111 @@
+import json
+import sys
+from pathlib import Path
+import pytest
+sys.path.insert(0, str(Path(__file__).resolve().parent.parent / "tools"))
+import fetch_provider_models as fpm  # noqa: E402
+def _catalog(models) -> Path:
+    import tempfile
+    p = Path(tempfile.mkdtemp()) / "cat.json"
+    p.write_text(json.dumps({"models": models}), encoding="utf-8")
+    return p
+def test_discover_new_models_skips_known_and_filters_openai(tmp_path):
+    cat = _catalog(
+        [
+            {"model": "gpt-4o", "provider": "openai"},
+            {"model": "claude-3-5-sonnet", "provider": "anthropic"},
+        ]
+    )
+    def fake_fetch(_key):
+        return [
+            "gpt-4o",  # known
+            "gpt-5-mini",  # new
+            "ft:gpt-4o:org:123",  # fine-tune — skip
+            "tts-1",  # infra — skip
+            "whisper-1",
+        ]
+    updates = fpm.discover_new_models(
+        provider="openai",
+        catalog_path=cat,
+        fetch_ids=fake_fetch,
+        keep=fpm._keep_openai,
+        api_key="k",
+    )
+    assert [u["model"] for u in updates] == ["gpt-5-mini"]
+    assert updates[0]["status"] == "active"
+def test_discover_new_models_anthropic_claude_only(tmp_path):
+    cat = _catalog([{"model": "claude-3-5-sonnet", "provider": "anthropic"}])
+    updates = fpm.discover_new_models(
+        provider="anthropic",
+        catalog_path=cat,
+        fetch_ids=lambda _k: ["claude-3-5-sonnet", "claude-3-7-sonnet", "not-a-model"],
+        keep=fpm._keep_anthropic,
+        api_key="k",
+    )
+    assert [u["model"] for u in updates] == ["claude-3-7-sonnet"]
+def test_fetch_updates_merges_providers_and_skips_missing_keys(tmp_path, monkeypatch):
+    cat = _catalog([{"model": "gpt-4o", "provider": "openai"}])
+    monkeypatch.delenv("OPENAI_API_KEY", raising=False)
+    monkeypatch.delenv("ANTHROPIC_API_KEY", raising=False)
+    updates = fpm.fetch_updates(["openai", "anthropic"], catalog_path=cat)
+    assert updates == []
+def test_fetch_updates_openai(monkeypatch, tmp_path):
+    cat = _catalog([{"model": "gpt-4o", "provider": "openai"}])
+    monkeypatch.setenv("OPENAI_API_KEY", "sekret")
+    monkeypatch.setattr(
+        fpm,
+        "_openai_model_ids",
+        lambda key: (["gpt-4o", "o3-mini"] if key == "sekret" else []),
+    )
+    updates = fpm.fetch_updates(["openai"], catalog_path=cat)
+    assert [u["model"] for u in updates] == ["o3-mini"]
+def test_cli_writes_output(tmp_path, monkeypatch):
+    cat = tmp_path / "cat.json"
+    cat.write_text(json.dumps({"models": []}), encoding="utf-8")
+    out = tmp_path / "updates.json"
+    monkeypatch.setattr(
+        fpm,
+        "fetch_updates",
+        lambda providers, catalog_path: [
+            {"model": "gpt-5", "provider": "openai", "status": "active"}
+        ],
+    )
+    assert fpm.main(["--provider", "openai", "--catalog", str(cat), "-o", str(out)]) == 0
+    data = json.loads(out.read_text(encoding="utf-8"))
+    assert data[0]["model"] == "gpt-5"
+def test_http_get_json_raises_on_http_error(monkeypatch):
+    import urllib.error
+    class FakeHTTPError(urllib.error.HTTPError):
+        def __init__(self):
+            super().__init__(url="http://x", code=401, msg="nope", hdrs={}, fp=None)
+    def boom(*a, **k):
+        raise FakeHTTPError()
+    monkeypatch.setattr(fpm.urllib.request, "urlopen", boom)
+    with pytest.raises(RuntimeError, match="HTTP 401"):
+        fpm._http_get_json("http://x", {})