PyPI - lm-deluge - Versions diffs - 0.0.88__py3-none-any.whl → 0.0.90__py3-none-any.whl - Mend

lm-deluge 0.0.88py3-none-any.whl → 0.0.90py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lm-deluge might be problematic. Click here for more details.

Files changed (41) hide show

lm_deluge/__init__.py +0 -24
lm_deluge/api_requests/anthropic.py +25 -5
lm_deluge/api_requests/base.py +37 -0
lm_deluge/api_requests/bedrock.py +23 -2
lm_deluge/api_requests/gemini.py +36 -10
lm_deluge/api_requests/openai.py +31 -4
lm_deluge/batches.py +15 -45
lm_deluge/client.py +27 -1
lm_deluge/models/__init__.py +2 -0
lm_deluge/models/anthropic.py +12 -12
lm_deluge/models/google.py +13 -0
lm_deluge/models/minimax.py +9 -1
lm_deluge/models/openrouter.py +48 -0
lm_deluge/models/zai.py +50 -1
lm_deluge/pipelines/gepa/docs/samples.py +19 -10
lm_deluge/prompt.py +333 -68
lm_deluge/server/__init__.py +24 -0
lm_deluge/server/__main__.py +144 -0
lm_deluge/server/adapters.py +369 -0
lm_deluge/server/app.py +388 -0
lm_deluge/server/auth.py +71 -0
lm_deluge/server/model_policy.py +215 -0
lm_deluge/server/models_anthropic.py +172 -0
lm_deluge/server/models_openai.py +175 -0
lm_deluge/skills/anthropic.py +0 -0
lm_deluge/skills/compat.py +0 -0
lm_deluge/tool/__init__.py +13 -1
lm_deluge/tool/prefab/sandbox/__init__.py +19 -0
lm_deluge/tool/prefab/sandbox/daytona_sandbox.py +483 -0
lm_deluge/tool/prefab/sandbox/docker_sandbox.py +609 -0
lm_deluge/tool/prefab/sandbox/fargate_sandbox.py +546 -0
lm_deluge/tool/prefab/sandbox/modal_sandbox.py +469 -0
lm_deluge/tool/prefab/sandbox/seatbelt_sandbox.py +827 -0
lm_deluge/tool/prefab/skills.py +0 -0
{lm_deluge-0.0.88.dist-info → lm_deluge-0.0.90.dist-info}/METADATA +4 -3
{lm_deluge-0.0.88.dist-info → lm_deluge-0.0.90.dist-info}/RECORD +39 -24
lm_deluge/mock_openai.py +0 -643
lm_deluge/tool/prefab/sandbox.py +0 -1621
{lm_deluge-0.0.88.dist-info → lm_deluge-0.0.90.dist-info}/WHEEL +0 -0
{lm_deluge-0.0.88.dist-info → lm_deluge-0.0.90.dist-info}/licenses/LICENSE +0 -0
{lm_deluge-0.0.88.dist-info → lm_deluge-0.0.90.dist-info}/top_level.txt +0 -0

lm_deluge/models/zai.py CHANGED Viewed

@@ -1 +1,50 @@
-ZAI_MODELS = {}
+ZAI_MODELS = {
+    "glm-4.7": {
+        "id": "glm-4.7",
+        "name": "glm-4.7",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.6": {
+        "id": "glm-4.6",
+        "name": "glm-4.6",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.5": {
+        "id": "glm-4.5",
+        "name": "glm-4.5",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+    "glm-4.5-air": {
+        "id": "glm-4.5-air",
+        "name": "glm-4.5-air",
+        "api_base": "https://api.z.ai/api/anthropic/v1",
+        "api_key_env_var": "ZAI_API_KEY",
+        "supports_json": True,
+        "api_spec": "anthropic",
+        "input_cost": 0.6,
+        "cached_input_cost": 0.6,
+        "cache_write_cost": 0.6,
+        "output_cost": 2.20,
+    },
+}

lm_deluge/pipelines/gepa/docs/samples.py CHANGED Viewed

@@ -6,7 +6,11 @@ Features:
 - Selects a parent (best-by-val), mutates a single component, and accepts only if
   minibatch reward improves; accepted candidates get a full val eval and join the pool.
 - Components: system_prompt, search_docstring, fetch_docstring.
-- Rollouts are run via verifiers + MockAsyncOpenAI (lm-deluge-backed); reflection uses LLMClient.
+- Rollouts are run via verifiers + OpenAI SDK (pointing to lm-deluge proxy server); reflection uses LLMClient.
+Prerequisites:
+    Start the lm-deluge proxy server first:
+        python -m lm_deluge.server --port 8000
 Run:
     uv run python gepa_lm_deluge_full.py --corpus-file ... --queries-file ... --env-file ...
@@ -31,8 +35,9 @@ from fts_bench import (  # type: ignore
 )
 from verifiers.utils.tool_utils import convert_func_to_oai_tool  # type: ignore
-from lm_deluge.client import LLMClient, _LLMClient  # type: ignore
-from lm_deluge.mock_openai import MockAsyncOpenAI  # type: ignore
+from openai import AsyncOpenAI  # type: ignore
+from lm_deluge.client import LLMClient  # type: ignore
 from lm_deluge.util.json import try_load_json  # type: ignore
 # ---------------------- Helpers ---------------------- #
@@ -362,7 +367,12 @@ def parse_args() -> argparse.Namespace:
     parser.add_argument(
         "--model",
         default="claude-5-mini",
-        help="Model for rollouts via MockAsyncOpenAI.",
+        help="Model for rollouts via lm-deluge proxy server.",
+    )
+    parser.add_argument(
+        "--proxy-url",
+        default="http://localhost:8000/v1",
+        help="URL of the lm-deluge proxy server.",
     )
     parser.add_argument(
         "--reflection-model",
@@ -437,7 +447,8 @@ def main() -> None:
     val_records = [val_ds[i] for i in range(len(val_ds))]
     question_key = _question_key_from_records(train_records or val_records)  # noqa
-    rollout_client = MockAsyncOpenAI(model=args.model)
+    # Create OpenAI client pointing to lm-deluge proxy server
+    rollout_client = AsyncOpenAI(base_url=args.proxy_url, api_key="not-needed")
     reflection_client = LLMClient(args.reflection_model, progress="tqdm")
     seed_candidate = {
@@ -478,11 +489,9 @@ def main() -> None:
     merges_tested = 0
     frontier = compute_val_frontier(population)
-    def print_rollout_usage(rollout_client: MockAsyncOpenAI):
-        key = list(rollout_client._clients.keys())[0]
-        client_obj: _LLMClient = rollout_client._clients[key]
-        print("Rollout client usage:")
-        client_obj.print_usage()
+    def print_rollout_usage(rollout_client: AsyncOpenAI):
+        # Usage tracking not available via proxy - would need server-side tracking
+        print("Rollout client: using lm-deluge proxy server")
     for it in range(1, args.iterations + 1):
         print(f"=== Starting iteration {it} ===")

lm-deluge 0.0.88__py3-none-any.whl → 0.0.90__py3-none-any.whl

Potentially problematic release.

lm-deluge 0.0.88py3-none-any.whl → 0.0.90py3-none-any.whl