PyPI - argo-proxy - Versions diffs - 3.0.2__tar.gz → 3.0.4__tar.gz - Mend

argo-proxy 3.0.2tar.gz → 3.0.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

{argo_proxy-3.0.2/src/argo_proxy.egg-info → argo_proxy-3.0.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: argo-proxy
-Version: 3.0.2
+Version: 3.0.4
 Summary: Proxy server to Argo API, OpenAI format compatible
 Author-email: Peng Ding <oaklight@gmx.com>
 License-Expression: MIT

{argo_proxy-3.0.2 → argo_proxy-3.0.4/src/argo_proxy.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: argo-proxy
-Version: 3.0.2
+Version: 3.0.4
 Summary: Proxy server to Argo API, OpenAI format compatible
 Author-email: Peng Ding <oaklight@gmx.com>
 License-Expression: MIT

argo_proxy-3.0.4/src/argoproxy/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "3.0.4"

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/endpoints/dispatch.py RENAMED Viewed

@@ -1025,6 +1025,7 @@ async def _convert_non_streaming(
     _ensure_user_field(target_body, config.user)
     _downgrade_developer_role(target_body)
     _normalize_null_content(target_body)
+    _normalize_thinking_for_upstream(target_body)
     _debug_dump("2_request_converted", target_body, config)
     # Log the converted body
@@ -1146,6 +1147,7 @@ async def _convert_buffered_streaming(
     _ensure_user_field(target_body, config.user)
     _downgrade_developer_role(target_body)
     _normalize_null_content(target_body)
+    _normalize_thinking_for_upstream(target_body)
     # 3. Inject stream flags and update headers for streaming
     target_body = _inject_stream_flags(target_body, target_provider)
@@ -1317,6 +1319,7 @@ async def _convert_streaming(
     _ensure_user_field(target_body, config.user)
     _downgrade_developer_role(target_body)
     _normalize_null_content(target_body)
+    _normalize_thinking_for_upstream(target_body)
     format_sse = _SSE_FORMATTERS[source_provider]

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/transports.py RENAMED Viewed

@@ -131,15 +131,20 @@ async def validate_api_async(
     raise ValueError("API validation failed after all attempts")
-async def _fetch_first_model(
+async def _fetch_validation_models(
     models_url: str,
     timeout: int = 5,
     resolver_overrides: dict[str, str] | None = None,
-) -> str | None:
-    """Fetch the first available model ID from an OpenAI-compatible ``/models`` endpoint.
+) -> list[str]:
+    """Fetch candidate model IDs for validation from an OpenAI-compatible
+    ``/models`` endpoint.
+    Returns a list of model ID strings sorted by preference: lightweight
+    models (nano, mini) come first to minimise token cost during validation.
+    Embedding-only models are excluded because they cannot serve chat requests.
     Returns:
-        A model ID string, or None if the request fails.
+        Sorted list of model IDs, or empty list if the request fails.
     """
     from ..performance import StaticOverrideResolver
@@ -155,15 +160,39 @@ async def _fetch_first_model(
         ) as session:
             async with session.get(models_url) as resp:
                 if resp.status != 200:
-                    return None
+                    return []
                 data = await resp.json()
                 models = data.get("data", [])
-                if models:
-                    m = models[0]
-                    return m.get("internal_id") or m.get("id")
     except Exception:
-        pass
-    return None
+        return []
+    # Filter out embedding models (they can't serve chat completions)
+    _EMBEDDING_KEYWORDS = {"embedding", "ada", "v3small", "v3large"}
+    chat_models = []
+    for m in models:
+        iid = (m.get("internal_id") or m.get("id") or "").lower()
+        display_id = (m.get("id") or "").lower()
+        if any(kw in iid or kw in display_id for kw in _EMBEDDING_KEYWORDS):
+            continue
+        chat_models.append(m)
+    # Sort: nano first (cheapest), then mini, then others
+    def _sort_key(m: dict) -> int:
+        iid = (m.get("internal_id") or m.get("id") or "").lower()
+        if "nano" in iid:
+            return 0
+        if "mini" in iid:
+            return 1
+        return 2
+    chat_models.sort(key=_sort_key)
+    result: list[str] = []
+    for m in chat_models:
+        model_id = m.get("internal_id") or m.get("id")
+        if model_id:
+            result.append(model_id)
+    return result
 async def validate_user_async(
@@ -196,57 +225,71 @@ async def validate_user_async(
     from ..performance import StaticOverrideResolver
     from .misc import contains_argo_auth_warning, extract_text_from_response
-    # Auto-detect a valid model name from the upstream
+    # Auto-detect valid model names from the upstream, sorted by preference
     models_url = chat_url.rsplit("/chat/completions", 1)[0] + "/models"
-    model = await _fetch_first_model(
+    candidate_models = await _fetch_validation_models(
         models_url, timeout=timeout, resolver_overrides=resolver_overrides
     )
-    if not model:
-        model = "gpt-4o-latest"  # fallback
-    payload = {
-        "model": model,
-        "messages": [{"role": "user", "content": "say ok"}],
-        "user": user,
-        "max_tokens": 5,
-    }
-    connector = None
-    if resolver_overrides:
-        resolver = StaticOverrideResolver(resolver_overrides)
-        connector = aiohttp.TCPConnector(resolver=resolver)
+    if not candidate_models:
+        candidate_models = ["gpt41nano"]  # lightweight fallback
     client_timeout = aiohttp.ClientTimeout(total=timeout)
     last_err: Exception | None = None
-    for attempt in range(attempts + 1):
-        try:
-            async with aiohttp.ClientSession(
-                connector=connector,
-                timeout=client_timeout,
-            ) as session:
-                async with session.post(
-                    chat_url,
-                    json=payload,
-                    headers={
-                        "Content-Type": "application/json",
-                        "Authorization": f"Bearer {user}",
-                    },
-                ) as response:
-                    if response.status != 200:
-                        raise ValueError(f"API returned status code {response.status}")
-                    data = await response.json()
-                    text = extract_text_from_response(data, "openai")
-                    return not contains_argo_auth_warning(text)
-        except Exception as e:
-            last_err = e
-            if attempt < attempts:
-                await asyncio.sleep(0.5)
-            if resolver_overrides and attempt < attempts:
-                resolver = StaticOverrideResolver(resolver_overrides)
-                connector = aiohttp.TCPConnector(resolver=resolver)
-            else:
-                connector = None
+    for model in candidate_models:
+        payload = {
+            "model": model,
+            "messages": [{"role": "user", "content": "say ok"}],
+            "user": user,
+            "max_tokens": 5,
+        }
+        connector = None
+        if resolver_overrides:
+            resolver = StaticOverrideResolver(resolver_overrides)
+            connector = aiohttp.TCPConnector(resolver=resolver)
+        for attempt in range(attempts + 1):
+            try:
+                async with aiohttp.ClientSession(
+                    connector=connector,
+                    timeout=client_timeout,
+                ) as session:
+                    async with session.post(
+                        chat_url,
+                        json=payload,
+                        headers={
+                            "Content-Type": "application/json",
+                            "Authorization": f"Bearer {user}",
+                        },
+                    ) as response:
+                        if response.status == 400:
+                            # Model rejected — try the next candidate
+                            body = await response.json()
+                            err_code = (
+                                body.get("error", {}).get("code", "")
+                                if isinstance(body, dict)
+                                else ""
+                            )
+                            if err_code == "model_not_found":
+                                last_err = ValueError(f"Model '{model}' not accepted")
+                                break  # skip to next model
+                        if response.status != 200:
+                            raise ValueError(
+                                f"API returned status code {response.status}"
+                            )
+                        data = await response.json()
+                        text = extract_text_from_response(data, "openai")
+                        return not contains_argo_auth_warning(text)
+            except Exception as e:
+                last_err = e
+                if attempt < attempts:
+                    await asyncio.sleep(0.5)
+                if resolver_overrides and attempt < attempts:
+                    resolver = StaticOverrideResolver(resolver_overrides)
+                    connector = aiohttp.TCPConnector(resolver=resolver)
+                else:
+                    connector = None
     if last_err is not None:
         raise last_err

argo_proxy-3.0.2/src/argoproxy/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- __version__ = "3.0.2"

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/LICENSE RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/README.md RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/pyproject.toml RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/setup.cfg RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argo_proxy.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argo_proxy.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argo_proxy.egg-info/entry_points.txt RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argo_proxy.egg-info/requires.txt RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argo_proxy.egg-info/top_level.txt RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/chat.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/completions.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/embed.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/native_anthropic.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/native_openai.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/endpoints/responses.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/deprecated.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/google_helpers.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/handler.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/input_handle.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/leaked_tool_parser.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/output_handle.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/tool_calls/tool_prompts.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/chat_completion.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/completions.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/embedding.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/function_call.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/types/responses.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/input_handle.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/models.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/stream_decoder.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/tokens.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_legacy/utils/usage.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_vendor/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_vendor/semver.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/_vendor/yaml.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/app.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/cli/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/cli/display.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/cli/handlers.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/cli/parser.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/config/__init__.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/config/interactive.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/config/io.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/config/model.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/config/validation.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/endpoints/dev_proxy.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/endpoints/extras.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/endpoints/passthrough.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/models.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/performance.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/py.typed RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/attack_logger.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/image_processing.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/logging.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/misc.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/models.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/src/argoproxy/utils/tool_calls.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_chat_completions.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_embeddings.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_function_calling_multiple.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_function_calling_single.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_leaked_tool_parser.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_legacy_completions.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/test/test_model_resolution.py RENAMED Viewed

File without changes

{argo_proxy-3.0.2 → argo_proxy-3.0.4}/tests/test_config_migrate.py RENAMED Viewed

File without changes

argo-proxy 3.0.2__tar.gz → 3.0.4__tar.gz

argo-proxy 3.0.2tar.gz → 3.0.4tar.gz