PyPI - coderouter-cli - Versions diffs - 1.8.1__py3-none-any.whl → 1.8.3__py3-none-any.whl - Mend

coderouter-cli 1.8.1py3-none-any.whl → 1.8.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

coderouter/adapters/openai_compat.py CHANGED Viewed

@@ -48,14 +48,25 @@ logger = get_logger(__name__)
 _RETRYABLE_STATUSES = {404, 408, 425, 429, 500, 502, 503, 504}
+# v1.8.3: non-standard reasoning fields emitted by various upstreams.
+# Different runtimes use different field names for the same concept:
+#   * ``reasoning``         — OpenRouter free models (gpt-oss-120b:free
+#                             confirmed 2026-04-20), Ollama
+#   * ``reasoning_content`` — llama.cpp ``llama-server`` (Qwen3.6 etc.,
+#                             confirmed 2026-04-26 with Unsloth GGUF)
+# Strict OpenAI clients reject either as an unknown key. The strip
+# function below removes both at the adapter boundary so downstream
+# layers never see them, regardless of which runtime fronts the model.
+_NON_STANDARD_REASONING_KEYS = ("reasoning", "reasoning_content")
 def _strip_reasoning_field(choices: list[dict[str, Any]] | None, *, delta_key: bool) -> bool:
-    """Remove non-standard ``reasoning`` keys from a choices list, in place.
+    """Remove non-standard reasoning keys from a choices list, in place.
-    v0.5-C: Some OpenRouter free models (confirmed on
-    ``openai/gpt-oss-120b:free`` 2026-04-20) return a ``reasoning`` field
-    alongside ``content`` on each choice. The field is not in the OpenAI
-    Chat Completions spec and strict clients can reject the unknown key.
-    We strip it at the adapter boundary so downstream layers never see it.
+    v0.5-C originally targeted OpenRouter's ``reasoning`` field. v1.8.3
+    extends the strip to ``reasoning_content`` (llama.cpp ``llama-server``
+    naming) since both denote the same hidden chain-of-thought trace and
+    neither is part of the OpenAI Chat Completions spec.
     Args:
         choices: The ``choices`` list from the response body or stream chunk.
@@ -64,7 +75,7 @@ def _strip_reasoning_field(choices: list[dict[str, Any]] | None, *, delta_key: b
             ``False`` for non-streaming responses (look in ``choice["message"]``).
     Returns:
-        True iff at least one ``reasoning`` key was removed. Callers use
+        True iff at least one reasoning key was removed. Callers use
         this to decide whether to emit a one-shot log line.
     """
     if not choices:
@@ -75,9 +86,12 @@ def _strip_reasoning_field(choices: list[dict[str, Any]] | None, *, delta_key: b
         if not isinstance(choice, dict):
             continue
         inner = choice.get(inner_key)
-        if isinstance(inner, dict) and "reasoning" in inner:
-            inner.pop("reasoning", None)
-            stripped = True
+        if not isinstance(inner, dict):
+            continue
+        for key in _NON_STANDARD_REASONING_KEYS:
+            if key in inner:
+                inner.pop(key, None)
+                stripped = True
     return stripped
@@ -235,15 +249,17 @@ class OpenAICompatAdapter(BaseAdapter):
                 retryable=False,
             ) from exc
-        # v0.5-C: passive strip of non-standard `reasoning` field on choices.
-        # No-op when the provider opted into passthrough.
+        # v0.5-C / v1.8.3: passive strip of non-standard reasoning fields
+        # on choices (covers both Ollama/OpenRouter ``reasoning`` and
+        # llama.cpp ``reasoning_content``). No-op when the provider opted
+        # into passthrough.
         if not self.config.capabilities.reasoning_passthrough and _strip_reasoning_field(
             data.get("choices"), delta_key=False
         ):
             log_capability_degraded(
                 logger,
                 provider=self.name,
-                dropped=["reasoning"],
+                dropped=list(_NON_STANDARD_REASONING_KEYS),
                 reason="non-standard-field",
             )
@@ -344,7 +360,7 @@ class OpenAICompatAdapter(BaseAdapter):
                             log_capability_degraded(
                                 logger,
                                 provider=self.name,
-                                dropped=["reasoning"],
+                                dropped=list(_NON_STANDARD_REASONING_KEYS),
                                 reason="non-standard-field",
                             )
                             reasoning_logged = True

coderouter/data/model-capabilities.yaml CHANGED Viewed

@@ -176,47 +176,59 @@ rules:
   # 「Claude Code 代替として最高」「local champ」と評価されている。
   #
   # ただし v1.8.0 までで `claude_code_suitability: ok` を declare していた
-  # のは note 記事の伝聞ベースの先回り宣言で、v1.8.1 (2026-04-26) の
-  # 実機検証 (M3 Max 32GB / Ollama 0.21.2) で次の課題が判明:
-  #   - num_ctx を declare 32768 しても Ollama 側で silent に縮められる
-  #     (canary echo-back probe 失敗)
+  # のは note 記事の伝聞ベースの先回り宣言で、v1.8.1 〜 v1.8.2
+  # (2026-04-26) の実機検証 (M3 Max 64GB / Ollama 0.21.2) で:
+  #   - num_ctx と streaming の NEEDS_TUNING は v1.8.2 で thinking モデル
+  #     用 probe バジェット拡大により偽陽性と判明 (doctor 側の課題)
   #   - tool_calls probe が native tool_calls / 修復可能 JSON のいずれも
-  #     返さず NEEDS_TUNING
-  #   - streaming probe が finish_reason='length' で 0 chars 打ち切り
-  # これらは Ollama 経由特有の問題で、HF / vLLM 直接ロードなら違う可能性。
-  # 確証ない以上、`claude_code_suitability` は撤回し `tools` 宣言だけ残す。
+  #     返さない真の課題が残る (Qwen3.6 系の Ollama 経由 tool 仕様未成熟)
+  # tool_calls 不全が解消されるまで `claude_code_suitability` は撤回。
   # 実機で動いたユーザーは `~/.coderouter/model-capabilities.yaml` で
   # `claude_code_suitability: ok` を上書きできる。
   # ------------------------------------------------------------------
+  # v1.8.2: thinking: true は doctor probe (num_ctx / streaming) が reasoning
+  # トークン消費分の max_tokens 余裕を確保するためのヒント。Qwen3 系は
+  # /think モードで thinking トークンを吐く設計なので true 宣言。
   - match: "qwen3.6:*"
     kind: openai_compat
     capabilities:
       tools: true
+      thinking: true
   - match: "qwen/qwen3.6-*"
     kind: openai_compat
     capabilities:
       tools: true
+      thinking: true
   # ------------------------------------------------------------------
-  # Gemma 4 family (v1.7-B 追加)
+  # Gemma 4 family (v1.7-B 追加、v1.8.2 で thinking: true 宣言)
   #
   # Google 公式 Gemma 4。Ollama 公式 tag は gemma4:e2b / e4b / 26b / 31b、
   # 全 variant が tools+vision+thinking 対応、E2B/E4B は audio もサポート。
   # MoE (26b は active 3.8B / total 25.2B)。note 記事で「日常・バランスの
   # 王者」と評価。Claude Haiku 互換性に近い簡潔な応答スタイル。
+  #
+  # v1.8.2 (2026-04-26): 実機検証 (M3 Max 64GB / Ollama 0.21.2 / gemma4:26b)
+  # で `reasoning` フィールドにかなりの量のトークンを吐く thinking モデル
+  # と確認。doctor probe の max_tokens=32 / 128 が thinking トークンに
+  # 食い切られて偽陽性 NEEDS_TUNING を出していた。registry で
+  # `thinking: true` を宣言すると doctor が probe バジェットを 1024 まで
+  # 引き上げて偽陽性を回避する。
   # ------------------------------------------------------------------
   - match: "gemma4:*"
     kind: openai_compat
     capabilities:
       tools: true
+      thinking: true
   - match: "google/gemma-4*"
     kind: openai_compat
     capabilities:
       tools: true
+      thinking: true
   # ------------------------------------------------------------------
   # GLM family (Z.AI / Zhipu AI、v1.7-B 追加)

coderouter/doctor.py CHANGED Viewed

@@ -433,6 +433,43 @@ _STREAMING_PROBE_USER_PROMPT = (
 # truncated". "1\n2\n...\n30" is ~80 chars; 40 chars covers the halfway
 # mark (1..20) which is already obviously-truncated territory.
 _STREAMING_PROBE_MIN_EXPECTED_CHARS = 40
+# v1.8.2: probe response budgets.
+#
+# Both num_ctx and streaming probes ask the model for a *short* answer
+# (the canary token / "1..30"). The original budgets (32 / 128 tokens)
+# assumed a non-thinking model that emits the answer immediately. On a
+# thinking model — Gemma 4 26B, Qwen3.6, gpt-oss, deepseek-r1 — the
+# upstream burns the entire budget on a hidden ``reasoning`` field
+# *before* emitting any visible ``content``, producing a false-positive
+# NEEDS_TUNING (canary missing / 0 chars streamed). Bumping the budget
+# is the cleanest fix: non-thinking models stop early at their natural
+# stop token (no waste), thinking models get headroom for the reasoning
+# trace plus the actual answer.
+#
+# Numbers picked from the v1.8.1 reality-check session
+# (docs/articles/note-v1-8-1-reality-check.md):
+#   * Gemma 4 26B reasoning prefix observed at ~150-300 tokens before
+#     content starts → 1024 covers reasoning + 30-line count comfortably.
+#   * Non-thinking baseline kept conservative-but-non-tight (256/512) to
+#     absorb stylistic preambles ("Sure, the answer is...") without
+#     burning extra cloud quota when the operator probes a paid endpoint.
+_NUM_CTX_PROBE_MAX_TOKENS_DEFAULT = 256
+_NUM_CTX_PROBE_MAX_TOKENS_THINKING = 1024
+_STREAMING_PROBE_MAX_TOKENS_DEFAULT = 512
+_STREAMING_PROBE_MAX_TOKENS_THINKING = 1024
+# v1.8.3: tool_calls probe also needs thinking-aware budget. The
+# pre-v1.8.3 default of 64 was tight even for non-thinking models
+# (the assistant often emits a brief preamble before the JSON tool
+# call), and on thinking models (Qwen3.6, Gemma 4, gpt-oss, deepseek-r1)
+# the entire 64-token budget gets consumed by ``reasoning_content``
+# before any ``tool_calls`` can surface — producing a false-positive
+# NEEDS_TUNING with the WRONG remediation (suggested patch flips
+# ``tools`` to false even though the model supports them perfectly).
+# 256/1024 brings the budget into line with the num_ctx / streaming
+# probes (same _is_reasoning_model gate).
+_TOOL_CALLS_PROBE_MAX_TOKENS_DEFAULT = 256
+_TOOL_CALLS_PROBE_MAX_TOKENS_THINKING = 1024
 # Default ``num_predict`` suggested in the emitted patch. -1 would be
 # optimal (uncapped) but "4096" communicates intent more clearly to
 # operators unfamiliar with Ollama's sentinel value, and covers Claude
@@ -475,6 +512,40 @@ def _declared_num_ctx(provider: ProviderConfig) -> int | None:
     return val if isinstance(val, int) else None
+def _is_reasoning_model(
+    provider: ProviderConfig, resolved: ResolvedCapabilities
+) -> bool:
+    """v1.8.2: True iff the model is known to emit a hidden reasoning trace.
+    Thinking models (Gemma 4, Qwen3-with-/think, gpt-oss, deepseek-r1,
+    Claude Sonnet 4.5+ in extended-thinking mode) burn output tokens on a
+    ``reasoning`` field before any visible ``content`` is produced. The
+    num_ctx / streaming probes use small response budgets that get fully
+    consumed by the reasoning prefix, producing a false-positive
+    NEEDS_TUNING. Callers use this to choose a generous probe budget.
+    Three signals fire:
+      * provider declared ``capabilities.thinking: true`` in providers.yaml
+      * provider declared ``capabilities.reasoning_passthrough: true``
+        (the operator opted in to passing the raw reasoning to the client,
+        which is only meaningful for models that emit it)
+      * registry resolved ``thinking: true`` for this (kind, model) pair
+    Conservative bias — when both provider declaration and registry are
+    silent, treat as non-reasoning. The probe still completes for thinking
+    models in that case (they just hit ``finish_reason='length'`` like
+    they did pre-v1.8.2), but at least the new generous default budget
+    (256 / 512) gives more headroom than the old 32 / 128.
+    """
+    if provider.capabilities.thinking is True:
+        return True
+    if provider.capabilities.reasoning_passthrough is True:
+        return True
+    if resolved.thinking is True:
+        return True
+    return resolved.reasoning_passthrough is True
 _PROBE_BASIC_USER_PROMPT = "Reply with exactly the single word: PONG"
 _PROBE_TOOLS_USER_PROMPT = (
     "You have one tool named `echo`. Call it with the argument "
@@ -617,7 +688,9 @@ def _extract_openai_assistant_choice(
     return msg if isinstance(msg, dict) else None
-async def _probe_num_ctx(provider: ProviderConfig) -> ProbeResult:
+async def _probe_num_ctx(
+    provider: ProviderConfig, resolved: ResolvedCapabilities
+) -> ProbeResult:
     """v1.0-B Probe — direct detection of Ollama ``num_ctx`` truncation.
     Addresses plan.md §9.4 symptom #1 (空応答 / 意味不明応答). Prior to
@@ -683,11 +756,21 @@ async def _probe_num_ctx(provider: ProviderConfig) -> ProbeResult:
     # whatever ``options.num_ctx`` the operator has declared. Request
     # fields win over extra_body, matching the adapter's merge order.
     body: dict[str, Any] = dict(provider.extra_body)
+    # v1.8.2: thinking models burn output tokens on a hidden ``reasoning``
+    # trace before emitting any ``content``. The pre-v1.8.2 default of 32
+    # was tight for any preamble at all; on Gemma 4 26B it caused
+    # ``finish_reason='length'`` with content="" before the canary could
+    # surface, producing a false-positive NEEDS_TUNING.
+    max_tokens = (
+        _NUM_CTX_PROBE_MAX_TOKENS_THINKING
+        if _is_reasoning_model(provider, resolved)
+        else _NUM_CTX_PROBE_MAX_TOKENS_DEFAULT
+    )
     body.update(
         {
             "model": provider.model,
             "messages": [{"role": "user", "content": user_prompt}],
-            "max_tokens": 32,
+            "max_tokens": max_tokens,
             "temperature": 0,
         }
     )
@@ -799,7 +882,9 @@ async def _probe_num_ctx(provider: ProviderConfig) -> ProbeResult:
     )
-async def _probe_streaming(provider: ProviderConfig) -> ProbeResult:
+async def _probe_streaming(
+    provider: ProviderConfig, resolved: ResolvedCapabilities
+) -> ProbeResult:
     """v1.0-C Probe — streaming completion path integrity.
     Addresses plan.md §9.4 symptom #1 from the **output** side. The v1.0-B
@@ -868,11 +953,18 @@ async def _probe_streaming(provider: ProviderConfig) -> ProbeResult:
     # probing. Top-level probe fields win on collision, matching adapter
     # merge order.
     body: dict[str, Any] = dict(provider.extra_body)
+    # v1.8.2: same thinking-model rationale as num_ctx probe — give
+    # reasoning a budget so the visible content has a chance to surface.
+    max_tokens = (
+        _STREAMING_PROBE_MAX_TOKENS_THINKING
+        if _is_reasoning_model(provider, resolved)
+        else _STREAMING_PROBE_MAX_TOKENS_DEFAULT
+    )
     body.update(
         {
             "model": provider.model,
             "messages": [{"role": "user", "content": _STREAMING_PROBE_USER_PROMPT}],
-            "max_tokens": 128,
+            "max_tokens": max_tokens,
             "temperature": 0,
             "stream": True,
         }
@@ -1011,6 +1103,16 @@ async def _probe_tool_calls(
           If declaration says True → NEEDS_TUNING (flip to False). If
           False → OK.
     """
+    # v1.8.3: thinking-aware budget — the pre-v1.8.3 default of 64 was
+    # consumed by ``reasoning_content`` on thinking models (Qwen3.6,
+    # Gemma 4, gpt-oss, deepseek-r1) before any ``tool_calls`` could
+    # surface, producing a false-positive NEEDS_TUNING that recommended
+    # flipping ``tools`` to false — the exact opposite of what's needed.
+    max_tokens = (
+        _TOOL_CALLS_PROBE_MAX_TOKENS_THINKING
+        if _is_reasoning_model(provider, resolved)
+        else _TOOL_CALLS_PROBE_MAX_TOKENS_DEFAULT
+    )
     if provider.kind == "anthropic":
         # Anthropic native tools use a different wire shape; we probe
         # via the messages API. A capable model returns content blocks
@@ -1022,7 +1124,7 @@ async def _probe_tool_calls(
             "messages": [
                 {"role": "user", "content": _PROBE_TOOLS_USER_PROMPT},
             ],
-            "max_tokens": 64,
+            "max_tokens": max_tokens,
             "tools": [_PROBE_TOOL_SPEC_ANTHROPIC],
         }
     else:
@@ -1033,7 +1135,7 @@ async def _probe_tool_calls(
             "messages": [
                 {"role": "user", "content": _PROBE_TOOLS_USER_PROMPT},
             ],
-            "max_tokens": 64,
+            "max_tokens": max_tokens,
             "temperature": 0,
             "tools": [_PROBE_TOOL_SPEC_OPENAI],
         }
@@ -1357,7 +1459,12 @@ async def _probe_reasoning_leak(
         )
     msg = _extract_openai_assistant_choice(parsed)
-    has_reasoning = bool(msg and "reasoning" in msg)
+    # v1.8.3: detect llama.cpp's ``reasoning_content`` alongside Ollama /
+    # OpenRouter's ``reasoning`` — they're the same concept under different
+    # field names, and the openai_compat adapter strips both since v1.8.3.
+    has_reasoning = bool(
+        msg and ("reasoning" in msg or "reasoning_content" in msg)
+    )
     # v1.0-A: content-embedded marker detection.
     content = (msg.get("content") if isinstance(msg, dict) else None) or ""
@@ -1506,11 +1613,11 @@ async def check_model(
     # declaration probes (tool_calls / thinking / reasoning-leak) should
     # dominate the report — streaming is the output-side sibling of
     # num_ctx and its NEEDS_TUNING verdict is orthogonal to the others.
-    report.results.append(await _probe_num_ctx(provider))
+    report.results.append(await _probe_num_ctx(provider, resolved))
     report.results.append(await _probe_tool_calls(provider, resolved))
     report.results.append(await _probe_thinking(provider, resolved))
     report.results.append(await _probe_reasoning_leak(provider, resolved))
-    report.results.append(await _probe_streaming(provider))
+    report.results.append(await _probe_streaming(provider, resolved))
     return report

{coderouter_cli-1.8.1.dist-info → coderouter_cli-1.8.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: coderouter-cli
-Version: 1.8.1
+Version: 1.8.3
 Summary: Local-first, free-first, fallback-built-in LLM router. Claude Code / OpenAI compatible.
 Project-URL: Homepage, https://github.com/zephel01/CodeRouter
 Project-URL: Repository, https://github.com/zephel01/CodeRouter
@@ -60,7 +60,7 @@ Description-Content-Type: text/markdown
 <p align="center">
   <a href="https://github.com/zephel01/CodeRouter/actions/workflows/ci.yml"><img src="https://github.com/zephel01/CodeRouter/actions/workflows/ci.yml/badge.svg?branch=main" alt="CI"></a>
   <a href=""><img src="https://img.shields.io/badge/status-stable-brightgreen" alt="status"></a>
-  <a href=""><img src="https://img.shields.io/badge/version-1.8.0-blue" alt="version"></a>
+  <a href=""><img src="https://img.shields.io/badge/version-1.8.3-blue" alt="version"></a>
   <a href=""><img src="https://img.shields.io/badge/python-3.12%2B-blue" alt="python"></a>
   <a href=""><img src="https://img.shields.io/badge/runtime%20deps-5-brightgreen" alt="deps"></a>
   <a href=""><img src="https://img.shields.io/badge/license-MIT-yellow" alt="license"></a>
@@ -100,7 +100,7 @@ Description-Content-Type: text/markdown
 | **要るか判断する** | [要否判定ガイド](./docs/when-do-i-need-coderouter.md) | エージェント × モデルの詳細マトリクスで「そもそも自分に必要か」を決める |
 | **詰まったとき** | [トラブルシューティング](./docs/troubleshooting.md) | `doctor` の使い方、`.env` の export 必須、Ollama サイレント失敗 5 症状、Claude Code 連携の罠 |
 | **安全に使う** | [セキュリティ方針](./docs/security.md) | 脅威モデル・秘密情報の扱い・脆弱性報告経路 |
-| **履歴** | [CHANGELOG](./CHANGELOG.md) | 全リリース履歴（最新: v1.8.0 — 用途別 4 プロファイル + GLM/Gemma 4/Qwen3.6 公式化 + apply 自動化） |
+| **履歴** | [CHANGELOG](./CHANGELOG.md) | 全リリース履歴（最新: v1.8.3 — tool_calls probe も thinking 対応 + adapter で `reasoning_content` strip / llama.cpp 直叩き対応） |
 | **設計を追う** | [plan.md](./plan.md) | 設計不変項・マイルストーン・今後のロードマップ |
 English versions: [Quickstart](./docs/quickstart.en.md) · [Usage guide](./docs/usage-guide.en.md) · [Free-tier guide](./docs/free-tier-guide.en.md) · [When you need it](./docs/when-do-i-need-coderouter.en.md) · [Troubleshooting](./docs/troubleshooting.en.md) · [Security](./docs/security.en.md)
@@ -175,7 +175,7 @@ OpenAI 互換エージェント + お行儀の良いモデル + フォールバ
 ## クイックスタート（3 コマンド）
-**v1.7.0 で PyPI 公開**、**v1.8.0 で用途別 4 プロファイル + Z.AI/GLM 連携**を追加しました。`uvx` 一発で動きます (Python 3.12 以上必須):
+**v1.7.0 で PyPI 公開**、**v1.8.0 で用途別 4 プロファイル + Z.AI/GLM 連携**を追加、**v1.8.2 で doctor probe を thinking モデル対応**にしました。`uvx` 一発で動きます (Python 3.12 以上必須):
 ```bash
 # 1. サンプル設定を置く
@@ -205,7 +205,7 @@ uv run coderouter serve --port 8088
 > **注**: PyPI 上のパッケージ名は `coderouter-cli` ですが、コマンド名と Python import 名は `coderouter` のままです。詳しくは [CHANGELOG `[v1.7.0]`](./CHANGELOG.md#v170--2026-04-25-pypi-公開-uvx-coderouter-cli-一発で動く) 参照。
 >
-> **v1.8.0 の `--apply` 自動化を使う場合**: `ruamel.yaml` を optional dep として一緒に入れます (`pip install 'coderouter-cli[doctor]'` または `uv pip install ruamel.yaml`)。基本機能には不要です。
+> **`--apply` 自動化を使う場合** (v1.8.0+): `ruamel.yaml` を optional dep として一緒に入れます (`pip install 'coderouter-cli[doctor]'` または `uv pip install ruamel.yaml`)。基本機能には不要です。
 あとは任意の OpenAI クライアントを `http://127.0.0.1:8088` に向けるだけです:

{coderouter_cli-1.8.1.dist-info → coderouter_cli-1.8.3.dist-info}/RECORD RENAMED Viewed

@@ -2,7 +2,7 @@ coderouter/__init__.py,sha256=ghdjPrLtnRzY8fyQ4CJZI1UJKADyNTLtA3G7se8H7Ns,696
 coderouter/__main__.py,sha256=-LCgxJnvgUV240HjQKv7ly-mn2NuKHpC4nCpvTHjeSU,130
 coderouter/cli.py,sha256=vI1-dv10t4-xG6Zpt7zi_3U8xGgq54Qa8XIMUYpfOV8,19859
 coderouter/cli_stats.py,sha256=ae20xUr_hjX09Ms3fBZGZsUS52o44JC57EpbWLBOCO0,27750
-coderouter/doctor.py,sha256=Uf4R1t2-50hRx6UpV9UBe_UeiJ2UYBg7e7zkPUHegWE,64217
+coderouter/doctor.py,sha256=F6f9vl99KTGgCja6N9w_QlDIFFCEqY0mxoAhKEI5yTI,69643
 coderouter/doctor_apply.py,sha256=r_J6xbu5-HivofPNriw4_vjNYs_VRs7GsGTS0oMEX10,24209
 coderouter/env_security.py,sha256=FEBZnXfJ0xE39kmMMn39zk0W_DRRnmcB_REmP9f4xWo,14796
 coderouter/errors.py,sha256=Xmq67lheyw8iv3Ox39jh2c4tvNI5RcUR4QkoxVDN6l4,1130
@@ -11,7 +11,7 @@ coderouter/output_filters.py,sha256=rI4YgKVv5vviDBl3Xkf7rp6LaSSkdWyEV004q6HrkB0,
 coderouter/adapters/__init__.py,sha256=7dIDSZ-FE_0iSqLSDc_lK1idRdLTKcM2hP9tCJipgPI,463
 coderouter/adapters/anthropic_native.py,sha256=qfdjxy4YyLt-0Fj7hUYn1oi1SFjEEbSvpaRBUC2hMf4,21903
 coderouter/adapters/base.py,sha256=H4uM6r_-95Xs1hCM_X4Zv3tq-xN3cXWLj83F-QjPNLw,8265
-coderouter/adapters/openai_compat.py,sha256=EC9zNYPGgSOVZyaH1dXRXO1VMN1RjBX5FZ2vEgTkVD8,17100
+coderouter/adapters/openai_compat.py,sha256=9qoJfLR2vVnyM8isb9G4j-Dk5QBHFlneOaBSY-P4UAg,17941
 coderouter/adapters/registry.py,sha256=Syt3eDljWZAK5mfiJGvUMKaZYAfCRScp7PvV6pYt7mc,683
 coderouter/config/__init__.py,sha256=FODEn74fN-qZnt4INPSHswqhOlEgpL6-_onxsitSx8g,274
 coderouter/config/capability_registry.py,sha256=oypl6Z-YjvNoC87AdSIm1C7XE_MZoFq_7Ivm3eRH3cI,14379
@@ -19,7 +19,7 @@ coderouter/config/env_file.py,sha256=CoMK27fuAXm-NtoLzXb8yN2E-wDFjHQuFwiIlmgTBQw
 coderouter/config/loader.py,sha256=FUEe8m4Tnmj_aul0vSctD8vKvNW-oLRoMRbTpSKqSmc,4077
 coderouter/config/schemas.py,sha256=NMWKstAzDKc6DT7qKr-GKlUFrsfE4HtEG7zkz9Pnq78,21597
 coderouter/data/__init__.py,sha256=uNyfD9jaCvTWsBAWtaw1Fr25OSxzv3psGMfBjT1z0Cc,328
-coderouter/data/model-capabilities.yaml,sha256=8g11ysbjEwt9Rc9Q9o4VCA0de2RmnH-mJEbnsueET_A,13949
+coderouter/data/model-capabilities.yaml,sha256=9f9CDIoWBJYtppMRh1BOS8FzRKzICV4uT-uANovGmzs,14718
 coderouter/ingress/__init__.py,sha256=WQsCH2CGJCAhy0mS6GSEdeYZRkkQu2OHDsP4CJWTLug,155
 coderouter/ingress/anthropic_routes.py,sha256=vuylsn7klFN-Dz3cBS7LrhnnSRGr6agipgMrr9gxq7k,8261
 coderouter/ingress/app.py,sha256=b9s6NpBGckaTQJCaw-6MZaY7Eq3rxgtX_cCkgWq-0Ig,6620
@@ -37,8 +37,8 @@ coderouter/translation/__init__.py,sha256=PYXN7XVEwpG1uC8RLy6fvnGbzEZhhrEuUapH8I
 coderouter/translation/anthropic.py,sha256=JpvIWNXHUPVqOGvps7o_6ZADhXuJuvpU7RdMqQFtwwM,6421
 coderouter/translation/convert.py,sha256=-qyzFzmmr9hhQV6_Sg75kJnvCZvHe3n7vRdaZtk_JqQ,47269
 coderouter/translation/tool_repair.py,sha256=fyxDb4kWHytO5JWq5y0i4tinJUtWqhMCkyfoCf5BjeM,8314
-coderouter_cli-1.8.1.dist-info/METADATA,sha256=sb0tldZ1vqseJCuO-oExjVXwnmOslwQt9MN9Rh5PVS8,44136
-coderouter_cli-1.8.1.dist-info/WHEEL,sha256=QccIxa26bgl1E6uMy58deGWi-0aeIkkangHcxk2kWfw,87
-coderouter_cli-1.8.1.dist-info/entry_points.txt,sha256=-dnLfD1YZ2WjH2zSdNCvlO65wYltM9bsHt9Fhg3yGss,51
-coderouter_cli-1.8.1.dist-info/licenses/LICENSE,sha256=wkEzoR86jFw33jvfOHjULqmkGEfxTFMgMaJnpR8mPRw,1065
-coderouter_cli-1.8.1.dist-info/RECORD,,
+coderouter_cli-1.8.3.dist-info/METADATA,sha256=Nm6kOVjXop9D5aISl3H0OcH-gi4fkGT0fmhuyoKTcHU,44221
+coderouter_cli-1.8.3.dist-info/WHEEL,sha256=QccIxa26bgl1E6uMy58deGWi-0aeIkkangHcxk2kWfw,87
+coderouter_cli-1.8.3.dist-info/entry_points.txt,sha256=-dnLfD1YZ2WjH2zSdNCvlO65wYltM9bsHt9Fhg3yGss,51
+coderouter_cli-1.8.3.dist-info/licenses/LICENSE,sha256=wkEzoR86jFw33jvfOHjULqmkGEfxTFMgMaJnpR8mPRw,1065
+coderouter_cli-1.8.3.dist-info/RECORD,,

{coderouter_cli-1.8.1.dist-info → coderouter_cli-1.8.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{coderouter_cli-1.8.1.dist-info → coderouter_cli-1.8.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{coderouter_cli-1.8.1.dist-info → coderouter_cli-1.8.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

coderouter-cli 1.8.1__py3-none-any.whl → 1.8.3__py3-none-any.whl

coderouter-cli 1.8.1py3-none-any.whl → 1.8.3py3-none-any.whl