PyPI - cat-stack - Versions diffs - 1.6.1__tar.gz → 1.6.2__tar.gz - Mend

cat-stack 1.6.1tar.gz → 1.6.2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

{cat_stack-1.6.1 → cat_stack-1.6.2}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cat-stack
-Version: 1.6.1
+Version: 1.6.2
 Summary: Domain-agnostic text, image, PDF, and DOCX classification engine powered by LLMs
 Project-URL: Documentation, https://github.com/chrissoria/cat-stack#readme
 Project-URL: Issues, https://github.com/chrissoria/cat-stack/issues

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/__about__.py RENAMED Viewed

@@ -1,7 +1,7 @@
 # SPDX-FileCopyrightText: 2025-present Christopher Soria <chrissoria@berkeley.edu>
 #
 # SPDX-License-Identifier: GPL-3.0-or-later
-__version__ = "1.6.1"
+__version__ = "1.6.2"
 __author__ = "Chris Soria"
 __email__ = "chrissoria@berkeley.edu"
 __title__ = "cat-stack"

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_providers.py RENAMED Viewed

@@ -59,6 +59,26 @@ def _openai_reasoning_effort_floor(model: str) -> str:
             return floor
     return "minimal"
+# ---------------------------------------------------------------------------
+# HuggingFace `chat_template_kwargs={"enable_thinking": False}` is the knob
+# to suppress Qwen3-family `<think>` blocks. Other model families don't
+# expose an `enable_thinking` template variable, and strict HF backends
+# (Fireworks, Groq) reject the unknown field with 400 — forcing a wasted
+# retry. Restrict injection to families that actually honor the flag.
+#
+# The runtime fallback in `complete()` (strip-on-400) stays as a safety
+# net for unexpected cases — e.g. if a Qwen variant lands on a router
+# whose validator doesn't accept the field.
+# ---------------------------------------------------------------------------
+_HF_NEEDS_ENABLE_THINKING_OFF = (
+    "Qwen/Qwen3",   # covers Qwen3, Qwen3.5, Qwen3.6, …
+)
+def _hf_model_needs_enable_thinking_off(model: str) -> bool:
+    return any(model.startswith(p) for p in _HF_NEEDS_ENABLE_THINKING_OFF)
 __all__ = [
     # Main client
     "UnifiedLLMClient",
@@ -449,9 +469,20 @@ class UnifiedLLMClient:
         elif creativity is not None:
             payload["temperature"] = creativity
-        # HuggingFace: disable thinking for models that reason by default (e.g., Qwen3)
-        # when thinking_budget is explicitly set to 0
-        if self.provider in ("huggingface", "huggingface-together") and thinking_budget is not None and thinking_budget == 0:
+        # HuggingFace: disable thinking on model families whose chat
+        # template honors `enable_thinking` (Qwen3-family). Other HF-routed
+        # models don't need the kwarg, and strict-validator backends
+        # (Fireworks, Groq) reject the unknown field outright — sending it
+        # to a non-Qwen model just buys a wasted retry. See
+        # `_hf_model_needs_enable_thinking_off()`. The runtime fallback in
+        # `complete()` still strips on 400 if a router rejects the kwarg
+        # even for a model we expected to support it.
+        if (
+            self.provider in ("huggingface", "huggingface-together")
+            and thinking_budget is not None
+            and thinking_budget == 0
+            and _hf_model_needs_enable_thinking_off(self.model)
+        ):
             payload["chat_template_kwargs"] = {"enable_thinking": False}
         return payload

{cat_stack-1.6.1 → cat_stack-1.6.2}/.gitignore RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/LICENSE RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/README.md RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/pyproject.toml RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/cat_stack/__init__.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/__init__.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_batch.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_category_analysis.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_chunked.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_embeddings.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_formatter.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_pilot_test.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_prompts.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_review_ui.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_tiebreaker.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_utils.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_web_fetch.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/_wrapper_helpers.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/CoVe.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/__init__.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/image_CoVe.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/image_stepback.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/pdf_CoVe.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/pdf_stepback.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/stepback.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/calls/top_n.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/classify.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/explore.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/extract.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/image_functions.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/images/circle.png RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/images/cube.png RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/images/diamond.png RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/images/overlapping_pentagons.png RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/images/rectangles.png RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/model_reference_list.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/pdf_functions.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/prompt_tune.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/summarize.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/text_functions.py RENAMED Viewed

File without changes

{cat_stack-1.6.1 → cat_stack-1.6.2}/src/catstack/text_functions_ensemble.py RENAMED Viewed

File without changes

cat-stack 1.6.1__tar.gz → 1.6.2__tar.gz

cat-stack 1.6.1tar.gz → 1.6.2tar.gz