PyPI - abstractcore - Versions diffs - 2.6.9__py3-none-any.whl → 2.9.1__py3-none-any.whl - Mend

abstractcore 2.6.9py3-none-any.whl → 2.9.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

abstractcore/apps/summarizer.py +69 -27
abstractcore/architectures/detection.py +190 -25
abstractcore/assets/architecture_formats.json +129 -6
abstractcore/assets/model_capabilities.json +803 -141
abstractcore/config/main.py +2 -2
abstractcore/config/manager.py +3 -1
abstractcore/events/__init__.py +7 -1
abstractcore/mcp/__init__.py +30 -0
abstractcore/mcp/client.py +213 -0
abstractcore/mcp/factory.py +64 -0
abstractcore/mcp/naming.py +28 -0
abstractcore/mcp/stdio_client.py +336 -0
abstractcore/mcp/tool_source.py +164 -0
abstractcore/processing/__init__.py +2 -2
abstractcore/processing/basic_deepsearch.py +1 -1
abstractcore/processing/basic_summarizer.py +379 -93
abstractcore/providers/anthropic_provider.py +91 -10
abstractcore/providers/base.py +540 -16
abstractcore/providers/huggingface_provider.py +17 -8
abstractcore/providers/lmstudio_provider.py +170 -25
abstractcore/providers/mlx_provider.py +13 -10
abstractcore/providers/ollama_provider.py +42 -26
abstractcore/providers/openai_compatible_provider.py +87 -22
abstractcore/providers/openai_provider.py +12 -9
abstractcore/providers/streaming.py +201 -39
abstractcore/providers/vllm_provider.py +78 -21
abstractcore/server/app.py +116 -30
abstractcore/structured/retry.py +20 -7
abstractcore/tools/__init__.py +46 -24
abstractcore/tools/abstractignore.py +166 -0
abstractcore/tools/arg_canonicalizer.py +61 -0
abstractcore/tools/common_tools.py +2443 -742
abstractcore/tools/core.py +109 -13
abstractcore/tools/handler.py +17 -3
abstractcore/tools/parser.py +894 -159
abstractcore/tools/registry.py +122 -18
abstractcore/tools/syntax_rewriter.py +68 -6
abstractcore/tools/tag_rewriter.py +186 -1
abstractcore/utils/jsonish.py +111 -0
abstractcore/utils/version.py +1 -1
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/METADATA +56 -2
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/RECORD +46 -37
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/WHEEL +0 -0
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/entry_points.txt +0 -0
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/licenses/LICENSE +0 -0
{abstractcore-2.6.9.dist-info → abstractcore-2.9.1.dist-info}/top_level.txt +0 -0

abstractcore/apps/summarizer.py CHANGED Viewed

@@ -6,23 +6,39 @@ Usage:
     python -m abstractcore.apps.summarizer <file_path> [options]
 Options:
-    --style <style>         Summary style (structured, narrative, objective, analytical, executive, conversational)
-    --length <length>       Summary length (brief, standard, detailed, comprehensive)
-    --focus <focus>         Specific focus area for summarization
-    --output <output>       Output file path (optional, prints to console if not provided)
-    --chunk-size <size>     Chunk size in characters (default: 8000, max: 32000)
-    --provider <provider>   LLM provider (requires --model)
-    --model <model>         LLM model (requires --provider)
-    --max-tokens <tokens>   Maximum total tokens for LLM context (default: 32000)
-    --max-output-tokens <tokens> Maximum tokens for LLM output generation (default: 8000)
-    --verbose              Show detailed progress information
-    --help                 Show this help message
+    --style <style>              Summary style (structured, narrative, objective, analytical, executive, conversational)
+    --length <length>            Summary length (brief, standard, detailed, comprehensive)
+    --focus <focus>              Specific focus area for summarization
+    --output <output>            Output file path (optional, prints to console if not provided)
+    --chunk-size <size>          Chunk size in characters (default: 8000, max: 32000)
+    --provider <provider>        LLM provider (requires --model)
+    --model <model>              LLM model (requires --provider)
+    --max-tokens <tokens|auto>   Maximum total tokens for LLM context (default: auto)
+                                 - 'auto' or -1: Uses model's full context window
+                                 - Specific number: Hard limit for deployment constraint (GPU/RAM)
+    --max-output-tokens <tokens|auto> Maximum tokens for LLM output (default: auto)
+    --verbose                    Show detailed progress information
+    --help                       Show this help message
+Memory Management:
+    --max-tokens controls token budget:
+    - Use 'auto' (default): Automatically uses model's full capability
+    - Use specific value: Hard limit for memory-constrained environments (e.g., --max-tokens 16000)
+    Example: 8GB GPU → --max-tokens 16000, 16GB GPU → --max-tokens 32000
 Examples:
+    # Auto mode (uses model's full capability)
     python -m abstractcore.apps.summarizer document.pdf
-    python -m abstractcore.apps.summarizer report.txt --style executive --length brief --verbose
-    python -m abstractcore.apps.summarizer data.md --focus "technical details" --output summary.txt
-    python -m abstractcore.apps.summarizer large.txt --chunk-size 15000 --provider openai --model gpt-4o-mini
+    # Memory-constrained (8GB GPU)
+    python -m abstractcore.apps.summarizer report.txt --max-tokens 16000
+    # Large document with specific style
+    python -m abstractcore.apps.summarizer data.md --style executive --length brief
+    # Custom model with hard limit
+    python -m abstractcore.apps.summarizer large.txt --provider openai --model gpt-4o-mini --max-tokens 24000
 """
 import argparse
@@ -239,16 +255,14 @@ Default model setup:
     parser.add_argument(
         '--max-tokens',
-        type=int,
-        default=32000,
-        help='Maximum total tokens for LLM context (default: 32000)'
+        default='auto',
+        help='Maximum total tokens for LLM context (default: auto). Use "auto" or -1 for model\'s full capability, or specific number for hard limit (e.g., 16000 for 8GB GPU)'
     )
     parser.add_argument(
         '--max-output-tokens',
-        type=int,
-        default=8000,
-        help='Maximum tokens for LLM output generation (default: 8000)'
+        default='auto',
+        help='Maximum tokens for LLM output generation (default: auto). Use "auto" or -1 for model\'s capability, or specific number'
     )
     parser.add_argument(
@@ -329,19 +343,40 @@ Default model setup:
             provider, model = get_app_defaults('summarizer')
             config_source = "configured defaults"
-        # Adjust max_tokens based on chunk size
-        max_tokens = max(args.max_tokens, args.chunk_size)
+        # Parse max_tokens (support 'auto', -1, or specific number)
+        if args.max_tokens in ('auto', 'Auto', 'AUTO'):
+            max_tokens = -1
+        else:
+            try:
+                max_tokens = int(args.max_tokens)
+            except ValueError:
+                print(f"Error: --max-tokens must be 'auto' or a number, got: {args.max_tokens}")
+                sys.exit(1)
+        # Parse max_output_tokens (support 'auto', -1, or specific number)
+        if args.max_output_tokens in ('auto', 'Auto', 'AUTO'):
+            max_output_tokens = -1
+        else:
+            try:
+                max_output_tokens = int(args.max_output_tokens)
+            except ValueError:
+                print(f"Error: --max-output-tokens must be 'auto' or a number, got: {args.max_output_tokens}")
+                sys.exit(1)
         if args.verbose:
-            print(f"Initializing summarizer ({provider}, {model}, {max_tokens} token context, {args.max_output_tokens} output tokens) - using {config_source}...")
+            max_tokens_display = "AUTO" if max_tokens == -1 else str(max_tokens)
+            max_output_display = "AUTO" if max_output_tokens == -1 else str(max_output_tokens)
+            print(f"Initializing summarizer ({provider}, {model}, {max_tokens_display} token context, {max_output_display} output tokens) - using {config_source}...")
         if args.debug:
+            max_tokens_display = "AUTO" if max_tokens == -1 else str(max_tokens)
+            max_output_display = "AUTO" if max_output_tokens == -1 else str(max_output_tokens)
             print(f"🐛 Debug - Configuration details:")
             print(f"   Provider: {provider}")
             print(f"   Model: {model}")
             print(f"   Config source: {config_source}")
-            print(f"   Max tokens: {max_tokens}")
-            print(f"   Max output tokens: {args.max_output_tokens}")
+            print(f"   Max tokens: {max_tokens_display}")
+            print(f"   Max output tokens: {max_output_display}")
             print(f"   Chunk size: {args.chunk_size}")
             print(f"   Timeout: {args.timeout}")
             print(f"   Style: {args.style}")
@@ -349,12 +384,19 @@ Default model setup:
             print(f"   Focus: {args.focus}")
         try:
-            llm = create_llm(provider, model=model, max_tokens=max_tokens, max_output_tokens=args.max_output_tokens, timeout=args.timeout)
+            # When using auto mode (-1), don't pass to create_llm (let provider use defaults)
+            llm_kwargs = {'timeout': args.timeout}
+            if max_tokens != -1:
+                llm_kwargs['max_tokens'] = max_tokens
+            if max_output_tokens != -1:
+                llm_kwargs['max_output_tokens'] = max_output_tokens
+            llm = create_llm(provider, model=model, **llm_kwargs)
             summarizer = BasicSummarizer(
                 llm,
                 max_chunk_size=args.chunk_size,
                 max_tokens=max_tokens,
-                max_output_tokens=args.max_output_tokens,
+                max_output_tokens=max_output_tokens,
                 timeout=args.timeout
             )
         except Exception as e:

abstractcore/architectures/detection.py CHANGED Viewed

@@ -20,6 +20,41 @@ _model_capabilities: Optional[Dict[str, Any]] = None
 # Cache for resolved model names and architectures to reduce redundant logging
 _resolved_aliases_cache: Dict[str, str] = {}
 _detected_architectures_cache: Dict[str, str] = {}
+# Cache to avoid repeating default-capabilities warnings for the same unknown model.
+_default_capabilities_warning_cache: set[str] = set()
+# Some callers pass provider/model as a single string (e.g. "lmstudio/qwen/qwen3-next-80b").
+# For capability lookup we want the underlying model id, not the provider prefix.
+_KNOWN_PROVIDER_PREFIXES = {
+    "anthropic",
+    "azure",
+    "bedrock",
+    "fireworks",
+    "gemini",
+    "google",
+    "groq",
+    "huggingface",
+    "lmstudio",
+    "local",
+    "mlx",
+    "nvidia",
+    "ollama",
+    "openai",
+    "openai-compatible",
+    "together",
+    "vllm",
+}
+def _strip_provider_prefix(model_name: str) -> str:
+    s = str(model_name or "").strip()
+    if not s or "/" not in s:
+        return s
+    head, rest = s.split("/", 1)
+    if head.strip().lower() in _KNOWN_PROVIDER_PREFIXES and rest.strip():
+        return rest.strip()
+    return s
 def _load_json_assets():
@@ -72,16 +107,36 @@ def detect_architecture(model_name: str) -> str:
         _detected_architectures_cache[model_name] = "generic"
         return "generic"
-    model_lower = model_name.lower()
+    # Normalize model names for better pattern matching:
+    # - HuggingFace cache names use `--` as `/` separators (models--org--name).
+    # - Claude versions sometimes appear as `claude-3-5-sonnet` (normalize to `claude-3.5-sonnet`).
+    model_lower = model_name.lower().replace("--", "/")
+    import re
+    model_lower = re.sub(r'(claude-\d+)-(\d+)(?=-|$)', r'\1.\2', model_lower)
+    # Choose the most specific matching architecture.
+    # Many architectures include broad patterns (e.g. "gpt") that can accidentally
+    # match more specific models (e.g. "gpt-oss"). We resolve this by selecting the
+    # longest matching pattern across all architectures.
+    best_arch = "generic"
+    best_pattern = ""
-    # Check each architecture's patterns
     for arch_name, arch_config in _architecture_formats["architectures"].items():
         patterns = arch_config.get("patterns", [])
         for pattern in patterns:
-            if pattern.lower() in model_lower:
-                logger.debug(f"Detected architecture '{arch_name}' for model '{model_name}' (pattern: '{pattern}')")
-                _detected_architectures_cache[model_name] = arch_name
-                return arch_name
+            pat = str(pattern).lower()
+            if not pat:
+                continue
+            if pat in model_lower and len(pat) > len(best_pattern):
+                best_arch = arch_name
+                best_pattern = pat
+    if best_arch != "generic":
+        logger.debug(
+            f"Detected architecture '{best_arch}' for model '{model_name}' (pattern: '{best_pattern}')"
+        )
+        _detected_architectures_cache[model_name] = best_arch
+        return best_arch
     # Fallback to generic
     logger.debug(f"No specific architecture detected for '{model_name}', using generic")
@@ -147,22 +202,69 @@ def resolve_model_alias(model_name: str, models: Dict[str, Any]) -> str:
     if normalized_model_name != model_name:
         logger.debug(f"Normalized model name '{model_name}' to '{normalized_model_name}'")
-    # Check if normalized name is a canonical name
-    if normalized_model_name in models:
-        _resolved_aliases_cache[model_name] = normalized_model_name
-        return normalized_model_name
-    # Check if it's an alias of any model (try both original and normalized)
+    # Also support "provider/model" strings by stripping known provider prefixes.
+    stripped_model_name = _strip_provider_prefix(model_name)
+    stripped_normalized_name = _strip_provider_prefix(normalized_model_name)
+    def _tail(name: str) -> str:
+        s = str(name or "").strip()
+        if not s or "/" not in s:
+            return s
+        return s.split("/")[-1].strip()
+    def _candidates(*names: str) -> List[str]:
+        out: List[str] = []
+        for n in names:
+            s = str(n or "").strip()
+            if not s:
+                continue
+            out.append(s)
+            t = _tail(s)
+            if t and t != s:
+                out.append(t)
+        # Deduplicate while preserving order
+        uniq: List[str] = []
+        seen: set[str] = set()
+        for s in out:
+            if s in seen:
+                continue
+            seen.add(s)
+            uniq.append(s)
+        return uniq
+    # Check if any normalized/stripped name is a canonical name.
+    for candidate in _candidates(normalized_model_name, stripped_normalized_name, stripped_model_name):
+        if candidate in models:
+            _resolved_aliases_cache[model_name] = candidate
+            return candidate
+    # Check if it's an alias of any model (try both original and normalized).
+    # Some JSON entries intentionally share aliases (e.g. base + variant). Prefer the
+    # most specific canonical model name deterministically.
+    alias_matches: List[str] = []
     for canonical_name, model_info in models.items():
         aliases = model_info.get("aliases", [])
-        if model_name in aliases or normalized_model_name in aliases:
-            logger.debug(f"Resolved alias '{model_name}' to canonical name '{canonical_name}'")
-            _resolved_aliases_cache[model_name] = canonical_name
-            return canonical_name
+        if not isinstance(aliases, list) or not aliases:
+            continue
+        candidates = _candidates(model_name, normalized_model_name, stripped_model_name, stripped_normalized_name)
+        alias_set = {str(a).strip().lower() for a in aliases if isinstance(a, str) and str(a).strip()}
+        cand_set = {str(c).strip().lower() for c in candidates if isinstance(c, str) and str(c).strip()}
+        if alias_set and cand_set and alias_set.intersection(cand_set):
+            alias_matches.append(canonical_name)
+    if alias_matches:
+        best = max(alias_matches, key=lambda n: (len(str(n)), str(n)))
+        logger.debug(f"Resolved alias '{model_name}' to canonical name '{best}'")
+        _resolved_aliases_cache[model_name] = best
+        return best
     # Return normalized name if no alias found
-    _resolved_aliases_cache[model_name] = normalized_model_name
-    return normalized_model_name
+    fallback = stripped_normalized_name or normalized_model_name
+    fallback_tail = _tail(fallback)
+    if fallback_tail:
+        fallback = fallback_tail
+    _resolved_aliases_cache[model_name] = fallback
+    return fallback
 def get_model_capabilities(model_name: str) -> Dict[str, Any]:
@@ -199,15 +301,44 @@ def get_model_capabilities(model_name: str) -> Dict[str, Any]:
     # Step 3: Try partial matches for common model naming patterns
     # Use canonical_name (which has been normalized) for better matching
     canonical_lower = canonical_name.lower()
-    for model_key, capabilities in models.items():
-        if model_key.lower() in canonical_lower or canonical_lower in model_key.lower():
+    candidates_name_in_key: List[tuple[int, int, str]] = []
+    candidates_key_in_name: List[tuple[int, str]] = []
+    for model_key in models.keys():
+        if not isinstance(model_key, str) or not model_key.strip():
+            continue
+        key_lower = model_key.lower()
+        # Prefer a close "superstring" match where the canonical name is missing a suffix.
+        # Example: "qwen3-next-80b" -> "qwen3-next-80b-a3b"
+        if canonical_lower and canonical_lower in key_lower:
+            extra = max(0, len(key_lower) - len(canonical_lower))
+            candidates_name_in_key.append((extra, len(key_lower), model_key))
+            continue
+        # Otherwise, prefer the most specific substring match (e.g. provider/model prefixes).
+        if key_lower in canonical_lower:
+            candidates_key_in_name.append((len(key_lower), model_key))
+    best_key: Optional[str] = None
+    best_mode: Optional[str] = None
+    if candidates_name_in_key:
+        candidates_name_in_key.sort(key=lambda x: (x[0], -x[1]))
+        best_key = candidates_name_in_key[0][2]
+        best_mode = "name_in_key"
+    elif candidates_key_in_name:
+        best_key = max(candidates_key_in_name, key=lambda x: x[0])[1]
+        best_mode = "key_in_name"
+    if best_key is not None:
+        capabilities = models.get(best_key)
+        if isinstance(capabilities, dict):
             result = capabilities.copy()
             # Remove alias-specific fields
             result.pop("canonical_name", None)
             result.pop("aliases", None)
             if "architecture" not in result:
                 result["architecture"] = detect_architecture(model_name)
-            logger.debug(f"Using capabilities from '{model_key}' for '{model_name}'")
+            logger.debug(f"Using capabilities from '{best_key}' for '{model_name}' (partial match: {best_mode})")
             return result
     # Step 4: Fallback to default capabilities based on architecture
@@ -215,16 +346,50 @@ def get_model_capabilities(model_name: str) -> Dict[str, Any]:
     default_caps = _model_capabilities.get("default_capabilities", {}).copy()
     default_caps["architecture"] = architecture
-    # Enhance defaults based on architecture
+    # Enhance defaults based on architecture.
+    #
+    # NOTE: `architecture_formats.json.tool_format` describes the *prompted transcript syntax*
+    # for tool calls (e.g. XML-wrapped, <|tool_call|> blocks, etc). Some architectures/models
+    # also support *native tool APIs* (provider-level `tools` payloads) even when their prompted
+    # transcript format is non-native. For those cases, architectures can set an explicit
+    # `default_tool_support` to avoid relying on tool_format heuristics.
     arch_format = get_architecture_format(architecture)
-    if arch_format.get("tool_format") == "native":
+    explicit_support = str(arch_format.get("default_tool_support") or "").strip().lower()
+    if explicit_support in {"native", "prompted", "none"}:
+        default_caps["tool_support"] = explicit_support
+    elif arch_format.get("tool_format") == "native":
         default_caps["tool_support"] = "native"
-    elif arch_format.get("tool_format") in ["special_token", "json", "xml", "pythonic"]:
+    elif arch_format.get("tool_format") in ["special_token", "json", "xml", "pythonic", "glm_xml"]:
         default_caps["tool_support"] = "prompted"
     else:
         default_caps["tool_support"] = "none"
+    # Propagate architecture-level output wrappers into default capabilities.
+    wrappers = arch_format.get("output_wrappers")
+    if isinstance(wrappers, dict) and wrappers:
+        default_caps["output_wrappers"] = dict(wrappers)
     logger.debug(f"Using default capabilities for '{model_name}' (architecture: {architecture})")
+    # Emit a one-time warning for unknown models to keep model_capabilities.json up to date.
+    try:
+        raw_name = str(model_name).strip()
+    except Exception:
+        raw_name = ""
+    if raw_name and raw_name not in _default_capabilities_warning_cache:
+        _default_capabilities_warning_cache.add(raw_name)
+        logger.warning(
+            "Model not found in model_capabilities.json; falling back to architecture defaults",
+            model_name=raw_name,
+            detected_architecture=architecture,
+            default_tool_support=default_caps.get("tool_support"),
+            next_steps=(
+                "Add this model (or an alias) to abstractcore/abstractcore/assets/model_capabilities.json "
+                "or email contact@abstractcore.ai with the exact model id and provider."
+            ),
+        )
     return default_caps
@@ -539,4 +704,4 @@ def check_vision_model_compatibility(model_name: str, provider: str = None) -> D
         result['warnings'].append("No max_image_tokens specified")
         result['recommendations'].append("Add max_image_tokens to model capabilities")
-    return result
+    return result

abstractcore/assets/architecture_formats.json CHANGED Viewed

@@ -88,7 +88,7 @@
       "patterns": ["qwen3-next"]
     },
     "qwen3_vl": {
-      "description": "Alibaba's Qwen3-VL multimodal architecture (September 2025)",
+      "description": "Alibaba's Qwen3-VL multimodal architecture (May 2025)",
       "message_format": "im_start_end",
       "system_prefix": "<|im_start|>system\n",
       "system_suffix": "<|im_end|>\n",
@@ -96,8 +96,20 @@
       "user_suffix": "<|im_end|>\n",
       "assistant_prefix": "<|im_start|>assistant\n",
       "assistant_suffix": "<|im_end|>\n",
-      "tool_format": "prompted",
-      "patterns": ["qwen3-vl"]
+      "tool_format": "native",
+      "patterns": ["qwen3-vl-2b", "qwen3-vl-4b", "qwen3-vl-8b"]
+    },
+    "qwen3_vl_moe": {
+      "description": "Alibaba's Qwen3-VL MoE multimodal architecture (May 2025)",
+      "message_format": "im_start_end",
+      "system_prefix": "<|im_start|>system\n",
+      "system_suffix": "<|im_end|>\n",
+      "user_prefix": "<|im_start|>user\n",
+      "user_suffix": "<|im_end|>\n",
+      "assistant_prefix": "<|im_start|>assistant\n",
+      "assistant_suffix": "<|im_end|>\n",
+      "tool_format": "native",
+      "patterns": ["qwen3-vl-30b-a3b", "qwen3-vl-235b-a22b"]
     },
       "qwen3_moe": {
         "description": "Alibaba's Qwen3 MoE architecture (April 2025)",
@@ -211,6 +223,30 @@
       "tool_format": "native",
       "patterns": ["codestral"]
     },
+    "mistral3": {
+      "description": "Mistral AI Mistral 3 architecture with rope-scaling (December 2024)",
+      "message_format": "inst",
+      "system_prefix": "",
+      "system_suffix": "\n\n",
+      "user_prefix": "[INST] ",
+      "user_suffix": " [/INST]",
+      "assistant_prefix": "",
+      "assistant_suffix": "",
+      "tool_format": "native",
+      "patterns": ["mistral-small-3", "devstral-small-2"]
+    },
+    "ministral3": {
+      "description": "Mistral AI Ministral 3 architecture (December 2024)",
+      "message_format": "inst",
+      "system_prefix": "",
+      "system_suffix": "\n\n",
+      "user_prefix": "[INST] ",
+      "user_suffix": " [/INST]",
+      "assistant_prefix": "",
+      "assistant_suffix": "",
+      "tool_format": "native",
+      "patterns": ["devstral-2-123b"]
+    },
     "phi": {
       "description": "Microsoft's Phi architecture family",
       "message_format": "basic",
@@ -295,6 +331,26 @@
       "tool_format": "none",
       "patterns": ["gemma-2b", "gemma-7b"]
     },
+    "glm4v_moe": {
+      "description": "Zhipu AI's GLM-4.6V multimodal MoE architecture (May 2025)",
+      "message_format": "glm_special_tokens",
+      "system_prefix": "<|system|>\n",
+      "system_suffix": "\n",
+      "user_prefix": "<|user|>\n",
+      "user_suffix": "\n",
+      "assistant_prefix": "<|assistant|>\n",
+      "assistant_suffix": "\n",
+      "tool_format": "glm_xml",
+      "tool_calling_format": "<tool_call>function_name\n<arg_key>key</arg_key>\n<arg_value>value</arg_value>\n</tool_call>",
+      "output_wrappers": {
+        "start": "<|begin_of_box|>",
+        "end": "<|end_of_box|>"
+      },
+      "thinking_output_field": "reasoning_content",
+      "thinking_tags": ["<think>", "</think>"],
+      "thinking_control": "/nothink",
+      "patterns": ["glm-4.6v", "glm4.6v", "zai-org/glm-4.6v", "glm-4.6v-flash", "glm-4.6v-fp8", "glm-4.6v-flash-fp8"]
+    },
     "glm4_moe": {
       "description": "Zhipu AI's GLM-4.5+ MoE architecture (July 2025)",
       "message_format": "im_start_end",
@@ -306,7 +362,7 @@
       "assistant_suffix": "\n",
       "tool_format": "special_token",
       "tool_prefix": "<|tool_call|>",
-      "patterns": ["glm-4.5", "glm-4.6", "glm-4.5-air"]
+      "patterns": ["glm-4.7", "glm-4.6", "glm-4.5", "glm-4.5-air"]
     },
     "glm4v": {
       "description": "Zhipu AI's GLM-4V multimodal architecture (June 2024)",
@@ -345,6 +401,19 @@
         "tool_prefix": "<|tool_call|>",
         "patterns": ["granite", "granite3.3:2b"]
       },
+      "granitemoehybrid": {
+        "description": "IBM's Granite 4.0 hybrid MoE architecture with Mamba2 (October 2025)",
+        "message_format": "special_tokens",
+        "system_prefix": "<|system|>\n",
+        "system_suffix": "\n",
+        "user_prefix": "<|user|>\n",
+        "user_suffix": "\n",
+        "assistant_prefix": "<|assistant|>\n",
+        "assistant_suffix": "\n",
+        "tool_format": "native",
+        "tool_prefix": "<|tool_call|>",
+        "patterns": ["granite-4.0-h", "granite-h-tiny", "granite-h-micro"]
+      },
     "deepseek": {
       "description": "DeepSeek architecture family",
       "message_format": "im_start_end",
@@ -357,6 +426,32 @@
       "tool_format": "json",
       "patterns": ["deepseek"]
     },
+    "minimax_m2_1": {
+      "description": "MiniMax M2.1 enhanced MoE architecture with improved coding and agentic capabilities (December 2024)",
+      "message_format": "im_start_end",
+      "system_prefix": "<|im_start|>system\n",
+      "system_suffix": "<|im_end|>\n",
+      "user_prefix": "<|im_start|>user\n",
+      "user_suffix": "<|im_end|>\n",
+      "assistant_prefix": "<|im_start|>assistant\n",
+      "assistant_suffix": "<|im_end|>\n",
+      "tool_format": "native",
+      "thinking_format": "<think>...</think>",
+      "patterns": ["minimax-m2.1", "minimaxai/minimax-m2.1", "minimax/minimax-m2.1"]
+    },
+    "minimax_m2": {
+      "description": "MiniMax M2 MoE architecture with interleaved thinking (January 2025)",
+      "message_format": "im_start_end",
+      "system_prefix": "<|im_start|>system\n",
+      "system_suffix": "<|im_end|>\n",
+      "user_prefix": "<|im_start|>user\n",
+      "user_suffix": "<|im_end|>\n",
+      "assistant_prefix": "<|im_start|>assistant\n",
+      "assistant_suffix": "<|im_end|>\n",
+      "tool_format": "native",
+      "thinking_format": "<think>...</think>",
+      "patterns": ["minimax-m2", "minimaxai/minimax-m2", "minimax/minimax-m2"]
+    },
     "seed_oss": {
       "description": "ByteDance's Seed-OSS long-context architecture (August 2025)",
       "message_format": "im_start_end",
@@ -390,6 +485,7 @@
       "user_suffix": "\n",
       "assistant_prefix": "Assistant: ",
       "assistant_suffix": "\n",
+      "default_tool_support": "native",
       "tool_format": "xml",
       "patterns": ["claude", "claude-3", "claude-4", "claude-4.1", "claude-4.5"]
     },
@@ -399,6 +495,32 @@
       "tool_format": "openai_functions",
       "patterns": ["gpt", "chatgpt", "gpt-5"]
     },
+    "gpt_oss": {
+      "description": "OpenAI GPT-OSS open-weight MoE architecture with harmony format (August 2025)",
+      "message_format": "harmony",
+      "system_prefix": "<|system|>\n",
+      "system_suffix": "\n",
+      "user_prefix": "<|user|>\n",
+      "user_suffix": "\n",
+      "assistant_prefix": "<|assistant|>\n",
+      "assistant_suffix": "\n",
+      "tool_format": "native",
+      "reasoning_levels": ["low", "medium", "high"],
+      "patterns": ["gpt-oss", "openai/gpt-oss"]
+    },
+    "nemotron_hybrid_moe": {
+      "description": "NVIDIA Nemotron-3-Nano hybrid MoE architecture with Mamba-2 and Attention layers (December 2025)",
+      "message_format": "im_start_end",
+      "system_prefix": "<|im_start|>system\n",
+      "system_suffix": "<|im_end|>\n",
+      "user_prefix": "<|im_start|>user\n",
+      "user_suffix": "<|im_end|>\n",
+      "assistant_prefix": "<|im_start|>assistant\n",
+      "assistant_suffix": "<|im_end|>\n",
+      "tool_format": "json",
+      "reasoning_support": true,
+      "patterns": ["nemotron-3-nano", "nemotron-nano", "nvidia/nemotron"]
+    },
     "generic": {
       "description": "Generic/unknown architecture fallback",
       "message_format": "basic",
@@ -420,7 +542,8 @@
     "human_assistant": "Human/Assistant format",
     "openai_chat": "OpenAI chat completion format",
     "llama3_header": "LLaMA 3+ format with <|start_header_id|> and <|eot_id|>",
-    "glm_special_tokens": "GLM format with <|system|>, <|user|>, <|assistant|> tokens"
+    "glm_special_tokens": "GLM format with <|system|>, <|user|>, <|assistant|> tokens",
+    "harmony": "OpenAI harmony response format for GPT-OSS models"
   },
   "tool_formats": {
     "pythonic": "Python function call syntax: [func(arg=val)]",
@@ -432,4 +555,4 @@
     "prompted": "Tool use through careful prompting",
     "none": "No tool support"
   }
-}
+}

abstractcore 2.6.9__py3-none-any.whl → 2.9.1__py3-none-any.whl

abstractcore 2.6.9py3-none-any.whl → 2.9.1py3-none-any.whl