PyPI - abstractcore - Versions diffs - 2.4.2__py3-none-any.whl → 2.4.4__py3-none-any.whl - Mend

abstractcore 2.4.2py3-none-any.whl → 2.4.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

abstractcore/apps/app_config_utils.py +19 -0
abstractcore/apps/summarizer.py +85 -56
abstractcore/architectures/detection.py +15 -4
abstractcore/assets/architecture_formats.json +1 -1
abstractcore/assets/model_capabilities.json +420 -11
abstractcore/core/interface.py +2 -0
abstractcore/core/session.py +4 -0
abstractcore/embeddings/manager.py +54 -16
abstractcore/media/__init__.py +116 -148
abstractcore/media/auto_handler.py +363 -0
abstractcore/media/base.py +456 -0
abstractcore/media/capabilities.py +335 -0
abstractcore/media/types.py +300 -0
abstractcore/media/vision_fallback.py +260 -0
abstractcore/providers/anthropic_provider.py +18 -1
abstractcore/providers/base.py +187 -0
abstractcore/providers/huggingface_provider.py +111 -12
abstractcore/providers/lmstudio_provider.py +88 -5
abstractcore/providers/mlx_provider.py +33 -1
abstractcore/providers/ollama_provider.py +37 -3
abstractcore/providers/openai_provider.py +18 -1
abstractcore/server/app.py +1390 -104
abstractcore/tools/common_tools.py +12 -8
abstractcore/utils/__init__.py +9 -5
abstractcore/utils/cli.py +199 -17
abstractcore/utils/message_preprocessor.py +182 -0
abstractcore/utils/structured_logging.py +117 -16
abstractcore/utils/version.py +1 -1
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/METADATA +214 -20
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/RECORD +34 -27
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/entry_points.txt +1 -0
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/WHEEL +0 -0
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/licenses/LICENSE +0 -0
{abstractcore-2.4.2.dist-info → abstractcore-2.4.4.dist-info}/top_level.txt +0 -0

abstractcore/apps/app_config_utils.py ADDED Viewed

@@ -0,0 +1,19 @@
+"""
+Shared configuration utilities for AbstractCore apps.
+"""
+def get_app_defaults(app_name: str) -> tuple[str, str]:
+    """Get default provider and model for an app."""
+    try:
+        from ..config import get_config_manager
+        config_manager = get_config_manager()
+        return config_manager.get_app_default(app_name)
+    except Exception:
+        # Fallback to hardcoded defaults if config unavailable
+        hardcoded_defaults = {
+            'summarizer': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'extractor': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'judge': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'cli': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+        }
+        return hardcoded_defaults.get(app_name, ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'))

abstractcore/apps/summarizer.py CHANGED Viewed

@@ -35,6 +35,23 @@ from ..processing import BasicSummarizer, SummaryStyle, SummaryLength
 from ..core.factory import create_llm
+def get_app_defaults(app_name: str) -> tuple[str, str]:
+    """Get default provider and model for an app."""
+    try:
+        from ..config import get_config_manager
+        config_manager = get_config_manager()
+        return config_manager.get_app_default(app_name)
+    except Exception:
+        # Fallback to hardcoded defaults if config unavailable
+        hardcoded_defaults = {
+            'summarizer': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'extractor': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'judge': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+            'cli': ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'),
+        }
+        return hardcoded_defaults.get(app_name, ('huggingface', 'unsloth/Qwen3-4B-Instruct-2507-GGUF'))
 def read_file_content(file_path: str) -> str:
     """
     Read content from various file types
@@ -168,9 +185,9 @@ Examples:
 Supported file types: .txt, .md, .py, .js, .html, .json, .csv, and most text-based files
 Default model setup:
-  - Requires Ollama: https://ollama.com/
-  - Download model: ollama pull gemma3:1b-it-qat
-  - Or use --provider and --model for other providers
+  - Fresh installs use: huggingface/unsloth/Qwen3-4B-Instruct-2507-GGUF (HuggingFace local model)
+  - Configure defaults: abstractcore --set-app-default summarizer <provider> <model>
+  - Or use --provider and --model for explicit override
         """
     )
@@ -240,6 +257,12 @@ Default model setup:
         help='Show detailed progress information'
     )
+    parser.add_argument(
+        '--debug',
+        action='store_true',
+        help='Enable debug logging and show detailed diagnostics'
+    )
     parser.add_argument(
         '--timeout',
         default=None,
@@ -249,6 +272,17 @@ Default model setup:
     # Parse arguments
     args = parser.parse_args()
+    # Configure logging based on arguments (--debug overrides config defaults)
+    if args.debug:
+        from ..utils.structured_logging import configure_logging
+        import logging
+        configure_logging(
+            console_level=logging.DEBUG,
+            file_level=logging.DEBUG,
+            verbatim_enabled=True
+        )
+        print("🐛 Debug logging enabled")
     try:
         # Validate chunk size
         if args.chunk_size < 1000:
@@ -285,66 +319,61 @@ Default model setup:
         style = parse_style(args.style)
         length = parse_length(args.length)
-        # Initialize LLM and summarizer
+        # Get provider and model using centralized configuration
         if args.provider and args.model:
-            # Custom provider/model with max_tokens adjusted for chunk size
-            max_tokens = max(16000, args.chunk_size)  # Ensure max_tokens >= chunk_size
-            if args.verbose:
-                print(f"Initializing summarizer ({args.provider}, {args.model}, {args.max_tokens} token context, {args.max_output_tokens} output tokens)...")
+            # Use explicit parameters
+            provider, model = args.provider, args.model
+            config_source = "explicit parameters"
+        else:
+            # Use configured defaults
+            provider, model = get_app_defaults('summarizer')
+            config_source = "configured defaults"
+        # Adjust max_tokens based on chunk size
+        max_tokens = max(args.max_tokens, args.chunk_size)
+        if args.verbose:
+            print(f"Initializing summarizer ({provider}, {model}, {max_tokens} token context, {args.max_output_tokens} output tokens) - using {config_source}...")
+        if args.debug:
+            print(f"🐛 Debug - Configuration details:")
+            print(f"   Provider: {provider}")
+            print(f"   Model: {model}")
+            print(f"   Config source: {config_source}")
+            print(f"   Max tokens: {max_tokens}")
+            print(f"   Max output tokens: {args.max_output_tokens}")
+            print(f"   Chunk size: {args.chunk_size}")
+            print(f"   Timeout: {args.timeout}")
+            print(f"   Style: {args.style}")
+            print(f"   Length: {args.length}")
+            print(f"   Focus: {args.focus}")
-            llm = create_llm(args.provider, model=args.model, max_tokens=args.max_tokens, max_output_tokens=args.max_output_tokens, timeout=args.timeout)
+        try:
+            llm = create_llm(provider, model=model, max_tokens=max_tokens, max_output_tokens=args.max_output_tokens, timeout=args.timeout)
             summarizer = BasicSummarizer(
-                llm,
+                llm,
                 max_chunk_size=args.chunk_size,
-                max_tokens=args.max_tokens,
+                max_tokens=max_tokens,
                 max_output_tokens=args.max_output_tokens,
                 timeout=args.timeout
             )
-        else:
-            # Default configuration with chunk size override
-            if args.chunk_size != 8000:
-                # Custom chunk size, need to adjust max_tokens if necessary
-                max_tokens = max(16000, args.chunk_size)
-                if args.verbose:
-                    print(f"Initializing summarizer (ollama, gemma3:1b-it-qat, {args.max_tokens} token context, {args.max_output_tokens} output tokens, {args.chunk_size} chunk size)...")
-                try:
-                    llm = create_llm("ollama", model="gemma3:1b-it-qat", max_tokens=args.max_tokens, max_output_tokens=args.max_output_tokens, timeout=args.timeout)
-                    summarizer = BasicSummarizer(
-                        llm,
-                        max_chunk_size=args.chunk_size,
-                        max_tokens=args.max_tokens,
-                        max_output_tokens=args.max_output_tokens,
-                        timeout=args.timeout
-                    )
-                except Exception as e:
-                    # Handle default model not available
-                    print(f"\n❌ Failed to initialize default Ollama model 'gemma3:1b-it-qat': {e}")
-                    print("\n💡 To use the default model, please:")
-                    print("   1. Install Ollama from: https://ollama.com/")
-                    print("   2. Download the model: ollama pull gemma3:1b-it-qat")
-                    print("   3. Start Ollama service")
-                    print("\n🚀 Alternatively, specify a different provider:")
-                    print("   - Example: summarizer document.txt --provider openai --model gpt-4o-mini")
-                    sys.exit(1)
-            else:
-                # Default configuration
-                if args.verbose:
-                    print(f"Initializing summarizer (ollama, gemma3:1b-it-qat, {args.max_tokens} token context, {args.max_output_tokens} output tokens, {args.chunk_size} chunk size)...")
-                try:
-                    summarizer = BasicSummarizer(
-                        max_chunk_size=args.chunk_size,
-                        max_tokens=args.max_tokens,
-                        max_output_tokens=args.max_output_tokens,
-                        timeout=args.timeout
-                    )
-                except RuntimeError as e:
-                    # Handle default model not available
-                    print(f"\n{e}")
-                    print("\n🚀 Quick alternatives to get started:")
-                    print("   - Use --provider and --model to specify an available provider")
-                    print("   - Example: summarizer document.txt --provider openai --model gpt-4o-mini")
-                    sys.exit(1)
+        except Exception as e:
+            # Handle model initialization failure
+            print(f"\n❌ Failed to initialize LLM '{provider}/{model}': {e}")
+            print(f"\n💡 Solutions:")
+            if provider == "ollama":
+                print(f"   - Install Ollama: https://ollama.com/")
+                print(f"   - Download the model: ollama pull {model}")
+                print(f"   - Verify with: ollama list")
+            print(f"\n🚀 Alternatively, specify a different provider:")
+            print(f"   - Example: summarizer document.txt --provider openai --model gpt-4o-mini")
+            print(f"   - Example: summarizer document.txt --provider anthropic --model claude-3-5-haiku-20241022")
+            print(f"\n🔧 Or configure a different default:")
+            print(f"   - abstractcore --set-app-default summarizer openai gpt-4o-mini")
+            print(f"   - abstractcore --status")
+            sys.exit(1)
         # Generate summary
         if args.verbose:

abstractcore/architectures/detection.py CHANGED Viewed

@@ -100,6 +100,8 @@ def resolve_model_alias(model_name: str, models: Dict[str, Any]) -> str:
     """
     Resolve a model name to its canonical name by checking aliases.
+    Automatically converts "--" to "/" for HuggingFace cache format compatibility.
     Args:
         model_name: Model name that might be an alias
         models: Models dictionary from capabilities JSON
@@ -111,15 +113,24 @@ def resolve_model_alias(model_name: str, models: Dict[str, Any]) -> str:
     if model_name in models:
         return model_name
-    # Check if it's an alias of any model
+    # Convert "--" to "/" for HuggingFace cache format compatibility
+    normalized_model_name = model_name.replace("--", "/")
+    if normalized_model_name != model_name:
+        logger.debug(f"Normalized model name '{model_name}' to '{normalized_model_name}'")
+    # Check if normalized name is a canonical name
+    if normalized_model_name in models:
+        return normalized_model_name
+    # Check if it's an alias of any model (try both original and normalized)
     for canonical_name, model_info in models.items():
         aliases = model_info.get("aliases", [])
-        if model_name in aliases:
+        if model_name in aliases or normalized_model_name in aliases:
             logger.debug(f"Resolved alias '{model_name}' to canonical name '{canonical_name}'")
             return canonical_name
-    # Return original name if no alias found
-    return model_name
+    # Return normalized name if no alias found
+    return normalized_model_name
 def get_model_capabilities(model_name: str) -> Dict[str, Any]:

abstractcore/assets/architecture_formats.json CHANGED Viewed

@@ -233,7 +233,7 @@
         "assistant_prefix": "Assistant: ",
         "assistant_suffix": "\n",
         "tool_format": "native",
-        "patterns": ["gemma3n", "gemma3n:e4b", "gemma3n:e2b"]
+        "patterns": ["gemma3n", "gemma3n:e4b", "gemma3n:e2b", "gemma-3n", "google/gemma-3n"]
       },
     "paligemma": {
       "description": "Google's PaliGemma vision-language architecture",

abstractcore 2.4.2__py3-none-any.whl → 2.4.4__py3-none-any.whl

abstractcore 2.4.2py3-none-any.whl → 2.4.4py3-none-any.whl