PyPI - chat-console - Versions diffs - 0.3.9__py3-none-any.whl → 0.3.94__py3-none-any.whl - Mend

chat-console 0.3.9py3-none-any.whl → 0.3.94py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

app/__init__.py +1 -1
app/api/base.py +10 -6
app/api/ollama.py +51 -23
app/config.py +29 -26
app/main.py +81 -11
app/ui/chat_interface.py +31 -58
app/ui/model_selector.py +5 -0
app/utils.py +580 -374
{chat_console-0.3.9.dist-info → chat_console-0.3.94.dist-info}/METADATA +1 -1
chat_console-0.3.94.dist-info/RECORD +24 -0
chat_console-0.3.9.dist-info/RECORD +0 -24
{chat_console-0.3.9.dist-info → chat_console-0.3.94.dist-info}/WHEEL +0 -0
{chat_console-0.3.9.dist-info → chat_console-0.3.94.dist-info}/entry_points.txt +0 -0
{chat_console-0.3.9.dist-info → chat_console-0.3.94.dist-info}/licenses/LICENSE +0 -0
{chat_console-0.3.9.dist-info → chat_console-0.3.94.dist-info}/top_level.txt +0 -0

app/utils.py CHANGED Viewed

@@ -27,458 +27,648 @@ async def generate_conversation_title(message: str, model: str, client: Any) ->
     debug_log(f"Starting title generation with model: {model}, client type: {type(client).__name__}")
-    # --- Choose a specific, reliable model for title generation ---
-    # First, determine if we have a valid client
-    if client is None:
-        debug_log("Client is None, will use default title")
-        return f"Conversation ({datetime.now().strftime('%Y-%m-%d %H:%M')})"
-    # Determine the best model to use for title generation
-    title_model_id = None
+    # For safety, always use a default title first
+    default_title = f"Conversation ({datetime.now().strftime('%Y-%m-%d %H:%M')})"
-    # Check if client is Anthropic
-    is_anthropic = 'anthropic' in str(type(client)).lower()
-    if is_anthropic:
-        debug_log("Using Anthropic client for title generation")
-        # Try to get available models safely
-        try:
-            available_anthropic_models = client.get_available_models()
-            debug_log(f"Found {len(available_anthropic_models)} Anthropic models")
+    # Try-except the entire function to ensure we always return a title
+    try:
+        # Pick a reliable title generation model - prefer OpenAI if available
+        from ..config import OPENAI_API_KEY, ANTHROPIC_API_KEY
+        if OPENAI_API_KEY:
+            from ..api.openai import OpenAIClient
+            title_client = await OpenAIClient.create()
+            title_model = "gpt-3.5-turbo"
+            debug_log("Using OpenAI for title generation")
+        elif ANTHROPIC_API_KEY:
+            from ..api.anthropic import AnthropicClient
+            title_client = await AnthropicClient.create()
+            title_model = "claude-3-haiku-20240307"
+            debug_log("Using Anthropic for title generation")
+        else:
+            # Use the passed client if no API keys available
+            title_client = client
+            title_model = model
+            debug_log(f"Using provided {type(client).__name__} for title generation")
+        # Create a special prompt for title generation
+        title_prompt = [
+            {
+                "role": "system",
+                "content": "Generate a brief, descriptive title (maximum 40 characters) for a conversation that starts with the following message. Return only the title text with no additional explanation or formatting."
+            },
+            {
+                "role": "user",
+                "content": message
+            }
+        ]
+        # Generate title
+        debug_log(f"Sending title generation request to {title_model}")
+        title = await title_client.generate_completion(
+            messages=title_prompt,
+            model=title_model,
+            temperature=0.7,
+            max_tokens=60
+        )
+        # Sanitize the title
+        title = title.strip().strip('"\'').strip()
+        if len(title) > 40:
+            title = title[:37] + "..."
-            # Try Claude 3 Haiku first (fastest)
-            haiku_id = "claude-3-haiku-20240307"
-            if any(m.get("id") == haiku_id for m in available_anthropic_models):
-                title_model_id = haiku_id
-                debug_log(f"Using Anthropic Haiku for title generation: {title_model_id}")
-            else:
-                # If Haiku not found, try Sonnet
-                sonnet_id = "claude-3-sonnet-20240229"
-                if any(m.get("id") == sonnet_id for m in available_anthropic_models):
-                    title_model_id = sonnet_id
-                    debug_log(f"Using Anthropic Sonnet for title generation: {title_model_id}")
-                else:
-                    debug_log("Neither Haiku nor Sonnet found in Anthropic models list")
-        except Exception as e:
-            debug_log(f"Error getting Anthropic models: {str(e)}")
+        debug_log(f"Generated title: {title}")
+        return title
+    except Exception as e:
+        # Log the error and return default title
+        debug_log(f"Title generation failed: {str(e)}")
+        logger.error(f"Title generation failed: {str(e)}")
+        return default_title
-    # Check if client is OpenAI
-    is_openai = 'openai' in str(type(client)).lower()
-    if is_openai:
-        debug_log("Using OpenAI client for title generation")
-        # Use GPT-3.5 for title generation (fast and cost-effective)
-        title_model_id = "gpt-3.5-turbo"
-        debug_log(f"Using OpenAI model for title generation: {title_model_id}")
-        # For OpenAI, we'll always use their model, not fall back to the passed model
-        # This prevents trying to use Ollama models with OpenAI client
+# Helper function for OpenAI streaming
+async def _generate_openai_stream(
+    app: 'SimpleChatApp',
+    messages: List[Dict],
+    model: str,
+    style: str,
+    client: Any,
+    callback: Callable[[str], Awaitable[None]],
+    update_lock: asyncio.Lock
+) -> Optional[str]:
+    """Generate streaming response using OpenAI provider."""
+    try:
+        from app.main import debug_log
+    except ImportError:
+        debug_log = lambda msg: None
-    # Check if client is Ollama
-    is_ollama = 'ollama' in str(type(client)).lower()
-    if is_ollama and not title_model_id:
-        debug_log("Using Ollama client for title generation")
-        # For Ollama, check if the model exists before using it
-        try:
-            # Try a quick test request to check if model exists
-            debug_log(f"Testing if Ollama model exists: {model}")
-            import aiohttp
-            async with aiohttp.ClientSession() as session:
-                try:
-                    base_url = "http://localhost:11434"
-                    async with session.post(
-                        f"{base_url}/api/generate",
-                        json={"model": model, "prompt": "test", "stream": False},
-                        timeout=2
-                    ) as response:
-                        if response.status == 200:
-                            # Model exists, use it
-                            title_model_id = model
-                            debug_log(f"Ollama model {model} exists, using it for title generation")
-                        else:
-                            debug_log(f"Ollama model {model} returned status {response.status}, falling back to default")
-                            # Fall back to a common model
-                            title_model_id = "llama3"
-                except Exception as e:
-                    debug_log(f"Error testing Ollama model: {str(e)}, falling back to default")
-                    # Fall back to a common model
-                    title_model_id = "llama3"
-        except Exception as e:
-            debug_log(f"Error checking Ollama model: {str(e)}")
-            # Fall back to a common model
-            title_model_id = "llama3"
+    debug_log(f"Using OpenAI-specific streaming for model: {model}")
-    # Fallback logic if no specific model was found
-    if not title_model_id:
-        # Use a safe default based on client type
-        if is_openai:
-            title_model_id = "gpt-3.5-turbo"
-        elif is_anthropic:
-            title_model_id = "claude-3-haiku-20240307"
-        elif is_ollama:
-            title_model_id = "llama3"  # Common default
-        else:
-            # Last resort - use the originally passed model
-            title_model_id = model
-        debug_log(f"No specific model found, using fallback model for title generation: {title_model_id}")
+    # Initialize variables for response tracking
+    full_response = ""
+    buffer = []
+    last_update = time.time()
+    update_interval = 0.03  # Responsive updates for OpenAI
-    logger.info(f"Generating title for conversation using model: {title_model_id}")
-    debug_log(f"Final model selected for title generation: {title_model_id}")
+    try:
+        # Initialize stream generator
+        debug_log("Initializing OpenAI stream generator")
+        stream_generator = client.generate_stream(messages, model, style)
+        # Process stream chunks
+        debug_log("Beginning to process OpenAI stream chunks")
+        async for chunk in stream_generator:
+            # Check for task cancellation
+            if asyncio.current_task().cancelled():
+                debug_log("Task cancellation detected during OpenAI chunk processing")
+                if hasattr(client, 'cancel_stream'):
+                    await client.cancel_stream()
+                raise asyncio.CancelledError()
+            # Process chunk content
+            if chunk:
+                if not isinstance(chunk, str):
+                    try:
+                        chunk = str(chunk)
+                    except Exception:
+                        continue
+                buffer.append(chunk)
+                current_time = time.time()
+                # Update UI with new content
+                if (current_time - last_update >= update_interval or
+                    len(''.join(buffer)) > 5 or
+                    len(full_response) < 50):
+                    new_content = ''.join(buffer)
+                    full_response += new_content
+                    try:
+                        async with update_lock:
+                            await callback(full_response)
+                            if hasattr(app, 'refresh'):
+                                app.refresh(layout=True)
+                    except Exception as callback_err:
+                        logger.error(f"Error in OpenAI UI callback: {str(callback_err)}")
+                    buffer = []
+                    last_update = current_time
+                    await asyncio.sleep(0.02)
+        # Process any remaining buffer content
+        if buffer:
+            new_content = ''.join(buffer)
+            full_response += new_content
+            try:
+                async with update_lock:
+                    await callback(full_response)
+                    if hasattr(app, 'refresh'):
+                        app.refresh(layout=True)
+                        await asyncio.sleep(0.02)
+                        try:
+                            messages_container = app.query_one("#messages-container")
+                            if messages_container:
+                                messages_container.scroll_end(animate=False)
+                        except Exception:
+                            pass
+            except Exception as callback_err:
+                logger.error(f"Error in final OpenAI UI callback: {str(callback_err)}")
+        # Final refresh to ensure everything is displayed correctly
+        try:
+            await asyncio.sleep(0.05)
+            async with update_lock:
+                await callback(full_response)
+                if hasattr(app, 'refresh'):
+                    app.refresh(layout=True)
+        except Exception:
+            pass
+        return full_response
+    except asyncio.CancelledError:
+        logger.info(f"OpenAI streaming cancelled. Partial response length: {len(full_response)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        return full_response
+    except Exception as e:
+        logger.error(f"Error during OpenAI streaming: {str(e)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        raise
-    # Create a special prompt for title generation
-    title_prompt = [
-        {
-            "role": "system",
-            "content": "Generate a brief, descriptive title (maximum 40 characters) for a conversation that starts with the following message. The title should be concise and reflect the main topic or query. Return only the title text with no additional explanation or formatting."
-        },
-        {
-            "role": "user",
-            "content": message
-        }
-    ]
+# Helper function for Anthropic streaming
+async def _generate_anthropic_stream(
+    app: 'SimpleChatApp',
+    messages: List[Dict],
+    model: str,
+    style: str,
+    client: Any,
+    callback: Callable[[str], Awaitable[None]],
+    update_lock: asyncio.Lock
+) -> Optional[str]:
+    """Generate streaming response using Anthropic provider."""
+    try:
+        from app.main import debug_log
+    except ImportError:
+        debug_log = lambda msg: None
-    tries = 2  # Number of retries
-    last_error = None
+    debug_log(f"Using Anthropic-specific streaming for model: {model}")
-    while tries > 0:
-        try:
-            debug_log(f"Attempt {3-tries} to generate title")
-            # First try generate_completion if available
-            if hasattr(client, 'generate_completion'):
-                debug_log("Using generate_completion method")
-                try:
-                    title = await client.generate_completion(
-                        messages=title_prompt,
-                        model=title_model_id,
-                        temperature=0.7,
-                        max_tokens=60  # Titles should be short
-                    )
-                    debug_log(f"Title generated successfully: {title}")
-                except Exception as completion_error:
-                    debug_log(f"Error in generate_completion: {str(completion_error)}")
-                    raise  # Re-raise to be caught by outer try/except
-            # Fall back to generate_stream if completion not available
-            elif hasattr(client, 'generate_stream'):
-                debug_log("Using generate_stream method")
-                title_chunks = []
-                try:
-                    async for chunk in client.generate_stream(title_prompt, title_model_id, style=""):
-                        if chunk is not None:
-                            title_chunks.append(chunk)
-                            debug_log(f"Received chunk of length: {len(chunk)}")
+    # Initialize variables for response tracking
+    full_response = ""
+    buffer = []
+    last_update = time.time()
+    update_interval = 0.03  # Responsive updates for Anthropic
+    try:
+        # Initialize stream generator
+        debug_log("Initializing Anthropic stream generator")
+        stream_generator = client.generate_stream(messages, model, style)
+        # Process stream chunks
+        debug_log("Beginning to process Anthropic stream chunks")
+        async for chunk in stream_generator:
+            # Check for task cancellation
+            if asyncio.current_task().cancelled():
+                debug_log("Task cancellation detected during Anthropic chunk processing")
+                if hasattr(client, 'cancel_stream'):
+                    await client.cancel_stream()
+                raise asyncio.CancelledError()
+            # Process chunk content
+            if chunk:
+                if not isinstance(chunk, str):
+                    try:
+                        chunk = str(chunk)
+                    except Exception:
+                        continue
+                buffer.append(chunk)
+                current_time = time.time()
+                # Update UI with new content
+                if (current_time - last_update >= update_interval or
+                    len(''.join(buffer)) > 5 or
+                    len(full_response) < 50):
-                    title = "".join(title_chunks)
-                    debug_log(f"Combined title from chunks: {title}")
+                    new_content = ''.join(buffer)
+                    full_response += new_content
-                    # If we didn't get any content, use a default
-                    if not title.strip():
-                        debug_log("Empty title received, using default")
-                        title = f"Conversation ({datetime.now().strftime('%Y-%m-%d %H:%M')})"
-                except Exception as stream_error:
-                    debug_log(f"Error during title stream processing: {str(stream_error)}")
-                    raise  # Re-raise to be caught by outer try/except
-            else:
-                debug_log("Client does not support any title generation method")
-                raise NotImplementedError("Client does not support a suitable method for title generation.")
-            # Sanitize and limit the title
-            title = title.strip().strip('"\'').strip()
-            if len(title) > 40:  # Set a maximum title length
-                title = title[:37] + "..."
+                    try:
+                        async with update_lock:
+                            await callback(full_response)
+                            if hasattr(app, 'refresh'):
+                                app.refresh(layout=True)
+                    except Exception as callback_err:
+                        logger.error(f"Error in Anthropic UI callback: {str(callback_err)}")
+                    buffer = []
+                    last_update = current_time
+                    await asyncio.sleep(0.02)
+        # Process any remaining buffer content
+        if buffer:
+            new_content = ''.join(buffer)
+            full_response += new_content
+            try:
+                async with update_lock:
+                    await callback(full_response)
+                    if hasattr(app, 'refresh'):
+                        app.refresh(layout=True)
+                        await asyncio.sleep(0.02)
+                        try:
+                            messages_container = app.query_one("#messages-container")
+                            if messages_container:
+                                messages_container.scroll_end(animate=False)
+                        except Exception:
+                            pass
+            except Exception as callback_err:
+                logger.error(f"Error in final Anthropic UI callback: {str(callback_err)}")
-            logger.info(f"Generated title: {title}")
-            debug_log(f"Final sanitized title: {title}")
-            return title  # Return successful title
+        # Final refresh to ensure everything is displayed correctly
+        try:
+            await asyncio.sleep(0.05)
+            async with update_lock:
+                await callback(full_response)
+                if hasattr(app, 'refresh'):
+                    app.refresh(layout=True)
+        except Exception:
+            pass
-        except Exception as e:
-            last_error = str(e)
-            debug_log(f"Error generating title (tries left: {tries-1}): {last_error}")
-            logger.error(f"Error generating title (tries left: {tries-1}): {last_error}")
-            tries -= 1
-            if tries > 0:  # Only sleep if there are more retries
-                await asyncio.sleep(1)  # Small delay before retry
-    # If all retries fail, log the error and return a default title
-    debug_log(f"Failed to generate title after multiple retries. Using default title.")
-    logger.error(f"Failed to generate title after multiple retries. Last error: {last_error}")
-    return f"Conversation ({datetime.now().strftime('%Y-%m-%d %H:%M')})"
+        return full_response
+    except asyncio.CancelledError:
+        logger.info(f"Anthropic streaming cancelled. Partial response length: {len(full_response)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        return full_response
+    except Exception as e:
+        logger.error(f"Error during Anthropic streaming: {str(e)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        raise
-# Worker function for streaming response generation
-async def generate_streaming_response(
+# Helper function for Ollama streaming
+async def _generate_ollama_stream(
     app: 'SimpleChatApp',
     messages: List[Dict],
     model: str,
     style: str,
     client: Any,
-    callback: Callable[[str], Awaitable[None]]
+    callback: Callable[[str], Awaitable[None]],
+    update_lock: asyncio.Lock
 ) -> Optional[str]:
-    """
-    Generate a streaming response from the model (as a Textual worker).
-    Refactored to be a coroutine, not an async generator.
-    """
+    """Generate streaming response using Ollama provider."""
     try:
         from app.main import debug_log
     except ImportError:
         debug_log = lambda msg: None
-    logger.info(f"Starting streaming response with model: {model}")
-    debug_log(f"Starting streaming response with model: '{model}', client type: {type(client).__name__}")
-    # Validate messages
-    if not messages:
-        debug_log("Error: messages list is empty")
-        raise ValueError("Messages list cannot be empty")
-    # Ensure all messages have required fields
-    for i, msg in enumerate(messages):
-        try:
-            debug_log(f"Message {i}: role={msg.get('role', 'missing')}, content_len={len(msg.get('content', ''))}")
-            if 'role' not in msg:
-                debug_log(f"Adding missing 'role' to message {i}")
-                msg['role'] = 'user'
-            if 'content' not in msg:
-                debug_log(f"Adding missing 'content' to message {i}")
-                msg['content'] = ''
-        except Exception as e:
-            debug_log(f"Error checking message {i}: {str(e)}")
-            messages[i] = {
-                'role': 'user',
-                'content': str(msg) if msg else ''
-            }
-            debug_log(f"Repaired message {i}")
+    debug_log(f"Using Ollama-specific streaming for model: {model}")
     # Initialize variables for response tracking
     full_response = ""
     buffer = []
     last_update = time.time()
-    update_interval = 0.05  # Reduced interval for more frequent updates
+    update_interval = 0.03  # Responsive updates for Ollama
     try:
-        # Validate client
-        if client is None:
-            debug_log("Error: client is None, cannot proceed with streaming")
-            raise ValueError("Model client is None, cannot proceed with streaming")
-        if not hasattr(client, 'generate_stream'):
-            debug_log(f"Error: client {type(client).__name__} does not have generate_stream method")
-            raise ValueError(f"Client {type(client).__name__} does not support streaming")
-        # Determine client type
-        is_ollama = 'ollama' in str(type(client)).lower()
-        is_openai = 'openai' in str(type(client)).lower()
-        is_anthropic = 'anthropic' in str(type(client)).lower()
-        debug_log(f"Client types - Ollama: {is_ollama}, OpenAI: {is_openai}, Anthropic: {is_anthropic}")
-        # Only show loading indicator for Ollama (which may need to load models)
-        # This prevents Ollama-specific UI elements from showing when using other providers
-        if is_ollama and hasattr(app, 'query_one'):
+        # Show loading indicator for Ollama (which may need to load models)
+        if hasattr(app, 'query_one'):
             try:
                 debug_log("Showing initial model loading indicator for Ollama")
-                logger.info("Showing initial model loading indicator for Ollama")
                 loading = app.query_one("#loading-indicator")
                 loading.add_class("model-loading")
                 loading.update("⚙️ Loading Ollama model...")
             except Exception as e:
                 debug_log(f"Error setting initial Ollama loading state: {str(e)}")
-                logger.error(f"Error setting initial Ollama loading state: {str(e)}")
-        debug_log(f"Starting stream generation with messages length: {len(messages)}")
-        logger.info(f"Starting stream generation for model: {model}")
         # Initialize stream generator
-        try:
-            debug_log("Calling client.generate_stream()")
-            stream_generator = client.generate_stream(messages, model, style)
-            debug_log("Successfully obtained stream generator")
-        except Exception as stream_init_error:
-            debug_log(f"Error initializing stream generator: {str(stream_init_error)}")
-            logger.error(f"Error initializing stream generator: {str(stream_init_error)}")
-            raise
-        # Update UI if model is ready (Ollama specific)
-        # Only check is_loading_model for Ollama clients to prevent errors with other providers
-        if is_ollama and hasattr(client, 'is_loading_model') and not client.is_loading_model() and hasattr(app, 'query_one'):
+        debug_log("Initializing Ollama stream generator")
+        stream_generator = client.generate_stream(messages, model, style)
+        # Update UI if model is ready
+        if hasattr(client, 'is_loading_model') and not client.is_loading_model() and hasattr(app, 'query_one'):
             try:
                 debug_log("Ollama model is ready for generation, updating UI")
-                logger.info("Ollama model is ready for generation, updating UI")
                 loading = app.query_one("#loading-indicator")
                 loading.remove_class("model-loading")
                 loading.update("▪▪▪ Generating response...")
             except Exception as e:
-                debug_log(f"Error updating UI after stream init: {str(e)}")
-                logger.error(f"Error updating UI after stream init: {str(e)}")
+                debug_log(f"Error updating UI after Ollama stream init: {str(e)}")
         # Process stream chunks
-        debug_log("Beginning to process stream chunks")
-        try:
-            async for chunk in stream_generator:
-                # Check for task cancellation
-                if asyncio.current_task().cancelled():
-                    debug_log("Task cancellation detected during chunk processing")
-                    logger.info("Task cancellation detected during chunk processing")
-                    if hasattr(client, 'cancel_stream'):
-                        debug_log("Calling client.cancel_stream() due to task cancellation")
-                        await client.cancel_stream()
-                    raise asyncio.CancelledError()
-                # Handle Ollama model loading state changes - only for Ollama clients
-                if is_ollama and hasattr(client, 'is_loading_model'):
-                    try:
-                        model_loading = client.is_loading_model()
-                        debug_log(f"Ollama model loading state: {model_loading}")
-                        if hasattr(app, 'query_one'):
-                            try:
-                                loading = app.query_one("#loading-indicator")
-                                if model_loading and hasattr(loading, 'has_class') and not loading.has_class("model-loading"):
-                                    debug_log("Ollama model loading started during streaming")
-                                    logger.info("Ollama model loading started during streaming")
-                                    loading.add_class("model-loading")
-                                    loading.update("⚙️ Loading Ollama model...")
-                                elif not model_loading and hasattr(loading, 'has_class') and loading.has_class("model-loading"):
-                                    debug_log("Ollama model loading finished during streaming")
-                                    logger.info("Ollama model loading finished during streaming")
-                                    loading.remove_class("model-loading")
-                                    loading.update("▪▪▪ Generating response...")
-                            except Exception as ui_e:
-                                debug_log(f"Error updating UI elements: {str(ui_e)}")
-                                logger.error(f"Error updating UI elements: {str(ui_e)}")
-                    except Exception as e:
-                        debug_log(f"Error checking Ollama model loading state: {str(e)}")
-                        logger.error(f"Error checking Ollama model loading state: {str(e)}")
-                # Process chunk content
-                if chunk:
-                    if not isinstance(chunk, str):
-                        debug_log(f"WARNING: Received non-string chunk of type: {type(chunk).__name__}")
+        debug_log("Beginning to process Ollama stream chunks")
+        async for chunk in stream_generator:
+            # Check for task cancellation
+            if asyncio.current_task().cancelled():
+                debug_log("Task cancellation detected during Ollama chunk processing")
+                if hasattr(client, 'cancel_stream'):
+                    await client.cancel_stream()
+                raise asyncio.CancelledError()
+            # Handle Ollama model loading state changes
+            if hasattr(client, 'is_loading_model'):
+                try:
+                    model_loading = client.is_loading_model()
+                    if hasattr(app, 'query_one'):
                         try:
-                            chunk = str(chunk)
-                            debug_log(f"Successfully converted chunk to string, length: {len(chunk)}")
-                        except Exception as e:
-                            debug_log(f"Error converting chunk to string: {str(e)}")
-                            continue
-                    debug_log(f"Received chunk of length: {len(chunk)}")
-                    buffer.append(chunk)
-                    current_time = time.time()
-                    # Update UI with new content
-                    # Always update immediately for the first few chunks for better responsiveness
-                    if (current_time - last_update >= update_interval or
-                        len(''.join(buffer)) > 5 or  # Reduced buffer size threshold
-                        len(full_response) < 50):    # More aggressive updates for early content
-                        new_content = ''.join(buffer)
-                        full_response += new_content
-                        debug_log(f"Updating UI with content length: {len(full_response)}")
-                        # Enhanced debug logging
-                        print(f"STREAM DEBUG: +{len(new_content)} chars, total: {len(full_response)}")
-                        # Print first few characters of content for debugging
-                        if len(full_response) < 100:
-                            print(f"STREAM CONTENT: '{full_response}'")
+                            loading = app.query_one("#loading-indicator")
+                            if model_loading and hasattr(loading, 'has_class') and not loading.has_class("model-loading"):
+                                debug_log("Ollama model loading started during streaming")
+                                loading.add_class("model-loading")
+                                loading.update("⚙️ Loading Ollama model...")
+                            elif not model_loading and hasattr(loading, 'has_class') and loading.has_class("model-loading"):
+                                debug_log("Ollama model loading finished during streaming")
+                                loading.remove_class("model-loading")
+                                loading.update("▪▪▪ Generating response...")
+                        except Exception:
+                            pass
+                except Exception:
+                    pass
+            # Process chunk content
+            if chunk:
+                if not isinstance(chunk, str):
+                    try:
+                        chunk = str(chunk)
+                    except Exception:
+                        continue
-                        try:
-                            # Call the UI callback with the full response so far
-                            debug_log("Calling UI callback with content")
+                buffer.append(chunk)
+                current_time = time.time()
+                # Update UI with new content
+                if (current_time - last_update >= update_interval or
+                    len(''.join(buffer)) > 5 or
+                    len(full_response) < 50):
+                    new_content = ''.join(buffer)
+                    full_response += new_content
+                    try:
+                        async with update_lock:
                             await callback(full_response)
-                            debug_log("UI callback completed successfully")
-                            # Force app refresh after each update
                             if hasattr(app, 'refresh'):
-                                debug_log("Forcing app refresh")
-                                app.refresh(layout=True)  # Force layout refresh
-                        except Exception as callback_err:
-                            debug_log(f"Error in UI callback: {str(callback_err)}")
-                            logger.error(f"Error in UI callback: {str(callback_err)}")
-                            print(f"STREAM ERROR: Error updating UI: {str(callback_err)}")
-                        buffer = []
-                        last_update = current_time
+                                app.refresh(layout=True)
+                    except Exception as callback_err:
+                        logger.error(f"Error in Ollama UI callback: {str(callback_err)}")
-                        # Shorter sleep between updates for more responsive streaming
-                        await asyncio.sleep(0.02)
-        except asyncio.CancelledError:
-            debug_log("CancelledError in stream processing")
-            raise
-        except Exception as chunk_error:
-            debug_log(f"Error processing stream chunks: {str(chunk_error)}")
-            logger.error(f"Error processing stream chunks: {str(chunk_error)}")
-            raise
+                    buffer = []
+                    last_update = current_time
+                    await asyncio.sleep(0.02)
+        # Process any remaining buffer content
         if buffer:
             new_content = ''.join(buffer)
             full_response += new_content
-            debug_log(f"Sending final content, total length: {len(full_response)}")
             try:
-                await callback(full_response)
-                debug_log("Final UI callback completed successfully")
-                debug_log("Forcing final UI refresh sequence for all models")
-                try:
+                async with update_lock:
+                    await callback(full_response)
                     if hasattr(app, 'refresh'):
-                        app.refresh(layout=False)
+                        app.refresh(layout=True)
                         await asyncio.sleep(0.02)
                         try:
                             messages_container = app.query_one("#messages-container")
-                            if messages_container and hasattr(messages_container, 'scroll_end'):
+                            if messages_container:
                                 messages_container.scroll_end(animate=False)
                         except Exception:
                             pass
+            except Exception as callback_err:
+                logger.error(f"Error in final Ollama UI callback: {str(callback_err)}")
+        # Final refresh to ensure everything is displayed correctly
+        try:
+            await asyncio.sleep(0.05)
+            async with update_lock:
+                await callback(full_response)
+                if hasattr(app, 'refresh'):
+                    app.refresh(layout=True)
+        except Exception:
+            pass
+        return full_response
+    except asyncio.CancelledError:
+        logger.info(f"Ollama streaming cancelled. Partial response length: {len(full_response)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        return full_response
+    except Exception as e:
+        logger.error(f"Error during Ollama streaming: {str(e)}")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        raise
+# Generic fallback streaming implementation
+async def _generate_generic_stream(
+    app: 'SimpleChatApp',
+    messages: List[Dict],
+    model: str,
+    style: str,
+    client: Any,
+    callback: Callable[[str], Awaitable[None]],
+    update_lock: asyncio.Lock
+) -> Optional[str]:
+    """Generic fallback implementation for streaming responses."""
+    try:
+        from app.main import debug_log
+    except ImportError:
+        debug_log = lambda msg: None
+    debug_log(f"Using generic streaming for model: {model}, client type: {type(client).__name__}")
+    # Initialize variables for response tracking
+    full_response = ""
+    buffer = []
+    last_update = time.time()
+    update_interval = 0.03  # Responsive updates
+    try:
+        # Initialize stream generator
+        debug_log("Initializing generic stream generator")
+        stream_generator = client.generate_stream(messages, model, style)
+        # Process stream chunks
+        debug_log("Beginning to process generic stream chunks")
+        async for chunk in stream_generator:
+            # Check for task cancellation
+            if asyncio.current_task().cancelled():
+                debug_log("Task cancellation detected during generic chunk processing")
+                if hasattr(client, 'cancel_stream'):
+                    await client.cancel_stream()
+                raise asyncio.CancelledError()
+            # Process chunk content
+            if chunk:
+                if not isinstance(chunk, str):
+                    try:
+                        chunk = str(chunk)
+                    except Exception:
+                        continue
+                buffer.append(chunk)
+                current_time = time.time()
+                # Update UI with new content
+                if (current_time - last_update >= update_interval or
+                    len(''.join(buffer)) > 5 or
+                    len(full_response) < 50):
+                    new_content = ''.join(buffer)
+                    full_response += new_content
+                    try:
+                        async with update_lock:
+                            await callback(full_response)
+                            if hasattr(app, 'refresh'):
+                                app.refresh(layout=True)
+                    except Exception as callback_err:
+                        logger.error(f"Error in generic UI callback: {str(callback_err)}")
+                    buffer = []
+                    last_update = current_time
+                    await asyncio.sleep(0.02)
+        # Process any remaining buffer content
+        if buffer:
+            new_content = ''.join(buffer)
+            full_response += new_content
+            try:
+                async with update_lock:
+                    await callback(full_response)
+                    if hasattr(app, 'refresh'):
                         app.refresh(layout=True)
                         await asyncio.sleep(0.02)
                         try:
                             messages_container = app.query_one("#messages-container")
-                            if messages_container and hasattr(messages_container, 'scroll_end'):
+                            if messages_container:
                                 messages_container.scroll_end(animate=False)
                         except Exception:
                             pass
-                except Exception as refresh_err:
-                    debug_log(f"Error forcing final UI refresh: {str(refresh_err)}")
             except Exception as callback_err:
-                debug_log(f"Error in final UI callback: {str(callback_err)}")
-                logger.error(f"Error in final UI callback: {str(callback_err)}")
+                logger.error(f"Error in final generic UI callback: {str(callback_err)}")
+        # Final refresh to ensure everything is displayed correctly
         try:
             await asyncio.sleep(0.05)
-            debug_log("Sending one final callback to ensure UI refresh")
-            await callback(full_response)
-            if hasattr(app, 'refresh'):
-                app.refresh(layout=True)
-        except Exception as final_err:
-            debug_log(f"Error in final extra callback: {str(final_err)}")
-        debug_log(f"Streaming response completed successfully. Response length: {len(full_response)}")
-        logger.info(f"Streaming response completed successfully. Response length: {len(full_response)}")
+            async with update_lock:
+                await callback(full_response)
+                if hasattr(app, 'refresh'):
+                    app.refresh(layout=True)
+        except Exception:
+            pass
         return full_response
     except asyncio.CancelledError:
-        debug_log(f"Streaming response task cancelled. Partial response length: {len(full_response)}")
-        logger.info(f"Streaming response task cancelled. Partial response length: {len(full_response)}")
+        logger.info(f"Generic streaming cancelled. Partial response length: {len(full_response)}")
         if hasattr(client, 'cancel_stream'):
-            debug_log("Calling client.cancel_stream() after cancellation")
-            try:
-                await client.cancel_stream()
-                debug_log("Successfully cancelled client stream")
-            except Exception as cancel_err:
-                debug_log(f"Error cancelling client stream: {str(cancel_err)}")
+            await client.cancel_stream()
         return full_response
     except Exception as e:
-        debug_log(f"Error during streaming response: {str(e)}")
-        logger.error(f"Error during streaming response: {str(e)}")
+        logger.error(f"Error during generic streaming: {str(e)}")
         if hasattr(client, 'cancel_stream'):
-            debug_log("Attempting to cancel client stream after error")
-            try:
-                await client.cancel_stream()
-                debug_log("Successfully cancelled client stream after error")
-            except Exception as cancel_err:
-                debug_log(f"Error cancelling client stream after error: {str(cancel_err)}")
+            await client.cancel_stream()
         raise
-    finally:
-        debug_log("generate_streaming_response worker finished or errored.")
-        if 'full_response' in locals():
-            return full_response
-        return None
+# Worker function for streaming response generation
+async def generate_streaming_response(
+    app: 'SimpleChatApp',
+    messages: List[Dict],
+    model: str,
+    style: str,
+    client: Any,
+    callback: Callable[[str], Awaitable[None]]
+) -> Optional[str]:
+    """
+    Generate a streaming response from the model (as a Textual worker).
+    Refactored to be a coroutine, not an async generator.
+    """
+    try:
+        from app.main import debug_log
+    except ImportError:
+        debug_log = lambda msg: None
+    logger.info(f"Starting streaming response with model: {model}")
+    debug_log(f"Starting streaming response with model: '{model}', client type: {type(client).__name__}")
+    # Validate messages
+    if not messages:
+        debug_log("Error: messages list is empty")
+        raise ValueError("Messages list cannot be empty")
+    # Ensure all messages have required fields
+    for i, msg in enumerate(messages):
+        try:
+            debug_log(f"Message {i}: role={msg.get('role', 'missing')}, content_len={len(msg.get('content', ''))}")
+            if 'role' not in msg:
+                debug_log(f"Adding missing 'role' to message {i}")
+                msg['role'] = 'user'
+            if 'content' not in msg:
+                debug_log(f"Adding missing 'content' to message {i}")
+                msg['content'] = ''
+        except Exception as e:
+            debug_log(f"Error checking message {i}: {str(e)}")
+            messages[i] = {
+                'role': 'user',
+                'content': str(msg) if msg else ''
+            }
+            debug_log(f"Repaired message {i}")
+    # Create a lock for synchronizing UI updates
+    update_lock = asyncio.Lock()
+    # Validate client
+    if client is None:
+        debug_log("Error: client is None, cannot proceed with streaming")
+        raise ValueError("Model client is None, cannot proceed with streaming")
+    if not hasattr(client, 'generate_stream'):
+        debug_log(f"Error: client {type(client).__name__} does not have generate_stream method")
+        raise ValueError(f"Client {type(client).__name__} does not support streaming")
+    # Explicitly check provider type first
+    is_ollama = 'ollama' in str(type(client)).lower()
+    is_openai = 'openai' in str(type(client)).lower()
+    is_anthropic = 'anthropic' in str(type(client)).lower()
+    debug_log(f"Client types - Ollama: {is_ollama}, OpenAI: {is_openai}, Anthropic: {is_anthropic}")
+    # Use separate implementations for each provider
+    try:
+        if is_openai:
+            debug_log("Using OpenAI-specific streaming implementation")
+            return await _generate_openai_stream(app, messages, model, style, client, callback, update_lock)
+        elif is_anthropic:
+            debug_log("Using Anthropic-specific streaming implementation")
+            return await _generate_anthropic_stream(app, messages, model, style, client, callback, update_lock)
+        elif is_ollama:
+            debug_log("Using Ollama-specific streaming implementation")
+            return await _generate_ollama_stream(app, messages, model, style, client, callback, update_lock)
+        else:
+            # Generic fallback
+            debug_log("Using generic streaming implementation")
+            return await _generate_generic_stream(app, messages, model, style, client, callback, update_lock)
+    except asyncio.CancelledError:
+        debug_log("Task cancellation detected in main streaming function")
+        if hasattr(client, 'cancel_stream'):
+            await client.cancel_stream()
+        raise
+    except Exception as e:
+        debug_log(f"Error in streaming implementation: {str(e)}")
+        logger.error(f"Error in streaming implementation: {str(e)}")
+        raise
 async def ensure_ollama_running() -> bool:
     """
@@ -555,6 +745,22 @@ def resolve_model_id(model_id_or_name: str) -> str:
     input_lower = model_id_or_name.lower().strip()
     logger.info(f"Attempting to resolve model identifier: '{input_lower}'")
+    # Add special case handling for common OpenAI models
+    openai_model_aliases = {
+        "04-mini": "gpt-4-mini",  # Fix "04-mini" typo to "gpt-4-mini"
+        "04": "gpt-4",
+        "04-vision": "gpt-4-vision",
+        "04-turbo": "gpt-4-turbo",
+        "035": "gpt-3.5-turbo",
+        "35-turbo": "gpt-3.5-turbo",
+        "35": "gpt-3.5-turbo"
+    }
+    if input_lower in openai_model_aliases:
+        resolved = openai_model_aliases[input_lower]
+        logger.info(f"Resolved '{input_lower}' to '{resolved}' via OpenAI model alias")
+        return resolved
     # Special case handling for common typos and model name variations
     typo_corrections = {
         "o4-mini": "04-mini",

chat-console 0.3.9__py3-none-any.whl → 0.3.94__py3-none-any.whl

chat-console 0.3.9py3-none-any.whl → 0.3.94py3-none-any.whl