PyPI - chat-console - Versions diffs - 0.2.99__tar.gz → 0.3.0__tar.gz - Mend

chat-console 0.2.99tar.gz → 0.3.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

{chat_console-0.2.99 → chat_console-0.3.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: chat-console
-Version: 0.2.99
+Version: 0.3.0
 Summary: A command-line interface for chatting with LLMs, storing chats and (future) rag interactions
 Home-page: https://github.com/wazacraftrfid/chat-console
 Author: Johnathan Greenaway

{chat_console-0.2.99 → chat_console-0.3.0}/app/__init__.py RENAMED Viewed

@@ -3,4 +3,4 @@ Chat CLI
 A command-line interface for chatting with various LLM providers like ChatGPT and Claude.
 """
-__version__ = "0.2.99"
+__version__ = "0.3.0"

{chat_console-0.2.99 → chat_console-0.3.0}/app/api/anthropic.py RENAMED Viewed

@@ -144,86 +144,110 @@ class AnthropicClient(BaseModelClient):
         except ImportError:
             debug_log = lambda msg: None
+        # Always include a reliable fallback list in case API calls fail
+        fallback_models = [
+            {"id": "claude-3-opus-20240229", "name": "Claude 3 Opus"},
+            {"id": "claude-3-sonnet-20240229", "name": "Claude 3 Sonnet"},
+            {"id": "claude-3-haiku-20240307", "name": "Claude 3 Haiku"},
+            {"id": "claude-3-5-sonnet-20240620", "name": "Claude 3.5 Sonnet"},
+            {"id": "claude-3-7-sonnet-20250219", "name": "Claude 3.7 Sonnet"},
+        ]
+        # If no client is initialized, return fallback immediately
+        if not self.client:
+            debug_log("Anthropic: No client initialized, using fallback models")
+            return fallback_models
         try:
             debug_log("Anthropic: Fetching models from API...")
-            # The Anthropic Python SDK might not have a direct high-level method for listing models yet.
-            # We might need to use the underlying HTTP client or make a direct request.
-            # Let's assume for now the SDK client *does* have a way, like self.client.models.list()
-            # If this fails, we'd need to implement a direct HTTP GET request.
-            # response = await self.client.models.list() # Hypothetical SDK method
-            # --- Alternative: Direct HTTP Request using httpx (if client exposes it) ---
-            # Check if the client has an internal http_client we can use
+            # Try using the models.list method if available in newer SDK versions
+            if hasattr(self.client, 'models') and hasattr(self.client.models, 'list'):
+                try:
+                    debug_log("Anthropic: Using client.models.list() method")
+                    models_response = await self.client.models.list()
+                    if hasattr(models_response, 'data') and isinstance(models_response.data, list):
+                        formatted_models = [
+                            {"id": model.id, "name": getattr(model, "name", model.id)}
+                            for model in models_response.data
+                        ]
+                        debug_log(f"Anthropic: Found {len(formatted_models)} models via SDK")
+                        return formatted_models
+                except Exception as sdk_err:
+                    debug_log(f"Anthropic: Error using models.list(): {str(sdk_err)}")
+                    # Continue to next method
+            # Try direct HTTP request if client exposes the underlying HTTP client
             if hasattr(self.client, '_client') and hasattr(self.client._client, 'get'):
-                 response = await self.client._client.get(
-                     "/v1/models",
-                     headers={"anthropic-version": "2023-06-01"} # Add required version header
-                 )
-                 response.raise_for_status() # Raise HTTP errors
-                 models_data = response.json()
-                 debug_log(f"Anthropic: API response received: {models_data}")
-                 if 'data' in models_data and isinstance(models_data['data'], list):
-                      # Format the response as expected: list of {"id": ..., "name": ...}
-                      formatted_models = [
-                          {"id": model.get("id"), "name": model.get("display_name", model.get("id"))}
-                          for model in models_data['data']
-                          if model.get("id") # Ensure model has an ID
-                      ]
-                      # Log each model ID clearly for debugging
-                      debug_log(f"Anthropic: Available models from API:")
-                      for model in formatted_models:
-                          debug_log(f"  - ID: {model.get('id')}, Name: {model.get('name')}")
-                      return formatted_models
-                 else:
-                      debug_log("Anthropic: Unexpected API response format for models.")
-                      return []
-            else:
-                 debug_log("Anthropic: Client does not expose HTTP client for model listing. Returning empty list.")
-                 return [] # Cannot fetch dynamically
+                try:
+                    debug_log("Anthropic: Using direct HTTP request to /v1/models")
+                    response = await self.client._client.get(
+                        "/v1/models",
+                        headers={"anthropic-version": "2023-06-01"}
+                    )
+                    response.raise_for_status()
+                    models_data = response.json()
+                    if 'data' in models_data and isinstance(models_data['data'], list):
+                        formatted_models = [
+                            {"id": model.get("id"), "name": model.get("display_name", model.get("id"))}
+                            for model in models_data['data']
+                            if model.get("id")
+                        ]
+                        debug_log(f"Anthropic: Found {len(formatted_models)} models via HTTP request")
+                        return formatted_models
+                    else:
+                        debug_log("Anthropic: Unexpected API response format")
+                except Exception as http_err:
+                    debug_log(f"Anthropic: HTTP request error: {str(http_err)}")
+                    # Continue to fallback
+            # If we reach here, both methods failed
+            debug_log("Anthropic: All API methods failed, using fallback models")
+            return fallback_models
         except Exception as e:
             debug_log(f"Anthropic: Failed to fetch models from API: {str(e)}")
-            # Fallback to a minimal hardcoded list in case of API error
-            # Include Claude 3.7 Sonnet with the correct full ID
-            fallback_models = [
-                {"id": "claude-3-opus-20240229", "name": "Claude 3 Opus"},
-                {"id": "claude-3-sonnet-20240229", "name": "Claude 3 Sonnet"},
-                {"id": "claude-3-haiku-20240307", "name": "Claude 3 Haiku"},
-                {"id": "claude-3-5-sonnet-20240620", "name": "Claude 3.5 Sonnet"},
-                {"id": "claude-3-7-sonnet-20250219", "name": "Claude 3.7 Sonnet"},  # Add Claude 3.7 Sonnet
-            ]
-            debug_log("Anthropic: Using fallback model list:")
-            for model in fallback_models:
-                debug_log(f"  - ID: {model['id']}, Name: {model['name']}")
+            debug_log("Anthropic: Using fallback model list")
             return fallback_models
-    # Keep this synchronous for now, but make it call the async fetcher
-    # Note: This is slightly awkward. Ideally, config loading would be async.
-    # For now, we'll run the async fetcher within the sync method using asyncio.run()
-    # This is NOT ideal for performance but avoids larger refactoring of config loading.
     def get_available_models(self) -> List[Dict[str, Any]]:
         """Get list of available Claude models by fetching from API."""
+        # Reliable fallback list that doesn't depend on async operations
+        fallback_models = [
+            {"id": "claude-3-opus-20240229", "name": "Claude 3 Opus"},
+            {"id": "claude-3-sonnet-20240229", "name": "Claude 3 Sonnet"},
+            {"id": "claude-3-haiku-20240307", "name": "Claude 3 Haiku"},
+            {"id": "claude-3-5-sonnet-20240620", "name": "Claude 3.5 Sonnet"},
+            {"id": "claude-3-7-sonnet-20250219", "name": "Claude 3.7 Sonnet"},
+        ]
         try:
-            # Run the async fetcher method synchronously
-            models = asyncio.run(self._fetch_models_from_api())
-            return models
-        except RuntimeError as e:
-             # Handle cases where asyncio.run can't be called (e.g., already in an event loop)
-             # This might happen during app runtime if called again. Fallback needed.
-             try:
-                 from app.main import debug_log
-             except ImportError:
-                 debug_log = lambda msg: None
-             debug_log(f"Anthropic: Cannot run async model fetch synchronously ({e}). Falling back to hardcoded list.")
-             # Use the same fallback list as in _fetch_models_from_api
-             fallback_models = [
-                 {"id": "claude-3-opus-20240229", "name": "Claude 3 Opus"},
-                 {"id": "claude-3-sonnet-20240229", "name": "Claude 3 Sonnet"},
-                 {"id": "claude-3-haiku-20240307", "name": "Claude 3 Haiku"},
-                 {"id": "claude-3-5-sonnet-20240620", "name": "Claude 3.5 Sonnet"},
-                 {"id": "claude-3-7-sonnet-20250219", "name": "Claude 3.7 Sonnet"},  # Add Claude 3.7 Sonnet
-             ]
-             debug_log("Anthropic: Using fallback model list in get_available_models:")
-             for model in fallback_models:
-                 debug_log(f"  - ID: {model['id']}, Name: {model['name']}")
-             return fallback_models
+            # Check if we're already in an event loop
+            try:
+                loop = asyncio.get_running_loop()
+                in_loop = True
+            except RuntimeError:
+                in_loop = False
+            if in_loop:
+                # We're already in an event loop, create a future
+                try:
+                    from app.main import debug_log
+                except ImportError:
+                    debug_log = lambda msg: None
+                debug_log("Anthropic: Already in event loop, using fallback models")
+                return fallback_models
+            else:
+                # Not in an event loop, we can use asyncio.run
+                models = asyncio.run(self._fetch_models_from_api())
+                return models
+        except Exception as e:
+            try:
+                from app.main import debug_log
+            except ImportError:
+                debug_log = lambda msg: None
+            debug_log(f"Anthropic: Error in get_available_models: {str(e)}")
+            return fallback_models

{chat_console-0.2.99 → chat_console-0.3.0}/app/api/base.py RENAMED Viewed

@@ -120,8 +120,8 @@ class BaseModelClient(ABC):
         if provider == "ollama":
             return await OllamaClient.create()
         elif provider == "openai":
-            return OpenAIClient()
+            return await OpenAIClient.create()
         elif provider == "anthropic":
-            return AnthropicClient()
+            return await AnthropicClient.create()
         else:
             raise ValueError(f"Unknown provider: {provider}")

{chat_console-0.2.99 → chat_console-0.3.0}/app/api/ollama.py RENAMED Viewed

@@ -369,6 +369,10 @@ class OllamaClient(BaseModelClient):
                     # Use a simpler async iteration pattern that's less error-prone
                     debug_log("Starting to process response stream")
+                    # Set a flag to track if we've yielded any content
+                    has_yielded_content = False
                     async for line in response.content:
                         # Check cancellation periodically
                         if self._active_stream_session is None:
@@ -378,31 +382,38 @@ class OllamaClient(BaseModelClient):
                         try:
                             # Process the chunk
                             if line:
-                                chunk = line.decode().strip()
                                 chunk_str = line.decode().strip()
                                 # Check if it looks like JSON before trying to parse
                                 if chunk_str.startswith('{') and chunk_str.endswith('}'):
                                     try:
                                         data = json.loads(chunk_str)
                                         if isinstance(data, dict) and "response" in data:
-                                            chunk_length = len(data["response"]) if data["response"] else 0
-                                            debug_log(f"Yielding chunk of length: {chunk_length}")
-                                            yield data["response"]
+                                            response_text = data["response"]
+                                            if response_text:  # Only yield non-empty responses
+                                                has_yielded_content = True
+                                                chunk_length = len(response_text)
+                                                # Only log occasionally to reduce console spam
+                                                if chunk_length % 20 == 0:
+                                                    debug_log(f"Yielding chunk of length: {chunk_length}")
+                                                yield response_text
                                         else:
-                                            debug_log(f"JSON chunk missing 'response' key: {chunk_str}")
+                                            debug_log(f"JSON chunk missing 'response' key: {chunk_str[:100]}")
                                     except json.JSONDecodeError:
-                                        debug_log(f"JSON decode error for chunk: {chunk_str}")
+                                        debug_log(f"JSON decode error for chunk: {chunk_str[:100]}")
                                 else:
                                     # Log unexpected non-JSON lines but don't process them
-                                    if chunk_str: # Avoid logging empty lines
-                                        debug_log(f"Received unexpected non-JSON line: {chunk_str}")
-                                # Continue processing next line regardless of parsing success/failure of current line
-                                continue
+                                    if chunk_str and len(chunk_str) > 5:  # Avoid logging empty or tiny lines
+                                        debug_log(f"Received unexpected non-JSON line: {chunk_str[:100]}")
                         except Exception as chunk_err:
                             debug_log(f"Error processing chunk: {str(chunk_err)}")
                             # Continue instead of breaking to try processing more chunks
                             continue
+                    # If we didn't yield any content, yield a default message
+                    if not has_yielded_content:
+                        debug_log("No content was yielded from stream, providing fallback response")
+                        yield "I'm sorry, but I couldn't generate a response. Please try again or try a different model."
                     logger.info("Streaming completed successfully")
                     debug_log("Streaming completed successfully")
                     return

{chat_console-0.2.99 → chat_console-0.3.0}/app/api/openai.py RENAMED Viewed

@@ -1,4 +1,5 @@
 from openai import AsyncOpenAI
+import asyncio
 from typing import List, Dict, Any, Optional, Generator, AsyncGenerator
 from .base import BaseModelClient
 from ..config import OPENAI_API_KEY
@@ -84,41 +85,87 @@ class OpenAIClient(BaseModelClient):
                         debug_log(f"OpenAI: skipping invalid message: {m}")
                 debug_log(f"OpenAI: prepared {len(api_messages)} valid messages")
+                # Check for empty or very short prompts and enhance them slightly
+                # This helps with the "hi" case where OpenAI might not generate a meaningful response
+                if api_messages and len(api_messages) > 0:
+                    last_message = api_messages[-1]
+                    if last_message["role"] == "user" and len(last_message["content"].strip()) <= 3:
+                        debug_log(f"OpenAI: Enhancing very short user prompt: '{last_message['content']}'")
+                        last_message["content"] = f"{last_message['content']} - Please respond conversationally."
+                        debug_log(f"OpenAI: Enhanced to: '{last_message['content']}'")
             except Exception as msg_error:
                 debug_log(f"OpenAI: error preparing messages: {str(msg_error)}")
                 # Fallback to a simpler message format if processing fails
                 api_messages = [{"role": "user", "content": "Please respond to my request."}]
             debug_log("OpenAI: requesting stream")
-            stream = await self.client.chat.completions.create(
-                model=model,
-                messages=api_messages,
-                temperature=temperature,
-                max_tokens=max_tokens,
-                stream=True,
-            )
-            debug_log("OpenAI: stream created successfully, processing chunks")
-            async for chunk in stream:
+            # Use more robust error handling with retry for connection issues
+            max_retries = 2
+            retry_count = 0
+            while retry_count <= max_retries:
                 try:
-                    if chunk.choices and hasattr(chunk.choices[0], 'delta') and hasattr(chunk.choices[0].delta, 'content'):
-                        content = chunk.choices[0].delta.content
-                        if content is not None:
-                            # Ensure we're returning a string
-                            text = str(content)
-                            debug_log(f"OpenAI: yielding chunk of length: {len(text)}")
-                            yield text
-                        else:
-                            debug_log("OpenAI: skipping None content chunk")
-                    else:
-                        debug_log("OpenAI: skipping chunk with missing content")
-                except Exception as chunk_error:
-                    debug_log(f"OpenAI: error processing chunk: {str(chunk_error)}")
-                    # Skip problematic chunks but continue processing
-                    continue
+                    stream = await self.client.chat.completions.create(
+                        model=model,
+                        messages=api_messages,
+                        temperature=temperature,
+                        max_tokens=max_tokens,
+                        stream=True,
+                    )
+                    debug_log("OpenAI: stream created successfully")
+                    # Yield a small padding token at the beginning for very short prompts
+                    # This ensures the UI sees immediate content updates
+                    if any(m["role"] == "user" and len(m["content"].strip()) <= 3 for m in api_messages):
+                        debug_log("OpenAI: Adding initial padding token for short message")
+                        yield ""  # Empty string to trigger UI update cycle
+                    # Process stream chunks
+                    chunk_count = 0
+                    debug_log("OpenAI: starting to process chunks")
+                    async for chunk in stream:
+                        chunk_count += 1
+                        try:
+                            if chunk.choices and hasattr(chunk.choices[0], 'delta') and hasattr(chunk.choices[0].delta, 'content'):
+                                content = chunk.choices[0].delta.content
+                                if content is not None:
+                                    # Ensure we're returning a string
+                                    text = str(content)
+                                    debug_log(f"OpenAI: yielding chunk {chunk_count} of length: {len(text)}")
+                                    yield text
+                                else:
+                                    debug_log(f"OpenAI: skipping None content chunk {chunk_count}")
+                            else:
+                                debug_log(f"OpenAI: skipping chunk {chunk_count} with missing content")
+                        except Exception as chunk_error:
+                            debug_log(f"OpenAI: error processing chunk {chunk_count}: {str(chunk_error)}")
+                            # Skip problematic chunks but continue processing
+                            continue
+                    debug_log(f"OpenAI: stream completed successfully with {chunk_count} chunks")
+                    # If we reach this point, we've successfully processed the stream
+                    break
+                except Exception as e:
+                    debug_log(f"OpenAI: error in attempt {retry_count+1}/{max_retries+1}: {str(e)}")
+                    retry_count += 1
+                    if retry_count <= max_retries:
+                        debug_log(f"OpenAI: retrying after error (attempt {retry_count+1})")
+                        # Simple exponential backoff
+                        await asyncio.sleep(1 * retry_count)
+                    else:
+                        debug_log("OpenAI: max retries reached, raising exception")
+                        raise Exception(f"OpenAI streaming error after {max_retries+1} attempts: {str(e)}")
         except Exception as e:
             debug_log(f"OpenAI: error in generate_stream: {str(e)}")
+            # Yield a simple error message as a last resort to ensure UI updates
+            yield f"Error: {str(e)}"
             raise Exception(f"OpenAI streaming error: {str(e)}")
     def get_available_models(self) -> List[Dict[str, Any]]:

{chat_console-0.2.99 → chat_console-0.3.0}/app/main.py RENAMED Viewed

@@ -23,6 +23,8 @@ file_handler.setFormatter(logging.Formatter('%(asctime)s - %(name)s - %(levelnam
 debug_logger = logging.getLogger("chat-cli-debug")
 debug_logger.setLevel(logging.DEBUG)
 debug_logger.addHandler(file_handler)
+# Prevent propagation to the root logger (which would print to console)
+debug_logger.propagate = False
 # Add a convenience function to log to this file
 def debug_log(message):
@@ -642,9 +644,10 @@ class SimpleChatApp(App): # Keep SimpleChatApp class definition
         await self.update_messages_ui()
         # If this is the first message and dynamic titles are enabled, generate one
-        if is_first_message and self.current_conversation and CONFIG.get("generate_dynamic_titles", True):
+        # Only attempt title generation if the message has sufficient content (at least 3 characters)
+        if is_first_message and self.current_conversation and CONFIG.get("generate_dynamic_titles", True) and len(content) >= 3:
             log("First message detected, generating title...")
-            debug_log("First message detected, attempting to generate conversation title")
+            debug_log(f"First message detected with length {len(content)}, generating conversation title")
             title_generation_in_progress = True # Use a local flag
             loading = self.query_one("#loading-indicator")
             loading.remove_class("hidden") # Show loading for title gen
@@ -942,30 +945,40 @@ class SimpleChatApp(App): # Keep SimpleChatApp class definition
                         # Update UI with the content - this no longer triggers refresh itself
                         await message_display.update_content(content)
+                        # Force a refresh after each update to ensure content is visible
+                        # This is critical for streaming to work properly
+                        self.refresh(layout=False)
+                        # Scroll after each content update to ensure it's visible
+                        messages_container.scroll_end(animate=False)
                         # Much more aggressive throttling of UI updates to eliminate visual jitter
                         # By using a larger modulo value, we significantly reduce refresh frequency
                         # This improves stability at the cost of slightly choppier animations
                         content_length = len(content)
-                        # Define some key refresh points
+                        # Define some key refresh points - more frequent than before
                         new_paragraph = content.endswith("\n") and content.count("\n") > 0
+                        code_block = "```" in content
                         do_refresh = (
-                            content_length < 5 or  # Only first few tokens
-                            content_length % 64 == 0 or  # Very infrequent periodic updates
-                            new_paragraph  # Refresh on paragraph breaks
+                            content_length < 10 or  # More frequent on first few tokens
+                            content_length % 32 == 0 or  # More frequent periodic updates (32 vs 64)
+                            new_paragraph or  # Refresh on paragraph breaks
+                            code_block  # Refresh when code blocks are detected
                         )
-                        # Check if it's been enough time since last refresh (250ms minimum)
+                        # Check if it's been enough time since last refresh (reduced to 200ms from 250ms)
                         current_time = time.time()
                         time_since_refresh = current_time - last_refresh_time
-                        if do_refresh and time_since_refresh > 0.25:
+                        if do_refresh and time_since_refresh > 0.2:
                             # Store the time we did the refresh
                             last_refresh_time = current_time
-                            # Skip layout updates completely during streaming
-                            # Just ensure content is still visible by scrolling
+                            # Ensure content is still visible by scrolling
                             messages_container.scroll_end(animate=False)
+                            # Force a more thorough refresh periodically
+                            self.refresh(layout=True)
                     except Exception as e:
                         debug_log(f"Error updating UI: {str(e)}")
                         log.error(f"Error updating UI: {str(e)}")
@@ -1054,6 +1067,21 @@ class SimpleChatApp(App): # Keep SimpleChatApp class definition
                     # Update the final message object content (optional, UI should be up-to-date)
                     if self.messages and self.messages[-1].role == "assistant":
                         self.messages[-1].content = full_response
+                    # Force a UI refresh with the message display to ensure it's fully rendered
+                    try:
+                        # Get the message display for the assistant message
+                        messages_container = self.query_one("#messages-container")
+                        message_displays = messages_container.query("MessageDisplay")
+                        # Check if we found any message displays
+                        if message_displays and len(message_displays) > 0:
+                            # Get the last message display which should be our assistant message
+                            last_message_display = message_displays[-1]
+                            debug_log("Forcing final content update on message display")
+                            # Force a final content update
+                            await last_message_display.update_content(full_response)
+                    except Exception as disp_err:
+                        debug_log(f"Error updating final message display: {str(disp_err)}")
                 else:
                     debug_log("Worker finished successfully but response was empty or invalid.")
                     # Handle case where 'Thinking...' might still be the last message
@@ -1061,11 +1089,24 @@ class SimpleChatApp(App): # Keep SimpleChatApp class definition
                          self.messages.pop() # Remove 'Thinking...' if no content arrived
                          await self.update_messages_ui()
-                # Final UI refresh with minimal layout recalculation
-                # Use layout=False to prevent UI jumping at the end
-                self.refresh(layout=False)
-                await asyncio.sleep(0.1)  # Allow UI to stabilize
+                # Force a full UI refresh to ensure content is visible
                 messages_container = self.query_one("#messages-container")
+                # Sequence of UI refreshes to ensure content is properly displayed
+                # 1. First do a lightweight refresh
+                self.refresh(layout=False)
+                # 2. Short delay to allow the UI to process
+                await asyncio.sleep(0.1)
+                # 3. Ensure we're scrolled to the end
+                messages_container.scroll_end(animate=False)
+                # 4. Full layout refresh
+                self.refresh(layout=True)
+                # 5. Final delay and scroll to ensure everything is visible
+                await asyncio.sleep(0.1)
                 messages_container.scroll_end(animate=False)
         except Exception as e:

{chat_console-0.2.99 → chat_console-0.3.0}/app/ui/chat_interface.py RENAMED Viewed

@@ -136,13 +136,52 @@ class MessageDisplay(Static): # Inherit from Static instead of RichLog
         # This allows parent to control refresh timing and avoid flickering
         self.update(formatted_content, refresh=False)
-        # No refresh or layout recalculation is performed here
-        # The parent container will handle refresh timing for better stability
+        # Always force a minimal refresh to ensure content is visible
+        # This is critical for streaming to work properly
+        self.refresh(layout=False)
+        # For Ollama responses, we need more aggressive refresh
+        # Check if this is likely an Ollama response by looking at the parent app
+        try:
+            app = self.app
+            if app and hasattr(app, 'selected_model'):
+                model = app.selected_model
+                if model and ('llama' in model.lower() or 'mistral' in model.lower() or
+                             'gemma' in model.lower() or 'phi' in model.lower() or
+                             'ollama' in model.lower()):
+                    # This is likely an Ollama model, force a more thorough refresh
+                    # Without doing a full layout recalculation
+                    self.refresh(layout=True)
+                    # Force parent container to scroll to end
+                    try:
+                        parent = self.parent
+                        if parent and hasattr(parent, 'scroll_end'):
+                            parent.scroll_end(animate=False)
+                    except Exception:
+                        pass
+        except Exception:
+            # Ignore any errors in this detection logic
+            pass
     def _format_content(self, content: str) -> str:
-        """Format message content with timestamp"""
+        """Format message content with timestamp and handle markdown links"""
         timestamp = datetime.now().strftime("%H:%M")
-        return f"[dim]{timestamp}[/dim] {content}"
+        # Fix markdown-style links that cause markup errors
+        # Convert [text](url) to a safe format for Textual markup
+        content = re.sub(
+            r'\[([^\]]+)\]\(([^)]+)\)',
+            lambda m: f"{m.group(1)} ({m.group(2)})",
+            content
+        )
+        # Escape any other potential markup characters
+        content = content.replace("[", "\\[").replace("]", "\\]")
+        # But keep our timestamp markup
+        timestamp_markup = f"[dim]{timestamp}[/dim]"
+        return f"{timestamp_markup} {content}"
 class InputWithFocus(Input):
     """Enhanced Input that better handles focus and maintains cursor position"""

{chat_console-0.2.99 → chat_console-0.3.0}/app/ui/model_selector.py RENAMED Viewed

@@ -243,12 +243,14 @@ class ModelSelector(Container):
                     # Set the model if we found one
                     if first_model and len(first_model) >= 2:
-                        # Resolve the model ID before storing and sending
+                        # Get the original ID from the model option
                         original_id = first_model[1]
+                        # Resolve the model ID for internal use and messaging
                         resolved_id = resolve_model_id(original_id)
                         logger.info(f"on_select_changed (provider): Original ID '{original_id}' resolved to '{resolved_id}'")
                         self.selected_model = resolved_id
-                        model_select.value = resolved_id
+                        # Use the original ID for the select widget to avoid invalid value errors
+                        model_select.value = original_id
                         model_select.remove_class("hide")
                         self.query_one("#custom-model-input").add_class("hide")
                         self.post_message(self.ModelSelected(resolved_id))
@@ -310,24 +312,35 @@ class ModelSelector(Container):
     def set_selected_model(self, model_id: str) -> None:
         """Set the selected model, ensuring it's properly resolved"""
         # First resolve the model ID to ensure we're using the full ID
+        original_id = model_id
         resolved_id = resolve_model_id(model_id)
-        logger.info(f"set_selected_model: Original ID '{model_id}' resolved to '{resolved_id}'")
+        logger.info(f"set_selected_model: Original ID '{original_id}' resolved to '{resolved_id}'")
-        # Store the resolved ID
+        # Store the resolved ID internally
         self.selected_model = resolved_id
         # Update the UI based on whether this is a known model or custom
-        if resolved_id in CONFIG["available_models"]:
-            select = self.query_one("#model-select", Select)
+        # Check if the original ID is in the available options
+        model_select = self.query_one("#model-select", Select)
+        available_options = [opt[1] for opt in model_select.options]
+        if original_id in available_options:
+            # Use the original ID for the select widget
+            custom_input = self.query_one("#custom-model-input")
+            model_select.value = original_id
+            model_select.remove_class("hide")
+            custom_input.add_class("hide")
+        elif resolved_id in available_options:
+            # If the resolved ID is in options, use that
             custom_input = self.query_one("#custom-model-input")
-            select.value = resolved_id
-            select.remove_class("hide")
+            model_select.value = resolved_id
+            model_select.remove_class("hide")
             custom_input.add_class("hide")
         else:
-            select = self.query_one("#model-select", Select)
+            # Use custom input for models not in the select options
             custom_input = self.query_one("#custom-model-input")
-            select.value = "custom"
-            select.add_class("hide")
+            model_select.value = "custom"
+            model_select.add_class("hide")
             custom_input.value = resolved_id
             custom_input.remove_class("hide")

{chat_console-0.2.99 → chat_console-0.3.0}/app/utils.py RENAMED Viewed

@@ -291,16 +291,35 @@ async def generate_streaming_response(
                     buffer.append(chunk)
                     current_time = time.time()
-                    # Update UI if enough time has passed or buffer is large
-                    if current_time - last_update >= update_interval or len(''.join(buffer)) > 100:
+                    # Update UI with every chunk for short messages, or throttle for longer ones
+                    # This is especially important for short messages like "hi" that might otherwise not trigger updates
+                    if (current_time - last_update >= update_interval or
+                        len(''.join(buffer)) > 10 or  # Much more aggressive buffer flush threshold
+                        len(full_response) < 20):     # Always update for very short responses
                         new_content = ''.join(buffer)
                         full_response += new_content
                         # Send content to UI
                         debug_log(f"Updating UI with content length: {len(full_response)}")
-                        await callback(full_response)
+                        try:
+                            await callback(full_response)
+                            debug_log("UI callback completed successfully")
+                        except Exception as callback_err:
+                            debug_log(f"Error in UI callback: {str(callback_err)}")
+                            logger.error(f"Error in UI callback: {str(callback_err)}")
                         buffer = []
                         last_update = current_time
+                        # Force UI refresh after each update for Ollama responses
+                        if is_ollama:
+                            debug_log("Forcing UI refresh for Ollama response")
+                            try:
+                                # Ensure the app refreshes the UI
+                                if hasattr(app, 'refresh'):
+                                    app.refresh(layout=False)
+                            except Exception as refresh_err:
+                                debug_log(f"Error forcing UI refresh: {str(refresh_err)}")
                         # Small delay to let UI catch up
                         await asyncio.sleep(0.05)
         except asyncio.CancelledError:
@@ -316,7 +335,22 @@ async def generate_streaming_response(
             new_content = ''.join(buffer)
             full_response += new_content
             debug_log(f"Sending final content, total length: {len(full_response)}")
-            await callback(full_response)
+            try:
+                await callback(full_response)
+                debug_log("Final UI callback completed successfully")
+                # Force final UI refresh for Ollama responses
+                if is_ollama:
+                    debug_log("Forcing final UI refresh for Ollama response")
+                    try:
+                        # Ensure the app refreshes the UI
+                        if hasattr(app, 'refresh'):
+                            app.refresh(layout=True)  # Use layout=True for final refresh
+                    except Exception as refresh_err:
+                        debug_log(f"Error forcing final UI refresh: {str(refresh_err)}")
+            except Exception as callback_err:
+                debug_log(f"Error in final UI callback: {str(callback_err)}")
+                logger.error(f"Error in final UI callback: {str(callback_err)}")
         debug_log(f"Streaming response completed successfully. Response length: {len(full_response)}")
         logger.info(f"Streaming response completed successfully. Response length: {len(full_response)}")
@@ -442,7 +476,27 @@ def resolve_model_id(model_id_or_name: str) -> str:
          logger.warning("No available_models found in CONFIG to resolve against.")
          return model_id_or_name # Return original if no models to check
-    # 1. Check if the input is already a valid full ID (must contain a date suffix)
+    # Special case for Ollama models with version format (model:version)
+    if ":" in input_lower and not input_lower.startswith("claude-"):
+        logger.info(f"Input '{input_lower}' appears to be an Ollama model with version, returning as-is")
+        return model_id_or_name
+    # Handle special cases for common model formats
+    # 1. Handle Ollama models with dot notation (e.g., phi3.latest, llama3.1)
+    if "." in input_lower and not input_lower.startswith("claude-"):
+        # This is likely an Ollama model with dot notation
+        logger.info(f"Input '{input_lower}' appears to be an Ollama model with dot notation")
+        # Convert dots to colons for Ollama format if needed
+        if ":" not in input_lower:
+            parts = input_lower.split(".")
+            if len(parts) == 2:
+                base_model, version = parts
+                ollama_format = f"{base_model}:{version}"
+                logger.info(f"Converting '{input_lower}' to Ollama format: '{ollama_format}'")
+                return ollama_format
+        return model_id_or_name
+    # 2. Check if the input is already a valid full ID (must contain a date suffix)
     # Full Claude IDs should have format like "claude-3-opus-20240229" with a date suffix
     for full_id in available_models:
         if full_id.lower() == input_lower:
@@ -460,7 +514,7 @@ def resolve_model_id(model_id_or_name: str) -> str:
     best_match = None
     match_type = "None"
-    # 2. Iterate through available models for other matches
+    # 3. Iterate through available models for other matches
     for full_id, model_info in available_models.items():
         full_id_lower = full_id.lower()
         display_name = model_info.get("display_name", "")
@@ -468,12 +522,12 @@ def resolve_model_id(model_id_or_name: str) -> str:
         logger.debug(f"Comparing '{input_lower}' against '{full_id_lower}' (Display: '{display_name}')")
-        # 2a. Exact match on display name (case-insensitive)
+        # 3a. Exact match on display name (case-insensitive)
         if display_name_lower == input_lower:
             logger.info(f"Resolved '{model_id_or_name}' to '{full_id}' via exact display name match.")
             return full_id # Exact display name match is high confidence
-        # 2b. Check if input is a known short alias (handle common cases explicitly)
+        # 3b. Check if input is a known short alias (handle common cases explicitly)
         # Special case for Claude 3.7 Sonnet which seems to be causing issues
         if input_lower == "claude-3.7-sonnet":
             # Hardcoded resolution for this specific model
@@ -501,7 +555,7 @@ def resolve_model_id(model_id_or_name: str) -> str:
              # This is also high confidence
              return full_id
-        # 2c. Check if input is a prefix of the full ID (more general, lower confidence)
+        # 3c. Check if input is a prefix of the full ID (more general, lower confidence)
         if full_id_lower.startswith(input_lower):
             logger.debug(f"Potential prefix match: '{input_lower}' vs '{full_id_lower}'")
             # Don't return immediately, might find a better match (e.g., display name or alias)
@@ -510,7 +564,7 @@ def resolve_model_id(model_id_or_name: str) -> str:
                  match_type = "Prefix"
                  logger.debug(f"Setting best_match to '{full_id}' based on prefix.")
-        # 2d. Check derived short name from display name (less reliable, keep as lower priority)
+        # 3d. Check derived short name from display name (less reliable, keep as lower priority)
         # Normalize display name: lower, replace space and dot with hyphen
         derived_short_name = display_name_lower.replace(" ", "-").replace(".", "-")
         if derived_short_name == input_lower:
@@ -521,7 +575,7 @@ def resolve_model_id(model_id_or_name: str) -> str:
                   match_type = "Derived Short Name"
                   logger.debug(f"Updating best_match to '{full_id}' based on derived name.")
-    # 3. Return best match found or original input
+    # 4. Return best match found or original input
     if best_match:
         logger.info(f"Returning best match found for '{model_id_or_name}': '{best_match}' (Type: {match_type})")
         return best_match

{chat_console-0.2.99 → chat_console-0.3.0}/chat_console.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: chat-console
-Version: 0.2.99
+Version: 0.3.0
 Summary: A command-line interface for chatting with LLMs, storing chats and (future) rag interactions
 Home-page: https://github.com/wazacraftrfid/chat-console
 Author: Johnathan Greenaway