PyPI - speedy-utils - Versions diffs - 1.1.47__tar.gz → 1.1.48__tar.gz - Mend

speedy-utils 1.1.47tar.gz → 1.1.48tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (157) hide show

{speedy_utils-1.1.47 → speedy_utils-1.1.48}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: speedy-utils
-Version: 1.1.47
+Version: 1.1.48
 Summary: Fast and easy-to-use package for data science
 Project-URL: Homepage, https://github.com/anhvth/speedy
 Project-URL: Repository, https://github.com/anhvth/speedy

{speedy_utils-1.1.47 → speedy_utils-1.1.48}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "speedy-utils"
-version = "1.1.47"
+version = "1.1.48"
 description = "Fast and easy-to-use package for data science"
 authors = [{ name = "AnhVTH", email = "anhvth.226@gmail.com" }]
 readme = "README.md"

{speedy_utils-1.1.47 → speedy_utils-1.1.48}/src/llm_utils/__init__.py RENAMED Viewed

@@ -1,3 +1,4 @@
+from llm_utils.llm_ray import LLMRay
 from llm_utils.lm import (
     LLM,
     AsyncLLMTask,
@@ -12,7 +13,6 @@ from llm_utils.lm import (
 from llm_utils.lm.base_prompt_builder import BasePromptBuilder
 from llm_utils.lm.lm_base import get_model_name
 from llm_utils.lm.openai_memoize import MOpenAI
-from llm_utils.llm_ray import LLMRay
 from llm_utils.vector_cache import VectorCache
@@ -37,7 +37,6 @@ from llm_utils.chat_format import (
     format_msgs,
     get_conversation_one_turn,
     show_chat,
-    show_chat_v2,
     show_string_diff,
     transform_messages,
     transform_messages_to_chatml,
@@ -54,7 +53,6 @@ __all__ = [
     "build_chatml_input",
     "format_msgs",
     "display_chat_messages_as_html",
-    "show_chat_v2",
     "AsyncLM",
     "AsyncLLMTask",
     "LLM",

{speedy_utils-1.1.47 → speedy_utils-1.1.48}/src/llm_utils/chat_format/__init__.py RENAMED Viewed

@@ -4,7 +4,6 @@ from .display import (
     get_conversation_one_turn,
     highlight_diff_chars,
     show_chat,
-    show_chat_v2,
     show_string_diff,
 )
 from .transform import (
@@ -32,5 +31,4 @@ __all__ = [
     "show_string_diff",
     "display_conversations",
     "display_chat_messages_as_html",
-    "show_chat_v2",
 ]

speedy_utils-1.1.48/src/llm_utils/chat_format/display.py ADDED Viewed

@@ -0,0 +1,384 @@
+from __future__ import annotations
+import json
+from difflib import SequenceMatcher
+from typing import Any
+from IPython.display import HTML, display
+def _preprocess_as_json(content: str) -> str:
+    """Preprocess content as JSON with proper formatting."""
+    try:
+        parsed = json.loads(content)
+        return json.dumps(parsed, indent=2, ensure_ascii=False)
+    except (json.JSONDecodeError, TypeError):
+        return content
+def _preprocess_as_markdown(content: str) -> str:
+    """Preprocess content as markdown with proper formatting."""
+    lines = content.split('\n')
+    processed_lines = []
+    for line in lines:
+        # Convert **bold** to span with bold styling
+        while '**' in line:
+            first_pos = line.find('**')
+            if first_pos == -1:
+                break
+            second_pos = line.find('**', first_pos + 2)
+            if second_pos == -1:
+                break
+            before = line[:first_pos]
+            bold_text = line[first_pos + 2 : second_pos]
+            after = line[second_pos + 2 :]
+            line = f'{before}<span style="font-weight: bold;">{bold_text}</span>{after}'
+        # Convert *italic* to span with italic styling
+        while '*' in line and line.count('*') >= 2:
+            first_pos = line.find('*')
+            if first_pos == -1:
+                break
+            second_pos = line.find('*', first_pos + 1)
+            if second_pos == -1:
+                break
+            before = line[:first_pos]
+            italic_text = line[first_pos + 1 : second_pos]
+            after = line[second_pos + 1 :]
+            line = (
+                f'{before}<span style="font-style: italic;">{italic_text}</span>{after}'
+            )
+        # Convert # headers to bold headers
+        if line.strip().startswith('#'):
+            level = len(line) - len(line.lstrip('#'))
+            header_text = line.lstrip('# ').strip()
+            line = f'<span style="font-weight: bold; font-size: 1.{min(4, level)}em;">{header_text}</span>'
+        processed_lines.append(line)
+    return '\n'.join(processed_lines)
+def _truncate_text(text: str, max_length: int, head_ratio: float = 0.3) -> str:
+    """
+    Truncate text if it exceeds max_length, showing head and tail with skip indicator.
+    Args:
+        text: Text to truncate
+        max_length: Maximum length before truncation
+        head_ratio: Ratio of max_length to show at the head (default 0.3)
+    Returns:
+        Original text if within limit, otherwise truncated with [SKIP n chars] indicator
+    """
+    if len(text) <= max_length:
+        return text
+    head_len = int(max_length * head_ratio)
+    tail_len = max_length - head_len
+    skip_len = len(text) - head_len - tail_len
+    return f'{text[:head_len]}\n...[SKIP {skip_len} chars]...\n{text[-tail_len:]}'
+def _format_reasoning_content(
+    reasoning: str, max_reasoning_length: int | None = None
+) -> str:
+    """
+    Format reasoning content with <think> tags.
+    Args:
+        reasoning: The reasoning content
+        max_reasoning_length: Max length before truncation (None = no truncation)
+    Returns:
+        Formatted reasoning with <think> tags
+    """
+    if max_reasoning_length is not None:
+        reasoning = _truncate_text(reasoning, max_reasoning_length)
+    return f'<think>\n{reasoning}\n</think>'
+def _escape_html(content: str) -> str:
+    """Escape HTML special characters and convert whitespace for display."""
+    return (
+        content.replace('&', '&amp;')
+        .replace('<', '&lt;')
+        .replace('>', '&gt;')
+        .replace('\n', '<br>')
+        .replace('\t', '&nbsp;&nbsp;&nbsp;&nbsp;')
+        .replace('  ', '&nbsp;&nbsp;')
+    )
+def _is_notebook() -> bool:
+    """Detect if running in a notebook environment."""
+    try:
+        from IPython.core.getipython import get_ipython
+        ipython = get_ipython()
+        return ipython is not None and 'IPKernelApp' in ipython.config
+    except (ImportError, AttributeError):
+        return False
+# Color configurations
+ROLE_COLORS_HTML = {
+    'system': 'red',
+    'user': 'darkorange',
+    'assistant': 'green',
+}
+ROLE_COLORS_TERMINAL = {
+    'system': '\033[91m',  # Red
+    'user': '\033[38;5;208m',  # Orange
+    'assistant': '\033[92m',  # Green
+}
+ROLE_LABELS = {
+    'system': 'System Instruction:',
+    'user': 'User:',
+    'assistant': 'Assistant:',
+}
+TERMINAL_RESET = '\033[0m'
+TERMINAL_BOLD = '\033[1m'
+TERMINAL_GRAY = '\033[90m'
+TERMINAL_DIM = '\033[2m'  # Dim text for reasoning
+# HTML colors
+HTML_REASONING_COLOR = '#AAAAAA'  # Lighter gray for better readability
+def _build_assistant_content_parts(
+    msg: dict[str, Any], max_reasoning_length: int | None
+) -> tuple[str | None, str]:
+    """
+    Build display content parts for assistant message.
+    Returns:
+        Tuple of (reasoning_formatted, answer_content)
+        reasoning_formatted is None if no reasoning present
+    """
+    content = msg.get('content', '')
+    reasoning = msg.get('reasoning_content')
+    if reasoning:
+        formatted_reasoning = _format_reasoning_content(reasoning, max_reasoning_length)
+        return formatted_reasoning, content
+    return None, content
+def _show_chat_html(
+    messages: list[dict[str, Any]], max_reasoning_length: int | None
+) -> None:
+    """Display chat messages as HTML in notebook."""
+    html_parts = [
+        "<div style='font-family:monospace; line-height:1.6em; white-space:pre-wrap;'>"
+    ]
+    separator = "<div style='color:#888; margin:0.5em 0;'>───────────────────────────────────────────────────</div>"
+    for i, msg in enumerate(messages):
+        role = msg.get('role', 'unknown').lower()
+        color = ROLE_COLORS_HTML.get(role, 'black')
+        label = ROLE_LABELS.get(role, f'{role.capitalize()}:')
+        if role == 'assistant':
+            reasoning, answer = _build_assistant_content_parts(
+                msg, max_reasoning_length
+            )
+            html_parts.append(
+                f"<div><strong style='color:{color}'>{label}</strong><br>"
+            )
+            if reasoning:
+                escaped_reasoning = _escape_html(reasoning)
+                html_parts.append(
+                    f"<span style='color:{HTML_REASONING_COLOR}'>{escaped_reasoning}</span><br><br>"
+                )
+            if answer:
+                escaped_answer = _escape_html(answer)
+                html_parts.append(
+                    f"<span style='color:{color}'>{escaped_answer}</span>"
+                )
+            html_parts.append('</div>')
+        else:
+            content = msg.get('content', '')
+            escaped_content = _escape_html(content)
+            html_parts.append(
+                f"<div style='color:{color}'><strong>{label}</strong><br>{escaped_content}</div>"
+            )
+        if i < len(messages) - 1:
+            html_parts.append(separator)
+    html_parts.append('</div>')
+    display(HTML(''.join(html_parts)))
+def _show_chat_terminal(
+    messages: list[dict[str, Any]], max_reasoning_length: int | None
+) -> None:
+    """Display chat messages with ANSI colors in terminal."""
+    separator = f'{TERMINAL_GRAY}─────────────────────────────────────────────────────────{TERMINAL_RESET}'
+    for i, msg in enumerate(messages):
+        role = msg.get('role', 'unknown').lower()
+        color = ROLE_COLORS_TERMINAL.get(role, '')
+        label = ROLE_LABELS.get(role, f'{role.capitalize()}:')
+        print(f'{color}{TERMINAL_BOLD}{label}{TERMINAL_RESET}')
+        if role == 'assistant':
+            reasoning, answer = _build_assistant_content_parts(
+                msg, max_reasoning_length
+            )
+            if reasoning:
+                # Use lighter gray without dim for better readability
+                print(f'\033[38;5;246m{reasoning.strip()}{TERMINAL_RESET}')
+                if answer:
+                    print()  # Blank line between reasoning and answer
+            if answer:
+                print(f'{color}{answer.strip()}{TERMINAL_RESET}')
+        else:
+            content = msg.get('content', '')
+            print(f'{color}{content}{TERMINAL_RESET}')
+        if i < len(messages) - 1:
+            print(separator)
+def show_chat(
+    messages: list[dict[str, Any]], max_reasoning_length: int | None = 2000
+) -> None:
+    """
+    Display chat messages with colored formatting.
+    Automatically detects notebook vs terminal environment and formats accordingly.
+    Handles reasoning_content in assistant messages, formatting it with <think> tags.
+    Args:
+        messages: List of message dicts with 'role', 'content', and optionally 'reasoning_content'
+        max_reasoning_length: Max chars for reasoning before truncation (None = no limit)
+    Example:
+        >>> messages = [
+        ...     {"role": "system", "content": "You are helpful."},
+        ...     {"role": "user", "content": "Hello!"},
+        ...     {"role": "assistant", "content": "Hi!", "reasoning_content": "User greeted me..."},
+        ... ]
+        >>> show_chat(messages)
+    """
+    if _is_notebook():
+        _show_chat_html(messages, max_reasoning_length)
+    else:
+        _show_chat_terminal(messages, max_reasoning_length)
+def get_conversation_one_turn(
+    system_msg: str | None = None,
+    user_msg: str | None = None,
+    assistant_msg: str | None = None,
+    assistant_prefix: str | None = None,
+    return_format: str = 'chatml',
+) -> Any:
+    """Build a one-turn conversation."""
+    messages: list[dict[str, str]] = []
+    if system_msg is not None:
+        messages.append({'role': 'system', 'content': system_msg})
+    if user_msg is not None:
+        messages.append({'role': 'user', 'content': user_msg})
+    if assistant_msg is not None:
+        messages.append({'role': 'assistant', 'content': assistant_msg})
+    if assistant_prefix is not None:
+        if return_format == 'chatml':
+            raise ValueError('Change return_format to "text" to use assistant_prefix')
+        if not messages or messages[-1]['role'] != 'user':
+            raise ValueError(
+                'Last message must be from user when using assistant_prefix'
+            )
+        from .transform import transform_messages
+        msg = transform_messages(messages, 'chatml', 'text', add_generation_prompt=True)
+        return str(msg) + assistant_prefix
+    if return_format != 'chatml':
+        raise ValueError(f'Unsupported return_format: {return_format}')
+    return messages
+def highlight_diff_chars(text1: str, text2: str) -> str:
+    """Return a string with deletions in red and additions in green."""
+    matcher = SequenceMatcher(None, text1, text2)
+    html_parts: list[str] = []
+    for tag, i1, i2, j1, j2 in matcher.get_opcodes():
+        if tag == 'equal':
+            html_parts.append(text1[i1:i2])
+        elif tag == 'replace':
+            if i1 != i2:
+                html_parts.append(
+                    f'<span style="background-color:#ffd6d6; color:#b20000;">{text1[i1:i2]}</span>'
+                )
+            if j1 != j2:
+                html_parts.append(
+                    f'<span style="background-color:#d6ffd6; color:#006600;">{text2[j1:j2]}</span>'
+                )
+        elif tag == 'delete':
+            html_parts.append(
+                f'<span style="background-color:#ffd6d6; color:#b20000;">{text1[i1:i2]}</span>'
+            )
+        elif tag == 'insert':
+            html_parts.append(
+                f'<span style="background-color:#d6ffd6; color:#006600;">{text2[j1:j2]}</span>'
+            )
+    return ''.join(html_parts)
+def show_string_diff(old: str, new: str) -> None:
+    """Display a visual diff between two strings (old -> new)."""
+    display(HTML(highlight_diff_chars(old, new)))
+def display_conversations(data1: Any, data2: Any) -> None:
+    """Display two conversations side by side. Deprecated."""
+    import warnings
+    warnings.warn(
+        'display_conversations is deprecated and will be removed.',
+        DeprecationWarning,
+        stacklevel=2,
+    )
+    print('=== Conversation 1 ===')
+    show_chat(data1)
+    print('\n=== Conversation 2 ===')
+    show_chat(data2)
+def display_chat_messages_as_html(*args, **kwargs):
+    """Deprecated alias for show_chat."""
+    import warnings
+    warnings.warn(
+        'display_chat_messages_as_html is deprecated, use show_chat instead.',
+        DeprecationWarning,
+        stacklevel=2,
+    )
+    return show_chat(*args, **kwargs)
+__all__ = [
+    'show_chat',
+    'get_conversation_one_turn',
+    'highlight_diff_chars',
+    'show_string_diff',
+    'display_conversations',
+    'display_chat_messages_as_html',
+]

{speedy_utils-1.1.47 → speedy_utils-1.1.48}/src/llm_utils/lm/llm.py RENAMED Viewed

@@ -9,12 +9,12 @@ from typing import Any, Dict, List, Optional, cast
 from httpx import Timeout
 from loguru import logger
-from openai import AuthenticationError, BadRequestError, OpenAI, RateLimitError
+from openai import AuthenticationError, BadRequestError, OpenAI, RateLimitError, APITimeoutError
 from openai.types.chat import ChatCompletionMessageParam
 from pydantic import BaseModel
-from speedy_utils.common.utils_io import jdumps
 from speedy_utils import clean_traceback
+from speedy_utils.common.utils_io import jdumps
 from .base_prompt_builder import BasePromptBuilder
 from .mixins import (
@@ -173,34 +173,45 @@ class LLM(
             )
             # Store raw response from client
             self.last_ai_response = completion
+        except APITimeoutError as exc:
+            error_msg = f'OpenAI API timeout ({api_kwargs['timeout']}) error: {exc} for model {model_name}'
+            logger.error(error_msg)
+            raise
         except (AuthenticationError, RateLimitError, BadRequestError) as exc:
             error_msg = f'OpenAI API error ({type(exc).__name__}): {exc}'
             logger.error(error_msg)
             raise
+        except ValueError as exc:
+            logger.error(f'ValueError during API call: {exc}')
+            raise
         except Exception as e:
             is_length_error = 'Length' in str(e) or 'maximum context length' in str(e)
             if is_length_error:
                 raise ValueError(
                     f'Input too long for model {model_name}. Error: {str(e)[:100]}...'
                 ) from e
-            # Re-raise all other exceptions
             raise
         # print(completion)
         results: list[dict[str, Any]] = []
         for choice in completion.choices:
+            assistant_message = [{'role': 'assistant', 'content': choice.message.content}]
+            try:
+                reasoning_content = choice.message.reasoning
+            except:
+                reasoning_content = None
+            if reasoning_content:
+                assistant_message[0]['reasoning_content'] = reasoning_content
             choice_messages = cast(
                 Messages,
-                messages + [{'role': 'assistant', 'content': choice.message.content}],
+                messages + assistant_message,
             )
             result_dict = {
                 'parsed': choice.message.content,
                 'messages': choice_messages,
             }
-            # Add reasoning content if this is a reasoning model
-            if self.is_reasoning_model and hasattr(choice.message, 'reasoning_content'):
-                result_dict['reasoning_content'] = choice.message.reasoning_content
             results.append(result_dict)
         return results
@@ -394,12 +405,12 @@ class LLM(
     ) -> list[dict[str, Any]]:
         """Inspect the message history of a specific response choice."""
         if hasattr(self, '_last_conversations'):
-            from llm_utils import show_chat_v2
+            from llm_utils import show_chat
             conv = self._last_conversations[idx]
             if k_last_messages > 0:
                 conv = conv[-k_last_messages:]
-            return show_chat_v2(conv)
+            return show_chat(conv)
         raise ValueError('No message history available. Make a call first.')
     def __inner_call__(
@@ -442,7 +453,7 @@ class LLM(
         is_reasoning_model: bool = False,
         lora_path: str | None = None,
         vllm_cmd: str | None = None,
-        vllm_timeout: int = 120,
+        vllm_timeout: int = 0.1,
         vllm_reuse: bool = True,
         timeout: float | Timeout | None = None,
         **model_kwargs,

speedy-utils 1.1.47__tar.gz → 1.1.48__tar.gz

speedy-utils 1.1.47tar.gz → 1.1.48tar.gz