PyPI - kash-shell - Versions diffs - 0.3.17__py3-none-any.whl → 0.3.20__py3-none-any.whl - Mend

kash-shell 0.3.17py3-none-any.whl → 0.3.20py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

kash/actions/core/{markdownify.py → markdownify_html.py} +3 -6
kash/actions/core/minify_html.py +41 -0
kash/commands/base/show_command.py +11 -1
kash/commands/workspace/workspace_commands.py +10 -88
kash/config/colors.py +6 -2
kash/docs/markdown/topics/a1_what_is_kash.md +52 -23
kash/docs/markdown/topics/a2_installation.md +17 -30
kash/docs/markdown/topics/a3_getting_started.md +5 -19
kash/exec/__init__.py +3 -0
kash/exec/action_exec.py +3 -3
kash/exec/fetch_url_items.py +109 -0
kash/exec/precondition_registry.py +3 -3
kash/file_storage/file_store.py +24 -1
kash/file_storage/store_filenames.py +4 -0
kash/help/function_param_info.py +1 -1
kash/help/help_pages.py +1 -1
kash/help/help_printing.py +1 -1
kash/llm_utils/llm_features.py +5 -1
kash/llm_utils/llms.py +18 -8
kash/media_base/media_cache.py +48 -24
kash/media_base/media_services.py +63 -14
kash/media_base/services/local_file_media.py +9 -1
kash/model/items_model.py +22 -8
kash/model/media_model.py +9 -1
kash/model/params_model.py +9 -3
kash/utils/common/function_inspect.py +97 -1
kash/utils/common/parse_docstring.py +347 -0
kash/utils/common/testing.py +58 -0
kash/utils/common/url_slice.py +329 -0
kash/utils/file_utils/file_formats.py +1 -1
kash/utils/text_handling/markdown_utils.py +424 -16
kash/web_content/web_extract.py +34 -15
kash/web_content/web_page_model.py +10 -1
kash/web_gen/templates/base_styles.css.jinja +137 -15
kash/web_gen/templates/base_webpage.html.jinja +13 -17
kash/web_gen/templates/components/toc_scripts.js.jinja +319 -0
kash/web_gen/templates/components/toc_styles.css.jinja +284 -0
kash/web_gen/templates/components/tooltip_scripts.js.jinja +730 -0
kash/web_gen/templates/components/tooltip_styles.css.jinja +482 -0
kash/web_gen/templates/content_styles.css.jinja +13 -8
kash/web_gen/templates/simple_webpage.html.jinja +15 -481
kash/workspaces/workspaces.py +10 -1
{kash_shell-0.3.17.dist-info → kash_shell-0.3.20.dist-info}/METADATA +75 -72
{kash_shell-0.3.17.dist-info → kash_shell-0.3.20.dist-info}/RECORD +47 -40
kash/exec/fetch_url_metadata.py +0 -72
kash/help/docstring_utils.py +0 -111
{kash_shell-0.3.17.dist-info → kash_shell-0.3.20.dist-info}/WHEEL +0 -0
{kash_shell-0.3.17.dist-info → kash_shell-0.3.20.dist-info}/entry_points.txt +0 -0
{kash_shell-0.3.17.dist-info → kash_shell-0.3.20.dist-info}/licenses/LICENSE +0 -0

kash/model/params_model.py CHANGED Viewed

@@ -206,10 +206,10 @@ A list of parameter declarations, possibly with default values.
 # These are the default models for typical use cases.
 # The user may override them with parameters.
-DEFAULT_CAREFUL_LLM = LLM.o1_preview
+DEFAULT_CAREFUL_LLM = LLM.o3
 DEFAULT_STRUCTURED_LLM = LLM.gpt_4o
-DEFAULT_STANDARD_LLM = LLM.claude_3_7_sonnet
-DEFAULT_FAST_LLM = LLM.claude_3_5_haiku
+DEFAULT_STANDARD_LLM = LLM.claude_4_sonnet
+DEFAULT_FAST_LLM = LLM.o1_mini
 # Parameters set globally such as in the workspace.
@@ -262,6 +262,12 @@ COMMON_ACTION_PARAMS: dict[str, Param] = {
         valid_str_values=list(LLM),
         is_open_ended=True,
     ),
+    "model_list": Param(
+        "model_list",
+        "A list of LLMs to use, as names separated by commas.",
+        type=str,
+        default_value=None,
+    ),
     "language": Param(
         "language",
         "The language of the input audio or text.",

kash/utils/common/function_inspect.py CHANGED Viewed

@@ -4,7 +4,14 @@ from collections.abc import Callable
 from dataclasses import dataclass
 from enum import Enum
 from inspect import Parameter
-from typing import Any, Union, cast, get_args, get_origin  # pyright: ignore[reportDeprecated]
+from typing import (
+    Any,
+    Literal,
+    Union,  # pyright: ignore[reportDeprecated]
+    cast,
+    get_args,
+    get_origin,
+)
 NO_DEFAULT = Parameter.empty  # Alias for clarity
@@ -90,6 +97,23 @@ def _resolve_type_details(annotation: Any) -> tuple[type | None, type | None, bo
             return (type(None), None, True)
         # If multiple non_none_args (e.g., int | str), current_annotation remains the Union for now.
+    # Handle Literal types
+    if origin is Literal:
+        if args:
+            # Determine the common type of all literal values
+            literal_types = {type(arg) for arg in args}
+            if len(literal_types) == 1:
+                # All literals are the same type
+                final_effective_type = literal_types.pop()
+            else:
+                # Mixed types, fall back to the most common base type or str if all are basic types
+                if all(isinstance(arg, (str, int, float, bool)) for arg in args):
+                    # For mixed basic types, use str as the effective type
+                    final_effective_type = str
+                else:
+                    final_effective_type = None
+            return final_effective_type, None, is_optional_flag
     #  Determine effective_type and inner_type from (potentially unwrapped) current_annotation
     final_effective_type: type | None = None
     final_inner_type: type | None = None
@@ -426,3 +450,75 @@ def test_inspect_function_parameters_updated():
             is_explicitly_optional=True,
         )
     ]
+def test_literal_types():
+    """Test Literal type support in function parameter inspection."""
+    # Test string literals
+    def func_string_literal(converter: Literal["markitdown", "marker"] = "markitdown"):
+        return converter
+    params = inspect_function_params(func_string_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "converter"
+    assert param.effective_type is str
+    assert param.default == "markitdown"
+    assert param.is_explicitly_optional is False
+    # Test integer literals
+    def func_int_literal(count: Literal[1, 2, 3] = 1):
+        return count
+    params = inspect_function_params(func_int_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "count"
+    assert param.effective_type is int
+    assert param.default == 1
+    # Test mixed type literals (should default to str)
+    def func_mixed_literal(value: Literal["auto", 42]):
+        return value
+    params = inspect_function_params(func_mixed_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "value"
+    assert param.effective_type is str
+    assert param.default == NO_DEFAULT
+    # Test Literal directly (without TypeAlias to avoid scope issues)
+    def func_direct_literal(converter: Literal["markitdown", "marker"] = "markitdown"):
+        return converter
+    params = inspect_function_params(func_direct_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "converter"
+    assert param.effective_type is str
+    assert param.default == "markitdown"
+    # Test optional literal
+    def func_optional_literal(mode: Literal["fast", "slow"] | None = None):
+        return mode
+    params = inspect_function_params(func_optional_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "mode"
+    assert param.effective_type is str
+    assert param.is_explicitly_optional is True
+    assert param.default is None
+    # Test boolean literals
+    def func_bool_literal(flag: Literal[True, False] = True):
+        return flag
+    params = inspect_function_params(func_bool_literal)
+    assert len(params) == 1
+    param = params[0]
+    assert param.name == "flag"
+    assert param.effective_type is bool
+    assert param.default is True

kash/utils/common/parse_docstring.py ADDED Viewed

@@ -0,0 +1,347 @@
+import re
+from dataclasses import dataclass, field
+from textwrap import dedent
+@dataclass
+class Docstring:
+    """
+    A parsed docstring.
+    """
+    body: str = ""
+    param: dict[str, str] = field(default_factory=dict)
+    type: dict[str, str] = field(default_factory=dict)
+    returns: str = ""
+    rtype: str = ""
+def parse_docstring(docstring: str) -> Docstring:
+    """
+    Parse a docstring in either reStructuredText or Google style format.
+    Supports two formats:
+    - reStructuredText style: `:param name: description`, `:type name: type`, etc.
+    - Google style: `Args:` section with `name (type): description` format
+    The parser automatically detects which format is used based on the presence
+    of `:param` directives or `Args:` sections.
+    """
+    docstring = dedent(docstring).strip()
+    if not docstring:
+        return Docstring()
+    # Detect format based on content
+    if ":param " in docstring or ":type " in docstring or ":return" in docstring:
+        return _parse_rst_docstring(docstring)
+    elif re.search(r"\b(Args|Arguments|Returns?):", docstring):
+        return _parse_google_docstring(docstring)
+    else:
+        # No special formatting, just treat as body
+        return Docstring(body=docstring)
+def _parse_rst_docstring(docstring: str) -> Docstring:
+    """
+    Parse reStructuredText-style docstring with :param: and :type: directives.
+    """
+    lines = docstring.split("\n")
+    result = Docstring()
+    body_lines = []
+    for line in lines:
+        if line.strip().startswith(":"):
+            break
+        body_lines.append(line)
+    result.body = "\n".join(body_lines).strip()
+    _parse_rst_fields(lines[len(body_lines) :], result)
+    return result
+def _parse_google_docstring(docstring: str) -> Docstring:
+    """
+    Parse Google-style docstring with Args: and Returns: sections.
+    """
+    lines = docstring.split("\n")
+    result = Docstring()
+    # Find sections using regex
+    sections = {}
+    for i, line in enumerate(lines):
+        stripped = line.strip()
+        if re.match(r"^(Args|Arguments):\s*$", stripped, re.IGNORECASE):
+            sections["args"] = i
+        elif re.match(r"^Returns?:\s*$", stripped, re.IGNORECASE):
+            sections["returns"] = i
+    # Body is everything before the first section
+    body_end = min(sections.values()) if sections else len(lines)
+    result.body = "\n".join(lines[:body_end]).strip()
+    # Parse each section
+    if "args" in sections:
+        _parse_google_args_section(lines, sections["args"] + 1, result, sections)
+    if "returns" in sections:
+        _parse_google_returns_section(lines, sections["returns"] + 1, result, sections)
+    return result
+def _parse_google_args_section(
+    lines: list[str], start_idx: int, result: Docstring, sections: dict[str, int]
+) -> None:
+    """
+    Parse the Args: section of a Google-style docstring.
+    """
+    # Find the end of this section
+    end_idx = len(lines)
+    for section_start in sections.values():
+        if section_start > start_idx:
+            end_idx = min(end_idx, section_start)
+    # Determine base indentation from first non-empty line
+    base_indent = None
+    for i in range(start_idx, end_idx):
+        line = lines[i]
+        if line.strip():
+            base_indent = len(line) - len(line.lstrip())
+            break
+    if base_indent is None:
+        return
+    i = start_idx
+    while i < end_idx:
+        line = lines[i]
+        # Skip empty lines
+        if not line.strip():
+            i += 1
+            continue
+        # Check if this line is at the base indentation level (parameter line)
+        line_indent = len(line) - len(line.lstrip())
+        if line_indent == base_indent:
+            param_line = line.strip()
+            # More robust regex that allows underscores and handles various formats
+            # Match: name (type): description
+            match = re.match(r"([a-zA-Z_]\w*)\s*\(([^)]+)\)\s*:\s*(.*)", param_line)
+            if match:
+                name, param_type, description = match.groups()
+                result.param[name] = description.strip()
+                result.type[name] = param_type.strip()
+            else:
+                # Match: name: description
+                match = re.match(r"([a-zA-Z_]\w*)\s*:\s*(.*)", param_line)
+                if match:
+                    name, description = match.groups()
+                    result.param[name] = description.strip()
+            # Collect continuation lines (more indented than base)
+            i += 1
+            continuation_lines = []
+            while i < end_idx:
+                if not lines[i].strip():
+                    i += 1
+                    continue
+                next_indent = len(lines[i]) - len(lines[i].lstrip())
+                if next_indent > base_indent:
+                    continuation_lines.append(lines[i].strip())
+                    i += 1
+                else:
+                    break
+            # Add continuation to the last parameter
+            if continuation_lines and result.param:
+                last_param = list(result.param.keys())[-1]
+                result.param[last_param] += " " + " ".join(continuation_lines)
+        else:
+            i += 1
+def _parse_google_returns_section(
+    lines: list[str], start_idx: int, result: Docstring, sections: dict[str, int]
+) -> None:
+    """
+    Parse the Returns: section of a Google-style docstring.
+    """
+    # Find the end of this section
+    end_idx = len(lines)
+    for section_start in sections.values():
+        if section_start > start_idx:
+            end_idx = min(end_idx, section_start)
+    # Collect all content from this section
+    content_lines = []
+    for i in range(start_idx, end_idx):
+        line = lines[i]
+        if line.strip():
+            content_lines.append(line.strip())
+    if content_lines:
+        content = " ".join(content_lines).strip()
+        # Try to parse "type: description" format
+        if ":" in content and not content.startswith(":"):
+            parts = content.split(":", 1)
+            if len(parts) == 2 and parts[0].strip():
+                result.rtype = parts[0].strip()
+                result.returns = parts[1].strip()
+            else:
+                result.returns = content
+        else:
+            result.returns = content
+def _parse_rst_fields(lines: list[str], result: Docstring) -> None:
+    """Parse reStructuredText-style field directives."""
+    current_field = None
+    current_content = []
+    def save_current_field():
+        if current_field and current_content:
+            content = " ".join(current_content).strip()
+            if current_field.startswith("param "):
+                result.param[current_field[6:]] = content
+            elif current_field.startswith("type "):
+                result.type[current_field[5:]] = content
+            elif current_field == "return":
+                result.returns = content
+            elif current_field == "rtype":
+                result.rtype = content
+    for line in lines:
+        if line.strip().startswith(":"):
+            save_current_field()
+            current_field, _, content = line.strip()[1:].partition(":")
+            current_content = [content.strip()]
+        else:
+            current_content.append(line.strip())
+    save_current_field()
+## Tests
+def test_parse_rst_docstring():
+    rst_docstring = """
+    Search for a string in files at the given paths and return their store paths.
+    Useful to find all docs or resources matching a string or regex.
+    :param sort: How to sort results. Can be `path` or `score`.
+    :param ignore_case: Ignore case when searching.
+    :type sort: str
+    :type ignore_case: bool
+    :return: The search results.
+    :rtype: CommandOutput
+    """
+    parsed = parse_docstring(rst_docstring)
+    assert (
+        parsed.body
+        == "Search for a string in files at the given paths and return their store paths.\nUseful to find all docs or resources matching a string or regex."
+    )
+    assert parsed.param == {
+        "sort": "How to sort results. Can be `path` or `score`.",
+        "ignore_case": "Ignore case when searching.",
+    }
+    assert parsed.type == {"sort": "str", "ignore_case": "bool"}
+    assert parsed.returns == "The search results."
+    assert parsed.rtype == "CommandOutput"
+def test_parse_google_docstring_with_types():
+    google_docstring = """
+    Search for a string in files at the given paths and return their store paths.
+    Useful to find all docs or resources matching a string or regex.
+    Args:
+        sort (str): How to sort results. Can be `path` or `score`.
+        ignore_case (bool): Ignore case when searching.
+    Returns:
+        CommandOutput: The search results.
+    """
+    parsed = parse_docstring(google_docstring)
+    assert (
+        parsed.body
+        == "Search for a string in files at the given paths and return their store paths.\nUseful to find all docs or resources matching a string or regex."
+    )
+    assert parsed.param == {
+        "sort": "How to sort results. Can be `path` or `score`.",
+        "ignore_case": "Ignore case when searching.",
+    }
+    assert parsed.type == {"sort": "str", "ignore_case": "bool"}
+    assert parsed.returns == "The search results."
+    assert parsed.rtype == "CommandOutput"
+def test_parse_google_docstring_without_types():
+    google_no_types = """
+    Process the data.
+    Args:
+        data: The input data to process.
+        verbose: Whether to print verbose output.
+    Returns:
+        The processed result.
+    """
+    parsed = parse_docstring(google_no_types)
+    assert parsed.body == "Process the data."
+    assert parsed.param == {
+        "data": "The input data to process.",
+        "verbose": "Whether to print verbose output.",
+    }
+    assert parsed.type == {}
+    assert parsed.returns == "The processed result."
+    assert parsed.rtype == ""
+def test_parse_simple_docstring():
+    simple_docstring = """Some text."""
+    parsed = parse_docstring(simple_docstring)
+    assert parsed.body == "Some text."
+    assert parsed.param == {}
+    assert parsed.type == {}
+    assert parsed.returns == ""
+    assert parsed.rtype == ""
+def test_parse_docstring_with_underscores():
+    docstring = """
+    Test function.
+    Args:
+        some_param (str): A parameter with underscores.
+        another_param_name: Another parameter without type.
+    """
+    parsed = parse_docstring(docstring)
+    assert parsed.param == {
+        "some_param": "A parameter with underscores.",
+        "another_param_name": "Another parameter without type.",
+    }
+    assert parsed.type == {"some_param": "str"}
+def test_parse_empty_docstring():
+    """Test empty docstring handling."""
+    parsed = parse_docstring("")
+    assert parsed.body == ""
+    assert parsed.param == {}
+    assert parsed.type == {}
+    assert parsed.returns == ""
+    assert parsed.rtype == ""

kash/utils/common/testing.py ADDED Viewed

@@ -0,0 +1,58 @@
+from __future__ import annotations
+import os
+from collections.abc import Callable
+from functools import wraps
+from typing import Literal, TypeAlias
+TestMarker: TypeAlias = Literal["online", "integration"]
+"""
+Valid markers for tests. Currently just marking online tests (e.g. LLM APIs that
+that require keys) and more complex integration tests.
+"""
+def enable_if(marker: TestMarker) -> Callable:
+    """
+    Mark a test as having external dependencies.
+    Test runs only if the corresponding environment variable is set, e.g.
+    for the marker "online", checks for ENABLE_TESTS_ONLINE=1.
+    Automatically sets pytest markers when pytest is available, but safe to use in
+    runtime code as well.
+    Example usage:
+    ```
+    def test_foo():
+        ...
+    @enable_if("online")  # Only runs if ENABLE_TESTS_ONLINE=1
+    def test_bar():
+        ...
+    ```
+    """
+    def decorator(func: Callable) -> Callable:
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            env_var = f"ENABLE_TESTS_{marker.upper()}"
+            if not os.getenv(env_var):
+                print(f"Skipping test function: {func.__name__} (set {env_var}=1 to enable)")
+                return
+            return func(*args, **kwargs)
+        # Set pytest markers automatically if pytest is available
+        try:
+            import pytest
+            wrapper = pytest.mark.integration(wrapper)
+            wrapper = getattr(pytest.mark, marker)(wrapper)
+        except ImportError:
+            # Pytest not available, which is fine for non-test runs
+            pass
+        return wrapper
+    return decorator

kash-shell 0.3.17__py3-none-any.whl → 0.3.20__py3-none-any.whl

kash-shell 0.3.17py3-none-any.whl → 0.3.20py3-none-any.whl