PyPI - yamlgraph - Versions diffs - 0.3.9__py3-none-any.whl - Mend

yamlgraph 0.3.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

examples/__init__.py +1 -0
examples/codegen/__init__.py +5 -0
examples/codegen/models/__init__.py +13 -0
examples/codegen/models/schemas.py +76 -0
examples/codegen/tests/__init__.py +1 -0
examples/codegen/tests/test_ai_helpers.py +235 -0
examples/codegen/tests/test_ast_analysis.py +174 -0
examples/codegen/tests/test_code_analysis.py +134 -0
examples/codegen/tests/test_code_context.py +301 -0
examples/codegen/tests/test_code_nav.py +89 -0
examples/codegen/tests/test_dependency_tools.py +119 -0
examples/codegen/tests/test_example_tools.py +185 -0
examples/codegen/tests/test_git_tools.py +112 -0
examples/codegen/tests/test_impl_agent_schemas.py +193 -0
examples/codegen/tests/test_impl_agent_v4_graph.py +94 -0
examples/codegen/tests/test_jedi_analysis.py +226 -0
examples/codegen/tests/test_meta_tools.py +250 -0
examples/codegen/tests/test_plan_discovery_prompt.py +98 -0
examples/codegen/tests/test_syntax_tools.py +85 -0
examples/codegen/tests/test_synthesize_prompt.py +94 -0
examples/codegen/tests/test_template_tools.py +244 -0
examples/codegen/tools/__init__.py +80 -0
examples/codegen/tools/ai_helpers.py +420 -0
examples/codegen/tools/ast_analysis.py +92 -0
examples/codegen/tools/code_context.py +180 -0
examples/codegen/tools/code_nav.py +52 -0
examples/codegen/tools/dependency_tools.py +120 -0
examples/codegen/tools/example_tools.py +188 -0
examples/codegen/tools/git_tools.py +151 -0
examples/codegen/tools/impl_executor.py +614 -0
examples/codegen/tools/jedi_analysis.py +311 -0
examples/codegen/tools/meta_tools.py +202 -0
examples/codegen/tools/syntax_tools.py +26 -0
examples/codegen/tools/template_tools.py +356 -0
examples/fastapi_interview.py +167 -0
examples/npc/api/__init__.py +1 -0
examples/npc/api/app.py +100 -0
examples/npc/api/routes/__init__.py +5 -0
examples/npc/api/routes/encounter.py +182 -0
examples/npc/api/session.py +330 -0
examples/npc/demo.py +387 -0
examples/npc/nodes/__init__.py +5 -0
examples/npc/nodes/image_node.py +92 -0
examples/npc/run_encounter.py +230 -0
examples/shared/__init__.py +0 -0
examples/shared/replicate_tool.py +238 -0
examples/storyboard/__init__.py +1 -0
examples/storyboard/generate_videos.py +335 -0
examples/storyboard/nodes/__init__.py +12 -0
examples/storyboard/nodes/animated_character_node.py +248 -0
examples/storyboard/nodes/animated_image_node.py +138 -0
examples/storyboard/nodes/character_node.py +162 -0
examples/storyboard/nodes/image_node.py +118 -0
examples/storyboard/nodes/replicate_tool.py +49 -0
examples/storyboard/retry_images.py +118 -0
scripts/demo_async_executor.py +212 -0
scripts/demo_interview_e2e.py +200 -0
scripts/demo_streaming.py +140 -0
scripts/run_interview_demo.py +94 -0
scripts/test_interrupt_fix.py +26 -0
tests/__init__.py +1 -0
tests/conftest.py +178 -0
tests/integration/__init__.py +1 -0
tests/integration/test_animated_storyboard.py +63 -0
tests/integration/test_cli_commands.py +242 -0
tests/integration/test_colocated_prompts.py +139 -0
tests/integration/test_map_demo.py +50 -0
tests/integration/test_memory_demo.py +283 -0
tests/integration/test_npc_api/__init__.py +1 -0
tests/integration/test_npc_api/test_routes.py +357 -0
tests/integration/test_npc_api/test_session.py +216 -0
tests/integration/test_pipeline_flow.py +105 -0
tests/integration/test_providers.py +163 -0
tests/integration/test_resume.py +75 -0
tests/integration/test_subgraph_integration.py +295 -0
tests/integration/test_subgraph_interrupt.py +106 -0
tests/unit/__init__.py +1 -0
tests/unit/test_agent_nodes.py +355 -0
tests/unit/test_async_executor.py +346 -0
tests/unit/test_checkpointer.py +212 -0
tests/unit/test_checkpointer_factory.py +212 -0
tests/unit/test_cli.py +121 -0
tests/unit/test_cli_package.py +81 -0
tests/unit/test_compile_graph_map.py +132 -0
tests/unit/test_conditions_routing.py +253 -0
tests/unit/test_config.py +93 -0
tests/unit/test_conversation_memory.py +276 -0
tests/unit/test_database.py +145 -0
tests/unit/test_deprecation.py +104 -0
tests/unit/test_executor.py +172 -0
tests/unit/test_executor_async.py +179 -0
tests/unit/test_export.py +149 -0
tests/unit/test_expressions.py +178 -0
tests/unit/test_feature_brainstorm.py +194 -0
tests/unit/test_format_prompt.py +145 -0
tests/unit/test_generic_report.py +200 -0
tests/unit/test_graph_commands.py +327 -0
tests/unit/test_graph_linter.py +627 -0
tests/unit/test_graph_loader.py +357 -0
tests/unit/test_graph_schema.py +193 -0
tests/unit/test_inline_schema.py +151 -0
tests/unit/test_interrupt_node.py +182 -0
tests/unit/test_issues.py +164 -0
tests/unit/test_jinja2_prompts.py +85 -0
tests/unit/test_json_extract.py +134 -0
tests/unit/test_langsmith.py +600 -0
tests/unit/test_langsmith_tools.py +204 -0
tests/unit/test_llm_factory.py +109 -0
tests/unit/test_llm_factory_async.py +118 -0
tests/unit/test_loops.py +403 -0
tests/unit/test_map_node.py +144 -0
tests/unit/test_no_backward_compat.py +56 -0
tests/unit/test_node_factory.py +348 -0
tests/unit/test_passthrough_node.py +126 -0
tests/unit/test_prompts.py +324 -0
tests/unit/test_python_nodes.py +198 -0
tests/unit/test_reliability.py +298 -0
tests/unit/test_result_export.py +234 -0
tests/unit/test_router.py +296 -0
tests/unit/test_sanitize.py +99 -0
tests/unit/test_schema_loader.py +295 -0
tests/unit/test_shell_tools.py +229 -0
tests/unit/test_state_builder.py +331 -0
tests/unit/test_state_builder_map.py +104 -0
tests/unit/test_state_config.py +197 -0
tests/unit/test_streaming.py +307 -0
tests/unit/test_subgraph.py +596 -0
tests/unit/test_template.py +190 -0
tests/unit/test_tool_call_integration.py +164 -0
tests/unit/test_tool_call_node.py +178 -0
tests/unit/test_tool_nodes.py +129 -0
tests/unit/test_websearch.py +234 -0
yamlgraph/__init__.py +35 -0
yamlgraph/builder.py +110 -0
yamlgraph/cli/__init__.py +159 -0
yamlgraph/cli/__main__.py +6 -0
yamlgraph/cli/commands.py +231 -0
yamlgraph/cli/deprecation.py +92 -0
yamlgraph/cli/graph_commands.py +541 -0
yamlgraph/cli/validators.py +37 -0
yamlgraph/config.py +67 -0
yamlgraph/constants.py +70 -0
yamlgraph/error_handlers.py +227 -0
yamlgraph/executor.py +290 -0
yamlgraph/executor_async.py +288 -0
yamlgraph/graph_loader.py +451 -0
yamlgraph/map_compiler.py +150 -0
yamlgraph/models/__init__.py +36 -0
yamlgraph/models/graph_schema.py +181 -0
yamlgraph/models/schemas.py +124 -0
yamlgraph/models/state_builder.py +236 -0
yamlgraph/node_factory.py +768 -0
yamlgraph/routing.py +87 -0
yamlgraph/schema_loader.py +240 -0
yamlgraph/storage/__init__.py +20 -0
yamlgraph/storage/checkpointer.py +72 -0
yamlgraph/storage/checkpointer_factory.py +123 -0
yamlgraph/storage/database.py +320 -0
yamlgraph/storage/export.py +269 -0
yamlgraph/tools/__init__.py +1 -0
yamlgraph/tools/agent.py +320 -0
yamlgraph/tools/graph_linter.py +388 -0
yamlgraph/tools/langsmith_tools.py +125 -0
yamlgraph/tools/nodes.py +126 -0
yamlgraph/tools/python_tool.py +179 -0
yamlgraph/tools/shell.py +205 -0
yamlgraph/tools/websearch.py +242 -0
yamlgraph/utils/__init__.py +48 -0
yamlgraph/utils/conditions.py +157 -0
yamlgraph/utils/expressions.py +245 -0
yamlgraph/utils/json_extract.py +104 -0
yamlgraph/utils/langsmith.py +416 -0
yamlgraph/utils/llm_factory.py +118 -0
yamlgraph/utils/llm_factory_async.py +105 -0
yamlgraph/utils/logging.py +104 -0
yamlgraph/utils/prompts.py +171 -0
yamlgraph/utils/sanitize.py +98 -0
yamlgraph/utils/template.py +102 -0
yamlgraph/utils/validators.py +181 -0
yamlgraph-0.3.9.dist-info/METADATA +1105 -0
yamlgraph-0.3.9.dist-info/RECORD +185 -0
yamlgraph-0.3.9.dist-info/WHEEL +5 -0
yamlgraph-0.3.9.dist-info/entry_points.txt +2 -0
yamlgraph-0.3.9.dist-info/licenses/LICENSE +33 -0
yamlgraph-0.3.9.dist-info/top_level.txt +4 -0

yamlgraph/utils/json_extract.py ADDED Viewed

@@ -0,0 +1,104 @@
+"""Extract JSON from LLM output with various formats.
+LLMs often wrap JSON responses in markdown code blocks or add
+explanatory text. This module provides robust extraction.
+FR-B: JSON Extraction feature.
+"""
+import json
+import re
+def extract_json(text: str) -> dict | list | str:
+    """Extract JSON from LLM response.
+    Extraction order:
+    1. Parse as raw JSON (handles both objects and arrays)
+    2. Extract from ```json ... ``` code block
+    3. Extract from ``` ... ``` code block (any language)
+    4. Extract first {...} or [...] pattern
+    5. Return original text if no JSON found
+    Args:
+        text: Raw LLM response
+    Returns:
+        Parsed JSON (dict/list) or original string if extraction fails
+    Examples:
+        >>> extract_json('{"key": "value"}')
+        {'key': 'value'}
+        >>> extract_json('```json\\n{"key": "value"}\\n```')
+        {'key': 'value'}
+        >>> extract_json('Result: {"x": 1} found')
+        {'x': 1}
+    """
+    if not text:
+        return text
+    text = text.strip()
+    # 1. Try raw JSON first
+    try:
+        return json.loads(text)
+    except json.JSONDecodeError:
+        pass
+    # 2. Try ```json ... ``` block
+    match = re.search(r"```json\s*\n?(.*?)\n?```", text, re.DOTALL | re.IGNORECASE)
+    if match:
+        try:
+            return json.loads(match.group(1).strip())
+        except json.JSONDecodeError:
+            pass
+    # 3. Try ``` ... ``` block (any language)
+    match = re.search(r"```\s*\n?(.*?)\n?```", text, re.DOTALL)
+    if match:
+        try:
+            return json.loads(match.group(1).strip())
+        except json.JSONDecodeError:
+            pass
+    # 4. Try {...} or [...] pattern
+    # Find all potential JSON objects/arrays and try parsing each
+    # Use non-greedy matching to find smallest valid JSON structures
+    for pattern in [
+        r"\{[^{}]*\}",  # Simple object: {key: value}
+        r"\[[^\[\]]*\]",  # Simple array: [1, 2, 3]
+    ]:
+        for match in re.finditer(pattern, text):
+            try:
+                return json.loads(match.group(0))
+            except json.JSONDecodeError:
+                continue
+    # 5. Try nested structures (greedy, last resort)
+    # Find balanced braces manually
+    for start_char, end_char in [("{", "}"), ("[", "]")]:
+        start_idx = text.find(start_char)
+        if start_idx == -1:
+            continue
+        # Find matching closing bracket
+        depth = 0
+        for i, c in enumerate(text[start_idx:], start=start_idx):
+            if c == start_char:
+                depth += 1
+            elif c == end_char:
+                depth -= 1
+                if depth == 0:
+                    candidate = text[start_idx : i + 1]
+                    try:
+                        return json.loads(candidate)
+                    except json.JSONDecodeError:
+                        break  # Try next start position
+    # 6. Return original text
+    return text
+__all__ = ["extract_json"]

yamlgraph/utils/langsmith.py ADDED Viewed

@@ -0,0 +1,416 @@
+"""LangSmith Utilities - Tracing and observability helpers.
+Provides functions for interacting with LangSmith traces,
+printing execution trees, and logging run information.
+"""
+import logging
+import os
+from datetime import datetime
+from typing import Any
+logger = logging.getLogger(__name__)
+def get_client() -> Any | None:
+    """Get a LangSmith client if available.
+    Returns:
+        LangSmith Client instance or None if not configured
+    """
+    try:
+        from langsmith import Client
+        # Support both LANGCHAIN_* and LANGSMITH_* env vars
+        api_key = os.environ.get("LANGCHAIN_API_KEY") or os.environ.get(
+            "LANGSMITH_API_KEY"
+        )
+        if not api_key:
+            return None
+        endpoint = (
+            os.environ.get("LANGCHAIN_ENDPOINT")
+            or os.environ.get("LANGSMITH_ENDPOINT")
+            or "https://api.smith.langchain.com"
+        )
+        return Client(api_url=endpoint, api_key=api_key)
+    except ImportError:
+        logger.debug("LangSmith package not installed, client unavailable")
+        return None
+def get_project_name() -> str:
+    """Get the current LangSmith project name.
+    Returns:
+        Project name from environment or default
+    """
+    return (
+        os.environ.get("LANGCHAIN_PROJECT")
+        or os.environ.get("LANGSMITH_PROJECT")
+        or "yamlgraph"
+    )
+def is_tracing_enabled() -> bool:
+    """Check if LangSmith tracing is enabled.
+    Returns:
+        True if tracing is enabled
+    """
+    # Support both env var names and values
+    tracing_v2 = os.environ.get("LANGCHAIN_TRACING_V2", "").lower()
+    tracing = os.environ.get("LANGSMITH_TRACING", "").lower()
+    return tracing_v2 == "true" or tracing == "true"
+def get_latest_run_id(project_name: str | None = None) -> str | None:
+    """Get the ID of the most recent run.
+    Args:
+        project_name: Optional project name (uses default if not provided)
+    Returns:
+        Run ID string or None
+    """
+    client = get_client()
+    if not client:
+        return None
+    project = project_name or get_project_name()
+    try:
+        runs = list(client.list_runs(project_name=project, limit=1))
+        if runs:
+            return str(runs[0].id)
+    except Exception as e:
+        logger.warning("Could not get latest run: %s", e)
+    return None
+def share_run(run_id: str | None = None) -> str | None:
+    """Create a public share link for a run.
+    Args:
+        run_id: Run ID (uses latest if not provided)
+    Returns:
+        Public URL string or None if failed
+    Example:
+        >>> url = share_run()
+        >>> print(url)
+        https://eu.smith.langchain.com/public/abc123.../r
+    """
+    client = get_client()
+    if not client:
+        return None
+    if not run_id:
+        run_id = get_latest_run_id()
+    if not run_id:
+        return None
+    try:
+        # Use the share_run method from LangSmith SDK
+        return client.share_run(run_id)
+    except Exception as e:
+        logger.warning("Could not share run: %s", e)
+        return None
+def read_run_shared_link(run_id: str) -> str | None:
+    """Get existing share link for a run if it exists.
+    Args:
+        run_id: The run ID to check
+    Returns:
+        Public URL string or None if not shared
+    """
+    client = get_client()
+    if not client:
+        return None
+    try:
+        return client.read_run_shared_link(run_id)
+    except Exception as e:
+        logger.debug("Could not read run shared link for %s: %s", run_id, e)
+        return None
+def print_run_tree(run_id: str | None = None, verbose: bool = False) -> None:
+    """Print an execution tree for a run.
+    Args:
+        run_id: Specific run ID (uses latest if not provided)
+        verbose: Include timing and status details
+    """
+    client = get_client()
+    if not client:
+        logger.warning("LangSmith client not available")
+        return
+    if not run_id:
+        run_id = get_latest_run_id()
+    if not run_id:
+        logger.warning("No run found")
+        return
+    try:
+        run = client.read_run(run_id)
+        _print_run_node(run, client, verbose=verbose, indent=0)
+    except Exception as e:
+        logger.warning("Error reading run: %s", e)
+def _print_run_node(
+    run,
+    client,
+    verbose: bool = False,
+    indent: int = 0,
+    is_last: bool = True,
+    prefix: str = "",
+):
+    """Recursively print a run node and its children in tree format.
+    Args:
+        run: The LangSmith run object
+        client: LangSmith client
+        verbose: Include timing details
+        indent: Current indentation level
+        is_last: Whether this is the last sibling
+        prefix: Prefix string for tree drawing
+    """
+    # Status emoji
+    if run.status == "success":
+        status = "✅"
+    elif run.status == "error":
+        status = "❌"
+    else:
+        status = "⏳"
+    # Timing
+    timing = ""
+    if run.end_time and run.start_time:
+        duration = (run.end_time - run.start_time).total_seconds()
+        timing = f" ({duration:.1f}s)"
+    # Tree connectors
+    if indent == 0:
+        connector = "📊 "
+        new_prefix = ""
+    else:
+        connector = "└─ " if is_last else "├─ "
+        new_prefix = prefix + ("   " if is_last else "│  ")
+    # Clean up run name for display
+    display_name = run.name
+    if display_name.startswith("Chat"):
+        display_name = f"🤖 {display_name}"
+    elif "generate" in display_name.lower():
+        display_name = f"📝 {display_name}"
+    elif "analyze" in display_name.lower():
+        display_name = f"🔍 {display_name}"
+    elif "summarize" in display_name.lower():
+        display_name = f"📊 {display_name}"
+    logger.info("%s%s%s%s %s", prefix, connector, display_name, timing, status)
+    # Get child runs
+    try:
+        children = list(
+            client.list_runs(
+                parent_run_id=run.id,
+                limit=50,
+            )
+        )
+        # Sort by start time to show in execution order
+        children.sort(key=lambda r: r.start_time or datetime.min)
+        for i, child in enumerate(children):
+            child_is_last = i == len(children) - 1
+            _print_run_node(
+                child,
+                client,
+                verbose=verbose,
+                indent=indent + 1,
+                is_last=child_is_last,
+                prefix=new_prefix,
+            )
+    except Exception as e:
+        logger.debug("Could not fetch child runs for %s: %s", run.id, e)
+def get_run_url(run_id: str | None = None) -> str | None:
+    """Get the LangSmith URL for a run.
+    Args:
+        run_id: Run ID (uses latest if not provided)
+    Returns:
+        URL string or None
+    """
+    if not run_id:
+        run_id = get_latest_run_id()
+    if not run_id:
+        return None
+    endpoint = os.environ.get("LANGCHAIN_ENDPOINT", "https://api.smith.langchain.com")
+    project = get_project_name()
+    # Convert API endpoint to web URL
+    web_url = endpoint.replace("api.", "").replace("/api", "")
+    if "smith.langchain" in web_url:
+        return f"{web_url}/o/default/projects/p/{project}/runs/{run_id}"
+    return f"{web_url}/projects/{project}/runs/{run_id}"
+def get_run_details(run_id: str | None = None) -> dict | None:
+    """Get detailed information about a run.
+    Args:
+        run_id: Run ID (uses latest if not provided)
+    Returns:
+        Dict with run details or None if failed:
+        - id: Run ID
+        - name: Run name
+        - status: success/error/pending
+        - error: Error message if any
+        - start_time: ISO timestamp
+        - end_time: ISO timestamp
+        - inputs: Input data
+        - outputs: Output data
+        - run_type: chain/llm/tool etc.
+    """
+    client = get_client()
+    if not client:
+        return None
+    if not run_id:
+        run_id = get_latest_run_id()
+    if not run_id:
+        return None
+    try:
+        run = client.read_run(run_id)
+        return {
+            "id": str(run.id),
+            "name": run.name,
+            "status": run.status,
+            "error": run.error,
+            "start_time": run.start_time.isoformat() if run.start_time else None,
+            "end_time": run.end_time.isoformat() if run.end_time else None,
+            "inputs": run.inputs,
+            "outputs": run.outputs,
+            "run_type": run.run_type,
+        }
+    except Exception as e:
+        logger.warning("Could not get run details: %s", e)
+        return None
+def get_run_errors(run_id: str | None = None) -> list[dict]:
+    """Get all errors from a run and its child runs.
+    Args:
+        run_id: Run ID (uses latest if not provided)
+    Returns:
+        List of error dicts with:
+        - node: Name of the failed node
+        - error: Error message
+        - run_type: Type of run (llm/chain/tool)
+    """
+    client = get_client()
+    if not client:
+        return []
+    if not run_id:
+        run_id = get_latest_run_id()
+    if not run_id:
+        return []
+    errors = []
+    try:
+        # Get parent run
+        run = client.read_run(run_id)
+        if run.error:
+            errors.append(
+                {
+                    "node": run.name,
+                    "error": run.error,
+                    "run_type": run.run_type,
+                }
+            )
+        # Get child runs with errors
+        children = client.list_runs(
+            parent_run_id=run_id,
+            error=True,
+            limit=50,
+        )
+        for child in children:
+            if child.error:
+                errors.append(
+                    {
+                        "node": child.name,
+                        "error": child.error,
+                        "run_type": child.run_type,
+                    }
+                )
+    except Exception as e:
+        logger.warning("Could not get run errors: %s", e)
+    return errors
+def get_failed_runs(
+    project_name: str | None = None,
+    limit: int = 10,
+) -> list[dict]:
+    """Get recent failed runs from a project.
+    Args:
+        project_name: Project name (uses default if not provided)
+        limit: Maximum number of runs to return
+    Returns:
+        List of failed run summaries with:
+        - id: Run ID
+        - name: Run name
+        - error: Error message
+        - start_time: ISO timestamp
+    """
+    client = get_client()
+    if not client:
+        return []
+    project = project_name or get_project_name()
+    try:
+        runs = client.list_runs(
+            project_name=project,
+            error=True,
+            limit=limit,
+        )
+        return [
+            {
+                "id": str(r.id),
+                "name": r.name,
+                "error": r.error,
+                "start_time": r.start_time.isoformat() if r.start_time else None,
+            }
+            for r in runs
+        ]
+    except Exception as e:
+        logger.warning("Could not list failed runs: %s", e)
+        return []

yamlgraph/utils/llm_factory.py ADDED Viewed

@@ -0,0 +1,118 @@
+"""LLM Factory - Multi-provider abstraction for language models.
+This module provides a simple factory pattern for creating LLM instances
+across different providers (Anthropic, Mistral, OpenAI).
+"""
+import logging
+import os
+import threading
+from typing import Literal
+from langchain_core.language_models.chat_models import BaseChatModel
+from yamlgraph.config import DEFAULT_MODELS
+logger = logging.getLogger(__name__)
+# Type alias for supported providers
+ProviderType = Literal["anthropic", "mistral", "openai"]
+# Thread-safe cache for LLM instances
+_llm_cache: dict[tuple, BaseChatModel] = {}
+_cache_lock = threading.Lock()
+def create_llm(
+    provider: ProviderType | None = None,
+    model: str | None = None,
+    temperature: float = 0.7,
+) -> BaseChatModel:
+    """Create an LLM instance with multi-provider support.
+    Supports Anthropic (default), Mistral, and OpenAI providers.
+    Provider can be specified via parameter or PROVIDER environment variable.
+    Model can be specified via parameter or {PROVIDER}_MODEL environment variable.
+    LLM instances are cached by (provider, model, temperature) to improve performance.
+    Args:
+        provider: LLM provider ("anthropic", "mistral", "openai").
+                 Defaults to PROVIDER env var or "anthropic".
+        model: Model name. Defaults to {PROVIDER}_MODEL env var or provider default.
+        temperature: Temperature for generation (0.0-1.0).
+    Returns:
+        Configured LLM instance.
+    Raises:
+        ValueError: If provider is invalid.
+    Examples:
+        >>> # Use default Anthropic
+        >>> llm = create_llm(temperature=0.7)
+        >>> # Override provider
+        >>> llm = create_llm(provider="mistral", temperature=0.8)
+        >>> # Custom model
+        >>> llm = create_llm(provider="openai", model="gpt-4o-mini")
+    """
+    # Determine provider (parameter > env var > default)
+    selected_provider = provider or os.getenv("PROVIDER") or "anthropic"
+    # Validate provider
+    if selected_provider not in DEFAULT_MODELS:
+        raise ValueError(
+            f"Invalid provider: {selected_provider}. "
+            f"Must be one of: {', '.join(DEFAULT_MODELS.keys())}"
+        )
+    # Determine model (parameter > env var > default)
+    # Note: DEFAULT_MODELS already handles env var via config.py
+    selected_model = model or DEFAULT_MODELS[selected_provider]
+    # Create cache key
+    cache_key = (selected_provider, selected_model, temperature)
+    # Thread-safe cache access
+    with _cache_lock:
+        # Return cached instance if available
+        if cache_key in _llm_cache:
+            logger.debug(
+                f"Using cached LLM: {selected_provider}/{selected_model} (temp={temperature})"
+            )
+            return _llm_cache[cache_key]
+        # Create new LLM instance
+        logger.info(
+            f"Creating LLM: {selected_provider}/{selected_model} (temp={temperature})"
+        )
+        if selected_provider == "mistral":
+            from langchain_mistralai import ChatMistralAI
+            llm = ChatMistralAI(model=selected_model, temperature=temperature)
+        elif selected_provider == "openai":
+            from langchain_openai import ChatOpenAI
+            llm = ChatOpenAI(model=selected_model, temperature=temperature)
+        else:  # anthropic (default)
+            from langchain_anthropic import ChatAnthropic
+            llm = ChatAnthropic(model=selected_model, temperature=temperature)
+        # Cache the instance
+        _llm_cache[cache_key] = llm
+        return llm
+def clear_cache() -> None:
+    """Clear the LLM instance cache.
+    Useful for testing or when you want to force recreation of LLM instances.
+    """
+    with _cache_lock:
+        _llm_cache.clear()
+    logger.debug("LLM cache cleared")