PyPI - hexdag - Versions diffs - 0.5.0.dev1__py3-none-any.whl - Mend

hexdag 0.5.0.dev1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (261) hide show

hexdag/__init__.py +116 -0
hexdag/__main__.py +30 -0
hexdag/adapters/executors/__init__.py +5 -0
hexdag/adapters/executors/local_executor.py +316 -0
hexdag/builtin/__init__.py +6 -0
hexdag/builtin/adapters/__init__.py +51 -0
hexdag/builtin/adapters/anthropic/__init__.py +5 -0
hexdag/builtin/adapters/anthropic/anthropic_adapter.py +151 -0
hexdag/builtin/adapters/database/__init__.py +6 -0
hexdag/builtin/adapters/database/csv/csv_adapter.py +249 -0
hexdag/builtin/adapters/database/pgvector/__init__.py +5 -0
hexdag/builtin/adapters/database/pgvector/pgvector_adapter.py +478 -0
hexdag/builtin/adapters/database/sqlalchemy/sqlalchemy_adapter.py +252 -0
hexdag/builtin/adapters/database/sqlite/__init__.py +5 -0
hexdag/builtin/adapters/database/sqlite/sqlite_adapter.py +410 -0
hexdag/builtin/adapters/local/README.md +59 -0
hexdag/builtin/adapters/local/__init__.py +7 -0
hexdag/builtin/adapters/local/local_observer_manager.py +696 -0
hexdag/builtin/adapters/memory/__init__.py +47 -0
hexdag/builtin/adapters/memory/file_memory_adapter.py +297 -0
hexdag/builtin/adapters/memory/in_memory_memory.py +216 -0
hexdag/builtin/adapters/memory/schemas.py +57 -0
hexdag/builtin/adapters/memory/session_memory.py +178 -0
hexdag/builtin/adapters/memory/sqlite_memory_adapter.py +215 -0
hexdag/builtin/adapters/memory/state_memory.py +280 -0
hexdag/builtin/adapters/mock/README.md +89 -0
hexdag/builtin/adapters/mock/__init__.py +15 -0
hexdag/builtin/adapters/mock/hexdag.toml +50 -0
hexdag/builtin/adapters/mock/mock_database.py +225 -0
hexdag/builtin/adapters/mock/mock_embedding.py +223 -0
hexdag/builtin/adapters/mock/mock_llm.py +177 -0
hexdag/builtin/adapters/mock/mock_tool_adapter.py +192 -0
hexdag/builtin/adapters/mock/mock_tool_router.py +232 -0
hexdag/builtin/adapters/openai/__init__.py +5 -0
hexdag/builtin/adapters/openai/openai_adapter.py +634 -0
hexdag/builtin/adapters/secret/__init__.py +7 -0
hexdag/builtin/adapters/secret/local_secret_adapter.py +248 -0
hexdag/builtin/adapters/unified_tool_router.py +280 -0
hexdag/builtin/macros/__init__.py +17 -0
hexdag/builtin/macros/conversation_agent.py +390 -0
hexdag/builtin/macros/llm_macro.py +151 -0
hexdag/builtin/macros/reasoning_agent.py +423 -0
hexdag/builtin/macros/tool_macro.py +380 -0
hexdag/builtin/nodes/__init__.py +38 -0
hexdag/builtin/nodes/_discovery.py +123 -0
hexdag/builtin/nodes/agent_node.py +696 -0
hexdag/builtin/nodes/base_node_factory.py +242 -0
hexdag/builtin/nodes/composite_node.py +926 -0
hexdag/builtin/nodes/data_node.py +201 -0
hexdag/builtin/nodes/expression_node.py +487 -0
hexdag/builtin/nodes/function_node.py +454 -0
hexdag/builtin/nodes/llm_node.py +491 -0
hexdag/builtin/nodes/loop_node.py +920 -0
hexdag/builtin/nodes/mapped_input.py +518 -0
hexdag/builtin/nodes/port_call_node.py +269 -0
hexdag/builtin/nodes/tool_call_node.py +195 -0
hexdag/builtin/nodes/tool_utils.py +390 -0
hexdag/builtin/prompts/__init__.py +68 -0
hexdag/builtin/prompts/base.py +422 -0
hexdag/builtin/prompts/chat_prompts.py +303 -0
hexdag/builtin/prompts/error_correction_prompts.py +320 -0
hexdag/builtin/prompts/tool_prompts.py +160 -0
hexdag/builtin/tools/builtin_tools.py +84 -0
hexdag/builtin/tools/database_tools.py +164 -0
hexdag/cli/__init__.py +17 -0
hexdag/cli/__main__.py +7 -0
hexdag/cli/commands/__init__.py +27 -0
hexdag/cli/commands/build_cmd.py +812 -0
hexdag/cli/commands/create_cmd.py +208 -0
hexdag/cli/commands/docs_cmd.py +293 -0
hexdag/cli/commands/generate_types_cmd.py +252 -0
hexdag/cli/commands/init_cmd.py +188 -0
hexdag/cli/commands/pipeline_cmd.py +494 -0
hexdag/cli/commands/plugin_dev_cmd.py +529 -0
hexdag/cli/commands/plugins_cmd.py +441 -0
hexdag/cli/commands/studio_cmd.py +101 -0
hexdag/cli/commands/validate_cmd.py +221 -0
hexdag/cli/main.py +84 -0
hexdag/core/__init__.py +83 -0
hexdag/core/config/__init__.py +20 -0
hexdag/core/config/loader.py +479 -0
hexdag/core/config/models.py +150 -0
hexdag/core/configurable.py +294 -0
hexdag/core/context/__init__.py +37 -0
hexdag/core/context/execution_context.py +378 -0
hexdag/core/docs/__init__.py +26 -0
hexdag/core/docs/extractors.py +678 -0
hexdag/core/docs/generators.py +890 -0
hexdag/core/docs/models.py +120 -0
hexdag/core/domain/__init__.py +10 -0
hexdag/core/domain/dag.py +1225 -0
hexdag/core/exceptions.py +234 -0
hexdag/core/expression_parser.py +569 -0
hexdag/core/logging.py +449 -0
hexdag/core/models/__init__.py +17 -0
hexdag/core/models/base.py +138 -0
hexdag/core/orchestration/__init__.py +46 -0
hexdag/core/orchestration/body_executor.py +481 -0
hexdag/core/orchestration/components/__init__.py +97 -0
hexdag/core/orchestration/components/adapter_lifecycle_manager.py +113 -0
hexdag/core/orchestration/components/checkpoint_manager.py +134 -0
hexdag/core/orchestration/components/execution_coordinator.py +360 -0
hexdag/core/orchestration/components/health_check_manager.py +176 -0
hexdag/core/orchestration/components/input_mapper.py +143 -0
hexdag/core/orchestration/components/lifecycle_manager.py +583 -0
hexdag/core/orchestration/components/node_executor.py +377 -0
hexdag/core/orchestration/components/secret_manager.py +202 -0
hexdag/core/orchestration/components/wave_executor.py +158 -0
hexdag/core/orchestration/constants.py +17 -0
hexdag/core/orchestration/events/README.md +312 -0
hexdag/core/orchestration/events/__init__.py +104 -0
hexdag/core/orchestration/events/batching.py +330 -0
hexdag/core/orchestration/events/decorators.py +139 -0
hexdag/core/orchestration/events/events.py +573 -0
hexdag/core/orchestration/events/observers/__init__.py +30 -0
hexdag/core/orchestration/events/observers/core_observers.py +690 -0
hexdag/core/orchestration/events/observers/models.py +111 -0
hexdag/core/orchestration/events/taxonomy.py +269 -0
hexdag/core/orchestration/hook_context.py +237 -0
hexdag/core/orchestration/hooks.py +437 -0
hexdag/core/orchestration/models.py +418 -0
hexdag/core/orchestration/orchestrator.py +910 -0
hexdag/core/orchestration/orchestrator_factory.py +275 -0
hexdag/core/orchestration/port_wrappers.py +327 -0
hexdag/core/orchestration/prompt/__init__.py +32 -0
hexdag/core/orchestration/prompt/template.py +332 -0
hexdag/core/pipeline_builder/__init__.py +21 -0
hexdag/core/pipeline_builder/component_instantiator.py +386 -0
hexdag/core/pipeline_builder/include_tag.py +265 -0
hexdag/core/pipeline_builder/pipeline_config.py +133 -0
hexdag/core/pipeline_builder/py_tag.py +223 -0
hexdag/core/pipeline_builder/tag_discovery.py +268 -0
hexdag/core/pipeline_builder/yaml_builder.py +1196 -0
hexdag/core/pipeline_builder/yaml_validator.py +569 -0
hexdag/core/ports/__init__.py +65 -0
hexdag/core/ports/api_call.py +133 -0
hexdag/core/ports/database.py +489 -0
hexdag/core/ports/embedding.py +215 -0
hexdag/core/ports/executor.py +237 -0
hexdag/core/ports/file_storage.py +117 -0
hexdag/core/ports/healthcheck.py +87 -0
hexdag/core/ports/llm.py +551 -0
hexdag/core/ports/memory.py +70 -0
hexdag/core/ports/observer_manager.py +130 -0
hexdag/core/ports/secret.py +145 -0
hexdag/core/ports/tool_router.py +94 -0
hexdag/core/ports_builder.py +623 -0
hexdag/core/protocols.py +273 -0
hexdag/core/resolver.py +304 -0
hexdag/core/schema/__init__.py +9 -0
hexdag/core/schema/generator.py +742 -0
hexdag/core/secrets.py +242 -0
hexdag/core/types.py +413 -0
hexdag/core/utils/async_warnings.py +206 -0
hexdag/core/utils/schema_conversion.py +78 -0
hexdag/core/utils/sql_validation.py +86 -0
hexdag/core/validation/secure_json.py +148 -0
hexdag/core/yaml_macro.py +517 -0
hexdag/mcp_server.py +3120 -0
hexdag/studio/__init__.py +10 -0
hexdag/studio/build_ui.py +92 -0
hexdag/studio/server/__init__.py +1 -0
hexdag/studio/server/main.py +100 -0
hexdag/studio/server/routes/__init__.py +9 -0
hexdag/studio/server/routes/execute.py +208 -0
hexdag/studio/server/routes/export.py +558 -0
hexdag/studio/server/routes/files.py +207 -0
hexdag/studio/server/routes/plugins.py +419 -0
hexdag/studio/server/routes/validate.py +220 -0
hexdag/studio/ui/index.html +13 -0
hexdag/studio/ui/package-lock.json +2992 -0
hexdag/studio/ui/package.json +31 -0
hexdag/studio/ui/postcss.config.js +6 -0
hexdag/studio/ui/public/hexdag.svg +5 -0
hexdag/studio/ui/src/App.tsx +251 -0
hexdag/studio/ui/src/components/Canvas.tsx +408 -0
hexdag/studio/ui/src/components/ContextMenu.tsx +187 -0
hexdag/studio/ui/src/components/FileBrowser.tsx +123 -0
hexdag/studio/ui/src/components/Header.tsx +181 -0
hexdag/studio/ui/src/components/HexdagNode.tsx +193 -0
hexdag/studio/ui/src/components/NodeInspector.tsx +512 -0
hexdag/studio/ui/src/components/NodePalette.tsx +262 -0
hexdag/studio/ui/src/components/NodePortsSection.tsx +403 -0
hexdag/studio/ui/src/components/PluginManager.tsx +347 -0
hexdag/studio/ui/src/components/PortsEditor.tsx +481 -0
hexdag/studio/ui/src/components/PythonEditor.tsx +195 -0
hexdag/studio/ui/src/components/ValidationPanel.tsx +105 -0
hexdag/studio/ui/src/components/YamlEditor.tsx +196 -0
hexdag/studio/ui/src/components/index.ts +8 -0
hexdag/studio/ui/src/index.css +92 -0
hexdag/studio/ui/src/main.tsx +10 -0
hexdag/studio/ui/src/types/index.ts +123 -0
hexdag/studio/ui/src/vite-env.d.ts +1 -0
hexdag/studio/ui/tailwind.config.js +29 -0
hexdag/studio/ui/tsconfig.json +37 -0
hexdag/studio/ui/tsconfig.node.json +13 -0
hexdag/studio/ui/vite.config.ts +35 -0
hexdag/visualization/__init__.py +69 -0
hexdag/visualization/dag_visualizer.py +1020 -0
hexdag-0.5.0.dev1.dist-info/METADATA +369 -0
hexdag-0.5.0.dev1.dist-info/RECORD +261 -0
hexdag-0.5.0.dev1.dist-info/WHEEL +4 -0
hexdag-0.5.0.dev1.dist-info/entry_points.txt +4 -0
hexdag-0.5.0.dev1.dist-info/licenses/LICENSE +190 -0
hexdag_plugins/.gitignore +43 -0
hexdag_plugins/README.md +73 -0
hexdag_plugins/__init__.py +1 -0
hexdag_plugins/azure/LICENSE +21 -0
hexdag_plugins/azure/README.md +414 -0
hexdag_plugins/azure/__init__.py +21 -0
hexdag_plugins/azure/azure_blob_adapter.py +450 -0
hexdag_plugins/azure/azure_cosmos_adapter.py +383 -0
hexdag_plugins/azure/azure_keyvault_adapter.py +314 -0
hexdag_plugins/azure/azure_openai_adapter.py +415 -0
hexdag_plugins/azure/pyproject.toml +107 -0
hexdag_plugins/azure/tests/__init__.py +1 -0
hexdag_plugins/azure/tests/test_azure_blob_adapter.py +350 -0
hexdag_plugins/azure/tests/test_azure_cosmos_adapter.py +323 -0
hexdag_plugins/azure/tests/test_azure_keyvault_adapter.py +330 -0
hexdag_plugins/azure/tests/test_azure_openai_adapter.py +329 -0
hexdag_plugins/hexdag_etl/README.md +168 -0
hexdag_plugins/hexdag_etl/__init__.py +53 -0
hexdag_plugins/hexdag_etl/examples/01_simple_pandas_transform.py +270 -0
hexdag_plugins/hexdag_etl/examples/02_simple_pandas_only.py +149 -0
hexdag_plugins/hexdag_etl/examples/03_file_io_pipeline.py +109 -0
hexdag_plugins/hexdag_etl/examples/test_pandas_transform.py +84 -0
hexdag_plugins/hexdag_etl/hexdag.toml +25 -0
hexdag_plugins/hexdag_etl/hexdag_etl/__init__.py +48 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/__init__.py +13 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/api_extract.py +230 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/base_node_factory.py +181 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/file_io.py +415 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/outlook.py +492 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/pandas_transform.py +563 -0
hexdag_plugins/hexdag_etl/hexdag_etl/nodes/sql_extract_load.py +112 -0
hexdag_plugins/hexdag_etl/pyproject.toml +82 -0
hexdag_plugins/hexdag_etl/test_transform.py +54 -0
hexdag_plugins/hexdag_etl/tests/test_plugin_integration.py +62 -0
hexdag_plugins/mysql_adapter/LICENSE +21 -0
hexdag_plugins/mysql_adapter/README.md +224 -0
hexdag_plugins/mysql_adapter/__init__.py +6 -0
hexdag_plugins/mysql_adapter/mysql_adapter.py +408 -0
hexdag_plugins/mysql_adapter/pyproject.toml +93 -0
hexdag_plugins/mysql_adapter/tests/test_mysql_adapter.py +259 -0
hexdag_plugins/storage/README.md +184 -0
hexdag_plugins/storage/__init__.py +19 -0
hexdag_plugins/storage/file/__init__.py +5 -0
hexdag_plugins/storage/file/local.py +325 -0
hexdag_plugins/storage/ports/__init__.py +5 -0
hexdag_plugins/storage/ports/vector_store.py +236 -0
hexdag_plugins/storage/sql/__init__.py +7 -0
hexdag_plugins/storage/sql/base.py +187 -0
hexdag_plugins/storage/sql/mysql.py +27 -0
hexdag_plugins/storage/sql/postgresql.py +27 -0
hexdag_plugins/storage/tests/__init__.py +1 -0
hexdag_plugins/storage/tests/test_local_file_storage.py +161 -0
hexdag_plugins/storage/tests/test_sql_adapters.py +212 -0
hexdag_plugins/storage/vector/__init__.py +7 -0
hexdag_plugins/storage/vector/chromadb.py +223 -0
hexdag_plugins/storage/vector/in_memory.py +285 -0
hexdag_plugins/storage/vector/pgvector.py +502 -0

hexdag/core/docs/generators.py ADDED Viewed

@@ -0,0 +1,890 @@
+"""Guide generators for MCP documentation.
+This module generates documentation directly from extracted component
+documentation - no external templates needed.
+"""
+import json
+from pathlib import Path
+from typing import Any
+from hexdag.core.docs.models import AdapterDoc, NodeDoc, ToolDoc
+from hexdag.core.logging import get_logger
+logger = get_logger(__name__)
+# Path to the generated schema
+SCHEMA_PATH = Path(__file__).parent.parent.parent.parent / "schemas" / "pipeline-schema.json"
+class GuideGenerator:
+    """Generate documentation guides from extracted component docs.
+    All documentation is generated programmatically from code introspection,
+    ensuring it stays in sync with the actual implementation.
+    """
+    def generate_adapter_guide(self, adapters: list[AdapterDoc]) -> str:
+        """Generate adapter creation guide.
+        Parameters
+        ----------
+        adapters : list[AdapterDoc]
+            List of adapter documentation objects
+        Returns
+        -------
+        str
+            Complete adapter guide as markdown
+        """
+        # Group adapters by port type
+        adapters_by_port: dict[str, list[AdapterDoc]] = {}
+        for adapter in adapters:
+            port = adapter.port_type
+            if port not in adapters_by_port:
+                adapters_by_port[port] = []
+            adapters_by_port[port].append(adapter)
+        lines = [
+            "# Creating Custom Adapters in hexDAG",
+            "",
+            "## Overview",
+            "",
+            "hexDAG uses adapters to connect pipelines to external services like LLMs,",
+            "databases, and APIs. Adapters implement ports (interfaces) with async methods.",
+            "",
+            "## Quick Start",
+            "",
+            "### Simple Adapter (No Secrets)",
+            "",
+            "```python",
+            "class MemoryCacheAdapter:",
+            '    """Simple in-memory cache adapter."""',
+            "",
+            "    def __init__(self, max_size: int = 100, ttl: int = 3600):",
+            "        self.cache = {}",
+            "        self.max_size = max_size",
+            "        self.ttl = ttl",
+            "",
+            "    async def aget(self, key: str):",
+            "        return self.cache.get(key)",
+            "",
+            "    async def aset(self, key: str, value: any):",
+            "        self.cache[key] = value",
+            "```",
+            "",
+            "### Adapter with Secrets",
+            "",
+            "Use `secret()` in defaults to declare secrets that auto-resolve from environment:",
+            "",
+            "```python",
+            "from hexdag.core.secrets import secret",
+            "",
+            "class OpenAIAdapter:",
+            '    """OpenAI LLM adapter with automatic secret resolution."""',
+            "",
+            "    def __init__(",
+            "        self,",
+            '        api_key: str = secret(env="OPENAI_API_KEY"),  # Auto-resolved',
+            '        model: str = "gpt-4",',
+            "        temperature: float = 0.7",
+            "    ):",
+            "        self.api_key = api_key",
+            "        self.model = model",
+            "        self.temperature = temperature",
+            "",
+            "    async def aresponse(self, messages: list) -> str:",
+            "        # Your implementation using self.api_key",
+            "        ...",
+            "```",
+            "",
+            "## Secret Resolution",
+            "",
+            "Secrets declared with `secret()` are resolved in this order:",
+            "1. **Explicit kwargs** - Values passed directly to `__init__`",
+            "2. **Environment variables** - From the `env` parameter",
+            "3. **Memory port** - From orchestrator memory (with `secret:` prefix)",
+            "4. **Error** - If required and no default",
+            "",
+            "## Available Adapters",
+            "",
+        ]
+        # Generate adapter tables by port type
+        for port_type in sorted(adapters_by_port.keys()):
+            port_adapters = adapters_by_port[port_type]
+            lines.append(f"### {port_type}")
+            lines.append("")
+            lines.append("| Adapter | Description |")
+            lines.append("|---------|-------------|")
+            for adapter in port_adapters:
+                desc = adapter.description[:60]
+                if len(adapter.description) > 60:
+                    desc += "..."
+                lines.append(f"| `{adapter.name}` | {desc} |")
+            lines.append("")
+        # Add YAML usage section
+        lines.extend([
+            "## Using Adapters in YAML",
+            "",
+            "```yaml",
+            "apiVersion: hexdag/v1",
+            "kind: Pipeline",
+            "metadata:",
+            "  name: my-pipeline",
+            "spec:",
+            "  ports:",
+            "    llm:",
+            "      adapter: hexdag.builtin.adapters.openai.OpenAIAdapter",
+            "      config:",
+            "        api_key: ${OPENAI_API_KEY}",
+            "        model: gpt-4",
+            "",
+            "  nodes:",
+            "    - kind: llm_node",
+            "      metadata:",
+            "        name: analyzer",
+            "      spec:",
+            '        prompt_template: "Analyze: {{input}}"',
+            "      dependencies: []",
+            "```",
+            "",
+            "## Best Practices",
+            "",
+            "1. **Async First**: Use `async def` for I/O operations",
+            "2. **Type Hints**: Add type annotations for better tooling",
+            "3. **Docstrings**: Document your adapter's purpose and config",
+            "4. **Error Handling**: Wrap external calls in try/except",
+            "5. **Secrets**: Use `secret()` - never hardcode secrets",
+        ])
+        return "\n".join(lines)
+    def generate_node_guide(self, nodes: list[NodeDoc]) -> str:
+        """Generate node creation guide.
+        Parameters
+        ----------
+        nodes : list[NodeDoc]
+            List of node documentation objects
+        Returns
+        -------
+        str
+            Complete node guide as markdown
+        """
+        lines = [
+            "# Creating Custom Nodes in hexDAG",
+            "",
+            "## Overview",
+            "",
+            "Nodes are the building blocks of hexDAG pipelines. Each node performs a specific",
+            "task and can be connected to other nodes via dependencies.",
+            "",
+            "## Quick Start",
+            "",
+            "### Using FunctionNode (Simplest)",
+            "",
+            "Reference any Python function by module path:",
+            "",
+            "```yaml",
+            "- kind: function_node",
+            "  metadata:",
+            "    name: my_processor",
+            "  spec:",
+            "    fn: mycompany.processors.process_data",
+            "  dependencies: []",
+            "```",
+            "",
+            "```python",
+            "# mycompany/processors.py",
+            "def process_data(input_data: dict) -> dict:",
+            '    """Your processing logic."""',
+            '    return {"result": input_data["value"] * 2}',
+            "```",
+            "",
+            "## Available Node Types",
+            "",
+        ]
+        # Generate node documentation
+        for node in nodes:
+            lines.append(f"### {node.name}")
+            lines.append("")
+            lines.append(f"{node.description}")
+            lines.append("")
+            lines.append(f"**Kind**: `{node.kind}`")
+            lines.append("")
+            if node.parameters:
+                lines.append("| Parameter | Type | Required | Description |")
+                lines.append("|-----------|------|----------|-------------|")
+                for param in node.parameters:
+                    req = "Yes" if param.required else "No"
+                    desc = param.description[:50]
+                    if len(param.description) > 50:
+                        desc += "..."
+                    lines.append(f"| `{param.name}` | `{param.type_hint}` | {req} | {desc} |")
+                lines.append("")
+            if node.yaml_example:
+                lines.append("**Example:**")
+                lines.append("```yaml")
+                lines.append(node.yaml_example.strip())
+                lines.append("```")
+                lines.append("")
+        # Add custom node section
+        lines.extend([
+            "## Creating Custom Nodes",
+            "",
+            "```python",
+            "from hexdag.builtin.nodes import BaseNodeFactory",
+            "from hexdag.core.domain.dag import NodeSpec",
+            "",
+            "class CustomProcessorNode(BaseNodeFactory):",
+            '    """Custom node for specialized processing."""',
+            "",
+            "    def __call__(",
+            "        self,",
+            "        name: str,",
+            "        threshold: float = 0.5,",
+            "        **kwargs",
+            "    ) -> NodeSpec:",
+            "        async def process_fn(input_data: dict) -> dict:",
+            '            if input_data.get("score", 0) > threshold:',
+            '                return {"status": "pass"}',
+            '            return {"status": "fail"}',
+            "",
+            "        return NodeSpec(",
+            "            name=name,",
+            "            fn=process_fn,",
+            '            deps=frozenset(kwargs.get("deps", [])),',
+            "        )",
+            "```",
+            "",
+            "## Best Practices",
+            "",
+            "1. **Async Functions**: Use `async def` for the node function",
+            "2. **Immutable**: Don't modify input_data; return new dict",
+            "3. **Type Hints**: Add types for better IDE support",
+            "4. **Docstrings**: Document purpose and parameters",
+        ])
+        return "\n".join(lines)
+    def generate_tool_guide(self, tools: list[ToolDoc]) -> str:
+        """Generate tool creation guide.
+        Parameters
+        ----------
+        tools : list[ToolDoc]
+            List of tool documentation objects
+        Returns
+        -------
+        str
+            Complete tool guide as markdown
+        """
+        # Separate sync and async tools
+        async_tools = [t for t in tools if t.is_async]
+        sync_tools = [t for t in tools if not t.is_async]
+        lines = [
+            "# Creating Custom Tools for hexDAG Agents",
+            "",
+            "## Overview",
+            "",
+            "Tools are functions that agents can invoke during execution. They enable",
+            "agents to interact with external systems, perform calculations, or access data.",
+            "",
+            "## Quick Start",
+            "",
+            "```python",
+            "def calculate(expression: str) -> str:",
+            '    """Evaluate a mathematical expression.',
+            "",
+            "    Args:",
+            '        expression: Math expression like "2 + 2"',
+            "",
+            "    Returns:",
+            "        Result as a string",
+            '    """',
+            "    result = eval(expression)  # Use safe evaluation in production",
+            "    return str(result)",
+            "```",
+            "",
+            "## Built-in Tools",
+            "",
+        ]
+        # Generate tool documentation
+        for tool in tools:
+            lines.append(f"### {tool.name}")
+            lines.append("")
+            lines.append(tool.description)
+            lines.append("")
+            if tool.parameters:
+                lines.append("**Parameters:**")
+                for param in tool.parameters:
+                    opt = "" if param.required else ", optional"
+                    default = f" Default: `{param.default}`" if param.default else ""
+                    lines.append(
+                        f"- `{param.name}` (`{param.type_hint}`{opt}): {param.description}{default}"
+                    )
+                lines.append("")
+            lines.append(f"**Returns:** `{tool.return_type}`")
+            if tool.is_async:
+                lines.append("")
+                lines.append("*This is an async tool.*")
+            lines.append("")
+        # Add usage section
+        lines.extend([
+            "## Using Tools with Agents",
+            "",
+            "```yaml",
+            "- kind: agent_node",
+            "  metadata:",
+            "    name: research_agent",
+            "  spec:",
+            '    initial_prompt_template: "Research: {{topic}}"',
+            "    max_steps: 5",
+            "    tools:",
+            "      - hexdag.builtin.tools.builtin_tools.tool_end",
+            "      - mycompany.tools.search",
+            "  dependencies: []",
+            "```",
+            "",
+            "## Tool Invocation Format",
+            "",
+            "Agents invoke tools using:",
+            "```",
+            'INVOKE_TOOL: tool_name(param1="value", param2=123)',
+            "```",
+            "",
+            "## Tool Reference",
+            "",
+        ])
+        # Add reference tables
+        if sync_tools:
+            lines.append("### Synchronous Tools")
+            lines.append("")
+            lines.append("| Tool | Description | Return Type |")
+            lines.append("|------|-------------|-------------|")
+            for tool in sync_tools:
+                desc = tool.description[:40]
+                if len(tool.description) > 40:
+                    desc += "..."
+                lines.append(f"| `{tool.name}` | {desc} | `{tool.return_type}` |")
+            lines.append("")
+        if async_tools:
+            lines.append("### Asynchronous Tools")
+            lines.append("")
+            lines.append("| Tool | Description | Return Type |")
+            lines.append("|------|-------------|-------------|")
+            for tool in async_tools:
+                desc = tool.description[:40]
+                if len(tool.description) > 40:
+                    desc += "..."
+                lines.append(f"| `{tool.name}` | {desc} | `{tool.return_type}` |")
+            lines.append("")
+        lines.extend([
+            "## Best Practices",
+            "",
+            "1. **Type Hints**: Always add parameter and return types",
+            "2. **Docstrings**: Write clear descriptions for LLM understanding",
+            "3. **Error Handling**: Return error messages, don't raise exceptions",
+            "4. **Idempotent**: Tools should be safe to retry",
+        ])
+        return "\n".join(lines)
+    def generate_syntax_reference(self) -> str:
+        """Generate syntax reference guide.
+        Returns
+        -------
+        str
+            Complete syntax reference as markdown
+        """
+        return """# hexDAG Variable Reference Syntax
+## 1. Initial Input Reference: $input
+Use `$input.field` in `input_mapping` to access the original pipeline input.
+```yaml
+nodes:
+  - kind: function_node
+    metadata:
+      name: processor
+    spec:
+      fn: myapp.process
+      input_mapping:
+        load_id: $input.load_id
+        carrier: $input.carrier_mc
+    dependencies: [extractor]
+```
+## 2. Node Output Reference: {{node.field}}
+Use Jinja2 syntax in prompt templates to reference previous node outputs.
+```yaml
+- kind: llm_node
+  metadata:
+    name: analyzer
+  spec:
+    prompt_template: |
+      Analyze this data:
+      {{extractor.result}}
+```
+## 3. Environment Variables: ${VAR}
+```yaml
+spec:
+  ports:
+    llm:
+      config:
+        model: ${MODEL}              # Resolved at build time
+        api_key: ${OPENAI_API_KEY}   # Secret - resolved at runtime
+```
+**Secret Patterns (deferred to runtime):**
+- `*_API_KEY`, `*_SECRET`, `*_TOKEN`, `*_PASSWORD`, `*_CREDENTIAL`, `SECRET_*`
+## 4. Input Mapping
+```yaml
+- kind: function_node
+  metadata:
+    name: merger
+  spec:
+    fn: myapp.merge_results
+    input_mapping:
+      request_id: $input.id          # From initial input
+      analysis: analyzer.result       # From dependency
+  dependencies: [analyzer]
+```
+## Quick Reference
+| Syntax | Location | Purpose |
+|--------|----------|---------|
+| `$input.field` | input_mapping | Access initial pipeline input |
+| `{{node.field}}` | prompt_template | Jinja2 template reference |
+| `${VAR}` | Any string | Environment variable |
+| `${VAR:default}` | Any string | Env var with default |
+| `node.path` | input_mapping | Dependency output extraction |
+"""
+    def generate_extension_guide(
+        self,
+        adapters: list[AdapterDoc],
+        nodes: list[NodeDoc],
+        tools: list[ToolDoc],
+    ) -> str:
+        """Generate extension overview guide.
+        Parameters
+        ----------
+        adapters : list[AdapterDoc]
+            List of adapter documentation objects
+        nodes : list[NodeDoc]
+            List of node documentation objects
+        tools : list[ToolDoc]
+            List of tool documentation objects
+        Returns
+        -------
+        str
+            Complete extension guide as markdown
+        """
+        lines = [
+            "# Extending hexDAG - Overview",
+            "",
+            "## Extension Points",
+            "",
+            "| Component | Purpose | Available |",
+            "|-----------|---------|-----------|",
+            f"| **Adapter** | Connect to external services | {len(adapters)} |",
+            f"| **Node** | Custom processing logic | {len(nodes)} |",
+            f"| **Tool** | Agent-callable functions | {len(tools)} |",
+            "",
+            "## Quick Reference",
+            "",
+            "### Adapters",
+            "Use `get_custom_adapter_guide()` for full documentation.",
+            "",
+            "### Nodes",
+            "Use `get_custom_node_guide()` for full documentation.",
+            "",
+            "### Tools",
+            "Use `get_custom_tool_guide()` for full documentation.",
+            "",
+            "## MCP Tools for Development",
+            "",
+            "| Tool | Purpose |",
+            "|------|---------|",
+            "| `list_nodes()` | See available nodes |",
+            "| `list_adapters()` | See available adapters |",
+            "| `list_tools()` | See available tools |",
+            "| `get_component_schema()` | Get config schema |",
+            "| `validate_yaml_pipeline()` | Validate your YAML |",
+            "| `get_pipeline_schema()` | Get full JSON schema |",
+        ]
+        return "\n".join(lines)
+    def generate_pipeline_schema_guide(self) -> str:
+        """Generate pipeline schema reference guide from JSON schema.
+        Reads the auto-generated pipeline-schema.json and produces
+        a human-readable markdown reference.
+        Returns
+        -------
+        str
+            Complete pipeline schema guide as markdown
+        """
+        lines = [
+            "# hexDAG Pipeline Schema Reference",
+            "",
+            "This reference is auto-generated from the pipeline JSON schema.",
+            "",
+            "## Overview",
+            "",
+            "hexDAG pipelines are defined in YAML using a Kubernetes-like structure.",
+            "The schema provides validation and IDE autocompletion support.",
+            "",
+            "## Pipeline Structure",
+            "",
+            "```yaml",
+            "apiVersion: hexdag/v1",
+            "kind: Pipeline",
+            "metadata:",
+            "  name: my-pipeline",
+            "  description: Pipeline description",
+            "spec:",
+            "  ports: {}     # Adapter configurations",
+            "  nodes: []     # Processing nodes",
+            "  events: {}    # Event handlers",
+            "```",
+            "",
+        ]
+        # Try to load and parse schema
+        try:
+            schema = self._load_schema()
+            if schema:
+                lines.extend(self._generate_node_types_section(schema))
+                lines.extend(self._generate_ports_section(schema))
+                lines.extend(self._generate_events_section(schema))
+        except Exception as e:
+            logger.warning(f"Could not load pipeline schema: {e}")
+            lines.extend([
+                "## Node Types",
+                "",
+                "*Schema not available. Run `scripts/generate_schemas.py` first.*",
+                "",
+            ])
+        # Add IDE setup section
+        lines.extend([
+            "## IDE Setup",
+            "",
+            "### VS Code",
+            "",
+            "Add to `.vscode/settings.json`:",
+            "",
+            "```json",
+            "{",
+            '  "yaml.schemas": {',
+            '    "./schemas/pipeline-schema.json": ["*.yaml", "pipelines/*.yaml"]',
+            "  }",
+            "}",
+            "```",
+            "",
+            "### Schema Location",
+            "",
+            (
+                "The schema file is at `schemas/pipeline-schema.json` and is "
+                "auto-generated from node `_yaml_schema` attributes."
+            ),
+        ])
+        return "\n".join(lines)
+    def _load_schema(self) -> dict[str, Any] | None:
+        """Load the pipeline schema JSON file.
+        Returns
+        -------
+        dict[str, Any] | None
+            Parsed schema or None if not found
+        """
+        if not SCHEMA_PATH.exists():
+            return None
+        return json.loads(SCHEMA_PATH.read_text())
+    def _generate_node_types_section(self, schema: dict[str, Any]) -> list[str]:
+        """Generate node types documentation from schema.
+        Parameters
+        ----------
+        schema : dict[str, Any]
+            Parsed JSON schema
+        Returns
+        -------
+        list[str]
+            Lines of markdown documentation
+        """
+        lines = ["## Node Types", ""]
+        defs = schema.get("$defs", {})
+        # Find all node specs
+        node_specs = [(name, spec) for name, spec in defs.items() if name.endswith("NodeSpec")]
+        if not node_specs:
+            lines.append("*No node types found in schema.*")
+            lines.append("")
+            return lines
+        # Generate table
+        lines.append("| Node Kind | Description |")
+        lines.append("|-----------|-------------|")
+        for name, spec in sorted(node_specs):
+            kind = name.replace("NodeSpec", "").lower()
+            # Convert CamelCase to snake_case
+            kind = "".join(f"_{c.lower()}" if c.isupper() else c for c in kind).lstrip("_")
+            # Get description from spec
+            desc = spec.get("description", "")
+            if not desc:
+                props = spec.get("properties", {})
+                spec_prop = props.get("spec", {})
+                desc = spec_prop.get("description", "No description")
+            # Truncate long descriptions
+            if len(desc) > 60:
+                desc = desc[:57] + "..."
+            lines.append(f"| `{kind}_node` | {desc} |")
+        lines.append("")
+        # Generate detailed sections for each node
+        for name, spec in sorted(node_specs):
+            lines.extend(self._generate_node_detail(name, spec))
+        return lines
+    def _generate_node_detail(self, name: str, spec: dict[str, Any]) -> list[str]:
+        """Generate detailed documentation for a single node type.
+        Parameters
+        ----------
+        name : str
+            Node spec name (e.g., "FunctionNodeSpec")
+        spec : dict[str, Any]
+            Node specification from schema
+        Returns
+        -------
+        list[str]
+            Lines of markdown documentation
+        """
+        kind = name.replace("NodeSpec", "").lower()
+        kind = "".join(f"_{c.lower()}" if c.isupper() else c for c in kind).lstrip("_")
+        lines = [f"### {kind}_node", ""]
+        # Get description
+        props = spec.get("properties", {})
+        spec_prop = props.get("spec", {})
+        desc = spec_prop.get("description", spec.get("description", ""))
+        if desc:
+            lines.append(desc)
+            lines.append("")
+        # Extract spec properties
+        spec_props = spec_prop.get("properties", {})
+        required = spec_prop.get("required", [])
+        if spec_props:
+            lines.append("**Parameters:**")
+            lines.append("")
+            lines.append("| Parameter | Type | Required | Description |")
+            lines.append("|-----------|------|----------|-------------|")
+            for param_name, param_spec in sorted(spec_props.items()):
+                param_type = self._get_type_from_schema(param_spec)
+                is_required = "Yes" if param_name in required else "No"
+                param_desc = param_spec.get("description", "")
+                if len(param_desc) > 40:
+                    param_desc = param_desc[:37] + "..."
+                lines.append(f"| `{param_name}` | {param_type} | {is_required} | {param_desc} |")
+            lines.append("")
+        # Add example
+        lines.append("**Example:**")
+        lines.append("")
+        lines.append("```yaml")
+        lines.append(f"- kind: {kind}_node")
+        lines.append("  metadata:")
+        lines.append(f"    name: my_{kind}")
+        lines.append("  spec:")
+        # Add required params as example (limit to first 3)
+        lines.extend(f"    {param_name}: # required" for param_name in required[:3])
+        lines.append("  dependencies: []")
+        lines.append("```")
+        lines.append("")
+        return lines
+    def _get_type_from_schema(self, spec: dict[str, Any]) -> str:
+        """Extract type string from JSON schema property.
+        Parameters
+        ----------
+        spec : dict[str, Any]
+            Property specification
+        Returns
+        -------
+        str
+            Human-readable type string
+        """
+        if "const" in spec:
+            return f'`"{spec["const"]}"`'
+        if "enum" in spec:
+            return " | ".join(f'`"{v}`"' for v in spec["enum"][:3])
+        if "anyOf" in spec:
+            types = [self._get_type_from_schema(s) for s in spec["anyOf"][:2]]
+            return " | ".join(types)
+        type_val = spec.get("type")
+        if isinstance(type_val, list):
+            return " | ".join(type_val)
+        if type_val == "array":
+            items = spec.get("items", {})
+            item_type = items.get("type", "any")
+            return f"list[{item_type}]"
+        if type_val:
+            return type_val
+        return "any"
+    def _generate_ports_section(self, schema: dict[str, Any]) -> list[str]:
+        """Generate ports documentation from schema.
+        Parameters
+        ----------
+        schema : dict[str, Any]
+            Parsed JSON schema
+        Returns
+        -------
+        list[str]
+            Lines of markdown documentation
+        """
+        return [
+            "## Ports Configuration",
+            "",
+            "Ports connect pipelines to external services:",
+            "",
+            "```yaml",
+            "spec:",
+            "  ports:",
+            "    llm:",
+            "      adapter: hexdag.builtin.adapters.openai.OpenAIAdapter",
+            "      config:",
+            "        api_key: ${OPENAI_API_KEY}",
+            "        model: gpt-4",
+            "    memory:",
+            "      adapter: hexdag.builtin.adapters.memory.InMemoryMemory",
+            "    database:",
+            "      adapter: hexdag.builtin.adapters.database.sqlite.SQLiteAdapter",
+            "      config:",
+            "        db_path: ./data.db",
+            "```",
+            "",
+            "### Available Port Types",
+            "",
+            "| Port | Purpose |",
+            "|------|---------|",
+            "| `llm` | Language model interactions |",
+            "| `memory` | Persistent agent memory |",
+            "| `database` | Data persistence |",
+            "| `secret` | Secret/credential management |",
+            "| `tool_router` | Tool invocation routing |",
+            "",
+        ]
+    def _generate_events_section(self, schema: dict[str, Any]) -> list[str]:
+        """Generate events documentation from schema.
+        Parameters
+        ----------
+        schema : dict[str, Any]
+            Parsed JSON schema
+        Returns
+        -------
+        list[str]
+            Lines of markdown documentation
+        """
+        return [
+            "## Events Configuration",
+            "",
+            "Configure event handlers for observability:",
+            "",
+            "```yaml",
+            "spec:",
+            "  events:",
+            "    node_failed:",
+            "      - type: alert",
+            "        target: pagerduty",
+            "        severity: high",
+            "    pipeline_completed:",
+            "      - type: metrics",
+            "        target: datadog",
+            "```",
+            "",
+            "### Event Types",
+            "",
+            "| Event | When Triggered |",
+            "|-------|----------------|",
+            "| `pipeline_started` | Pipeline execution begins |",
+            "| `pipeline_completed` | Pipeline execution finishes |",
+            "| `node_started` | Node execution begins |",
+            "| `node_completed` | Node execution finishes |",
+            "| `node_failed` | Node execution fails |",
+            "",
+            "### Handler Types",
+            "",
+            "| Type | Purpose |",
+            "|------|---------|",
+            "| `alert` | Send alerts (PagerDuty, Slack) |",
+            "| `metrics` | Emit metrics (Datadog, Prometheus) |",
+            "| `log` | Write to logs |",
+            "| `webhook` | Call external webhooks |",
+            "| `callback` | Execute Python callbacks |",
+            "",
+        ]