PyPI - htmlgraph - Versions diffs - 0.9.3__py3-none-any.whl → 0.27.5__py3-none-any.whl - Mend

htmlgraph 0.9.3py3-none-any.whl → 0.27.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (331) hide show

htmlgraph/.htmlgraph/.session-warning-state.json +6 -0
htmlgraph/.htmlgraph/agents.json +72 -0
htmlgraph/.htmlgraph/htmlgraph.db +0 -0
htmlgraph/__init__.py +173 -17
htmlgraph/__init__.pyi +123 -0
htmlgraph/agent_detection.py +127 -0
htmlgraph/agent_registry.py +45 -30
htmlgraph/agents.py +160 -107
htmlgraph/analytics/__init__.py +9 -2
htmlgraph/analytics/cli.py +190 -51
htmlgraph/analytics/cost_analyzer.py +391 -0
htmlgraph/analytics/cost_monitor.py +664 -0
htmlgraph/analytics/cost_reporter.py +675 -0
htmlgraph/analytics/cross_session.py +617 -0
htmlgraph/analytics/dependency.py +192 -100
htmlgraph/analytics/pattern_learning.py +771 -0
htmlgraph/analytics/session_graph.py +707 -0
htmlgraph/analytics/strategic/__init__.py +80 -0
htmlgraph/analytics/strategic/cost_optimizer.py +611 -0
htmlgraph/analytics/strategic/pattern_detector.py +876 -0
htmlgraph/analytics/strategic/preference_manager.py +709 -0
htmlgraph/analytics/strategic/suggestion_engine.py +747 -0
htmlgraph/analytics/work_type.py +190 -14
htmlgraph/analytics_index.py +135 -51
htmlgraph/api/__init__.py +3 -0
htmlgraph/api/cost_alerts_websocket.py +416 -0
htmlgraph/api/main.py +2498 -0
htmlgraph/api/static/htmx.min.js +1 -0
htmlgraph/api/static/style-redesign.css +1344 -0
htmlgraph/api/static/style.css +1079 -0
htmlgraph/api/templates/dashboard-redesign.html +1366 -0
htmlgraph/api/templates/dashboard.html +794 -0
htmlgraph/api/templates/partials/activity-feed-hierarchical.html +326 -0
htmlgraph/api/templates/partials/activity-feed.html +1100 -0
htmlgraph/api/templates/partials/agents-redesign.html +317 -0
htmlgraph/api/templates/partials/agents.html +317 -0
htmlgraph/api/templates/partials/event-traces.html +373 -0
htmlgraph/api/templates/partials/features-kanban-redesign.html +509 -0
htmlgraph/api/templates/partials/features.html +578 -0
htmlgraph/api/templates/partials/metrics-redesign.html +346 -0
htmlgraph/api/templates/partials/metrics.html +346 -0
htmlgraph/api/templates/partials/orchestration-redesign.html +443 -0
htmlgraph/api/templates/partials/orchestration.html +198 -0
htmlgraph/api/templates/partials/spawners.html +375 -0
htmlgraph/api/templates/partials/work-items.html +613 -0
htmlgraph/api/websocket.py +538 -0
htmlgraph/archive/__init__.py +24 -0
htmlgraph/archive/bloom.py +234 -0
htmlgraph/archive/fts.py +297 -0
htmlgraph/archive/manager.py +583 -0
htmlgraph/archive/search.py +244 -0
htmlgraph/atomic_ops.py +560 -0
htmlgraph/attribute_index.py +208 -0
htmlgraph/bounded_paths.py +539 -0
htmlgraph/builders/__init__.py +14 -0
htmlgraph/builders/base.py +118 -29
htmlgraph/builders/bug.py +150 -0
htmlgraph/builders/chore.py +119 -0
htmlgraph/builders/epic.py +150 -0
htmlgraph/builders/feature.py +31 -6
htmlgraph/builders/insight.py +195 -0
htmlgraph/builders/metric.py +217 -0
htmlgraph/builders/pattern.py +202 -0
htmlgraph/builders/phase.py +162 -0
htmlgraph/builders/spike.py +52 -19
htmlgraph/builders/track.py +148 -72
htmlgraph/cigs/__init__.py +81 -0
htmlgraph/cigs/autonomy.py +385 -0
htmlgraph/cigs/cost.py +475 -0
htmlgraph/cigs/messages_basic.py +472 -0
htmlgraph/cigs/messaging.py +365 -0
htmlgraph/cigs/models.py +771 -0
htmlgraph/cigs/pattern_storage.py +427 -0
htmlgraph/cigs/patterns.py +503 -0
htmlgraph/cigs/posttool_analyzer.py +234 -0
htmlgraph/cigs/reporter.py +818 -0
htmlgraph/cigs/tracker.py +317 -0
htmlgraph/cli/.htmlgraph/.session-warning-state.json +6 -0
htmlgraph/cli/.htmlgraph/agents.json +72 -0
htmlgraph/cli/.htmlgraph/htmlgraph.db +0 -0
htmlgraph/cli/__init__.py +42 -0
htmlgraph/cli/__main__.py +6 -0
htmlgraph/cli/analytics.py +1424 -0
htmlgraph/cli/base.py +685 -0
htmlgraph/cli/constants.py +206 -0
htmlgraph/cli/core.py +954 -0
htmlgraph/cli/main.py +147 -0
htmlgraph/cli/models.py +475 -0
htmlgraph/cli/templates/__init__.py +1 -0
htmlgraph/cli/templates/cost_dashboard.py +399 -0
htmlgraph/cli/work/__init__.py +239 -0
htmlgraph/cli/work/browse.py +115 -0
htmlgraph/cli/work/features.py +568 -0
htmlgraph/cli/work/orchestration.py +676 -0
htmlgraph/cli/work/report.py +728 -0
htmlgraph/cli/work/sessions.py +466 -0
htmlgraph/cli/work/snapshot.py +559 -0
htmlgraph/cli/work/tracks.py +486 -0
htmlgraph/cli_commands/__init__.py +1 -0
htmlgraph/cli_commands/feature.py +195 -0
htmlgraph/cli_framework.py +115 -0
htmlgraph/collections/__init__.py +18 -0
htmlgraph/collections/base.py +415 -98
htmlgraph/collections/bug.py +53 -0
htmlgraph/collections/chore.py +53 -0
htmlgraph/collections/epic.py +53 -0
htmlgraph/collections/feature.py +12 -26
htmlgraph/collections/insight.py +100 -0
htmlgraph/collections/metric.py +92 -0
htmlgraph/collections/pattern.py +97 -0
htmlgraph/collections/phase.py +53 -0
htmlgraph/collections/session.py +194 -0
htmlgraph/collections/spike.py +56 -16
htmlgraph/collections/task_delegation.py +241 -0
htmlgraph/collections/todo.py +511 -0
htmlgraph/collections/traces.py +487 -0
htmlgraph/config/cost_models.json +56 -0
htmlgraph/config.py +190 -0
htmlgraph/context_analytics.py +344 -0
htmlgraph/converter.py +216 -28
htmlgraph/cost_analysis/__init__.py +5 -0
htmlgraph/cost_analysis/analyzer.py +438 -0
htmlgraph/dashboard.html +2406 -307
htmlgraph/dashboard.html.backup +6592 -0
htmlgraph/dashboard.html.bak +7181 -0
htmlgraph/dashboard.html.bak2 +7231 -0
htmlgraph/dashboard.html.bak3 +7232 -0
htmlgraph/db/__init__.py +38 -0
htmlgraph/db/queries.py +790 -0
htmlgraph/db/schema.py +1788 -0
htmlgraph/decorators.py +317 -0
htmlgraph/dependency_models.py +19 -2
htmlgraph/deploy.py +142 -125
htmlgraph/deployment_models.py +474 -0
htmlgraph/docs/API_REFERENCE.md +841 -0
htmlgraph/docs/HTTP_API.md +750 -0
htmlgraph/docs/INTEGRATION_GUIDE.md +752 -0
htmlgraph/docs/ORCHESTRATION_PATTERNS.md +717 -0
htmlgraph/docs/README.md +532 -0
htmlgraph/docs/__init__.py +77 -0
htmlgraph/docs/docs_version.py +55 -0
htmlgraph/docs/metadata.py +93 -0
htmlgraph/docs/migrations.py +232 -0
htmlgraph/docs/template_engine.py +143 -0
htmlgraph/docs/templates/_sections/cli_reference.md.j2 +52 -0
htmlgraph/docs/templates/_sections/core_concepts.md.j2 +29 -0
htmlgraph/docs/templates/_sections/sdk_basics.md.j2 +69 -0
htmlgraph/docs/templates/base_agents.md.j2 +78 -0
htmlgraph/docs/templates/example_user_override.md.j2 +47 -0
htmlgraph/docs/version_check.py +163 -0
htmlgraph/edge_index.py +182 -27
htmlgraph/error_handler.py +544 -0
htmlgraph/event_log.py +100 -52
htmlgraph/event_migration.py +13 -4
htmlgraph/exceptions.py +49 -0
htmlgraph/file_watcher.py +101 -28
htmlgraph/find_api.py +75 -63
htmlgraph/git_events.py +145 -63
htmlgraph/graph.py +1122 -106
htmlgraph/hooks/.htmlgraph/.session-warning-state.json +6 -0
htmlgraph/hooks/.htmlgraph/agents.json +72 -0
htmlgraph/hooks/.htmlgraph/index.sqlite +0 -0
htmlgraph/hooks/__init__.py +45 -0
htmlgraph/hooks/bootstrap.py +169 -0
htmlgraph/hooks/cigs_pretool_enforcer.py +354 -0
htmlgraph/hooks/concurrent_sessions.py +208 -0
htmlgraph/hooks/context.py +350 -0
htmlgraph/hooks/drift_handler.py +525 -0
htmlgraph/hooks/event_tracker.py +1314 -0
htmlgraph/hooks/git_commands.py +175 -0
htmlgraph/hooks/hooks-config.example.json +12 -0
htmlgraph/hooks/installer.py +343 -0
htmlgraph/hooks/orchestrator.py +674 -0
htmlgraph/hooks/orchestrator_reflector.py +223 -0
htmlgraph/hooks/post-checkout.sh +28 -0
htmlgraph/hooks/post-commit.sh +24 -0
htmlgraph/hooks/post-merge.sh +26 -0
htmlgraph/hooks/post_tool_use_failure.py +273 -0
htmlgraph/hooks/post_tool_use_handler.py +257 -0
htmlgraph/hooks/posttooluse.py +408 -0
htmlgraph/hooks/pre-commit.sh +94 -0
htmlgraph/hooks/pre-push.sh +28 -0
htmlgraph/hooks/pretooluse.py +819 -0
htmlgraph/hooks/prompt_analyzer.py +637 -0
htmlgraph/hooks/session_handler.py +668 -0
htmlgraph/hooks/session_summary.py +395 -0
htmlgraph/hooks/state_manager.py +504 -0
htmlgraph/hooks/subagent_detection.py +202 -0
htmlgraph/hooks/subagent_stop.py +369 -0
htmlgraph/hooks/task_enforcer.py +255 -0
htmlgraph/hooks/task_validator.py +177 -0
htmlgraph/hooks/validator.py +628 -0
htmlgraph/ids.py +41 -27
htmlgraph/index.d.ts +286 -0
htmlgraph/learning.py +767 -0
htmlgraph/mcp_server.py +69 -23
htmlgraph/models.py +1586 -87
htmlgraph/operations/README.md +62 -0
htmlgraph/operations/__init__.py +79 -0
htmlgraph/operations/analytics.py +339 -0
htmlgraph/operations/bootstrap.py +289 -0
htmlgraph/operations/events.py +244 -0
htmlgraph/operations/fastapi_server.py +231 -0
htmlgraph/operations/hooks.py +350 -0
htmlgraph/operations/initialization.py +597 -0
htmlgraph/operations/initialization.py.backup +228 -0
htmlgraph/operations/server.py +303 -0
htmlgraph/orchestration/__init__.py +58 -0
htmlgraph/orchestration/claude_launcher.py +179 -0
htmlgraph/orchestration/command_builder.py +72 -0
htmlgraph/orchestration/headless_spawner.py +281 -0
htmlgraph/orchestration/live_events.py +377 -0
htmlgraph/orchestration/model_selection.py +327 -0
htmlgraph/orchestration/plugin_manager.py +140 -0
htmlgraph/orchestration/prompts.py +137 -0
htmlgraph/orchestration/spawner_event_tracker.py +383 -0
htmlgraph/orchestration/spawners/__init__.py +16 -0
htmlgraph/orchestration/spawners/base.py +194 -0
htmlgraph/orchestration/spawners/claude.py +173 -0
htmlgraph/orchestration/spawners/codex.py +435 -0
htmlgraph/orchestration/spawners/copilot.py +294 -0
htmlgraph/orchestration/spawners/gemini.py +471 -0
htmlgraph/orchestration/subprocess_runner.py +36 -0
htmlgraph/orchestration/task_coordination.py +343 -0
htmlgraph/orchestration.md +563 -0
htmlgraph/orchestrator-system-prompt-optimized.txt +863 -0
htmlgraph/orchestrator.py +669 -0
htmlgraph/orchestrator_config.py +357 -0
htmlgraph/orchestrator_mode.py +328 -0
htmlgraph/orchestrator_validator.py +133 -0
htmlgraph/parallel.py +646 -0
htmlgraph/parser.py +160 -35
htmlgraph/path_query.py +608 -0
htmlgraph/pattern_matcher.py +636 -0
htmlgraph/planning.py +147 -52
htmlgraph/pydantic_models.py +476 -0
htmlgraph/quality_gates.py +350 -0
htmlgraph/query_builder.py +109 -72
htmlgraph/query_composer.py +509 -0
htmlgraph/reflection.py +443 -0
htmlgraph/refs.py +344 -0
htmlgraph/repo_hash.py +512 -0
htmlgraph/repositories/__init__.py +292 -0
htmlgraph/repositories/analytics_repository.py +455 -0
htmlgraph/repositories/analytics_repository_standard.py +628 -0
htmlgraph/repositories/feature_repository.py +581 -0
htmlgraph/repositories/feature_repository_htmlfile.py +668 -0
htmlgraph/repositories/feature_repository_memory.py +607 -0
htmlgraph/repositories/feature_repository_sqlite.py +858 -0
htmlgraph/repositories/filter_service.py +620 -0
htmlgraph/repositories/filter_service_standard.py +445 -0
htmlgraph/repositories/shared_cache.py +621 -0
htmlgraph/repositories/shared_cache_memory.py +395 -0
htmlgraph/repositories/track_repository.py +552 -0
htmlgraph/repositories/track_repository_htmlfile.py +619 -0
htmlgraph/repositories/track_repository_memory.py +508 -0
htmlgraph/repositories/track_repository_sqlite.py +711 -0
htmlgraph/routing.py +8 -19
htmlgraph/scripts/deploy.py +1 -2
htmlgraph/sdk/__init__.py +398 -0
htmlgraph/sdk/__init__.pyi +14 -0
htmlgraph/sdk/analytics/__init__.py +19 -0
htmlgraph/sdk/analytics/engine.py +155 -0
htmlgraph/sdk/analytics/helpers.py +178 -0
htmlgraph/sdk/analytics/registry.py +109 -0
htmlgraph/sdk/base.py +484 -0
htmlgraph/sdk/constants.py +216 -0
htmlgraph/sdk/core.pyi +308 -0
htmlgraph/sdk/discovery.py +120 -0
htmlgraph/sdk/help/__init__.py +12 -0
htmlgraph/sdk/help/mixin.py +699 -0
htmlgraph/sdk/mixins/__init__.py +15 -0
htmlgraph/sdk/mixins/attribution.py +113 -0
htmlgraph/sdk/mixins/mixin.py +410 -0
htmlgraph/sdk/operations/__init__.py +12 -0
htmlgraph/sdk/operations/mixin.py +427 -0
htmlgraph/sdk/orchestration/__init__.py +17 -0
htmlgraph/sdk/orchestration/coordinator.py +203 -0
htmlgraph/sdk/orchestration/spawner.py +204 -0
htmlgraph/sdk/planning/__init__.py +19 -0
htmlgraph/sdk/planning/bottlenecks.py +93 -0
htmlgraph/sdk/planning/mixin.py +211 -0
htmlgraph/sdk/planning/parallel.py +186 -0
htmlgraph/sdk/planning/queue.py +210 -0
htmlgraph/sdk/planning/recommendations.py +87 -0
htmlgraph/sdk/planning/smart_planning.py +319 -0
htmlgraph/sdk/session/__init__.py +19 -0
htmlgraph/sdk/session/continuity.py +57 -0
htmlgraph/sdk/session/handoff.py +110 -0
htmlgraph/sdk/session/info.py +309 -0
htmlgraph/sdk/session/manager.py +103 -0
htmlgraph/sdk/strategic/__init__.py +26 -0
htmlgraph/sdk/strategic/mixin.py +563 -0
htmlgraph/server.py +685 -180
htmlgraph/services/__init__.py +10 -0
htmlgraph/services/claiming.py +199 -0
htmlgraph/session_hooks.py +300 -0
htmlgraph/session_manager.py +1392 -175
htmlgraph/session_registry.py +587 -0
htmlgraph/session_state.py +436 -0
htmlgraph/session_warning.py +201 -0
htmlgraph/sessions/__init__.py +23 -0
htmlgraph/sessions/handoff.py +756 -0
htmlgraph/setup.py +34 -17
htmlgraph/spike_index.py +143 -0
htmlgraph/sync_docs.py +12 -15
htmlgraph/system_prompts.py +450 -0
htmlgraph/templates/AGENTS.md.template +366 -0
htmlgraph/templates/CLAUDE.md.template +97 -0
htmlgraph/templates/GEMINI.md.template +87 -0
htmlgraph/templates/orchestration-view.html +350 -0
htmlgraph/track_builder.py +146 -15
htmlgraph/track_manager.py +69 -21
htmlgraph/transcript.py +890 -0
htmlgraph/transcript_analytics.py +699 -0
htmlgraph/types.py +323 -0
htmlgraph/validation.py +115 -0
htmlgraph/watch.py +8 -5
htmlgraph/work_type_utils.py +3 -2
{htmlgraph-0.9.3.data → htmlgraph-0.27.5.data}/data/htmlgraph/dashboard.html +2406 -307
htmlgraph-0.27.5.data/data/htmlgraph/templates/AGENTS.md.template +366 -0
htmlgraph-0.27.5.data/data/htmlgraph/templates/CLAUDE.md.template +97 -0
htmlgraph-0.27.5.data/data/htmlgraph/templates/GEMINI.md.template +87 -0
{htmlgraph-0.9.3.dist-info → htmlgraph-0.27.5.dist-info}/METADATA +97 -64
htmlgraph-0.27.5.dist-info/RECORD +337 -0
{htmlgraph-0.9.3.dist-info → htmlgraph-0.27.5.dist-info}/entry_points.txt +1 -1
htmlgraph/cli.py +0 -2688
htmlgraph/sdk.py +0 -709
htmlgraph-0.9.3.dist-info/RECORD +0 -61
{htmlgraph-0.9.3.data → htmlgraph-0.27.5.data}/data/htmlgraph/styles.css +0 -0
{htmlgraph-0.9.3.dist-info → htmlgraph-0.27.5.dist-info}/WHEEL +0 -0

htmlgraph/graph.py CHANGED Viewed

@@ -6,18 +6,193 @@ Provides:
 - CSS selector queries
 - Graph algorithms (BFS, shortest path, dependency analysis)
 - Bottleneck detection
+- Transaction/snapshot support for concurrency
 """
+import hashlib
+import os
+import time
 from collections import defaultdict, deque
+from collections.abc import Callable, Iterator
+from contextlib import contextmanager
+from dataclasses import dataclass, field
+from datetime import datetime
 from pathlib import Path
-from typing import Any, Callable, Iterator
+from typing import Any, cast
-from htmlgraph.models import Node, Edge
-from htmlgraph.converter import html_to_node, node_to_html, NodeConverter
-from htmlgraph.parser import HtmlParser
+from htmlgraph.attribute_index import AttributeIndex
+from htmlgraph.converter import NodeConverter
 from htmlgraph.edge_index import EdgeIndex, EdgeRef
-from htmlgraph.query_builder import QueryBuilder
+from htmlgraph.exceptions import NodeNotFoundError
 from htmlgraph.find_api import FindAPI
+from htmlgraph.models import Node
+from htmlgraph.parser import HtmlParser
+from htmlgraph.query_builder import QueryBuilder
+@dataclass
+class CompiledQuery:
+    """
+    Pre-compiled CSS selector query for efficient reuse.
+    While justhtml doesn't support native selector pre-compilation,
+    this class provides:
+    - Cached selector string to avoid string manipulation overhead
+    - Reusable query execution with metrics tracking
+    - Integration with query cache for performance
+    Example:
+        >>> graph = HtmlGraph("features/")
+        >>> compiled = graph.compile_query("[data-status='blocked']")
+        >>> results = graph.query_compiled(compiled)  # Fast on reuse
+        >>> results2 = graph.query_compiled(compiled)  # Uses cache
+    """
+    selector: str
+    _compiled_at: datetime = field(default_factory=datetime.now)
+    _use_count: int = field(default=0, init=False)
+    def matches(self, node: Node) -> bool:
+        """
+        Check if a node matches this compiled query.
+        Args:
+            node: Node to check
+        Returns:
+            True if node matches selector
+        """
+        try:
+            # Convert node to HTML in-memory
+            html_content = node.to_html()
+            # Parse the HTML string
+            parser = HtmlParser.from_string(html_content)
+            # Check if selector matches
+            return bool(parser.query(f"article{self.selector}"))
+        except Exception:
+            return False
+    def execute(self, nodes: dict[str, Node]) -> list[Node]:
+        """
+        Execute this compiled query on a set of nodes.
+        Args:
+            nodes: Dict of nodes to query
+        Returns:
+            List of matching nodes
+        """
+        self._use_count += 1
+        return [node for node in nodes.values() if self.matches(node)]
+class GraphSnapshot:
+    """
+    Immutable snapshot of graph state at a point in time.
+    Provides read-only access to graph data without affecting the original graph.
+    Safe to use across multiple agents or threads.
+    Example:
+        snapshot = graph.snapshot()
+        node = snapshot.get("feature-001")  # Read-only access
+        results = snapshot.query("[data-status='blocked']")
+    """
+    def __init__(self, nodes: dict[str, Node], directory: Path):
+        """
+        Create a snapshot of graph nodes.
+        Args:
+            nodes: Dictionary of nodes to snapshot
+            directory: Graph directory (for context)
+        """
+        # Deep copy to prevent external mutations
+        self._nodes = {
+            node_id: node.model_copy(deep=True) for node_id, node in nodes.items()
+        }
+        self._directory = directory
+    def get(self, node_id: str) -> Node | None:
+        """
+        Get a node by ID from the snapshot.
+        Args:
+            node_id: Node identifier
+        Returns:
+            Node instance or None if not found
+        """
+        node = self._nodes.get(node_id)
+        # Return a copy to prevent mutation of snapshot
+        return node.model_copy(deep=True) if node else None
+    def query(self, selector: str) -> list[Node]:
+        """
+        Query nodes using CSS selector.
+        Args:
+            selector: CSS selector string
+        Returns:
+            List of matching nodes (copies)
+        """
+        matching = []
+        for node in self._nodes.values():
+            try:
+                # Convert node to HTML in-memory
+                html_content = node.to_html()
+                # Parse the HTML string
+                parser = HtmlParser.from_string(html_content)
+                # Check if selector matches
+                if parser.query(f"article{selector}"):
+                    # Return copy to prevent mutation
+                    matching.append(node.model_copy(deep=True))
+            except Exception:
+                # Skip nodes that fail to parse
+                continue
+        return matching
+    def filter(self, predicate: Callable[[Node], bool]) -> list[Node]:
+        """
+        Filter nodes using a predicate function.
+        Args:
+            predicate: Function that takes Node and returns bool
+        Returns:
+            List of matching nodes (copies)
+        """
+        return [
+            node.model_copy(deep=True)
+            for node in self._nodes.values()
+            if predicate(node)
+        ]
+    def __len__(self) -> int:
+        """Get number of nodes in snapshot."""
+        return len(self._nodes)
+    def __contains__(self, node_id: str) -> bool:
+        """Check if node exists in snapshot."""
+        return node_id in self._nodes
+    def __iter__(self) -> Iterator[Node]:
+        """Iterate over nodes in snapshot (returns copies)."""
+        return iter(node.model_copy(deep=True) for node in self._nodes.values())
+    @property
+    def nodes(self) -> dict[str, Node]:
+        """Get all nodes as a dict (returns copies)."""
+        return {
+            node_id: node.model_copy(deep=True) for node_id, node in self._nodes.items()
+        }
 class HtmlGraph:
@@ -38,8 +213,8 @@ class HtmlGraph:
         self,
         directory: Path | str,
         stylesheet_path: str = "../styles.css",
-        auto_load: bool = True,
-        pattern: str | list[str] = "*.html"
+        auto_load: bool = False,
+        pattern: str | list[str] = "*.html",
     ):
         """
         Initialize graph from a directory.
@@ -47,7 +222,7 @@ class HtmlGraph:
         Args:
             directory: Directory containing HTML node files
             stylesheet_path: Default stylesheet path for new files
-            auto_load: Whether to load all nodes on init
+            auto_load: Whether to load all nodes on init (default: False for lazy loading)
             pattern: Glob pattern(s) for node files. Can be a single pattern or list.
                      Examples: "*.html", ["*.html", "*/index.html"]
         """
@@ -59,10 +234,84 @@ class HtmlGraph:
         self._nodes: dict[str, Node] = {}
         self._converter = NodeConverter(directory, stylesheet_path)
         self._edge_index = EdgeIndex()
+        self._attr_index = AttributeIndex()
+        self._query_cache: dict[str, list[Node]] = {}
+        self._adjacency_cache: dict[str, dict[str, list[str]]] | None = None
+        self._cache_enabled: bool = True
+        self._explicitly_loaded: bool = False
+        self._file_hashes: dict[str, str] = {}  # Track file content hashes
+        # Query compilation cache (LRU cache with max 100 compiled queries)
+        self._compiled_queries: dict[str, CompiledQuery] = {}
+        self._compiled_query_max_size: int = 100
+        # Performance metrics
+        self._metrics = {
+            "query_count": 0,
+            "cache_hits": 0,
+            "cache_misses": 0,
+            "reload_count": 0,
+            "single_reload_count": 0,
+            "total_query_time_ms": 0.0,
+            "slowest_query_ms": 0.0,
+            "slowest_query_selector": "",
+            "last_reload_time_ms": 0.0,
+            "compiled_queries": 0,
+            "compiled_query_hits": 0,
+            "auto_compiled_count": 0,
+        }
+        # Check for env override (backwards compatibility)
+        if os.environ.get("HTMLGRAPH_EAGER_LOAD") == "1":
+            auto_load = True
         if auto_load:
             self.reload()
+    def _invalidate_cache(self) -> None:
+        """Clear query, adjacency, attribute, and compiled query caches. Called when graph is modified."""
+        self._query_cache.clear()
+        self._compiled_queries.clear()
+        self._adjacency_cache = None
+        self._attr_index.clear()
+    def _compute_file_hash(self, filepath: Path) -> str:
+        """
+        Compute MD5 hash of file content.
+        Args:
+            filepath: Path to file to hash
+        Returns:
+            MD5 hash as hex string
+        """
+        try:
+            content = filepath.read_bytes()
+            return hashlib.md5(content).hexdigest()
+        except Exception:
+            return ""
+    def has_file_changed(self, filepath: Path | str) -> bool:
+        """
+        Check if a file has changed since it was last loaded.
+        Args:
+            filepath: Path to file to check
+        Returns:
+            True if file changed or not yet loaded, False if unchanged
+        """
+        filepath = Path(filepath)
+        if not filepath.exists():
+            return True
+        filepath_str = str(filepath)
+        current_hash = self._compute_file_hash(filepath)
+        stored_hash = self._file_hashes.get(filepath_str)
+        # If no stored hash or hash changed, file has changed
+        return stored_hash is None or current_hash != stored_hash
     def reload(self) -> int:
         """
         Reload all nodes from disk.
@@ -70,14 +319,70 @@ class HtmlGraph:
         Returns:
             Number of nodes loaded
         """
-        self._nodes.clear()
-        for node in self._converter.load_all(self.pattern):
-            self._nodes[node.id] = node
+        start = time.perf_counter()
+        self._cache_enabled = False  # Disable during reload
+        try:
+            self._nodes.clear()
+            self._file_hashes.clear()
+            # Load all nodes and compute file hashes
+            for node in self._converter.load_all(self.pattern):
+                self._nodes[node.id] = node
+                # Find and hash the node file
+                filepath = self._find_node_file(node.id)
+                if filepath:
+                    file_hash = self._compute_file_hash(filepath)
+                    self._file_hashes[str(filepath)] = file_hash
+            # Rebuild edge index for O(1) reverse lookups
+            # Rebuild attribute index for O(1) attribute lookups
+            self._attr_index.rebuild(self._nodes)
+            self._edge_index.rebuild(self._nodes)
+            self._explicitly_loaded = True
+            # Track metrics
+            elapsed_ms = (time.perf_counter() - start) * 1000
+            reload_count: int = int(self._metrics.get("reload_count", 0))  # type: ignore[call-overload]
+            self._metrics["reload_count"] = reload_count + 1
+            self._metrics["last_reload_time_ms"] = elapsed_ms
+            return len(self._nodes)
+        finally:
+            self._cache_enabled = True
+            self._invalidate_cache()
+    def _ensure_loaded(self) -> None:
+        """Ensure nodes are loaded. Called lazily on first access."""
+        if not self._explicitly_loaded and not self._nodes:
+            self.reload()
-        # Rebuild edge index for O(1) reverse lookups
-        self._edge_index.rebuild(self._nodes)
+    def _get_node_files(self) -> list[Path]:
+        """
+        Get all node files matching the configured pattern(s).
-        return len(self._nodes)
+        Returns:
+            List of Path objects for node files
+        """
+        files: list[Path] = []
+        patterns = [self.pattern] if isinstance(self.pattern, str) else self.pattern
+        for pattern in patterns:
+            files.extend(self.directory.glob(pattern))
+        return files
+    def _filepath_to_node_id(self, filepath: Path) -> str:
+        """
+        Extract node ID from a filepath.
+        Handles:
+        - Flat files: features/node-id.html -> "node-id"
+        - Directory-based: features/node-id/index.html -> "node-id"
+        """
+        if filepath.name == "index.html":
+            return filepath.parent.name
+        else:
+            return filepath.stem
     @property
     def nodes(self) -> dict[str, Node]:
@@ -85,18 +390,272 @@ class HtmlGraph:
         return self._nodes.copy()
     def __len__(self) -> int:
-        """Number of nodes in graph."""
+        """
+        Get the number of nodes in the graph.
+        Enables using len() on graph instances.
+        Returns:
+            int: Total number of nodes
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> print(f"Graph has {len(graph)} nodes")
+            Graph has 42 nodes
+        """
         return len(self._nodes)
     def __contains__(self, node_id: str) -> bool:
-        """Check if node exists."""
+        """
+        Check if a node exists in the graph.
+        Enables using 'in' operator on graph instances.
+        Args:
+            node_id: Node identifier to check
+        Returns:
+            bool: True if node exists, False otherwise
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> if "feature-001" in graph:
+            ...     print("Feature exists!")
+            Feature exists!
+            >>> if "nonexistent" not in graph:
+            ...     print("Not found")
+            Not found
+        """
         return node_id in self._nodes
     def __iter__(self) -> Iterator[Node]:
-        """Iterate over all nodes."""
+        """
+        Iterate over all nodes in the graph.
+        Enables using graphs in for loops and other iteration contexts.
+        Yields:
+            Node: Each node in the graph (in arbitrary order)
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> for node in graph:
+            ...     print(f"{node.id}: {node.title} [{node.status}]")
+            feature-001: User Auth [in-progress]
+            feature-002: Database [done]
+            >>> # Works with list comprehensions
+            >>> todo_titles = [n.title for n in graph if n.status == "todo"]
+            >>>
+            >>> # Works with any iterable operation
+            >>> high_priority = list(filter(lambda n: n.priority == "high", graph))
+        """
+        self._ensure_loaded()
         return iter(self._nodes.values())
     # =========================================================================
+    # Memory-Efficient Loading (for large graphs 10K+ nodes)
+    # =========================================================================
+    def load_chunked(self, chunk_size: int = 100) -> Iterator[list[Node]]:
+        """
+        Yield nodes in chunks for memory-efficient processing.
+        Loads nodes in batches without loading the entire graph into memory.
+        Useful for large graphs (10K+ nodes).
+        Args:
+            chunk_size: Number of nodes per chunk (default: 100)
+        Yields:
+            List of nodes (up to chunk_size per batch)
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> for chunk in graph.load_chunked(chunk_size=50):
+            ...     # Process 50 nodes at a time
+            ...     for node in chunk:
+            ...         print(node.title)
+        """
+        files = self._get_node_files()
+        # Yield nodes in chunks
+        for i in range(0, len(files), chunk_size):
+            chunk = []
+            for filepath in files[i : i + chunk_size]:
+                try:
+                    node_id = self._filepath_to_node_id(filepath)
+                    node = self._converter.load(node_id)
+                    if node:
+                        chunk.append(node)
+                except Exception:
+                    # Skip files that fail to parse
+                    continue
+            if chunk:
+                yield chunk
+    def iter_nodes(self) -> Iterator[Node]:
+        """
+        Iterate over all nodes without loading all into memory.
+        Memory-efficient iteration for large graphs. Loads nodes one at a time
+        instead of loading the entire graph.
+        Yields:
+            Node: Individual nodes from the graph
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> for node in graph.iter_nodes():
+            ...     if node.status == "blocked":
+            ...         print(f"Blocked: {node.title}")
+        """
+        for filepath in self._get_node_files():
+            try:
+                node_id = self._filepath_to_node_id(filepath)
+                node = self._converter.load(node_id)
+                if node:
+                    yield node
+            except Exception:
+                # Skip files that fail to parse
+                continue
+    @property
+    def node_count(self) -> int:
+        """
+        Count nodes without loading them.
+        Efficient count by globbing files without parsing HTML.
+        Returns:
+            Number of nodes in the graph
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> print(f"Graph has {graph.node_count} nodes")
+            Graph has 42 nodes
+        """
+        return len(self._get_node_files())
+    # =========================================================================
+    # =========================================================================
+    # Transaction & Snapshot Support
+    # =========================================================================
+    def snapshot(self) -> GraphSnapshot:
+        """
+        Create an immutable snapshot of the current graph state.
+        The snapshot is a frozen copy that won't be affected by subsequent
+        changes to the graph. Useful for:
+        - Concurrent read operations
+        - Comparing graph state before/after changes
+        - Safe multi-agent scenarios
+        Returns:
+            GraphSnapshot: Immutable view of current graph state
+        Example:
+            # Agent 1 takes snapshot
+            snapshot = graph.snapshot()
+            # Agent 2 modifies graph
+            graph.update(node)
+            # Agent 1's snapshot is unchanged
+            old_node = snapshot.get("feature-001")
+        """
+        self._ensure_loaded()
+        return GraphSnapshot(self._nodes, self.directory)
+    @contextmanager
+    def transaction(self) -> Iterator[Any]:
+        """
+        Context manager for atomic multi-operation transactions.
+        Operations performed within the transaction are batched and applied
+        atomically. If any exception occurs, no changes are persisted.
+        Yields:
+            TransactionContext: Context for collecting operations
+        Raises:
+            Exception: Any exception from operations causes rollback
+        Example:
+            # All-or-nothing batch update
+            with graph.transaction() as tx:
+                tx.add(node1)
+                tx.update(node2)
+                tx.delete("feature-003")
+            # All changes persisted atomically
+            # Failed transaction (rollback)
+            try:
+                with graph.transaction() as tx:
+                    tx.add(node1)
+                    tx.update(invalid_node)  # Raises error
+            except Exception:
+                pass  # No changes persisted
+        """
+        # Create snapshot before transaction
+        snapshot_nodes = {
+            node_id: node.model_copy(deep=True) for node_id, node in self._nodes.items()
+        }
+        snapshot_file_hashes = self._file_hashes.copy()
+        # Transaction context for collecting operations
+        class TransactionContext:
+            def __init__(self, graph: "HtmlGraph"):
+                self._graph = graph
+                self._operations: list[Callable[[], Any]] = []
+            def add(self, node: Node, overwrite: bool = False) -> "TransactionContext":
+                """Queue an add operation."""
+                self._operations.append(
+                    lambda: self._graph.add(node, overwrite=overwrite)
+                )
+                return self
+            def update(self, node: Node) -> "TransactionContext":
+                """Queue an update operation."""
+                self._operations.append(lambda: self._graph.update(node))
+                return self
+            def delete(self, node_id: str) -> "TransactionContext":
+                """Queue a delete operation."""
+                self._operations.append(lambda: self._graph.delete(node_id))
+                return self
+            def remove(self, node_id: str) -> "TransactionContext":
+                """Queue a remove operation (alias for delete)."""
+                return self.delete(node_id)
+            def _commit(self) -> None:
+                """Execute all queued operations."""
+                for operation in self._operations:
+                    operation()
+        tx = TransactionContext(self)
+        try:
+            yield tx
+            # Commit all operations if no exceptions
+            tx._commit()
+        except Exception:
+            # Rollback: restore snapshot state
+            self._nodes = snapshot_nodes
+            self._file_hashes = snapshot_file_hashes
+            self._invalidate_cache()
+            # Rebuild indexes from restored state
+            self._edge_index.rebuild(self._nodes)
+            self._attr_index.rebuild(self._nodes)
+            # Re-raise exception
+            raise
     # CRUD Operations
     # =========================================================================
@@ -117,18 +676,28 @@ class HtmlGraph:
         if node.id in self._nodes and not overwrite:
             raise ValueError(f"Node already exists: {node.id}")
-        # If overwriting, remove old edges from index first
+        # If overwriting, remove old node from indexes first
         if overwrite and node.id in self._nodes:
+            old_node = self._nodes[node.id]
             self._edge_index.remove_node(node.id)
+            self._attr_index.remove_node(node.id, old_node)
         filepath = self._converter.save(node)
         self._nodes[node.id] = node
+        # Update file hash
+        file_hash = self._compute_file_hash(filepath)
+        self._file_hashes[str(filepath)] = file_hash
         # Add new edges to index
         for relationship, edges in node.edges.items():
             for edge in edges:
                 self._edge_index.add(node.id, edge.target_id, edge.relationship)
+        # Add node to attribute index
+        self._attr_index.add_node(node.id, node)
+        self._invalidate_cache()
         return filepath
     def update(self, node: Node) -> Path:
@@ -142,10 +711,10 @@ class HtmlGraph:
             Path to updated HTML file
         Raises:
-            KeyError: If node doesn't exist
+            NodeNotFoundError: If node doesn't exist
         """
         if node.id not in self._nodes:
-            raise KeyError(f"Node not found: {node.id}")
+            raise NodeNotFoundError(node.type, node.id)
         # Get current outgoing edges from the edge index (source of truth)
         # This handles the case where node and self._nodes[node.id] are the same object
@@ -154,15 +723,27 @@ class HtmlGraph:
         # Remove all old OUTGOING edges (where this node is source)
         # DO NOT use remove_node() as it removes incoming edges too!
         for edge_ref in old_outgoing:
-            self._edge_index.remove(edge_ref.source_id, edge_ref.target_id, edge_ref.relationship)
+            self._edge_index.remove(
+                edge_ref.source_id, edge_ref.target_id, edge_ref.relationship
+            )
         # Add new OUTGOING edges (where this node is source)
         for relationship, edges in node.edges.items():
             for edge in edges:
                 self._edge_index.add(node.id, edge.target_id, edge.relationship)
+        # Update attribute index
+        old_node = self._nodes[node.id]
+        self._attr_index.update_node(node.id, old_node, node)
         filepath = self._converter.save(node)
         self._nodes[node.id] = node
+        # Update file hash
+        file_hash = self._compute_file_hash(filepath)
+        self._file_hashes[str(filepath)] = file_hash
+        self._invalidate_cache()
         return filepath
     def get(self, node_id: str) -> Node | None:
@@ -175,6 +756,7 @@ class HtmlGraph:
         Returns:
             Node instance or None if not found
         """
+        self._ensure_loaded()
         return self._nodes.get(node_id)
     def get_or_load(self, node_id: str) -> Node | None:
@@ -189,8 +771,104 @@ class HtmlGraph:
         node = self._converter.load(node_id)
         if node:
             self._nodes[node_id] = node
+            reload_count: int = int(self._metrics.get("single_reload_count", 0))  # type: ignore[call-overload]
+            self._metrics["single_reload_count"] = reload_count + 1
         return node
+    def reload_node(self, node_id: str) -> Node | None:
+        """
+        Reload a single node from disk without full graph reload.
+        Much faster than full reload() when only one node changed.
+        Updates the node in cache and refreshes its edges in the index.
+        Uses file hash to skip reload if content hasn't changed.
+        Args:
+            node_id: ID of the node to reload
+        Returns:
+            Updated node if found and loaded, None if not found
+        Example:
+            >>> graph.reload_node("feat-001")  # Reload just this node
+        """
+        # Verify the node file exists
+        filepath = self._find_node_file(node_id)
+        if not filepath:
+            return None
+        # Check if file has actually changed
+        if not self.has_file_changed(filepath):
+            # File unchanged, return cached node if available
+            return self._nodes.get(node_id)
+        try:
+            # Remove old node's edges from index if exists
+            if node_id in self._nodes:
+                old_node = self._nodes[node_id]
+                self._edge_index.remove_node_edges(node_id, old_node)
+            # Load updated node from disk (converter.load expects node_id)
+            updated_node = self._converter.load(node_id)
+            if not updated_node:
+                return None
+            # Update cache
+            self._nodes[node_id] = updated_node
+            # Update file hash
+            file_hash = self._compute_file_hash(filepath)
+            self._file_hashes[str(filepath)] = file_hash
+            # Add new edges to index
+            self._edge_index.add_node_edges(node_id, updated_node)
+            # Invalidate query cache
+            self._invalidate_cache()
+            # Track metric
+            reload_count: int = int(self._metrics.get("single_reload_count", 0))  # type: ignore[call-overload]
+            self._metrics["single_reload_count"] = reload_count + 1
+            return updated_node
+        except Exception:
+            return None
+    def _find_node_file(self, node_id: str) -> Path | None:
+        """
+        Find the file path for a node by ID.
+        Checks common naming patterns for node files.
+        Args:
+            node_id: Node ID to find
+        Returns:
+            Path to node file, or None if not found
+        """
+        # Try direct match patterns
+        patterns = [
+            f"{node_id}.html",
+            f"{node_id}/index.html",
+        ]
+        for pattern in patterns:
+            filepath = self.directory / pattern
+            if filepath.exists():
+                return filepath
+        # Fall back to scanning (slower but thorough)
+        for filepath in self.directory.glob("*.html"):
+            try:
+                # Quick check of file content for ID
+                content = filepath.read_text()
+                if f'id="{node_id}"' in content or f"id='{node_id}'" in content:
+                    return filepath
+            except Exception:
+                continue
+        return None
     def remove(self, node_id: str) -> bool:
         """
         Remove a node from the graph.
@@ -202,10 +880,19 @@ class HtmlGraph:
             True if node was removed
         """
         if node_id in self._nodes:
-            # Remove all edges involving this node from index
+            # Find and remove file hash
+            filepath = self._find_node_file(node_id)
+            if filepath:
+                self._file_hashes.pop(str(filepath), None)
+            # Remove node from indexes
+            old_node = self._nodes[node_id]
             self._edge_index.remove_node(node_id)
+            self._attr_index.remove_node(node_id, old_node)
             del self._nodes[node_id]
-            return self._converter.delete(node_id)
+            result = self._converter.delete(node_id)
+            self._invalidate_cache()
+            return result
         return False
     def delete(self, node_id: str) -> bool:
@@ -248,9 +935,10 @@ class HtmlGraph:
     def query(self, selector: str) -> list[Node]:
         """
-        Query nodes using CSS selector.
+        Query nodes using CSS selector with caching and metrics.
         Selector is applied to article element of each node.
+        Uses cached nodes instead of re-parsing from disk for better performance.
         Args:
             selector: CSS selector string
@@ -262,21 +950,53 @@ class HtmlGraph:
             graph.query("[data-status='blocked']")
             graph.query("[data-priority='high'][data-type='feature']")
         """
+        self._ensure_loaded()
+        query_count: int = int(self._metrics.get("query_count", 0))  # type: ignore[call-overload]
+        self._metrics["query_count"] = query_count + 1
+        # Check cache first
+        if self._cache_enabled and selector in self._query_cache:
+            cache_hits: int = int(self._metrics.get("cache_hits", 0))  # type: ignore[call-overload]
+            self._metrics["cache_hits"] = cache_hits + 1
+            return self._query_cache[selector].copy()  # Return copy to prevent mutation
+        cache_misses: int = int(self._metrics.get("cache_misses", 0))  # type: ignore[call-overload]
+        self._metrics["cache_misses"] = cache_misses + 1
+        # Time the query
+        start = time.perf_counter()
+        # Perform query using cached nodes instead of disk I/O
         matching = []
-        patterns = [self.pattern] if isinstance(self.pattern, str) else self.pattern
-        for pat in patterns:
-            for filepath in self.directory.glob(pat):
-                if filepath.is_file():
-                    try:
-                        parser = HtmlParser.from_file(filepath)
-                        # Query for article matching selector
-                        if parser.query(f"article{selector}"):
-                            node_id = parser.get_node_id()
-                            if node_id and node_id in self._nodes:
-                                matching.append(self._nodes[node_id])
-                    except Exception:
-                        continue
+        for node in self._nodes.values():
+            try:
+                # Convert node to HTML in-memory
+                html_content = node.to_html()
+                # Parse the HTML string
+                parser = HtmlParser.from_string(html_content)
+                # Check if selector matches
+                if parser.query(f"article{selector}"):
+                    matching.append(node)
+            except Exception:
+                # Skip nodes that fail to parse
+                continue
+        # Track timing
+        elapsed_ms = (time.perf_counter() - start) * 1000
+        total_time: float = cast(float, self._metrics.get("total_query_time_ms", 0.0))
+        self._metrics["total_query_time_ms"] = total_time + elapsed_ms
+        slowest: float = cast(float, self._metrics.get("slowest_query_ms", 0.0))
+        if elapsed_ms > slowest:
+            self._metrics["slowest_query_ms"] = elapsed_ms
+            self._metrics["slowest_query_selector"] = selector
+        # Cache result
+        if self._cache_enabled:
+            self._query_cache[selector] = matching.copy()
         return matching
@@ -285,6 +1005,99 @@ class HtmlGraph:
         results = self.query(selector)
         return results[0] if results else None
+    def compile_query(self, selector: str) -> CompiledQuery:
+        """
+        Pre-compile a CSS selector for reuse.
+        Creates a CompiledQuery object that can be reused multiple times
+        with query_compiled() for better performance when the same selector
+        is used frequently.
+        Args:
+            selector: CSS selector string to compile
+        Returns:
+            CompiledQuery object that can be reused
+        Example:
+            >>> graph = HtmlGraph("features/")
+            >>> compiled = graph.compile_query("[data-status='blocked']")
+            >>> results1 = graph.query_compiled(compiled)
+            >>> results2 = graph.query_compiled(compiled)  # Reuses compilation
+        """
+        # Check if already compiled
+        if selector in self._compiled_queries:
+            hits: int = int(self._metrics.get("compiled_query_hits", 0))  # type: ignore[call-overload]
+            self._metrics["compiled_query_hits"] = hits + 1
+            return self._compiled_queries[selector]
+        # Create new compiled query
+        compiled = CompiledQuery(selector=selector)
+        compiled_count: int = int(self._metrics.get("compiled_queries", 0))  # type: ignore[call-overload]
+        self._metrics["compiled_queries"] = compiled_count + 1
+        # Add to cache (with LRU eviction if needed)
+        if len(self._compiled_queries) >= self._compiled_query_max_size:
+            # Evict least recently used (first item in dict)
+            first_key = next(iter(self._compiled_queries))
+            del self._compiled_queries[first_key]
+        self._compiled_queries[selector] = compiled
+        return compiled
+    def query_compiled(self, compiled: CompiledQuery) -> list[Node]:
+        """
+        Execute a pre-compiled query.
+        Uses the regular query cache if available, otherwise executes
+        the compiled query and caches the result.
+        Args:
+            compiled: CompiledQuery object from compile_query()
+        Returns:
+            List of matching nodes
+        Example:
+            >>> compiled = graph.compile_query("[data-priority='high']")
+            >>> high_priority = graph.query_compiled(compiled)
+        """
+        self._ensure_loaded()
+        selector = compiled.selector
+        query_count: int = int(self._metrics.get("query_count", 0))  # type: ignore[call-overload]
+        self._metrics["query_count"] = query_count + 1
+        # Check cache first (same cache as regular query())
+        if self._cache_enabled and selector in self._query_cache:
+            cache_hits: int = int(self._metrics.get("cache_hits", 0))  # type: ignore[call-overload]
+            self._metrics["cache_hits"] = cache_hits + 1
+            return self._query_cache[selector].copy()
+        cache_misses: int = int(self._metrics.get("cache_misses", 0))  # type: ignore[call-overload]
+        self._metrics["cache_misses"] = cache_misses + 1
+        # Time the query
+        start = time.perf_counter()
+        # Execute compiled query
+        matching = compiled.execute(self._nodes)
+        # Track timing
+        elapsed_ms = (time.perf_counter() - start) * 1000
+        total_time: float = cast(float, self._metrics.get("total_query_time_ms", 0.0))
+        self._metrics["total_query_time_ms"] = total_time + elapsed_ms
+        slowest: float = cast(float, self._metrics.get("slowest_query_ms", 0.0))
+        if elapsed_ms > slowest:
+            self._metrics["slowest_query_ms"] = elapsed_ms
+            self._metrics["slowest_query_selector"] = selector
+        # Cache result
+        if self._cache_enabled:
+            self._query_cache[selector] = matching.copy()
+        return matching
     def filter(self, predicate: Callable[[Node], bool]) -> list[Node]:
         """
         Filter nodes using a Python predicate function.
@@ -298,19 +1111,104 @@ class HtmlGraph:
         Example:
             graph.filter(lambda n: n.status == "todo" and n.priority == "high")
         """
+        self._ensure_loaded()
         return [node for node in self._nodes.values() if predicate(node)]
     def by_status(self, status: str) -> list[Node]:
-        """Get all nodes with given status."""
-        return self.filter(lambda n: n.status == status)
+        """
+        Get all nodes with given status (O(1) lookup via attribute index).
+        Uses the attribute index for efficient lookups instead of
+        filtering all nodes.
+        Args:
+            status: Status value to filter by
+        Returns:
+            List of nodes with the given status
+        """
+        self._ensure_loaded()
+        self._attr_index.ensure_built(self._nodes)
+        node_ids = self._attr_index.get_by_status(status)
+        return [self._nodes[node_id] for node_id in node_ids if node_id in self._nodes]
     def by_type(self, node_type: str) -> list[Node]:
-        """Get all nodes with given type."""
-        return self.filter(lambda n: n.type == node_type)
+        """
+        Get all nodes with given type (O(1) lookup via attribute index).
+        Uses the attribute index for efficient lookups instead of
+        filtering all nodes.
+        Args:
+            node_type: Node type to filter by
+        Returns:
+            List of nodes with the given type
+        """
+        self._ensure_loaded()
+        self._attr_index.ensure_built(self._nodes)
+        node_ids = self._attr_index.get_by_type(node_type)
+        return [self._nodes[node_id] for node_id in node_ids if node_id in self._nodes]
     def by_priority(self, priority: str) -> list[Node]:
-        """Get all nodes with given priority."""
-        return self.filter(lambda n: n.priority == priority)
+        """
+        Get all nodes with given priority (O(1) lookup via attribute index).
+        Uses the attribute index for efficient lookups instead of
+        filtering all nodes.
+        Args:
+            priority: Priority value to filter by
+        Returns:
+            List of nodes with the given priority
+        """
+        self._ensure_loaded()
+        self._attr_index.ensure_built(self._nodes)
+        node_ids = self._attr_index.get_by_priority(priority)
+        return [self._nodes[node_id] for node_id in node_ids if node_id in self._nodes]
+    def get_by_status(self, status: str) -> list[Node]:
+        """
+        Get all nodes with given status (O(1) lookup via attribute index).
+        Alias for by_status() with explicit name for clarity.
+        Args:
+            status: Status value to filter by
+        Returns:
+            List of nodes with the given status
+        """
+        return self.by_status(status)
+    def get_by_type(self, node_type: str) -> list[Node]:
+        """
+        Get all nodes with given type (O(1) lookup via attribute index).
+        Alias for by_type() with explicit name for clarity.
+        Args:
+            node_type: Node type to filter by
+        Returns:
+            List of nodes with the given type
+        """
+        return self.by_type(node_type)
+    def get_by_priority(self, priority: str) -> list[Node]:
+        """
+        Get all nodes with given priority (O(1) lookup via attribute index).
+        Alias for by_priority() with explicit name for clarity.
+        Args:
+            priority: Priority value to filter by
+        Returns:
+            List of nodes with the given priority
+        """
+        return self.by_priority(priority)
     def query_builder(self) -> QueryBuilder:
         """
@@ -348,7 +1246,7 @@ class HtmlGraph:
         """
         return QueryBuilder(_graph=self)
-    def find(self, type: str | None = None, **kwargs) -> Node | None:
+    def find(self, type: str | None = None, **kwargs: Any) -> Node | None:
         """
         Find the first node matching the given criteria.
@@ -374,7 +1272,9 @@ class HtmlGraph:
         """
         return FindAPI(self).find(type=type, **kwargs)
-    def find_all(self, type: str | None = None, limit: int | None = None, **kwargs) -> list[Node]:
+    def find_all(
+        self, type: str | None = None, limit: int | None = None, **kwargs: Any
+    ) -> list[Node]:
         """
         Find all nodes matching the given criteria.
@@ -405,10 +1305,7 @@ class HtmlGraph:
         return FindAPI(self).find_all(type=type, limit=limit, **kwargs)
     def find_related(
-        self,
-        node_id: str,
-        relationship: str | None = None,
-        direction: str = "outgoing"
+        self, node_id: str, relationship: str | None = None, direction: str = "outgoing"
     ) -> list[Node]:
         """
         Find nodes related to a given node.
@@ -428,9 +1325,7 @@ class HtmlGraph:
     # =========================================================================
     def get_incoming_edges(
-        self,
-        node_id: str,
-        relationship: str | None = None
+        self, node_id: str, relationship: str | None = None
     ) -> list[EdgeRef]:
         """
         Get all edges pointing TO a node (O(1) lookup).
@@ -455,9 +1350,7 @@ class HtmlGraph:
         return self._edge_index.get_incoming(node_id, relationship)
     def get_outgoing_edges(
-        self,
-        node_id: str,
-        relationship: str | None = None
+        self, node_id: str, relationship: str | None = None
     ) -> list[EdgeRef]:
         """
         Get all edges pointing FROM a node (O(1) lookup).
@@ -472,10 +1365,7 @@ class HtmlGraph:
         return self._edge_index.get_outgoing(node_id, relationship)
     def get_neighbors(
-        self,
-        node_id: str,
-        relationship: str | None = None,
-        direction: str = "both"
+        self, node_id: str, relationship: str | None = None, direction: str = "both"
     ) -> set[str]:
         """
         Get all neighboring node IDs connected to a node (O(1) lookup).
@@ -495,10 +1385,119 @@ class HtmlGraph:
         """Access the edge index for advanced queries."""
         return self._edge_index
+    @property
+    def attribute_index(self) -> AttributeIndex:
+        """
+        Access the attribute index for advanced queries.
+        The attribute index is lazy-built on first access.
+        Returns:
+            AttributeIndex instance
+        Example:
+            >>> stats = graph.attribute_index.stats()
+            >>> print(stats)
+        """
+        self._ensure_loaded()
+        self._attr_index.ensure_built(self._nodes)
+        return self._attr_index
+    @property
+    def cache_stats(self) -> dict:
+        """Get cache statistics."""
+        return {
+            "cached_queries": len(self._query_cache),
+            "cache_enabled": self._cache_enabled,
+        }
+    @property
+    def metrics(self) -> dict:
+        """
+        Get performance metrics.
+        Returns:
+            Dict with query counts, cache stats, timing info
+        Example:
+            >>> graph.metrics
+            {
+                'query_count': 42,
+                'cache_hits': 38,
+                'cache_hit_rate': '90.5%',
+                'avg_query_time_ms': 12.3,
+                ...
+            }
+        """
+        m = self._metrics.copy()
+        # Calculate derived metrics
+        query_count = cast(int, m["query_count"])
+        if query_count > 0:
+            cache_hits = cast(int, m["cache_hits"])
+            total_query_time_ms = cast(float, m["total_query_time_ms"])
+            m["cache_hit_rate"] = f"{cache_hits / query_count * 100:.1f}%"
+            m["avg_query_time_ms"] = total_query_time_ms / query_count
+        else:
+            m["cache_hit_rate"] = "N/A"
+            m["avg_query_time_ms"] = 0.0
+        # Add current state
+        m["nodes_loaded"] = len(self._nodes)
+        m["cached_queries"] = len(self._query_cache)
+        m["compiled_queries_cached"] = len(self._compiled_queries)
+        # Calculate compilation hit rate
+        compiled_queries = cast(int, m["compiled_queries"])
+        compiled_query_hits = cast(int, m["compiled_query_hits"])
+        total_compilations = compiled_queries + compiled_query_hits
+        if total_compilations > 0:
+            m["compilation_hit_rate"] = (
+                f"{compiled_query_hits / total_compilations * 100:.1f}%"
+            )
+        else:
+            m["compilation_hit_rate"] = "N/A"
+        return m
+    def reset_metrics(self) -> None:
+        """Reset all performance metrics to zero."""
+        for key in self._metrics:
+            if isinstance(self._metrics[key], (int, float)):
+                self._metrics[key] = 0 if isinstance(self._metrics[key], int) else 0.0
+            else:
+                self._metrics[key] = ""
     # =========================================================================
     # Graph Algorithms
     # =========================================================================
+    def _get_adjacency_cache(self) -> dict[str, dict[str, list[str]]]:
+        """
+        Get or build the persistent adjacency cache.
+        Builds the cache on first access and returns it on subsequent calls.
+        Cache structure: {node_id: {"outgoing": [ids], "incoming": [ids]}}
+        Returns:
+            Dict mapping node_id to dict with "outgoing" and "incoming" neighbor lists
+        """
+        if self._adjacency_cache is None:
+            self._adjacency_cache = {}
+            for node_id in self._nodes:
+                # Use edge index for efficient O(1) lookups
+                outgoing = self._edge_index.get_neighbors(
+                    node_id, relationship=None, direction="outgoing"
+                )
+                incoming = self._edge_index.get_neighbors(
+                    node_id, relationship=None, direction="incoming"
+                )
+                self._adjacency_cache[node_id] = {
+                    "outgoing": list(outgoing),
+                    "incoming": list(incoming),
+                }
+        return self._adjacency_cache
     def _build_adjacency(self, relationship: str | None = None) -> dict[str, set[str]]:
         """
         Build adjacency list from edges.
@@ -521,10 +1520,7 @@ class HtmlGraph:
         return adj
     def shortest_path(
-        self,
-        from_id: str,
-        to_id: str,
-        relationship: str | None = None
+        self, from_id: str, to_id: str, relationship: str | None = None
     ) -> list[str] | None:
         """
         Find shortest path between two nodes using BFS.
@@ -563,9 +1559,7 @@ class HtmlGraph:
         return None
     def transitive_deps(
-        self,
-        node_id: str,
-        relationship: str = "blocked_by"
+        self, node_id: str, relationship: str = "blocked_by"
     ) -> set[str]:
         """
         Get all transitive dependencies of a node.
@@ -600,11 +1594,7 @@ class HtmlGraph:
         return deps
-    def dependents(
-        self,
-        node_id: str,
-        relationship: str = "blocked_by"
-    ) -> set[str]:
+    def dependents(self, node_id: str, relationship: str = "blocked_by") -> set[str]:
         """
         Find all nodes that depend on this node (O(1) lookup).
@@ -621,7 +1611,9 @@ class HtmlGraph:
         incoming = self._edge_index.get_incoming(node_id, relationship)
         return {ref.source_id for ref in incoming}
-    def find_bottlenecks(self, relationship: str = "blocked_by", top_n: int = 5) -> list[tuple[str, int]]:
+    def find_bottlenecks(
+        self, relationship: str = "blocked_by", top_n: int = 5
+    ) -> list[tuple[str, int]]:
         """
         Find nodes that block the most other nodes.
@@ -639,9 +1631,7 @@ class HtmlGraph:
                 blocked_count[edge.target_id] += 1
         sorted_bottlenecks = sorted(
-            blocked_count.items(),
-            key=lambda x: x[1],
-            reverse=True
+            blocked_count.items(), key=lambda x: x[1], reverse=True
         )
         return sorted_bottlenecks[:top_n]
@@ -725,7 +1715,7 @@ class HtmlGraph:
         self,
         node_id: str,
         relationship: str = "blocked_by",
-        max_depth: int | None = None
+        max_depth: int | None = None,
     ) -> list[str]:
         """
         Get all ancestor nodes (nodes that this node depends on).
@@ -773,7 +1763,7 @@ class HtmlGraph:
         self,
         node_id: str,
         relationship: str = "blocked_by",
-        max_depth: int | None = None
+        max_depth: int | None = None,
     ) -> list[str]:
         """
         Get all descendant nodes (nodes that depend on this node).
@@ -814,10 +1804,8 @@ class HtmlGraph:
         return descendants
     def subgraph(
-        self,
-        node_ids: list[str] | set[str],
-        include_edges: bool = True
-    ) -> 'HtmlGraph':
+        self, node_ids: list[str] | set[str], include_edges: bool = True
+    ) -> "HtmlGraph":
         """
         Extract a subgraph containing only the specified nodes.
@@ -835,7 +1823,6 @@ class HtmlGraph:
             sub = graph.subgraph(deps)
         """
         import tempfile
-        from htmlgraph.models import Edge
         # Create new graph in temp directory
         temp_dir = tempfile.mkdtemp(prefix="htmlgraph_subgraph_")
@@ -865,9 +1852,7 @@ class HtmlGraph:
         return subgraph
     def connected_component(
-        self,
-        node_id: str,
-        relationship: str | None = None
+        self, node_id: str, relationship: str | None = None
     ) -> set[str]:
         """
         Get all nodes in the same connected component as the given node.
@@ -907,19 +1892,30 @@ class HtmlGraph:
         from_id: str,
         to_id: str,
         relationship: str | None = None,
-        max_length: int | None = None
+        max_length: int | None = None,
+        max_paths: int = 100,
+        timeout_seconds: float = 5.0,
     ) -> list[list[str]]:
         """
         Find all paths between two nodes.
+        WARNING: This method has O(V!) worst-case complexity in dense graphs.
+        Use max_paths and timeout_seconds parameters to limit execution.
+        For most use cases, prefer shortest_path() instead.
         Args:
-            from_id: Starting node ID
+            from_id: Source node ID
             to_id: Target node ID
-            relationship: Optional filter to specific edge type
-            max_length: Maximum path length (None = unlimited, but recommended)
+            relationship: Optional edge type filter
+            max_length: Maximum path length
+            max_paths: Maximum number of paths to return (default 100)
+            timeout_seconds: Maximum execution time (default 5.0)
         Returns:
-            List of paths, each path is a list of node IDs
+            List of paths (each path is list of node IDs)
+        Raises:
+            TimeoutError: If execution exceeds timeout_seconds
         """
         if from_id not in self._nodes or to_id not in self._nodes:
             return []
@@ -929,8 +1925,20 @@ class HtmlGraph:
         paths: list[list[str]] = []
         adj = self._build_adjacency(relationship)
+        start_time = time.time()
+        def dfs(current: str, target: str, path: list[str], visited: set[str]) -> None:
+            # Check timeout periodically (every recursive call)
+            if time.time() - start_time > timeout_seconds:
+                raise TimeoutError(
+                    f"all_paths() exceeded timeout of {timeout_seconds}s "
+                    f"(found {len(paths)} paths so far)"
+                )
+            # Check if we've hit the max_paths limit
+            if len(paths) >= max_paths:
+                return
-        def dfs(current: str, target: str, path: list[str], visited: set[str]):
             if max_length and len(path) > max_length:
                 return
@@ -965,35 +1973,40 @@ class HtmlGraph:
         - completion_rate: Overall completion percentage
         - edge_count: Total number of edges
         """
-        stats = {
+        by_status: defaultdict[str, int] = defaultdict(int)
+        by_type: defaultdict[str, int] = defaultdict(int)
+        by_priority: defaultdict[str, int] = defaultdict(int)
+        edge_count = 0
+        stats: dict[str, Any] = {
             "total": len(self._nodes),
-            "by_status": defaultdict(int),
-            "by_type": defaultdict(int),
-            "by_priority": defaultdict(int),
-            "edge_count": 0,
+            "by_status": by_status,
+            "by_type": by_type,
+            "by_priority": by_priority,
+            "edge_count": edge_count,
         }
         done_count = 0
         for node in self._nodes.values():
-            stats["by_status"][node.status] += 1
-            stats["by_type"][node.type] += 1
-            stats["by_priority"][node.priority] += 1
+            by_status[node.status] += 1
+            by_type[node.type] += 1
+            by_priority[node.priority] += 1
             for edges in node.edges.values():
-                stats["edge_count"] += len(edges)
+                edge_count += len(edges)
             if node.status == "done":
                 done_count += 1
+        stats["edge_count"] = edge_count
         stats["completion_rate"] = (
-            round(done_count / len(self._nodes) * 100, 1)
-            if self._nodes else 0
+            round(done_count / len(self._nodes) * 100, 1) if self._nodes else 0
         )
         # Convert defaultdicts to regular dicts
-        stats["by_status"] = dict(stats["by_status"])
-        stats["by_type"] = dict(stats["by_type"])
-        stats["by_priority"] = dict(stats["by_priority"])
+        stats["by_status"] = dict(by_status)
+        stats["by_type"] = dict(by_type)
+        stats["by_priority"] = dict(by_priority)
         return stats
@@ -1009,7 +2022,9 @@ class HtmlGraph:
         """
         lines = ["# Graph Summary"]
         stats = self.stats()
-        lines.append(f"Total: {stats['total']} nodes | Done: {stats['completion_rate']}%")
+        lines.append(
+            f"Total: {stats['total']} nodes | Done: {stats['completion_rate']}%"
+        )
         # Status breakdown
         status_parts = [f"{s}: {c}" for s, c in stats["by_status"].items()]
@@ -1036,6 +2051,7 @@ class HtmlGraph:
     def to_json(self) -> list[dict[str, Any]]:
         """Export all nodes as JSON-serializable list."""
         from htmlgraph.converter import node_to_dict
         return [node_to_dict(node) for node in self._nodes.values()]
     def to_mermaid(self, relationship: str | None = None) -> str:

htmlgraph 0.9.3__py3-none-any.whl → 0.27.5__py3-none-any.whl

htmlgraph 0.9.3py3-none-any.whl → 0.27.5py3-none-any.whl