PyPI - codexa - Versions diffs - 0.4.0__py3-none-any.whl - Mend

codexa 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (189) hide show

codexa-0.4.0.dist-info/METADATA +650 -0
codexa-0.4.0.dist-info/RECORD +189 -0
codexa-0.4.0.dist-info/WHEEL +5 -0
codexa-0.4.0.dist-info/entry_points.txt +2 -0
codexa-0.4.0.dist-info/licenses/LICENSE +21 -0
codexa-0.4.0.dist-info/top_level.txt +1 -0
semantic_code_intelligence/__init__.py +5 -0
semantic_code_intelligence/analysis/__init__.py +21 -0
semantic_code_intelligence/analysis/ai_features.py +351 -0
semantic_code_intelligence/bridge/__init__.py +28 -0
semantic_code_intelligence/bridge/context_provider.py +245 -0
semantic_code_intelligence/bridge/protocol.py +167 -0
semantic_code_intelligence/bridge/server.py +348 -0
semantic_code_intelligence/bridge/vscode.py +271 -0
semantic_code_intelligence/ci/__init__.py +13 -0
semantic_code_intelligence/ci/hooks.py +98 -0
semantic_code_intelligence/ci/hotspots.py +272 -0
semantic_code_intelligence/ci/impact.py +246 -0
semantic_code_intelligence/ci/metrics.py +591 -0
semantic_code_intelligence/ci/pr.py +412 -0
semantic_code_intelligence/ci/quality.py +557 -0
semantic_code_intelligence/ci/templates.py +164 -0
semantic_code_intelligence/ci/trace.py +224 -0
semantic_code_intelligence/cli/__init__.py +0 -0
semantic_code_intelligence/cli/commands/__init__.py +0 -0
semantic_code_intelligence/cli/commands/ask_cmd.py +153 -0
semantic_code_intelligence/cli/commands/benchmark_cmd.py +303 -0
semantic_code_intelligence/cli/commands/chat_cmd.py +252 -0
semantic_code_intelligence/cli/commands/ci_gen_cmd.py +74 -0
semantic_code_intelligence/cli/commands/context_cmd.py +120 -0
semantic_code_intelligence/cli/commands/cross_refactor_cmd.py +113 -0
semantic_code_intelligence/cli/commands/deps_cmd.py +91 -0
semantic_code_intelligence/cli/commands/docs_cmd.py +101 -0
semantic_code_intelligence/cli/commands/doctor_cmd.py +147 -0
semantic_code_intelligence/cli/commands/evolve_cmd.py +171 -0
semantic_code_intelligence/cli/commands/explain_cmd.py +112 -0
semantic_code_intelligence/cli/commands/gate_cmd.py +135 -0
semantic_code_intelligence/cli/commands/grep_cmd.py +234 -0
semantic_code_intelligence/cli/commands/hotspots_cmd.py +119 -0
semantic_code_intelligence/cli/commands/impact_cmd.py +131 -0
semantic_code_intelligence/cli/commands/index_cmd.py +138 -0
semantic_code_intelligence/cli/commands/init_cmd.py +152 -0
semantic_code_intelligence/cli/commands/investigate_cmd.py +163 -0
semantic_code_intelligence/cli/commands/languages_cmd.py +101 -0
semantic_code_intelligence/cli/commands/lsp_cmd.py +49 -0
semantic_code_intelligence/cli/commands/mcp_cmd.py +50 -0
semantic_code_intelligence/cli/commands/metrics_cmd.py +264 -0
semantic_code_intelligence/cli/commands/models_cmd.py +157 -0
semantic_code_intelligence/cli/commands/plugin_cmd.py +275 -0
semantic_code_intelligence/cli/commands/pr_summary_cmd.py +178 -0
semantic_code_intelligence/cli/commands/quality_cmd.py +208 -0
semantic_code_intelligence/cli/commands/refactor_cmd.py +103 -0
semantic_code_intelligence/cli/commands/review_cmd.py +88 -0
semantic_code_intelligence/cli/commands/search_cmd.py +236 -0
semantic_code_intelligence/cli/commands/serve_cmd.py +117 -0
semantic_code_intelligence/cli/commands/suggest_cmd.py +100 -0
semantic_code_intelligence/cli/commands/summary_cmd.py +78 -0
semantic_code_intelligence/cli/commands/tool_cmd.py +282 -0
semantic_code_intelligence/cli/commands/trace_cmd.py +123 -0
semantic_code_intelligence/cli/commands/tui_cmd.py +58 -0
semantic_code_intelligence/cli/commands/viz_cmd.py +127 -0
semantic_code_intelligence/cli/commands/watch_cmd.py +72 -0
semantic_code_intelligence/cli/commands/web_cmd.py +61 -0
semantic_code_intelligence/cli/commands/workspace_cmd.py +250 -0
semantic_code_intelligence/cli/main.py +65 -0
semantic_code_intelligence/cli/router.py +92 -0
semantic_code_intelligence/config/__init__.py +0 -0
semantic_code_intelligence/config/settings.py +260 -0
semantic_code_intelligence/context/__init__.py +19 -0
semantic_code_intelligence/context/engine.py +429 -0
semantic_code_intelligence/context/memory.py +253 -0
semantic_code_intelligence/daemon/__init__.py +1 -0
semantic_code_intelligence/daemon/watcher.py +515 -0
semantic_code_intelligence/docs/__init__.py +1080 -0
semantic_code_intelligence/embeddings/__init__.py +0 -0
semantic_code_intelligence/embeddings/enhanced.py +131 -0
semantic_code_intelligence/embeddings/generator.py +149 -0
semantic_code_intelligence/embeddings/model_registry.py +100 -0
semantic_code_intelligence/evolution/__init__.py +1 -0
semantic_code_intelligence/evolution/budget_guard.py +111 -0
semantic_code_intelligence/evolution/commit_manager.py +88 -0
semantic_code_intelligence/evolution/context_builder.py +131 -0
semantic_code_intelligence/evolution/engine.py +249 -0
semantic_code_intelligence/evolution/patch_generator.py +229 -0
semantic_code_intelligence/evolution/task_selector.py +214 -0
semantic_code_intelligence/evolution/test_runner.py +111 -0
semantic_code_intelligence/indexing/__init__.py +0 -0
semantic_code_intelligence/indexing/chunker.py +174 -0
semantic_code_intelligence/indexing/parallel.py +86 -0
semantic_code_intelligence/indexing/scanner.py +146 -0
semantic_code_intelligence/indexing/semantic_chunker.py +337 -0
semantic_code_intelligence/llm/__init__.py +62 -0
semantic_code_intelligence/llm/cache.py +219 -0
semantic_code_intelligence/llm/cached_provider.py +145 -0
semantic_code_intelligence/llm/conversation.py +190 -0
semantic_code_intelligence/llm/cross_refactor.py +272 -0
semantic_code_intelligence/llm/investigation.py +274 -0
semantic_code_intelligence/llm/mock_provider.py +77 -0
semantic_code_intelligence/llm/ollama_provider.py +122 -0
semantic_code_intelligence/llm/openai_provider.py +100 -0
semantic_code_intelligence/llm/provider.py +92 -0
semantic_code_intelligence/llm/rate_limiter.py +164 -0
semantic_code_intelligence/llm/reasoning.py +438 -0
semantic_code_intelligence/llm/safety.py +110 -0
semantic_code_intelligence/llm/streaming.py +251 -0
semantic_code_intelligence/lsp/__init__.py +609 -0
semantic_code_intelligence/mcp/__init__.py +393 -0
semantic_code_intelligence/parsing/__init__.py +19 -0
semantic_code_intelligence/parsing/parser.py +375 -0
semantic_code_intelligence/plugins/__init__.py +255 -0
semantic_code_intelligence/plugins/examples/__init__.py +1 -0
semantic_code_intelligence/plugins/examples/code_quality.py +73 -0
semantic_code_intelligence/plugins/examples/search_annotator.py +56 -0
semantic_code_intelligence/scalability/__init__.py +205 -0
semantic_code_intelligence/search/__init__.py +0 -0
semantic_code_intelligence/search/formatter.py +123 -0
semantic_code_intelligence/search/grep.py +361 -0
semantic_code_intelligence/search/hybrid_search.py +170 -0
semantic_code_intelligence/search/keyword_search.py +311 -0
semantic_code_intelligence/search/section_expander.py +103 -0
semantic_code_intelligence/services/__init__.py +0 -0
semantic_code_intelligence/services/indexing_service.py +630 -0
semantic_code_intelligence/services/search_service.py +269 -0
semantic_code_intelligence/storage/__init__.py +0 -0
semantic_code_intelligence/storage/chunk_hash_store.py +86 -0
semantic_code_intelligence/storage/hash_store.py +66 -0
semantic_code_intelligence/storage/index_manifest.py +85 -0
semantic_code_intelligence/storage/index_stats.py +138 -0
semantic_code_intelligence/storage/query_history.py +160 -0
semantic_code_intelligence/storage/symbol_registry.py +209 -0
semantic_code_intelligence/storage/vector_store.py +297 -0
semantic_code_intelligence/tests/__init__.py +0 -0
semantic_code_intelligence/tests/test_ai_features.py +351 -0
semantic_code_intelligence/tests/test_chunker.py +119 -0
semantic_code_intelligence/tests/test_cli.py +188 -0
semantic_code_intelligence/tests/test_config.py +154 -0
semantic_code_intelligence/tests/test_context.py +381 -0
semantic_code_intelligence/tests/test_embeddings.py +73 -0
semantic_code_intelligence/tests/test_endtoend.py +1142 -0
semantic_code_intelligence/tests/test_enhanced_embeddings.py +92 -0
semantic_code_intelligence/tests/test_hash_store.py +79 -0
semantic_code_intelligence/tests/test_logging.py +55 -0
semantic_code_intelligence/tests/test_new_cli.py +138 -0
semantic_code_intelligence/tests/test_parser.py +495 -0
semantic_code_intelligence/tests/test_phase10.py +355 -0
semantic_code_intelligence/tests/test_phase11.py +593 -0
semantic_code_intelligence/tests/test_phase12.py +375 -0
semantic_code_intelligence/tests/test_phase13.py +663 -0
semantic_code_intelligence/tests/test_phase14.py +568 -0
semantic_code_intelligence/tests/test_phase15.py +814 -0
semantic_code_intelligence/tests/test_phase16.py +792 -0
semantic_code_intelligence/tests/test_phase17.py +815 -0
semantic_code_intelligence/tests/test_phase18.py +934 -0
semantic_code_intelligence/tests/test_phase19.py +986 -0
semantic_code_intelligence/tests/test_phase20.py +2753 -0
semantic_code_intelligence/tests/test_phase20b.py +2058 -0
semantic_code_intelligence/tests/test_phase20c.py +962 -0
semantic_code_intelligence/tests/test_phase21.py +428 -0
semantic_code_intelligence/tests/test_phase22.py +799 -0
semantic_code_intelligence/tests/test_phase23.py +783 -0
semantic_code_intelligence/tests/test_phase24.py +715 -0
semantic_code_intelligence/tests/test_phase25.py +496 -0
semantic_code_intelligence/tests/test_phase26.py +251 -0
semantic_code_intelligence/tests/test_phase27.py +531 -0
semantic_code_intelligence/tests/test_phase8.py +592 -0
semantic_code_intelligence/tests/test_phase9.py +643 -0
semantic_code_intelligence/tests/test_plugins.py +293 -0
semantic_code_intelligence/tests/test_priority_features.py +727 -0
semantic_code_intelligence/tests/test_router.py +41 -0
semantic_code_intelligence/tests/test_scalability.py +138 -0
semantic_code_intelligence/tests/test_scanner.py +125 -0
semantic_code_intelligence/tests/test_search.py +160 -0
semantic_code_intelligence/tests/test_semantic_chunker.py +255 -0
semantic_code_intelligence/tests/test_tools.py +182 -0
semantic_code_intelligence/tests/test_vector_store.py +151 -0
semantic_code_intelligence/tests/test_watcher.py +211 -0
semantic_code_intelligence/tools/__init__.py +442 -0
semantic_code_intelligence/tools/executor.py +232 -0
semantic_code_intelligence/tools/protocol.py +200 -0
semantic_code_intelligence/tui/__init__.py +454 -0
semantic_code_intelligence/utils/__init__.py +0 -0
semantic_code_intelligence/utils/logging.py +112 -0
semantic_code_intelligence/version.py +3 -0
semantic_code_intelligence/web/__init__.py +11 -0
semantic_code_intelligence/web/api.py +289 -0
semantic_code_intelligence/web/server.py +397 -0
semantic_code_intelligence/web/ui.py +659 -0
semantic_code_intelligence/web/visualize.py +226 -0
semantic_code_intelligence/workspace/__init__.py +427 -0

semantic_code_intelligence/tests/test_phase24.py ADDED Viewed

@@ -0,0 +1,715 @@
+"""Phase 24 — Self-Improving Development Loop.
+Tests verify:
+  1.  BudgetGuard — start, can_continue, record_tokens/iteration, stop_reason, summary
+  2.  TestRunner — parse_summary, TestResult
+  3.  CommitManager — git operations with mocked subprocess
+  4.  TaskSelector — priority selection, task builders
+  5.  ContextBuilder — system prompt, build sections, truncation, estimate_tokens
+  6.  PatchGenerator — diff extraction, diff parsing, safety limits
+  7.  EvolutionEngine — orchestrated loop with mocked components
+  8.  CLI command — evolve command exists, help text, options
+  9.  Module imports and version
+"""
+from __future__ import annotations
+import json
+import textwrap
+import time
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+import pytest
+# ---------------------------------------------------------------------------
+# Imports under test
+# ---------------------------------------------------------------------------
+from semantic_code_intelligence.evolution.budget_guard import BudgetGuard
+from semantic_code_intelligence.evolution.test_runner import TestResult, TestRunner, _parse_summary
+from semantic_code_intelligence.evolution.commit_manager import CommitManager
+from semantic_code_intelligence.evolution.task_selector import (
+    TASK_ERROR_HANDLING,
+    TASK_FIX_TESTS,
+    TASK_REDUCE_DUPLICATION,
+    TASK_SMALL_OPTIMISATION,
+    TASK_TYPE_HINTS,
+    EvolutionTask,
+    TaskSelector,
+)
+from semantic_code_intelligence.evolution.context_builder import (
+    SYSTEM_PROMPT,
+    ContextBuilder,
+)
+from semantic_code_intelligence.evolution.patch_generator import (
+    PatchGenerator,
+    PatchResult,
+    _diff_files,
+    _diff_line_count,
+    _extract_diff,
+)
+from semantic_code_intelligence.evolution.engine import (
+    EvolutionEngine,
+    EvolutionResult,
+    IterationRecord,
+)
+from semantic_code_intelligence.llm.mock_provider import MockProvider
+from semantic_code_intelligence.llm.provider import LLMMessage, LLMResponse, MessageRole
+_PROJECT_ROOT = Path(__file__).resolve().parents[2]
+_SRC = _PROJECT_ROOT / "semantic_code_intelligence"
+# ═══════════════════════════════════════════════════════════════════════════
+# 1 — BudgetGuard
+# ═══════════════════════════════════════════════════════════════════════════
+class TestBudgetGuard:
+    """Tests for the BudgetGuard resource tracker."""
+    def test_defaults(self):
+        g = BudgetGuard()
+        assert g.max_tokens == 20_000
+        assert g.max_iterations == 5
+        assert g.max_seconds == 600.0
+        assert g.tokens_used == 0
+        assert g.iterations_done == 0
+    def test_can_continue_fresh(self):
+        g = BudgetGuard()
+        assert g.can_continue() is True
+    def test_record_tokens(self):
+        g = BudgetGuard(max_tokens=100)
+        g.record_tokens(40)
+        assert g.tokens_used == 40
+        assert g.tokens_remaining == 60
+    def test_record_iteration(self):
+        g = BudgetGuard(max_iterations=3)
+        g.record_iteration()
+        g.record_iteration()
+        assert g.iterations_done == 2
+        assert g.iterations_remaining == 1
+    def test_stop_on_token_limit(self):
+        g = BudgetGuard(max_tokens=50)
+        g.record_tokens(50)
+        assert g.can_continue() is False
+        assert "token" in g.stop_reason().lower()
+    def test_stop_on_iteration_limit(self):
+        g = BudgetGuard(max_iterations=2)
+        g.record_iteration()
+        g.record_iteration()
+        assert g.can_continue() is False
+        assert "iteration" in g.stop_reason().lower()
+    def test_stop_on_time_limit(self):
+        g = BudgetGuard(max_seconds=0.01)
+        g.start()
+        time.sleep(0.02)
+        assert g.can_continue() is False
+        assert "time" in g.stop_reason().lower()
+    def test_stop_reason_none_when_ok(self):
+        g = BudgetGuard()
+        assert g.stop_reason() is None
+    def test_elapsed_without_start(self):
+        g = BudgetGuard()
+        assert g.elapsed_seconds == 0.0
+    def test_summary(self):
+        g = BudgetGuard(max_tokens=1000, max_iterations=3, max_seconds=300)
+        g.start()
+        g.record_tokens(150)
+        g.record_iteration()
+        s = g.summary()
+        assert s["tokens_used"] == 150
+        assert s["tokens_max"] == 1000
+        assert s["iterations_done"] == 1
+        assert s["iterations_max"] == 3
+        assert isinstance(s["elapsed_seconds"], float)
+    def test_tokens_remaining_never_negative(self):
+        g = BudgetGuard(max_tokens=10)
+        g.record_tokens(100)
+        assert g.tokens_remaining == 0
+# ═══════════════════════════════════════════════════════════════════════════
+# 2 — TestRunner
+# ═══════════════════════════════════════════════════════════════════════════
+class TestTestResult:
+    """Tests for the TestResult dataclass."""
+    def test_summary_line_pass(self):
+        r = TestResult(passed=True, total=10, failures=0, errors=0)
+        line = r.summary_line()
+        assert "PASS" in line
+        assert "10 tests" in line
+    def test_summary_line_fail(self):
+        r = TestResult(passed=False, total=10, failures=2, errors=0)
+        line = r.summary_line()
+        assert "FAIL" in line
+        assert "2 failures" in line
+    def test_summary_line_errors(self):
+        r = TestResult(passed=False, total=10, failures=1, errors=2)
+        line = r.summary_line()
+        assert "2 errors" in line
+class TestTestRunnerParsing:
+    """Tests for TestRunner._parse_summary regex parsing."""
+    def test_parse_all_passed(self):
+        total, failures, errors = _parse_summary("10 passed in 2.34s")
+        assert total == 10
+        assert failures == 0
+        assert errors == 0
+    def test_parse_mixed(self):
+        total, failures, errors = _parse_summary("8 passed, 2 failed in 5.67s")
+        assert total == 10
+        assert failures == 2
+        assert errors == 0
+    def test_parse_errors(self):
+        total, failures, errors = _parse_summary("5 passed, 1 failed, 2 errors in 3.0s")
+        assert total == 8
+        assert failures == 1
+        assert errors == 2
+    def test_parse_empty(self):
+        total, failures, errors = _parse_summary("")
+        assert total == 0
+        assert failures == 0
+# ═══════════════════════════════════════════════════════════════════════════
+# 3 — CommitManager
+# ═══════════════════════════════════════════════════════════════════════════
+class TestCommitManager:
+    """Tests for CommitManager git operations (mocked subprocess)."""
+    def test_has_changes_true(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(
+                stdout="M  foo.py\n", returncode=0
+            )
+            assert cm.has_changes() is True
+    def test_has_changes_false(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(stdout="", returncode=0)
+            assert cm.has_changes() is False
+    def test_git_diff(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(
+                stdout="+added line\n-removed line\n", returncode=0
+            )
+            diff = cm.git_diff()
+            assert "+added line" in diff
+    def test_commit_returns_sha(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(
+                stdout="abc1234\n", returncode=0
+            )
+            sha = cm.commit("test message")
+            assert sha == "abc1234"
+    def test_stage_files(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(returncode=0)
+            cm.stage_files(["a.py", "b.py"])
+            args = mock_run.call_args[0][0]
+            assert "add" in args
+            assert "a.py" in args
+            assert "b.py" in args
+    def test_revert_files(self):
+        cm = CommitManager(project_root=_PROJECT_ROOT)
+        with patch("subprocess.run") as mock_run:
+            mock_run.return_value = MagicMock(returncode=0)
+            cm.revert_files(["c.py"])
+            args = mock_run.call_args[0][0]
+            assert "checkout" in args
+            assert "c.py" in args
+# ═══════════════════════════════════════════════════════════════════════════
+# 4 — TaskSelector
+# ═══════════════════════════════════════════════════════════════════════════
+class TestEvolutionTask:
+    """Tests for the EvolutionTask dataclass."""
+    def test_basic_construction(self):
+        t = EvolutionTask(
+            category=TASK_TYPE_HINTS,
+            description="Add return types to foo.py",
+            target_files=["foo.py"],
+        )
+        assert t.category == TASK_TYPE_HINTS
+        assert len(t.target_files) == 1
+        assert t.context_hint == ""
+class TestTaskSelector:
+    """Tests for priority-based task selection."""
+    def test_fix_tests_has_highest_priority(self):
+        runner = MagicMock()
+        cm = MagicMock()
+        sel = TaskSelector(
+            project_root=_PROJECT_ROOT,
+            test_runner=runner,
+            commit_manager=cm,
+        )
+        failed_result = TestResult(
+            passed=False, total=7, failures=2, errors=0,
+            output="FAILED tests/test_foo.py::test_bar - AssertionError",
+            return_code=1,
+        )
+        task = sel.select(failed_result)
+        assert task.category == TASK_FIX_TESTS
+    def test_fallback_to_generic(self):
+        """With no test failures and no code issues -> small optimisation."""
+        runner = MagicMock()
+        cm = MagicMock()
+        sel = TaskSelector(
+            project_root=_PROJECT_ROOT,
+            test_runner=runner,
+            commit_manager=cm,
+        )
+        passing = TestResult(passed=10, total=10, failures=0, errors=0, return_code=0)
+        with patch.object(sel, "_find_type_hint_task", return_value=None), \
+             patch.object(sel, "_find_error_handling_task", return_value=None), \
+             patch.object(sel, "_find_duplication_task", return_value=None):
+            task = sel.select(passing)
+            assert task.category == TASK_SMALL_OPTIMISATION
+    def test_task_categories_are_strings(self):
+        assert isinstance(TASK_FIX_TESTS, str)
+        assert isinstance(TASK_TYPE_HINTS, str)
+        assert isinstance(TASK_ERROR_HANDLING, str)
+        assert isinstance(TASK_REDUCE_DUPLICATION, str)
+        assert isinstance(TASK_SMALL_OPTIMISATION, str)
+# ═══════════════════════════════════════════════════════════════════════════
+# 5 — ContextBuilder
+# ═══════════════════════════════════════════════════════════════════════════
+class TestContextBuilder:
+    """Tests for context assembly."""
+    def test_system_prompt_exists(self):
+        assert len(SYSTEM_PROMPT) > 100
+        assert "diff" in SYSTEM_PROMPT.lower()
+    def test_estimate_tokens(self):
+        cm = MagicMock()
+        cb = ContextBuilder(project_root=_PROJECT_ROOT, commit_manager=cm)
+        # 11 chars // 4 = 2 (floor division), min 1
+        assert cb.estimate_tokens("hello world") == 2
+        assert cb.estimate_tokens("hi") == 1  # min clamp
+    def test_build_includes_task(self):
+        cm = MagicMock()
+        cm.git_diff.return_value = ""
+        cb = ContextBuilder(project_root=_PROJECT_ROOT, commit_manager=cm)
+        task = EvolutionTask(
+            category="test_cat",
+            description="Do something helpful",
+            target_files=[],
+        )
+        ctx = cb.build(task)
+        assert "Do something helpful" in ctx
+        assert "test_cat" in ctx
+    def test_build_truncates_large_content(self):
+        cm = MagicMock()
+        cm.git_diff.return_value = ""
+        cb = ContextBuilder(
+            project_root=_PROJECT_ROOT,
+            commit_manager=cm,
+            max_context_tokens=50,
+        )
+        task = EvolutionTask(
+            category="demo",
+            description="truncation test",
+            target_files=[],
+            context_hint="A" * 10000,
+        )
+        ctx = cb.build(task)
+        assert len(ctx) < 10000
+# ═══════════════════════════════════════════════════════════════════════════
+# 6 — PatchGenerator — diff helpers
+# ═══════════════════════════════════════════════════════════════════════════
+class TestDiffExtraction:
+    """Tests for _extract_diff from LLM output."""
+    def test_fenced_diff_block(self):
+        text = textwrap.dedent("""\
+            Here is the patch:
+            ```diff
+            --- a/foo.py
+            +++ b/foo.py
+            @@ -1,3 +1,3 @@
+            -old line
+            +new line
+             context
+            ```
+        """)
+        diff = _extract_diff(text)
+        assert "--- a/foo.py" in diff
+        assert "+new line" in diff
+    def test_raw_diff_without_fence(self):
+        text = textwrap.dedent("""\
+            --- a/bar.py
+            +++ b/bar.py
+            @@ -10,4 +10,5 @@
+             context
+            -removed
+            +added
+            +another
+        """)
+        diff = _extract_diff(text)
+        assert "--- a/bar.py" in diff
+        assert "+added" in diff
+    def test_no_diff_returns_empty(self):
+        text = "Just some regular text with no diff."
+        diff = _extract_diff(text)
+        assert diff == ""
+class TestDiffFiles:
+    """Tests for _diff_files extraction."""
+    def test_single_file(self):
+        diff = "--- a/foo.py\n+++ b/foo.py\n@@ -1 +1 @@\n-x\n+y"
+        files = _diff_files(diff)
+        assert files == ["foo.py"]
+    def test_multiple_files(self):
+        diff = (
+            "--- a/a.py\n+++ b/a.py\n@@ -1 +1 @@\n-x\n+y\n"
+            "--- a/b.py\n+++ b/b.py\n@@ -1 +1 @@\n-x\n+y"
+        )
+        files = _diff_files(diff)
+        assert "a.py" in files
+        assert "b.py" in files
+    def test_dev_null_excluded(self):
+        diff = "--- /dev/null\n+++ b/new.py\n@@ -0,0 +1 @@\n+new"
+        files = _diff_files(diff)
+        assert files == ["new.py"]
+class TestDiffLineCount:
+    """Tests for _diff_line_count."""
+    def test_counts_adds_and_removes(self):
+        diff = (
+            "--- a/foo.py\n+++ b/foo.py\n@@ -1,3 +1,3 @@\n"
+            " ctx\n-removed\n+added\n ctx\n"
+        )
+        assert _diff_line_count(diff) == 2
+    def test_ignores_header_lines(self):
+        diff = "--- a/foo.py\n+++ b/foo.py\n@@ -1 +1 @@\n-x\n+y"
+        assert _diff_line_count(diff) == 2
+class TestPatchResult:
+    """Tests for the PatchResult dataclass."""
+    def test_default_is_failure(self):
+        r = PatchResult()
+        assert r.success is False
+        assert r.files_changed == []
+    def test_to_dict(self):
+        r = PatchResult(success=True, files_changed=["a.py"], lines_changed=5)
+        d = r.to_dict()
+        assert d["success"] is True
+        assert d["files_changed"] == ["a.py"]
+class TestPatchGeneratorSafety:
+    """Tests for PatchGenerator safety limits with mock LLM."""
+    def test_rejects_too_many_files(self):
+        provider = MockProvider()
+        lines = []
+        for i in range(5):
+            lines.append(f"--- a/f{i}.py")
+            lines.append(f"+++ b/f{i}.py")
+            lines.append("@@ -1 +1 @@")
+            lines.append(f"-old{i}")
+            lines.append(f"+new{i}")
+        diff_text = "\n".join(lines)
+        provider.enqueue_response(f"```diff\n{diff_text}\n```")
+        budget = BudgetGuard(max_tokens=50000)
+        cm = MagicMock()
+        cm.git_diff.return_value = ""
+        cb = ContextBuilder(project_root=_PROJECT_ROOT, commit_manager=cm)
+        pg = PatchGenerator(
+            project_root=_PROJECT_ROOT,
+            provider=provider,
+            context_builder=cb,
+            budget=budget,
+        )
+        task = EvolutionTask(category="test", description="test", target_files=[])
+        result = pg.generate_and_apply(task)
+        assert result.success is False
+        assert "files" in result.error.lower()
+    def test_rejects_when_budget_exceeded(self):
+        provider = MockProvider()
+        budget = BudgetGuard(max_tokens=10)
+        budget.record_tokens(10)
+        cm = MagicMock()
+        cm.git_diff.return_value = ""
+        cb = ContextBuilder(project_root=_PROJECT_ROOT, commit_manager=cm)
+        pg = PatchGenerator(
+            project_root=_PROJECT_ROOT,
+            provider=provider,
+            context_builder=cb,
+            budget=budget,
+        )
+        task = EvolutionTask(category="test", description="test", target_files=[])
+        result = pg.generate_and_apply(task)
+        assert result.success is False
+        assert "budget" in result.error.lower()
+    def test_handles_llm_returning_no_diff(self):
+        provider = MockProvider()
+        provider.enqueue_response("Sorry, I cannot generate a diff for this.")
+        budget = BudgetGuard(max_tokens=50000)
+        cm = MagicMock()
+        cm.git_diff.return_value = ""
+        cb = ContextBuilder(project_root=_PROJECT_ROOT, commit_manager=cm)
+        pg = PatchGenerator(
+            project_root=_PROJECT_ROOT,
+            provider=provider,
+            context_builder=cb,
+            budget=budget,
+        )
+        task = EvolutionTask(category="test", description="test", target_files=[])
+        result = pg.generate_and_apply(task)
+        assert result.success is False
+        assert "valid" in result.error.lower() or "diff" in result.error.lower()
+# ═══════════════════════════════════════════════════════════════════════════
+# 7 — Engine — IterationRecord and EvolutionResult
+# ═══════════════════════════════════════════════════════════════════════════
+class TestIterationRecord:
+    """Tests for the IterationRecord dataclass."""
+    def test_to_dict(self):
+        r = IterationRecord(
+            iteration=1,
+            task_category="type_hints",
+            task_description="Add types",
+            committed=True,
+            commit_sha="abc123",
+        )
+        d = r.to_dict()
+        assert d["iteration"] == 1
+        assert d["committed"] is True
+        assert d["commit_sha"] == "abc123"
+class TestEvolutionResult:
+    """Tests for the EvolutionResult aggregate."""
+    def test_to_dict(self):
+        r = EvolutionResult(
+            iterations_completed=2,
+            commits=["abc", "def"],
+            reverts=1,
+            stop_reason="iteration limit reached (2)",
+        )
+        d = r.to_dict()
+        assert d["iterations_completed"] == 2
+        assert len(d["commits"]) == 2
+        assert d["reverts"] == 1
+class TestEvolutionEngineOrchestration:
+    """Tests for the EvolutionEngine loop with mocked components."""
+    def test_engine_runs_iterations(self, tmp_path):
+        """Engine should run iterations and respect budget."""
+        provider = MockProvider()
+        provider.enqueue_response("no diff here")
+        provider.enqueue_response("no diff here")
+        budget = BudgetGuard(max_tokens=50000, max_iterations=2, max_seconds=60)
+        with patch.object(TestRunner, "run") as mock_test_run, \
+             patch.object(CommitManager, "has_changes", return_value=False):
+            mock_test_run.return_value = TestResult(
+                passed=10, total=10, failures=0, errors=0, return_code=0,
+            )
+            engine = EvolutionEngine(
+                project_root=tmp_path,
+                provider=provider,
+                budget=budget,
+            )
+            result = engine.run()
+        assert result.iterations_completed == 2
+        assert result.stop_reason is not None
+        assert len(result.history) == 2
+    def test_engine_writes_history(self, tmp_path):
+        """Engine should persist evolution_history.json."""
+        provider = MockProvider()
+        provider.enqueue_response("no diff")
+        budget = BudgetGuard(max_tokens=50000, max_iterations=1, max_seconds=60)
+        with patch.object(TestRunner, "run") as mock_test_run, \
+             patch.object(CommitManager, "has_changes", return_value=False):
+            mock_test_run.return_value = TestResult(
+                passed=5, total=5, failures=0, errors=0, return_code=0,
+            )
+            engine = EvolutionEngine(
+                project_root=tmp_path,
+                provider=provider,
+                budget=budget,
+            )
+            engine.run()
+        history_file = tmp_path / ".codexa" / "evolution_history.json"
+        assert history_file.exists()
+        data = json.loads(history_file.read_text(encoding="utf-8"))
+        assert isinstance(data, list)
+        assert len(data) == 1
+# ═══════════════════════════════════════════════════════════════════════════
+# 8 — CLI command
+# ═══════════════════════════════════════════════════════════════════════════
+class TestEvolveCLI:
+    """Tests for the evolve CLI command."""
+    def test_command_exists(self):
+        from semantic_code_intelligence.cli.commands.evolve_cmd import evolve_cmd
+        assert evolve_cmd.name == "evolve"
+    def test_command_has_options(self):
+        from semantic_code_intelligence.cli.commands.evolve_cmd import evolve_cmd
+        param_names = [p.name for p in evolve_cmd.params]
+        assert "iterations" in param_names
+        assert "budget" in param_names
+        assert "timeout" in param_names
+        assert "path" in param_names
+    def test_command_registered_in_router(self):
+        from semantic_code_intelligence.cli.router import register_commands
+        group = MagicMock(spec=["add_command"])
+        register_commands(group)
+        added_names = [call.args[0].name for call in group.add_command.call_args_list]
+        assert "evolve" in added_names
+    def test_help_mentions_evolve(self):
+        from click.testing import CliRunner
+        from semantic_code_intelligence.cli.commands.evolve_cmd import evolve_cmd
+        runner = CliRunner()
+        result = runner.invoke(evolve_cmd, ["--help"])
+        assert result.exit_code == 0
+        assert "self-improving" in result.output.lower() or "evolve" in result.output.lower()
+# ═══════════════════════════════════════════════════════════════════════════
+# 9 — Module imports and version
+# ═══════════════════════════════════════════════════════════════════════════
+class TestModuleImports:
+    """Verify that all Phase 24 modules are importable."""
+    def test_import_budget_guard(self):
+        from semantic_code_intelligence.evolution import budget_guard
+        assert hasattr(budget_guard, "BudgetGuard")
+    def test_import_test_runner(self):
+        from semantic_code_intelligence.evolution import test_runner
+        assert hasattr(test_runner, "TestRunner")
+        assert hasattr(test_runner, "TestResult")
+    def test_import_commit_manager(self):
+        from semantic_code_intelligence.evolution import commit_manager
+        assert hasattr(commit_manager, "CommitManager")
+    def test_import_task_selector(self):
+        from semantic_code_intelligence.evolution import task_selector
+        assert hasattr(task_selector, "TaskSelector")
+        assert hasattr(task_selector, "EvolutionTask")
+    def test_import_context_builder(self):
+        from semantic_code_intelligence.evolution import context_builder
+        assert hasattr(context_builder, "ContextBuilder")
+        assert hasattr(context_builder, "SYSTEM_PROMPT")
+    def test_import_patch_generator(self):
+        from semantic_code_intelligence.evolution import patch_generator
+        assert hasattr(patch_generator, "PatchGenerator")
+        assert hasattr(patch_generator, "PatchResult")
+    def test_import_engine(self):
+        from semantic_code_intelligence.evolution import engine
+        assert hasattr(engine, "EvolutionEngine")
+        assert hasattr(engine, "EvolutionResult")
+        assert hasattr(engine, "IterationRecord")
+    def test_import_evolve_cmd(self):
+        from semantic_code_intelligence.cli.commands import evolve_cmd
+        assert hasattr(evolve_cmd, "evolve_cmd")
+class TestVersion:
+    """Verify the project version reflects Phase 24."""
+    def test_version_is_0_24_0(self):
+        from semantic_code_intelligence import __version__
+        assert __version__ == "0.4.0"