PyPI - codexa - Versions diffs - 0.4.0__py3-none-any.whl - Mend

codexa 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (189) hide show

codexa-0.4.0.dist-info/METADATA +650 -0
codexa-0.4.0.dist-info/RECORD +189 -0
codexa-0.4.0.dist-info/WHEEL +5 -0
codexa-0.4.0.dist-info/entry_points.txt +2 -0
codexa-0.4.0.dist-info/licenses/LICENSE +21 -0
codexa-0.4.0.dist-info/top_level.txt +1 -0
semantic_code_intelligence/__init__.py +5 -0
semantic_code_intelligence/analysis/__init__.py +21 -0
semantic_code_intelligence/analysis/ai_features.py +351 -0
semantic_code_intelligence/bridge/__init__.py +28 -0
semantic_code_intelligence/bridge/context_provider.py +245 -0
semantic_code_intelligence/bridge/protocol.py +167 -0
semantic_code_intelligence/bridge/server.py +348 -0
semantic_code_intelligence/bridge/vscode.py +271 -0
semantic_code_intelligence/ci/__init__.py +13 -0
semantic_code_intelligence/ci/hooks.py +98 -0
semantic_code_intelligence/ci/hotspots.py +272 -0
semantic_code_intelligence/ci/impact.py +246 -0
semantic_code_intelligence/ci/metrics.py +591 -0
semantic_code_intelligence/ci/pr.py +412 -0
semantic_code_intelligence/ci/quality.py +557 -0
semantic_code_intelligence/ci/templates.py +164 -0
semantic_code_intelligence/ci/trace.py +224 -0
semantic_code_intelligence/cli/__init__.py +0 -0
semantic_code_intelligence/cli/commands/__init__.py +0 -0
semantic_code_intelligence/cli/commands/ask_cmd.py +153 -0
semantic_code_intelligence/cli/commands/benchmark_cmd.py +303 -0
semantic_code_intelligence/cli/commands/chat_cmd.py +252 -0
semantic_code_intelligence/cli/commands/ci_gen_cmd.py +74 -0
semantic_code_intelligence/cli/commands/context_cmd.py +120 -0
semantic_code_intelligence/cli/commands/cross_refactor_cmd.py +113 -0
semantic_code_intelligence/cli/commands/deps_cmd.py +91 -0
semantic_code_intelligence/cli/commands/docs_cmd.py +101 -0
semantic_code_intelligence/cli/commands/doctor_cmd.py +147 -0
semantic_code_intelligence/cli/commands/evolve_cmd.py +171 -0
semantic_code_intelligence/cli/commands/explain_cmd.py +112 -0
semantic_code_intelligence/cli/commands/gate_cmd.py +135 -0
semantic_code_intelligence/cli/commands/grep_cmd.py +234 -0
semantic_code_intelligence/cli/commands/hotspots_cmd.py +119 -0
semantic_code_intelligence/cli/commands/impact_cmd.py +131 -0
semantic_code_intelligence/cli/commands/index_cmd.py +138 -0
semantic_code_intelligence/cli/commands/init_cmd.py +152 -0
semantic_code_intelligence/cli/commands/investigate_cmd.py +163 -0
semantic_code_intelligence/cli/commands/languages_cmd.py +101 -0
semantic_code_intelligence/cli/commands/lsp_cmd.py +49 -0
semantic_code_intelligence/cli/commands/mcp_cmd.py +50 -0
semantic_code_intelligence/cli/commands/metrics_cmd.py +264 -0
semantic_code_intelligence/cli/commands/models_cmd.py +157 -0
semantic_code_intelligence/cli/commands/plugin_cmd.py +275 -0
semantic_code_intelligence/cli/commands/pr_summary_cmd.py +178 -0
semantic_code_intelligence/cli/commands/quality_cmd.py +208 -0
semantic_code_intelligence/cli/commands/refactor_cmd.py +103 -0
semantic_code_intelligence/cli/commands/review_cmd.py +88 -0
semantic_code_intelligence/cli/commands/search_cmd.py +236 -0
semantic_code_intelligence/cli/commands/serve_cmd.py +117 -0
semantic_code_intelligence/cli/commands/suggest_cmd.py +100 -0
semantic_code_intelligence/cli/commands/summary_cmd.py +78 -0
semantic_code_intelligence/cli/commands/tool_cmd.py +282 -0
semantic_code_intelligence/cli/commands/trace_cmd.py +123 -0
semantic_code_intelligence/cli/commands/tui_cmd.py +58 -0
semantic_code_intelligence/cli/commands/viz_cmd.py +127 -0
semantic_code_intelligence/cli/commands/watch_cmd.py +72 -0
semantic_code_intelligence/cli/commands/web_cmd.py +61 -0
semantic_code_intelligence/cli/commands/workspace_cmd.py +250 -0
semantic_code_intelligence/cli/main.py +65 -0
semantic_code_intelligence/cli/router.py +92 -0
semantic_code_intelligence/config/__init__.py +0 -0
semantic_code_intelligence/config/settings.py +260 -0
semantic_code_intelligence/context/__init__.py +19 -0
semantic_code_intelligence/context/engine.py +429 -0
semantic_code_intelligence/context/memory.py +253 -0
semantic_code_intelligence/daemon/__init__.py +1 -0
semantic_code_intelligence/daemon/watcher.py +515 -0
semantic_code_intelligence/docs/__init__.py +1080 -0
semantic_code_intelligence/embeddings/__init__.py +0 -0
semantic_code_intelligence/embeddings/enhanced.py +131 -0
semantic_code_intelligence/embeddings/generator.py +149 -0
semantic_code_intelligence/embeddings/model_registry.py +100 -0
semantic_code_intelligence/evolution/__init__.py +1 -0
semantic_code_intelligence/evolution/budget_guard.py +111 -0
semantic_code_intelligence/evolution/commit_manager.py +88 -0
semantic_code_intelligence/evolution/context_builder.py +131 -0
semantic_code_intelligence/evolution/engine.py +249 -0
semantic_code_intelligence/evolution/patch_generator.py +229 -0
semantic_code_intelligence/evolution/task_selector.py +214 -0
semantic_code_intelligence/evolution/test_runner.py +111 -0
semantic_code_intelligence/indexing/__init__.py +0 -0
semantic_code_intelligence/indexing/chunker.py +174 -0
semantic_code_intelligence/indexing/parallel.py +86 -0
semantic_code_intelligence/indexing/scanner.py +146 -0
semantic_code_intelligence/indexing/semantic_chunker.py +337 -0
semantic_code_intelligence/llm/__init__.py +62 -0
semantic_code_intelligence/llm/cache.py +219 -0
semantic_code_intelligence/llm/cached_provider.py +145 -0
semantic_code_intelligence/llm/conversation.py +190 -0
semantic_code_intelligence/llm/cross_refactor.py +272 -0
semantic_code_intelligence/llm/investigation.py +274 -0
semantic_code_intelligence/llm/mock_provider.py +77 -0
semantic_code_intelligence/llm/ollama_provider.py +122 -0
semantic_code_intelligence/llm/openai_provider.py +100 -0
semantic_code_intelligence/llm/provider.py +92 -0
semantic_code_intelligence/llm/rate_limiter.py +164 -0
semantic_code_intelligence/llm/reasoning.py +438 -0
semantic_code_intelligence/llm/safety.py +110 -0
semantic_code_intelligence/llm/streaming.py +251 -0
semantic_code_intelligence/lsp/__init__.py +609 -0
semantic_code_intelligence/mcp/__init__.py +393 -0
semantic_code_intelligence/parsing/__init__.py +19 -0
semantic_code_intelligence/parsing/parser.py +375 -0
semantic_code_intelligence/plugins/__init__.py +255 -0
semantic_code_intelligence/plugins/examples/__init__.py +1 -0
semantic_code_intelligence/plugins/examples/code_quality.py +73 -0
semantic_code_intelligence/plugins/examples/search_annotator.py +56 -0
semantic_code_intelligence/scalability/__init__.py +205 -0
semantic_code_intelligence/search/__init__.py +0 -0
semantic_code_intelligence/search/formatter.py +123 -0
semantic_code_intelligence/search/grep.py +361 -0
semantic_code_intelligence/search/hybrid_search.py +170 -0
semantic_code_intelligence/search/keyword_search.py +311 -0
semantic_code_intelligence/search/section_expander.py +103 -0
semantic_code_intelligence/services/__init__.py +0 -0
semantic_code_intelligence/services/indexing_service.py +630 -0
semantic_code_intelligence/services/search_service.py +269 -0
semantic_code_intelligence/storage/__init__.py +0 -0
semantic_code_intelligence/storage/chunk_hash_store.py +86 -0
semantic_code_intelligence/storage/hash_store.py +66 -0
semantic_code_intelligence/storage/index_manifest.py +85 -0
semantic_code_intelligence/storage/index_stats.py +138 -0
semantic_code_intelligence/storage/query_history.py +160 -0
semantic_code_intelligence/storage/symbol_registry.py +209 -0
semantic_code_intelligence/storage/vector_store.py +297 -0
semantic_code_intelligence/tests/__init__.py +0 -0
semantic_code_intelligence/tests/test_ai_features.py +351 -0
semantic_code_intelligence/tests/test_chunker.py +119 -0
semantic_code_intelligence/tests/test_cli.py +188 -0
semantic_code_intelligence/tests/test_config.py +154 -0
semantic_code_intelligence/tests/test_context.py +381 -0
semantic_code_intelligence/tests/test_embeddings.py +73 -0
semantic_code_intelligence/tests/test_endtoend.py +1142 -0
semantic_code_intelligence/tests/test_enhanced_embeddings.py +92 -0
semantic_code_intelligence/tests/test_hash_store.py +79 -0
semantic_code_intelligence/tests/test_logging.py +55 -0
semantic_code_intelligence/tests/test_new_cli.py +138 -0
semantic_code_intelligence/tests/test_parser.py +495 -0
semantic_code_intelligence/tests/test_phase10.py +355 -0
semantic_code_intelligence/tests/test_phase11.py +593 -0
semantic_code_intelligence/tests/test_phase12.py +375 -0
semantic_code_intelligence/tests/test_phase13.py +663 -0
semantic_code_intelligence/tests/test_phase14.py +568 -0
semantic_code_intelligence/tests/test_phase15.py +814 -0
semantic_code_intelligence/tests/test_phase16.py +792 -0
semantic_code_intelligence/tests/test_phase17.py +815 -0
semantic_code_intelligence/tests/test_phase18.py +934 -0
semantic_code_intelligence/tests/test_phase19.py +986 -0
semantic_code_intelligence/tests/test_phase20.py +2753 -0
semantic_code_intelligence/tests/test_phase20b.py +2058 -0
semantic_code_intelligence/tests/test_phase20c.py +962 -0
semantic_code_intelligence/tests/test_phase21.py +428 -0
semantic_code_intelligence/tests/test_phase22.py +799 -0
semantic_code_intelligence/tests/test_phase23.py +783 -0
semantic_code_intelligence/tests/test_phase24.py +715 -0
semantic_code_intelligence/tests/test_phase25.py +496 -0
semantic_code_intelligence/tests/test_phase26.py +251 -0
semantic_code_intelligence/tests/test_phase27.py +531 -0
semantic_code_intelligence/tests/test_phase8.py +592 -0
semantic_code_intelligence/tests/test_phase9.py +643 -0
semantic_code_intelligence/tests/test_plugins.py +293 -0
semantic_code_intelligence/tests/test_priority_features.py +727 -0
semantic_code_intelligence/tests/test_router.py +41 -0
semantic_code_intelligence/tests/test_scalability.py +138 -0
semantic_code_intelligence/tests/test_scanner.py +125 -0
semantic_code_intelligence/tests/test_search.py +160 -0
semantic_code_intelligence/tests/test_semantic_chunker.py +255 -0
semantic_code_intelligence/tests/test_tools.py +182 -0
semantic_code_intelligence/tests/test_vector_store.py +151 -0
semantic_code_intelligence/tests/test_watcher.py +211 -0
semantic_code_intelligence/tools/__init__.py +442 -0
semantic_code_intelligence/tools/executor.py +232 -0
semantic_code_intelligence/tools/protocol.py +200 -0
semantic_code_intelligence/tui/__init__.py +454 -0
semantic_code_intelligence/utils/__init__.py +0 -0
semantic_code_intelligence/utils/logging.py +112 -0
semantic_code_intelligence/version.py +3 -0
semantic_code_intelligence/web/__init__.py +11 -0
semantic_code_intelligence/web/api.py +289 -0
semantic_code_intelligence/web/server.py +397 -0
semantic_code_intelligence/web/ui.py +659 -0
semantic_code_intelligence/web/visualize.py +226 -0
semantic_code_intelligence/workspace/__init__.py +427 -0

semantic_code_intelligence/tests/test_ai_features.py ADDED Viewed

@@ -0,0 +1,351 @@
+"""Tests for AI features — repository summary, AI context, code explanations."""
+import json
+import pytest
+from semantic_code_intelligence.analysis.ai_features import (
+    CodeExplanation,
+    LanguageStats,
+    RepoSummary,
+    explain_file,
+    explain_symbol,
+    generate_ai_context,
+    summarize_repository,
+)
+from semantic_code_intelligence.context.engine import ContextBuilder
+# ---------------------------------------------------------------------------
+# Sample code
+# ---------------------------------------------------------------------------
+PYTHON_SAMPLE = '''\
+import os
+from pathlib import Path
+def helper():
+    return 42
+def main():
+    result = helper()
+    print(result)
+class Worker:
+    def __init__(self):
+        self.data = []
+    def process(self):
+        result = helper()
+        return result
+'''
+JS_SAMPLE = '''\
+import { readFile } from 'fs';
+function parse(data) {
+    return JSON.parse(data);
+}
+function load(path) {
+    const data = readFile(path);
+    return parse(data);
+}
+class DataLoader {
+    constructor(path) {
+        this.path = path;
+    }
+    load() {
+        return load(this.path);
+    }
+}
+'''
+# ---------------------------------------------------------------------------
+# RepoSummary
+# ---------------------------------------------------------------------------
+class TestRepoSummary:
+    @pytest.fixture(autouse=True)
+    def setup(self):
+        self.builder = ContextBuilder()
+        self.builder.index_file("app.py", PYTHON_SAMPLE)
+        self.builder.index_file("app.js", JS_SAMPLE)
+        self.summary = summarize_repository(self.builder)
+    def test_total_files(self):
+        assert self.summary.total_files == 2
+    def test_total_symbols(self):
+        assert self.summary.total_symbols > 0
+    def test_total_functions(self):
+        assert self.summary.total_functions >= 2  # helper, main, parse, load
+    def test_total_classes(self):
+        assert self.summary.total_classes >= 2  # Worker, DataLoader
+    def test_total_methods(self):
+        assert self.summary.total_methods >= 2
+    def test_total_imports(self):
+        assert self.summary.total_imports >= 2
+    def test_languages_listed(self):
+        lang_names = {l.language for l in self.summary.languages}
+        assert "python" in lang_names
+        assert "javascript" in lang_names
+    def test_top_functions(self):
+        assert len(self.summary.top_functions) > 0
+        assert "name" in self.summary.top_functions[0]
+    def test_top_classes(self):
+        assert len(self.summary.top_classes) > 0
+        assert "name" in self.summary.top_classes[0]
+    def test_to_dict(self):
+        d = self.summary.to_dict()
+        assert "total_files" in d
+        assert "languages" in d
+        assert "top_functions" in d
+    def test_to_json(self):
+        j = self.summary.to_json()
+        parsed = json.loads(j)
+        assert parsed["total_files"] == 2
+    def test_render(self):
+        text = self.summary.render()
+        assert "Repository Summary" in text
+        assert "Files:" in text
+        assert "Languages" in text
+class TestLanguageStats:
+    def test_to_dict(self):
+        stats = LanguageStats(
+            language="python",
+            file_count=5,
+            function_count=10,
+            class_count=3,
+        )
+        d = stats.to_dict()
+        assert d["language"] == "python"
+        assert d["file_count"] == 5
+        assert d["function_count"] == 10
+        assert d["class_count"] == 3
+class TestRepoSummaryEmpty:
+    def test_empty_builder(self):
+        builder = ContextBuilder()
+        summary = summarize_repository(builder)
+        assert summary.total_files == 0
+        assert summary.total_symbols == 0
+        assert summary.languages == []
+    def test_single_file(self):
+        builder = ContextBuilder()
+        builder.index_file("app.py", PYTHON_SAMPLE)
+        summary = summarize_repository(builder)
+        assert summary.total_files == 1
+        lang_names = {l.language for l in summary.languages}
+        assert "python" in lang_names
+# ---------------------------------------------------------------------------
+# AI Context Generation
+# ---------------------------------------------------------------------------
+class TestGenerateAIContext:
+    @pytest.fixture(autouse=True)
+    def setup(self):
+        self.builder = ContextBuilder()
+        self.builder.index_file("app.py", PYTHON_SAMPLE)
+        self.builder.index_file("app.js", JS_SAMPLE)
+    def test_basic_context(self):
+        ctx = generate_ai_context(self.builder)
+        assert "summary" in ctx
+        assert "call_graph" in ctx
+        assert "dependencies" in ctx
+    def test_context_with_symbol_focus(self):
+        ctx = generate_ai_context(self.builder, symbol_name="helper")
+        assert "focused_contexts" in ctx
+        assert len(ctx["focused_contexts"]) >= 1
+    def test_context_with_file_focus(self):
+        ctx = generate_ai_context(self.builder, file_path="app.py")
+        assert "file_symbols" in ctx
+        assert len(ctx["file_symbols"]) > 0
+    def test_context_without_call_graph(self):
+        ctx = generate_ai_context(self.builder, include_call_graph=False)
+        assert "call_graph" not in ctx
+    def test_context_without_dependencies(self):
+        ctx = generate_ai_context(self.builder, include_dependencies=False)
+        assert "dependencies" not in ctx
+    def test_context_is_json_serializable(self):
+        ctx = generate_ai_context(self.builder)
+        j = json.dumps(ctx)
+        assert len(j) > 0
+    def test_call_graph_has_edges(self):
+        ctx = generate_ai_context(self.builder)
+        assert ctx["call_graph"]["edge_count"] > 0
+    def test_dependencies_has_files(self):
+        ctx = generate_ai_context(self.builder)
+        assert "app.py" in ctx["dependencies"]
+# ---------------------------------------------------------------------------
+# Code Explanation
+# ---------------------------------------------------------------------------
+class TestExplainSymbol:
+    @pytest.fixture(autouse=True)
+    def setup(self):
+        self.builder = ContextBuilder()
+        self.builder.index_file("app.py", PYTHON_SAMPLE)
+        self.symbols = self.builder.get_all_symbols()
+    def test_explain_function(self):
+        func = next(s for s in self.symbols if s.name == "helper")
+        explanation = explain_symbol(func)
+        assert explanation.symbol_name == "helper"
+        assert explanation.symbol_kind == "function"
+        assert "Function" in explanation.summary
+        assert "helper" in explanation.summary
+    def test_explain_class(self):
+        cls = next(s for s in self.symbols if s.name == "Worker")
+        explanation = explain_symbol(cls)
+        assert explanation.symbol_name == "Worker"
+        assert "Class" in explanation.summary
+    def test_explain_method(self):
+        method = next(s for s in self.symbols if s.name == "process")
+        explanation = explain_symbol(method)
+        assert explanation.symbol_name == "process"
+        assert "Method" in explanation.summary
+        assert "Worker" in explanation.summary
+    def test_explain_import(self):
+        imp = next(s for s in self.symbols if s.kind == "import")
+        explanation = explain_symbol(imp)
+        assert "Import" in explanation.summary
+    def test_explain_with_builder_context(self):
+        func = next(s for s in self.symbols if s.name == "main")
+        explanation = explain_symbol(func, self.builder)
+        assert "related_symbols" in explanation.details or "file_imports" in explanation.details
+    def test_explanation_to_dict(self):
+        func = next(s for s in self.symbols if s.name == "helper")
+        explanation = explain_symbol(func)
+        d = explanation.to_dict()
+        assert "symbol_name" in d
+        assert "summary" in d
+        assert "details" in d
+    def test_explanation_render(self):
+        func = next(s for s in self.symbols if s.name == "helper")
+        explanation = explain_symbol(func)
+        text = explanation.render()
+        assert "helper" in text
+        assert "File:" in text
+    def test_explanation_render_with_details(self):
+        func = next(s for s in self.symbols if s.name == "main")
+        explanation = explain_symbol(func, self.builder)
+        text = explanation.render()
+        assert "main" in text
+class TestExplainFile:
+    def test_explain_python_file(self):
+        explanations = explain_file("app.py", PYTHON_SAMPLE)
+        assert len(explanations) > 0
+        # Should not include imports
+        for e in explanations:
+            assert e.symbol_kind != "import"
+    def test_explain_js_file(self):
+        explanations = explain_file("app.js", JS_SAMPLE)
+        assert len(explanations) > 0
+    def test_explain_empty_file(self):
+        explanations = explain_file("empty.py", "")
+        assert explanations == []
+    def test_explain_unsupported_file(self):
+        explanations = explain_file("style.css", "body { color: red; }")
+        assert explanations == []
+    def test_each_explanation_has_name(self):
+        explanations = explain_file("app.py", PYTHON_SAMPLE)
+        for e in explanations:
+            assert e.symbol_name
+            assert e.file_path == "app.py"
+class TestCodeExplanation:
+    def test_dataclass_fields(self):
+        exp = CodeExplanation(
+            symbol_name="foo",
+            symbol_kind="function",
+            file_path="test.py",
+            summary="A test function.",
+            details={"parameters": "a, b"},
+        )
+        assert exp.symbol_name == "foo"
+        assert exp.details["parameters"] == "a, b"
+    def test_render_empty_details(self):
+        exp = CodeExplanation(
+            symbol_name="foo",
+            symbol_kind="function",
+            file_path="test.py",
+            summary="A test function.",
+        )
+        text = exp.render()
+        assert "foo" in text
+        assert "Function" in text
+# ---------------------------------------------------------------------------
+# Edge cases
+# ---------------------------------------------------------------------------
+class TestAIFeaturesEdgeCases:
+    def test_summary_single_symbol(self):
+        builder = ContextBuilder()
+        builder.index_file("one.py", "def single(): pass\n")
+        summary = summarize_repository(builder)
+        assert summary.total_functions == 1
+        assert summary.total_files == 1
+    def test_ai_context_empty_builder(self):
+        builder = ContextBuilder()
+        ctx = generate_ai_context(builder)
+        assert ctx["summary"]["total_files"] == 0
+    def test_ai_context_nonexistent_symbol(self):
+        builder = ContextBuilder()
+        builder.index_file("app.py", PYTHON_SAMPLE)
+        ctx = generate_ai_context(builder, symbol_name="nonexistent")
+        assert ctx["focused_contexts"] == []
+    def test_ai_context_nonexistent_file(self):
+        builder = ContextBuilder()
+        builder.index_file("app.py", PYTHON_SAMPLE)
+        ctx = generate_ai_context(builder, file_path="nonexistent.py")
+        assert ctx["file_symbols"] == []

semantic_code_intelligence/tests/test_chunker.py ADDED Viewed

@@ -0,0 +1,119 @@
+"""Tests for the code chunker."""
+from __future__ import annotations
+from pathlib import Path
+import pytest
+from semantic_code_intelligence.indexing.chunker import (
+    CodeChunk,
+    chunk_code,
+    chunk_file,
+    detect_language,
+)
+class TestDetectLanguage:
+    """Tests for language detection."""
+    def test_python(self):
+        assert detect_language("main.py") == "python"
+    def test_javascript(self):
+        assert detect_language("app.js") == "javascript"
+    def test_typescript(self):
+        assert detect_language("component.tsx") == "typescript"
+    def test_java(self):
+        assert detect_language("Main.java") == "java"
+    def test_unknown(self):
+        assert detect_language("data.xyz") == "unknown"
+    def test_path_with_directory(self):
+        assert detect_language("/some/path/file.py") == "python"
+        assert detect_language("C:\\code\\file.js") == "javascript"
+class TestChunkCode:
+    """Tests for code chunking logic."""
+    def test_empty_content(self):
+        chunks = chunk_code("", "test.py")
+        assert chunks == []
+    def test_whitespace_only(self):
+        chunks = chunk_code("   \n  \n ", "test.py")
+        assert chunks == []
+    def test_small_file_single_chunk(self):
+        code = "def hello():\n    return 'world'\n"
+        chunks = chunk_code(code, "test.py", chunk_size=1000)
+        assert len(chunks) == 1
+        assert chunks[0].content == code
+        assert chunks[0].start_line == 1
+        assert chunks[0].end_line == 2
+        assert chunks[0].language == "python"
+        assert chunks[0].chunk_index == 0
+    def test_large_file_multiple_chunks(self):
+        lines = [f"line_{i} = {i}\n" for i in range(100)]
+        code = "".join(lines)
+        chunks = chunk_code(code, "test.py", chunk_size=200, chunk_overlap=50)
+        assert len(chunks) > 1
+    def test_chunks_cover_all_content(self):
+        lines = [f"x_{i} = {i}\n" for i in range(50)]
+        code = "".join(lines)
+        chunks = chunk_code(code, "test.py", chunk_size=100, chunk_overlap=20)
+        # Every line should appear in at least one chunk
+        all_chunk_text = "".join(c.content for c in chunks)
+        for line in lines:
+            assert line in all_chunk_text
+    def test_chunk_index_sequential(self):
+        lines = [f"var_{i} = {i}\n" for i in range(100)]
+        code = "".join(lines)
+        chunks = chunk_code(code, "test.py", chunk_size=150, chunk_overlap=30)
+        for i, chunk in enumerate(chunks):
+            assert chunk.chunk_index == i
+    def test_chunk_metadata(self):
+        code = "function hello() { return 1; }\n"
+        chunks = chunk_code(code, "app.js", chunk_size=1000)
+        assert chunks[0].file_path == "app.js"
+        assert chunks[0].language == "javascript"
+    def test_overlap_between_chunks(self):
+        lines = [f"line_{i:03d} = {i}\n" for i in range(100)]
+        code = "".join(lines)
+        chunks = chunk_code(code, "test.py", chunk_size=200, chunk_overlap=50)
+        if len(chunks) >= 2:
+            # Last lines of chunk N should appear in chunk N+1
+            chunk0_lines = set(chunks[0].content.splitlines())
+            chunk1_lines = set(chunks[1].content.splitlines())
+            overlap = chunk0_lines & chunk1_lines
+            assert len(overlap) > 0
+class TestChunkFile:
+    """Tests for file-based chunking."""
+    def test_chunk_existing_file(self, tmp_path: Path):
+        f = tmp_path / "test.py"
+        f.write_text("def hello():\n    pass\n", encoding="utf-8")
+        chunks = chunk_file(f, chunk_size=1000)
+        assert len(chunks) == 1
+    def test_chunk_nonexistent_file(self, tmp_path: Path):
+        f = tmp_path / "missing.py"
+        chunks = chunk_file(f)
+        assert chunks == []
+    def test_chunk_empty_file(self, tmp_path: Path):
+        f = tmp_path / "empty.py"
+        f.write_text("", encoding="utf-8")
+        chunks = chunk_file(f)
+        assert chunks == []

semantic_code_intelligence/tests/test_cli.py ADDED Viewed

@@ -0,0 +1,188 @@
+"""Tests for CLI commands and routing."""
+from __future__ import annotations
+import json
+from pathlib import Path
+import pytest
+from click.testing import CliRunner
+from semantic_code_intelligence.cli.main import cli
+@pytest.fixture
+def runner() -> CliRunner:
+    """Provide a Click test runner."""
+    return CliRunner()
+@pytest.fixture
+def initialized_project(tmp_path: Path) -> Path:
+    """Create an initialized project directory."""
+    runner = CliRunner()
+    with runner.isolated_filesystem(temp_dir=tmp_path) as td:
+        project = Path(td)
+        runner.invoke(cli, ["init", str(project)])
+        yield project
+class TestCLIMain:
+    """Tests for the main CLI group."""
+    def test_cli_help(self, runner: CliRunner):
+        result = runner.invoke(cli, ["--help"])
+        assert result.exit_code == 0
+        assert "Codex" in result.output
+    def test_cli_version(self, runner: CliRunner):
+        result = runner.invoke(cli, ["--version"])
+        assert result.exit_code == 0
+        assert "0.4.0" in result.output
+    def test_cli_verbose_flag(self, runner: CliRunner):
+        result = runner.invoke(cli, ["--verbose", "--help"])
+        assert result.exit_code == 0
+class TestInitCommand:
+    """Tests for the init command."""
+    def test_init_creates_project(self, runner: CliRunner, tmp_path: Path):
+        result = runner.invoke(cli, ["init", str(tmp_path)])
+        assert result.exit_code == 0
+        assert (tmp_path / ".codexa").is_dir()
+        assert (tmp_path / ".codexa" / "config.json").exists()
+        assert (tmp_path / ".codexa" / "index").is_dir()
+    def test_init_already_initialized(self, runner: CliRunner, tmp_path: Path):
+        # First init
+        runner.invoke(cli, ["init", str(tmp_path)])
+        # Second init should detect existing
+        result = runner.invoke(cli, ["init", str(tmp_path)])
+        assert result.exit_code == 0
+        assert "already initialized" in result.output
+    def test_init_default_path(self, runner: CliRunner):
+        with runner.isolated_filesystem() as td:
+            result = runner.invoke(cli, ["init"])
+            assert result.exit_code == 0
+            assert Path(td, ".codexa").is_dir()
+class TestIndexCommand:
+    """Tests for the index command."""
+    def test_index_without_init_fails(self, runner: CliRunner, tmp_path: Path):
+        result = runner.invoke(cli, ["index", str(tmp_path)])
+        assert result.exit_code != 0 or "not initialized" in result.output.lower()
+    def test_index_initialized_project(self, runner: CliRunner, tmp_path: Path):
+        # Initialize first
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(cli, ["index", str(tmp_path)])
+        assert result.exit_code == 0
+        assert "Indexing" in result.output or "index" in result.output.lower()
+    def test_index_with_python_files(self, runner: CliRunner, tmp_path: Path):
+        # Create some Python files
+        (tmp_path / "main.py").write_text("def hello(): pass", encoding="utf-8")
+        (tmp_path / "utils.py").write_text("def helper(): pass", encoding="utf-8")
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(cli, ["index", str(tmp_path)])
+        assert result.exit_code == 0
+        # Should find 2 py files (not counting files in .codexa)
+        assert "2 files" in result.output
+    def test_index_ignores_excluded_dirs(self, runner: CliRunner, tmp_path: Path):
+        # Create files in ignored directories
+        (tmp_path / "main.py").write_text("def hello(): pass", encoding="utf-8")
+        node_modules = tmp_path / "node_modules"
+        node_modules.mkdir()
+        (node_modules / "pkg.js").write_text("function f(){}", encoding="utf-8")
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(cli, ["index", str(tmp_path)])
+        assert result.exit_code == 0
+        assert "1 files" in result.output
+    def test_index_force_flag(self, runner: CliRunner, tmp_path: Path):
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(cli, ["index", str(tmp_path), "--force"])
+        assert result.exit_code == 0
+class TestSearchCommand:
+    """Tests for the search command."""
+    def test_search_without_init_fails(self, runner: CliRunner, tmp_path: Path):
+        result = runner.invoke(cli, ["search", "test query", "--path", str(tmp_path)])
+        assert result.exit_code != 0 or "not initialized" in result.output.lower()
+    def test_search_human_readable(self, runner: CliRunner, tmp_path: Path):
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(
+            cli, ["search", "test query", "--path", str(tmp_path)]
+        )
+        assert result.exit_code == 0
+        # Without an index, shows empty index warning
+        assert "empty" in result.output.lower() or "no results" in result.output.lower()
+    def test_search_json_output(self, runner: CliRunner, tmp_path: Path):
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(
+            cli, ["search", "jwt verification", "--json", "--no-auto-index", "--path", str(tmp_path)]
+        )
+        assert result.exit_code == 0
+        data = json.loads(result.output)
+        assert data["query"] == "jwt verification"
+        assert "results" in data
+        assert isinstance(data["results"], list)
+    def test_search_custom_top_k(self, runner: CliRunner, tmp_path: Path):
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(
+            cli,
+            ["search", "query", "-k", "5", "--json", "--no-auto-index", "--path", str(tmp_path)],
+        )
+        assert result.exit_code == 0
+        data = json.loads(result.output)
+        assert data["top_k"] == 5
+    def test_search_default_top_k_from_config(self, runner: CliRunner, tmp_path: Path):
+        runner.invoke(cli, ["init", str(tmp_path)])
+        result = runner.invoke(
+            cli,
+            ["search", "query", "--json", "--no-auto-index", "--path", str(tmp_path)],
+        )
+        assert result.exit_code == 0
+        data = json.loads(result.output)
+        assert data["top_k"] == 10  # default from config
+class TestCommandRouting:
+    """Tests that all commands are properly registered and routable."""
+    def test_all_commands_registered(self, runner: CliRunner):
+        result = runner.invoke(cli, ["--help"])
+        assert result.exit_code == 0
+        # All Phase 1 commands should appear in help
+        for cmd_name in ["init", "index", "search"]:
+            assert cmd_name in result.output
+    def test_init_command_accessible(self, runner: CliRunner):
+        result = runner.invoke(cli, ["init", "--help"])
+        assert result.exit_code == 0
+    def test_index_command_accessible(self, runner: CliRunner):
+        result = runner.invoke(cli, ["index", "--help"])
+        assert result.exit_code == 0
+    def test_search_command_accessible(self, runner: CliRunner):
+        result = runner.invoke(cli, ["search", "--help"])
+        assert result.exit_code == 0
+    def test_unknown_command_fails(self, runner: CliRunner):
+        result = runner.invoke(cli, ["nonexistent"])
+        assert result.exit_code != 0