PyPI - ai-coding-assistant - Versions diffs - 0.5.0__py3-none-any.whl - Mend

ai-coding-assistant 0.5.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

ai_coding_assistant-0.5.0.dist-info/METADATA +226 -0
ai_coding_assistant-0.5.0.dist-info/RECORD +89 -0
ai_coding_assistant-0.5.0.dist-info/WHEEL +4 -0
ai_coding_assistant-0.5.0.dist-info/entry_points.txt +3 -0
ai_coding_assistant-0.5.0.dist-info/licenses/LICENSE +21 -0
coding_assistant/__init__.py +3 -0
coding_assistant/__main__.py +19 -0
coding_assistant/cli/__init__.py +1 -0
coding_assistant/cli/app.py +158 -0
coding_assistant/cli/commands/__init__.py +19 -0
coding_assistant/cli/commands/ask.py +178 -0
coding_assistant/cli/commands/config.py +438 -0
coding_assistant/cli/commands/diagram.py +267 -0
coding_assistant/cli/commands/document.py +410 -0
coding_assistant/cli/commands/explain.py +192 -0
coding_assistant/cli/commands/fix.py +249 -0
coding_assistant/cli/commands/index.py +162 -0
coding_assistant/cli/commands/refactor.py +245 -0
coding_assistant/cli/commands/search.py +182 -0
coding_assistant/cli/commands/serve_docs.py +128 -0
coding_assistant/cli/repl.py +381 -0
coding_assistant/cli/theme.py +90 -0
coding_assistant/codebase/__init__.py +1 -0
coding_assistant/codebase/crawler.py +93 -0
coding_assistant/codebase/parser.py +266 -0
coding_assistant/config/__init__.py +25 -0
coding_assistant/config/config_manager.py +615 -0
coding_assistant/config/settings.py +82 -0
coding_assistant/context/__init__.py +19 -0
coding_assistant/context/chunker.py +443 -0
coding_assistant/context/enhanced_retriever.py +322 -0
coding_assistant/context/hybrid_search.py +311 -0
coding_assistant/context/ranker.py +355 -0
coding_assistant/context/retriever.py +119 -0
coding_assistant/context/window.py +362 -0
coding_assistant/documentation/__init__.py +23 -0
coding_assistant/documentation/agents/__init__.py +27 -0
coding_assistant/documentation/agents/coordinator.py +510 -0
coding_assistant/documentation/agents/module_documenter.py +111 -0
coding_assistant/documentation/agents/synthesizer.py +139 -0
coding_assistant/documentation/agents/task_delegator.py +100 -0
coding_assistant/documentation/decomposition/__init__.py +21 -0
coding_assistant/documentation/decomposition/context_preserver.py +477 -0
coding_assistant/documentation/decomposition/module_detector.py +302 -0
coding_assistant/documentation/decomposition/partitioner.py +621 -0
coding_assistant/documentation/generators/__init__.py +14 -0
coding_assistant/documentation/generators/dataflow_generator.py +440 -0
coding_assistant/documentation/generators/diagram_generator.py +511 -0
coding_assistant/documentation/graph/__init__.py +13 -0
coding_assistant/documentation/graph/dependency_builder.py +468 -0
coding_assistant/documentation/graph/module_analyzer.py +475 -0
coding_assistant/documentation/writers/__init__.py +11 -0
coding_assistant/documentation/writers/markdown_writer.py +322 -0
coding_assistant/embeddings/__init__.py +0 -0
coding_assistant/embeddings/generator.py +89 -0
coding_assistant/embeddings/store.py +187 -0
coding_assistant/exceptions/__init__.py +50 -0
coding_assistant/exceptions/base.py +110 -0
coding_assistant/exceptions/llm.py +249 -0
coding_assistant/exceptions/recovery.py +263 -0
coding_assistant/exceptions/storage.py +213 -0
coding_assistant/exceptions/validation.py +230 -0
coding_assistant/llm/__init__.py +1 -0
coding_assistant/llm/client.py +277 -0
coding_assistant/llm/gemini_client.py +181 -0
coding_assistant/llm/groq_client.py +160 -0
coding_assistant/llm/prompts.py +98 -0
coding_assistant/llm/together_client.py +160 -0
coding_assistant/operations/__init__.py +13 -0
coding_assistant/operations/differ.py +369 -0
coding_assistant/operations/generator.py +347 -0
coding_assistant/operations/linter.py +430 -0
coding_assistant/operations/validator.py +406 -0
coding_assistant/storage/__init__.py +9 -0
coding_assistant/storage/database.py +363 -0
coding_assistant/storage/session.py +231 -0
coding_assistant/utils/__init__.py +31 -0
coding_assistant/utils/cache.py +477 -0
coding_assistant/utils/hardware.py +132 -0
coding_assistant/utils/keystore.py +206 -0
coding_assistant/utils/logger.py +32 -0
coding_assistant/utils/progress.py +311 -0
coding_assistant/validation/__init__.py +13 -0
coding_assistant/validation/files.py +305 -0
coding_assistant/validation/inputs.py +335 -0
coding_assistant/validation/params.py +280 -0
coding_assistant/validation/sanitizers.py +243 -0
coding_assistant/vcs/__init__.py +5 -0
coding_assistant/vcs/git.py +269 -0

coding_assistant/context/window.py ADDED Viewed

@@ -0,0 +1,362 @@
+"""Token window management for LLM context limits."""
+from typing import List, Dict, Optional, Any
+import tiktoken
+from dataclasses import dataclass
+@dataclass
+class TokenBudget:
+    """Token budget allocation."""
+    total: int
+    system_prompt: int
+    query: int
+    history: int
+    chunks: int
+    response_reserved: int
+    @property
+    def used(self) -> int:
+        """Total tokens used."""
+        return self.system_prompt + self.query + self.history + self.chunks
+    @property
+    def available(self) -> int:
+        """Available tokens for response."""
+        return self.total - self.used - self.response_reserved
+    @property
+    def utilization(self) -> float:
+        """Context window utilization (0-1)."""
+        return self.used / (self.total - self.response_reserved)
+class TokenWindowManager:
+    """
+    Manages context within LLM token limits.
+    This class handles:
+    - Token counting for text
+    - Context prioritization
+    - Truncation when needed
+    - Budget allocation
+    Default allocations:
+    - System prompt: 5-10% (reserved)
+    - Response: 15-20% (reserved)
+    - Query: actual size
+    - History: up to 30%
+    - Code chunks: remaining space
+    """
+    def __init__(
+        self,
+        max_tokens: int = 150000,  # Default for Claude Sonnet
+        reserved_response: int = 4000,
+        reserved_system: int = 1000,
+        max_history_ratio: float = 0.3,  # Max 30% for history
+        encoding: str = "cl100k_base"  # OpenAI compatible encoding
+    ):
+        """
+        Initialize token window manager.
+        Args:
+            max_tokens: Maximum context window size
+            reserved_response: Tokens reserved for LLM response
+            reserved_system: Tokens reserved for system prompt
+            max_history_ratio: Maximum ratio of tokens for history
+            encoding: Tiktoken encoding to use
+        """
+        self.max_tokens = max_tokens
+        self.reserved_response = reserved_response
+        self.reserved_system = reserved_system
+        self.max_history_ratio = max_history_ratio
+        try:
+            self.encoder = tiktoken.get_encoding(encoding)
+        except Exception:
+            # Fallback to basic estimation
+            self.encoder = None
+    def count_tokens(self, text: str) -> int:
+        """
+        Count tokens in text.
+        Args:
+            text: Text to count tokens for
+        Returns:
+            Number of tokens
+        """
+        if not text:
+            return 0
+        if self.encoder:
+            try:
+                return len(self.encoder.encode(text))
+            except Exception:
+                pass
+        # Fallback: rough estimation (1 token ≈ 4 characters)
+        return len(text) // 4
+    def build_context(
+        self,
+        query: str,
+        chunks: List[Dict[str, Any]],
+        history: Optional[List[Dict[str, str]]] = None,
+        system_prompt: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """
+        Build context within token limit.
+        Args:
+            query: User query
+            chunks: Code chunks (must have 'content' key)
+            history: Conversation history (list of {role, content})
+            system_prompt: System prompt text
+        Returns:
+            Dict with selected context and token budget
+        """
+        history = history or []
+        # Count tokens for fixed components
+        query_tokens = self.count_tokens(query)
+        system_tokens = self.count_tokens(system_prompt) if system_prompt else self.reserved_system
+        # Available tokens for history and chunks
+        available = self.max_tokens - self.reserved_response - system_tokens - query_tokens
+        if available <= 0:
+            # Query too long!
+            return {
+                'query': query,
+                'history': [],
+                'chunks': [],
+                'budget': self._create_budget(
+                    system_tokens, query_tokens, 0, 0
+                ),
+                'truncated': True,
+                'error': 'Query exceeds token limit'
+            }
+        # Allocate history (up to max_history_ratio)
+        max_history_tokens = int(available * self.max_history_ratio)
+        included_history, history_tokens = self._select_history(
+            history, max_history_tokens
+        )
+        # Remaining tokens for chunks
+        available_for_chunks = available - history_tokens
+        # Select chunks that fit
+        included_chunks, chunk_tokens = self._select_chunks(
+            chunks, available_for_chunks
+        )
+        budget = self._create_budget(
+            system_tokens, query_tokens, history_tokens, chunk_tokens
+        )
+        return {
+            'query': query,
+            'history': included_history,
+            'chunks': included_chunks,
+            'budget': budget,
+            'truncated': len(included_chunks) < len(chunks) or len(included_history) < len(history)
+        }
+    def _select_history(
+        self,
+        history: List[Dict[str, str]],
+        max_tokens: int
+    ) -> tuple[List[Dict[str, str]], int]:
+        """
+        Select history messages that fit within token limit.
+        Prioritizes recent messages.
+        Args:
+            history: Full conversation history
+            max_tokens: Maximum tokens for history
+        Returns:
+            Tuple of (selected messages, total tokens)
+        """
+        if not history:
+            return [], 0
+        included = []
+        total_tokens = 0
+        # Start from most recent and work backwards
+        for msg in reversed(history[-20:]):  # Consider last 20 messages
+            content = msg.get('content', '')
+            msg_tokens = self.count_tokens(content)
+            if total_tokens + msg_tokens <= max_tokens:
+                included.insert(0, msg)  # Maintain chronological order
+                total_tokens += msg_tokens
+            else:
+                # Can't fit more messages
+                break
+        return included, total_tokens
+    def _select_chunks(
+        self,
+        chunks: List[Dict[str, Any]],
+        max_tokens: int
+    ) -> tuple[List[Dict[str, Any]], int]:
+        """
+        Select code chunks that fit within token limit.
+        Assumes chunks are already ranked by relevance.
+        Args:
+            chunks: Code chunks (ranked)
+            max_tokens: Maximum tokens for chunks
+        Returns:
+            Tuple of (selected chunks, total tokens)
+        """
+        if not chunks:
+            return [], 0
+        included = []
+        total_tokens = 0
+        for chunk in chunks:
+            content = chunk.get('content', '')
+            chunk_tokens = self.count_tokens(content)
+            if total_tokens + chunk_tokens <= max_tokens:
+                included.append(chunk)
+                total_tokens += chunk_tokens
+            else:
+                # Try to fit at least one chunk
+                if not included and chunk_tokens <= max_tokens * 1.2:
+                    # Allow slight overflow for first chunk
+                    included.append(chunk)
+                    total_tokens += chunk_tokens
+                break
+        return included, total_tokens
+    def _create_budget(
+        self,
+        system_tokens: int,
+        query_tokens: int,
+        history_tokens: int,
+        chunk_tokens: int
+    ) -> TokenBudget:
+        """Create token budget summary."""
+        return TokenBudget(
+            total=self.max_tokens,
+            system_prompt=system_tokens,
+            query=query_tokens,
+            history=history_tokens,
+            chunks=chunk_tokens,
+            response_reserved=self.reserved_response
+        )
+    def estimate_response_tokens(self, response: str) -> int:
+        """
+        Estimate tokens in a response.
+        Args:
+            response: Response text
+        Returns:
+            Estimated token count
+        """
+        return self.count_tokens(response)
+    def can_fit(self, text: str, available_tokens: int) -> bool:
+        """
+        Check if text fits within token limit.
+        Args:
+            text: Text to check
+            available_tokens: Available token budget
+        Returns:
+            True if text fits
+        """
+        return self.count_tokens(text) <= available_tokens
+    def truncate_text(self, text: str, max_tokens: int) -> str:
+        """
+        Truncate text to fit within token limit.
+        Args:
+            text: Text to truncate
+            max_tokens: Maximum tokens allowed
+        Returns:
+            Truncated text
+        """
+        tokens = self.count_tokens(text)
+        if tokens <= max_tokens:
+            return text
+        # Binary search for the right length
+        if self.encoder:
+            encoded = self.encoder.encode(text)
+            truncated = encoded[:max_tokens]
+            return self.encoder.decode(truncated) + "..."
+        # Fallback: character-based truncation
+        ratio = max_tokens / tokens
+        char_limit = int(len(text) * ratio)
+        return text[:char_limit] + "..."
+    def get_model_limits(self, model_name: str) -> tuple[int, int]:
+        """
+        Get token limits for known models.
+        Args:
+            model_name: Model identifier
+        Returns:
+            Tuple of (max_tokens, recommended_response_reserve)
+        """
+        limits = {
+            'claude-sonnet': (200000, 4000),
+            'claude-opus': (200000, 4000),
+            'gpt-4': (128000, 4000),
+            'gpt-3.5': (16385, 2000),
+            'ollama-default': (4096, 512),
+        }
+        # Match by substring
+        for key, (max_tok, reserve) in limits.items():
+            if key in model_name.lower():
+                return max_tok, reserve
+        # Conservative default
+        return 8000, 1000
+    def format_budget_summary(self, budget: TokenBudget) -> str:
+        """
+        Format budget for display.
+        Args:
+            budget: Token budget
+        Returns:
+            Formatted string
+        """
+        return f"""Token Budget:
+  Total Window:    {budget.total:,} tokens
+  System Prompt:   {budget.system_prompt:,} tokens ({budget.system_prompt/budget.total*100:.1f}%)
+  Query:           {budget.query:,} tokens ({budget.query/budget.total*100:.1f}%)
+  History:         {budget.history:,} tokens ({budget.history/budget.total*100:.1f}%)
+  Code Chunks:     {budget.chunks:,} tokens ({budget.chunks/budget.total*100:.1f}%)
+  Reserved (Resp): {budget.response_reserved:,} tokens ({budget.response_reserved/budget.total*100:.1f}%)
+  ─────────────────────────────────────
+  Used:            {budget.used:,} tokens ({budget.utilization*100:.1f}%)
+  Available:       {budget.available:,} tokens
+"""

coding_assistant/documentation/__init__.py ADDED Viewed

@@ -0,0 +1,23 @@
+"""Documentation generation module for AI Coding Assistant.
+This module provides CodeWiki-style automated documentation generation:
+- Repository-level architecture understanding
+- Hierarchical decomposition for scalability
+- Multi-agent documentation generation
+- Visual diagram creation (Mermaid)
+- Incremental updates and continuous synchronization
+"""
+from coding_assistant.documentation.graph.dependency_builder import (
+    DependencyGraphBuilder,
+    CodeEntity,
+)
+from coding_assistant.documentation.graph.module_analyzer import ModuleAnalyzer
+__all__ = [
+    'DependencyGraphBuilder',
+    'CodeEntity',
+    'ModuleAnalyzer',
+]
+__version__ = '0.5.0'

coding_assistant/documentation/agents/__init__.py ADDED Viewed

@@ -0,0 +1,27 @@
+"""Multi-agent documentation generation system.
+This module implements parallel documentation generation using multiple LLM agents,
+inspired by CodeWiki's recursive multi-agent approach.
+"""
+from coding_assistant.documentation.agents.coordinator import (
+    MultiAgentCoordinator,
+    DocumentationTask,
+)
+from coding_assistant.documentation.agents.module_documenter import (
+    ModuleDocumenter,
+)
+from coding_assistant.documentation.agents.synthesizer import (
+    DocumentationSynthesizer,
+)
+from coding_assistant.documentation.agents.task_delegator import (
+    TaskDelegator,
+)
+__all__ = [
+    'MultiAgentCoordinator',
+    'DocumentationTask',
+    'ModuleDocumenter',
+    'DocumentationSynthesizer',
+    'TaskDelegator',
+]