PyPI - cite-agent - Versions diffs - 1.3.9__py3-none-any.whl → 1.4.3__py3-none-any.whl - Mend

cite-agent 1.3.9py3-none-any.whl → 1.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

cite_agent/__init__.py +13 -13
cite_agent/__version__.py +1 -1
cite_agent/action_first_mode.py +150 -0
cite_agent/adaptive_providers.py +413 -0
cite_agent/archive_api_client.py +186 -0
cite_agent/auth.py +0 -1
cite_agent/auto_expander.py +70 -0
cite_agent/cache.py +379 -0
cite_agent/circuit_breaker.py +370 -0
cite_agent/citation_network.py +377 -0
cite_agent/cli.py +8 -16
cite_agent/cli_conversational.py +113 -3
cite_agent/confidence_calibration.py +381 -0
cite_agent/deduplication.py +325 -0
cite_agent/enhanced_ai_agent.py +689 -371
cite_agent/error_handler.py +228 -0
cite_agent/execution_safety.py +329 -0
cite_agent/full_paper_reader.py +239 -0
cite_agent/observability.py +398 -0
cite_agent/offline_mode.py +348 -0
cite_agent/paper_comparator.py +368 -0
cite_agent/paper_summarizer.py +420 -0
cite_agent/pdf_extractor.py +350 -0
cite_agent/proactive_boundaries.py +266 -0
cite_agent/quality_gate.py +442 -0
cite_agent/request_queue.py +390 -0
cite_agent/response_enhancer.py +257 -0
cite_agent/response_formatter.py +458 -0
cite_agent/response_pipeline.py +295 -0
cite_agent/response_style_enhancer.py +259 -0
cite_agent/self_healing.py +418 -0
cite_agent/similarity_finder.py +524 -0
cite_agent/streaming_ui.py +13 -9
cite_agent/thinking_blocks.py +308 -0
cite_agent/tool_orchestrator.py +416 -0
cite_agent/trend_analyzer.py +540 -0
cite_agent/unpaywall_client.py +226 -0
{cite_agent-1.3.9.dist-info → cite_agent-1.4.3.dist-info}/METADATA +15 -1
cite_agent-1.4.3.dist-info/RECORD +62 -0
cite_agent-1.3.9.dist-info/RECORD +0 -32
{cite_agent-1.3.9.dist-info → cite_agent-1.4.3.dist-info}/WHEEL +0 -0
{cite_agent-1.3.9.dist-info → cite_agent-1.4.3.dist-info}/entry_points.txt +0 -0
{cite_agent-1.3.9.dist-info → cite_agent-1.4.3.dist-info}/licenses/LICENSE +0 -0
{cite_agent-1.3.9.dist-info → cite_agent-1.4.3.dist-info}/top_level.txt +0 -0

cite_agent/citation_network.py ADDED Viewed

@@ -0,0 +1,377 @@
+"""
+Citation Network Mapper - Find foundational papers and research lineages
+Provides tools for:
+- Mapping citation networks
+- Finding seminal papers
+- Tracing research lineage
+- Suggesting reading order
+"""
+from typing import List, Dict, Any, Optional, Set, Tuple
+import logging
+from collections import defaultdict, deque
+logger = logging.getLogger(__name__)
+class CitationNetwork:
+    """Maps and analyzes citation networks between papers"""
+    def __init__(self, archive_client=None):
+        """
+        Initialize citation network mapper
+        Args:
+            archive_client: ArchiveAPIClient instance for fetching citation data
+        """
+        self.archive_client = archive_client
+        self._citation_cache = {}
+        self._reference_cache = {}
+    def map_citations(self, paper_id: str, depth: int = 1, max_papers: int = 50) -> Dict[str, Any]:
+        """
+        Map citation network for a paper
+        Args:
+            paper_id: DOI, arXiv ID, or Semantic Scholar ID
+            depth: How many citation levels to traverse (1-3)
+            max_papers: Maximum papers to include
+        Returns:
+            Dictionary with nodes (papers) and edges (citations)
+        """
+        if not self.archive_client:
+            logger.warning("No archive client provided - citation mapping unavailable")
+            return {"nodes": [], "edges": [], "error": "Archive client required"}
+        try:
+            # Get base paper
+            base_paper = self._fetch_paper(paper_id)
+            if not base_paper:
+                return {"nodes": [], "edges": [], "error": f"Paper {paper_id} not found"}
+            nodes = []
+            edges = []
+            visited = set()
+            # BFS traversal
+            queue = deque([(base_paper, 0)])  # (paper, current_depth)
+            while queue and len(nodes) < max_papers:
+                paper, current_depth = queue.popleft()
+                paper_id = paper.get('paperId') or paper.get('id')
+                if not paper_id or paper_id in visited:
+                    continue
+                visited.add(paper_id)
+                # Add node
+                nodes.append({
+                    'id': paper_id,
+                    'title': paper.get('title', 'Unknown'),
+                    'year': paper.get('year'),
+                    'citationCount': paper.get('citationCount', 0),
+                    'authors': [a.get('name') for a in paper.get('authors', [])[:3]],
+                    'depth': current_depth
+                })
+                # Get citations if within depth limit
+                if current_depth < depth:
+                    citations = self._fetch_citations(paper_id)
+                    for cited_paper in citations[:20]:  # Limit per paper
+                        cited_id = cited_paper.get('paperId') or cited_paper.get('id')
+                        if cited_id and cited_id not in visited:
+                            edges.append({
+                                'source': paper_id,
+                                'target': cited_id,
+                                'type': 'cites'
+                            })
+                            queue.append((cited_paper, current_depth + 1))
+            return {
+                'nodes': nodes,
+                'edges': edges,
+                'stats': {
+                    'total_papers': len(nodes),
+                    'total_citations': len(edges),
+                    'max_depth': depth,
+                    'most_cited': max(nodes, key=lambda x: x['citationCount']) if nodes else None
+                }
+            }
+        except Exception as e:
+            logger.error(f"Error mapping citations: {e}")
+            return {"nodes": [], "edges": [], "error": str(e)}
+    def find_seminal_papers(self, topic: str, min_citations: int = 100, limit: int = 20) -> List[Dict[str, Any]]:
+        """
+        Find foundational/seminal papers in a field
+        Args:
+            topic: Research topic or query
+            min_citations: Minimum citation count
+            limit: Maximum papers to return
+        Returns:
+            List of highly-cited foundational papers
+        """
+        if not self.archive_client:
+            return []
+        try:
+            # Search for papers
+            results = self.archive_client.search_papers(
+                query=topic,
+                limit=limit * 2,  # Get more to filter
+                fields=['title', 'authors', 'year', 'citationCount', 'abstract', 'paperId']
+            )
+            papers = results.get('data', [])
+            # Filter by citation count and sort
+            seminal = [p for p in papers if p.get('citationCount', 0) >= min_citations]
+            seminal.sort(key=lambda x: x.get('citationCount', 0), reverse=True)
+            # Enhance with network metrics
+            enhanced = []
+            for paper in seminal[:limit]:
+                paper_id = paper.get('paperId') or paper.get('id')
+                # Get citation velocity (citations per year)
+                year = paper.get('year', 2024)
+                age = max(1, 2025 - year)
+                citations = paper.get('citationCount', 0)
+                velocity = citations / age
+                enhanced.append({
+                    'id': paper_id,
+                    'title': paper.get('title'),
+                    'authors': [a.get('name') for a in paper.get('authors', [])[:5]],
+                    'year': year,
+                    'citations': citations,
+                    'citation_velocity': round(velocity, 1),
+                    'abstract': paper.get('abstract', '')[:300],
+                    'influential': citations > min_citations * 2  # Highly influential
+                })
+            return enhanced
+        except Exception as e:
+            logger.error(f"Error finding seminal papers: {e}")
+            return []
+    def trace_research_lineage(self, paper1_id: str, paper2_id: str, max_depth: int = 4) -> Dict[str, Any]:
+        """
+        Find citation path between two papers
+        Args:
+            paper1_id: First paper ID
+            paper2_id: Second paper ID
+            max_depth: Maximum path length to search
+        Returns:
+            Shortest citation path between papers
+        """
+        if not self.archive_client:
+            return {"path": [], "error": "Archive client required"}
+        try:
+            # BFS to find shortest path
+            queue = deque([(paper1_id, [paper1_id])])
+            visited = {paper1_id}
+            while queue:
+                current_id, path = queue.popleft()
+                if len(path) > max_depth:
+                    continue
+                if current_id == paper2_id:
+                    # Found path! Get paper details
+                    detailed_path = []
+                    for pid in path:
+                        paper = self._fetch_paper(pid)
+                        if paper:
+                            detailed_path.append({
+                                'id': pid,
+                                'title': paper.get('title'),
+                                'year': paper.get('year'),
+                                'authors': [a.get('name') for a in paper.get('authors', [])[:3]]
+                            })
+                    return {
+                        'path': detailed_path,
+                        'length': len(path) - 1,
+                        'connection_type': 'direct' if len(path) == 2 else 'indirect'
+                    }
+                # Explore citations and references
+                citations = self._fetch_citations(current_id)
+                references = self._fetch_references(current_id)
+                for paper in citations + references:
+                    paper_id = paper.get('paperId') or paper.get('id')
+                    if paper_id and paper_id not in visited:
+                        visited.add(paper_id)
+                        queue.append((paper_id, path + [paper_id]))
+            return {
+                'path': [],
+                'error': f'No citation path found within {max_depth} steps'
+            }
+        except Exception as e:
+            logger.error(f"Error tracing lineage: {e}")
+            return {"path": [], "error": str(e)}
+    def suggest_reading_order(self, paper_ids: List[str]) -> List[Dict[str, Any]]:
+        """
+        Suggest optimal reading order based on citations
+        Args:
+            paper_ids: List of paper IDs to order
+        Returns:
+            Papers sorted by foundational-to-recent order
+        """
+        if not self.archive_client:
+            return []
+        try:
+            # Fetch all papers
+            papers = []
+            for pid in paper_ids:
+                paper = self._fetch_paper(pid)
+                if paper:
+                    papers.append(paper)
+            # Build citation graph
+            citation_graph = defaultdict(set)
+            for paper in papers:
+                paper_id = paper.get('paperId') or paper.get('id')
+                references = self._fetch_references(paper_id)
+                for ref in references:
+                    ref_id = ref.get('paperId') or ref.get('id')
+                    if ref_id in paper_ids:
+                        citation_graph[paper_id].add(ref_id)
+            # Topological sort (foundational papers first)
+            ordered = []
+            visited = set()
+            def dfs(paper_id):
+                if paper_id in visited:
+                    return
+                visited.add(paper_id)
+                # Visit dependencies first
+                for dep_id in citation_graph.get(paper_id, []):
+                    dfs(dep_id)
+                # Find paper details
+                paper = next((p for p in papers if p.get('paperId') == paper_id or p.get('id') == paper_id), None)
+                if paper and paper not in ordered:
+                    ordered.append(paper)
+            # Process all papers
+            for paper in papers:
+                paper_id = paper.get('paperId') or paper.get('id')
+                dfs(paper_id)
+            # Format output
+            result = []
+            for i, paper in enumerate(ordered, 1):
+                result.append({
+                    'order': i,
+                    'id': paper.get('paperId') or paper.get('id'),
+                    'title': paper.get('title'),
+                    'year': paper.get('year'),
+                    'authors': [a.get('name') for a in paper.get('authors', [])[:3]],
+                    'reason': 'Foundational' if i <= len(ordered) // 3 else 'Recent' if i > 2 * len(ordered) // 3 else 'Core'
+                })
+            return result
+        except Exception as e:
+            logger.error(f"Error suggesting reading order: {e}")
+            return []
+    def _fetch_paper(self, paper_id: str) -> Optional[Dict[str, Any]]:
+        """Fetch paper details from API or cache"""
+        if paper_id in self._citation_cache:
+            return self._citation_cache[paper_id]
+        if not self.archive_client:
+            return None
+        try:
+            result = self.archive_client.get_paper(
+                paper_id,
+                fields=['paperId', 'title', 'authors', 'year', 'citationCount', 'abstract']
+            )
+            if result:
+                self._citation_cache[paper_id] = result
+                return result
+        except Exception as e:
+            logger.warning(f"Could not fetch paper {paper_id}: {e}")
+        return None
+    def _fetch_citations(self, paper_id: str, limit: int = 50) -> List[Dict[str, Any]]:
+        """Fetch papers citing this paper"""
+        if paper_id in self._citation_cache:
+            cached = self._citation_cache[paper_id]
+            if 'citations' in cached:
+                return cached['citations']
+        if not self.archive_client:
+            return []
+        try:
+            # Semantic Scholar API: /paper/{id}/citations
+            citations = self.archive_client.get_paper_citations(paper_id, limit=limit)
+            return citations if citations else []
+        except Exception as e:
+            logger.warning(f"Could not fetch citations for {paper_id}: {e}")
+            return []
+    def _fetch_references(self, paper_id: str, limit: int = 50) -> List[Dict[str, Any]]:
+        """Fetch papers referenced by this paper"""
+        if paper_id in self._reference_cache:
+            return self._reference_cache[paper_id]
+        if not self.archive_client:
+            return []
+        try:
+            # Semantic Scholar API: /paper/{id}/references
+            references = self.archive_client.get_paper_references(paper_id, limit=limit)
+            if references:
+                self._reference_cache[paper_id] = references
+                return references
+        except Exception as e:
+            logger.warning(f"Could not fetch references for {paper_id}: {e}")
+        return []
+def get_citation_network(archive_client=None) -> CitationNetwork:
+    """
+    Get CitationNetwork instance
+    Args:
+        archive_client: ArchiveAPIClient instance
+    Returns:
+        CitationNetwork instance
+    """
+    return CitationNetwork(archive_client)

cite_agent/cli.py CHANGED Viewed

@@ -225,7 +225,8 @@ class NocturnalCLI:
     def _show_ready_panel(self):
         panel = Panel(
             "Systems check complete.\n"
-            "Type [bold]help[/] for commands or [bold]tips[/] for power moves.",
+            "Type [bold]help[/] for commands or [bold]tips[/] for power moves.\n"
+            "[dim]Press Ctrl+C while the agent is thinking to interrupt and ask something else.[/dim]",
             title="✅ Cite Agent ready!",
             border_style="green",
             padding=(1, 2),
@@ -460,16 +461,9 @@ class NocturnalCLI:
                     finally:
                         live.stop()
-                    # Print response with typing effect for natural feel
+                    # Print response immediately (no artificial typing delay)
                     self.console.print("[bold violet]🤖 Agent[/]: ", end="", highlight=False)
-                    # Character-by-character streaming (like ChatGPT) - faster for long responses
-                    import time
-                    for char in response.response:
-                        self.console.print(char, end="", style="white")
-                        time.sleep(0.003)  # 3ms per character (~333 chars/sec) - faster than before
-                    self.console.print()  # Newline after response
+                    self.console.print(response.response)
                     # Save to history automatically
                     self.workflow.save_query_result(
@@ -482,12 +476,10 @@ class NocturnalCLI:
                         }
                     )
-                    # Show usage stats occasionally
-                    if hasattr(self.agent, 'daily_token_usage') and self.agent.daily_token_usage > 0:
-                        stats = self.agent.get_usage_stats()
-                        if stats['usage_percentage'] > 10:  # Show if >10% used
-                            self.console.print(f"\n📊 Usage: {stats['usage_percentage']:.1f}% of daily limit")
+                except KeyboardInterrupt:
+                    live.stop()
+                    self.console.print("\n[dim]⏹️  Interrupted. Ask another question when ready.[/dim]")
+                    continue
                 except Exception as e:
                     self.console.print(f"\n[error]❌ Error: {e}[/error]")

cite_agent/cli_conversational.py CHANGED Viewed

@@ -8,7 +8,7 @@ import asyncio
 import os
 import sys
 from pathlib import Path
-from typing import Optional
+from typing import List, Optional
 # Add nocturnal_archive to path
 sys.path.insert(0, str(Path(__file__).parent))
@@ -93,6 +93,85 @@ Remember:
         # Store this for when we make requests
         self.jarvis_prompt = jarvis_system_prompt
+    async def _build_environment_snapshot(self, limit: int = 8) -> Optional[str]:
+        """Return a short summary of the current workspace."""
+        if not self.agent:
+            return None
+        try:
+            listing = await self.agent._get_workspace_listing(limit=limit)  # type: ignore[attr-defined]
+        except Exception:
+            listing = {"base": self.working_dir, "items": []}
+        base = listing.get("base") or self.working_dir
+        items = listing.get("items") or listing.get("entries") or []
+        lines: List[str] = [f"📂 Working directory: {base}"]
+        if items:
+            preview_count = min(len(items), 6)
+            preview_lines = [
+                f"  • {item.get('name')} ({item.get('type', 'item')})"
+                for item in items[:preview_count]
+            ]
+            if len(items) > preview_count:
+                preview_lines.append(f"  • … {len(items) - preview_count} more")
+            lines.append("Contents snapshot:\n" + "\n".join(preview_lines))
+        if listing.get("error"):
+            lines.append(f"⚠️ Workspace note: {listing['error']}")
+        note = listing.get("note")
+        if note:
+            lines.append(note)
+        return "\n\n".join(lines)
+    @staticmethod
+    def _looks_like_grounding_question(text: str) -> bool:
+        lowered = text.lower().strip()
+        if not lowered:
+            return False
+        grounding_phrases = [
+            "where are we",
+            "where am i",
+            "what directory",
+            "current directory",
+            "pwd",
+            "show files",
+            "list files",
+            "where is this",
+        ]
+        return any(phrase in lowered for phrase in grounding_phrases)
+    @staticmethod
+    def _is_small_talk_probe(text: str) -> bool:
+        lowered = text.lower().strip()
+        return lowered in {"test", "hi", "hello", "hey", "ping"}
+    async def _respond_with_grounding(self) -> None:
+        snapshot = await self._build_environment_snapshot()
+        if not snapshot:
+            snapshot = "I can’t access the workspace details right now, but I’m ready to help."
+        async def snapshot_gen():
+            async for chunk in simulate_streaming(snapshot, chunk_size=4):
+                yield chunk
+        await self.ui.stream_agent_response(snapshot_gen())
+    async def _respond_with_acknowledgement(self) -> None:
+        message = (
+            "Ready when you are. Try `help` for guidance or ask me to summarise a file like "
+            "`summarize README.md`."
+        )
+        async def ack_gen():
+            async for chunk in simulate_streaming(message, chunk_size=4):
+                yield chunk
+        await self.ui.stream_agent_response(ack_gen())
     async def run(self):
         """Main conversation loop"""
@@ -121,6 +200,24 @@ Remember:
                     yield chunk
             await self.ui.stream_agent_response(welcome_gen())
+            snapshot = await self._build_environment_snapshot()
+            if snapshot:
+                async def snapshot_gen():
+                    async for chunk in simulate_streaming(snapshot, chunk_size=4):
+                        yield chunk
+                await self.ui.stream_agent_response(snapshot_gen())
+            quick_tips = (
+                "Quick tips: `help` for options • `read_file README.md` to inspect docs • "
+                "`summarize docs/…` or `analyze data.csv` to get started."
+            )
+            async def tips_gen():
+                async for chunk in simulate_streaming(quick_tips, chunk_size=4):
+                    yield chunk
+            await self.ui.stream_agent_response(tips_gen())
             # Main conversation loop
             while self.conversation_active:
@@ -160,15 +257,28 @@ Remember:
         - Use appropriate tools
         - Stream response naturally
         """
+        stripped = user_input.strip()
+        if not stripped:
+            return
+        lowered = stripped.lower()
+        if self._is_small_talk_probe(stripped):
+            await self._respond_with_acknowledgement()
+            return
+        if self._looks_like_grounding_question(stripped):
+            await self._respond_with_grounding()
+            return
         # Determine if this is a web search request
-        is_web_search = any(keyword in user_input.lower() for keyword in [
+        is_web_search = any(keyword in lowered for keyword in [
             'google', 'search for', 'browse', 'look up', 'find on the web',
             'what does', 'who is', 'recent news'
         ])
         # Determine if this is a data analysis request
-        is_data_analysis = any(keyword in user_input.lower() for keyword in [
+        is_data_analysis = any(keyword in lowered for keyword in [
             'analyze', 'data', 'csv', 'plot', 'graph', 'test', 'regression',
             'correlation', 'statistics', 'mean', 'median', 'distribution'
         ])

cite-agent 1.3.9__py3-none-any.whl → 1.4.3__py3-none-any.whl

cite-agent 1.3.9py3-none-any.whl → 1.4.3py3-none-any.whl