PyPI - amd-gaia - Versions diffs - 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl - Mend

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/METADATA +223 -223
amd_gaia-0.15.1.dist-info/RECORD +178 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2177 -2177
gaia/agents/base/api_agent.py +120 -120
gaia/agents/base/console.py +1841 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +83 -83
gaia/agents/blender/agent.py +556 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +835 -835
gaia/agents/chat/app.py +1058 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1729 -1729
gaia/agents/chat/tools/shell_tools.py +436 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2036 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +642 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1506 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1974 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +173 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +430 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5481 -5621
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/llm/__init__.py +9 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3236 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +120 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +163 -163
gaia/talk/app.py +289 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.14.3.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -729
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/WHEEL +0 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/top_level.txt +0 -0

gaia/mcp/external_services.py CHANGED Viewed

@@ -1,518 +1,518 @@
-#!/usr/bin/env python
-#
-# Copyright(C) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""
-External MCP Services Integration
-Provides wrappers for external MCP services like Context7 and Perplexity
-that run as separate processes via npx commands.
-"""
-import json
-import os
-import subprocess
-import time
-from typing import Any, Dict, List, Optional
-from gaia.logger import get_logger
-logger = get_logger(__name__)
-class ExternalMCPService:
-    """Base class for managing external MCP services via subprocess."""
-    def __init__(
-        self,
-        command: List[str],
-        env: Optional[Dict[str, str]] = None,
-        timeout: int = 30,
-    ):
-        """
-        Initialize external MCP service.
-        Args:
-            command: Command to start the MCP service (e.g., ["npx", "-y", "package"])
-            env: Additional environment variables
-            timeout: Timeout in seconds for subprocess calls
-        """
-        self.command = command
-        self.env = {**os.environ.copy(), **(env or {})}
-        self.timeout = timeout
-        self.process = None
-    def call_tool(self, tool_name: str, arguments: Dict[str, Any]) -> Dict[str, Any]:
-        """
-        Call a tool on the external MCP service.
-        Args:
-            tool_name: Name of the tool to call
-            arguments: Tool arguments as a dictionary
-        Returns:
-            Tool execution result
-        """
-        try:
-            # Create JSON-RPC request
-            request = {
-                "jsonrpc": "2.0",
-                "id": int(time.time() * 1000),
-                "method": "tools/call",
-                "params": {"name": tool_name, "arguments": arguments},
-            }
-            # Call the MCP service via subprocess
-            result = subprocess.run(
-                self.command,
-                input=json.dumps(request) + "\n",
-                capture_output=True,
-                text=True,
-                env=self.env,
-                timeout=self.timeout,
-            )
-            if result.returncode != 0:
-                logger.error(
-                    f"MCP service error (exit {result.returncode}): {result.stderr}"
-                )
-                return {"error": f"Service failed: {result.stderr or 'Unknown error'}"}
-            # Parse response
-            try:
-                response = json.loads(result.stdout)
-                # Extract result from JSON-RPC response
-                if "result" in response:
-                    return response["result"]
-                elif "error" in response:
-                    return {"error": response["error"].get("message", "Unknown error")}
-                else:
-                    return {"error": "Invalid response format"}
-            except json.JSONDecodeError as e:
-                logger.error(f"Failed to parse MCP response: {e}")
-                logger.debug(f"Raw output: {result.stdout}")
-                return {"error": f"Invalid JSON response: {str(e)}"}
-        except subprocess.TimeoutExpired:
-            logger.error(f"MCP service call timed out after {self.timeout}s")
-            return {"error": f"Request timed out after {self.timeout} seconds"}
-        except Exception as e:
-            logger.error(f"MCP service call failed: {e}")
-            return {"error": str(e)}
-    def list_tools(self) -> List[Dict[str, Any]]:
-        """
-        List available tools from the MCP service.
-        Returns:
-            List of tool definitions
-        """
-        try:
-            request = {"jsonrpc": "2.0", "id": 1, "method": "tools/list", "params": {}}
-            result = subprocess.run(
-                self.command,
-                input=json.dumps(request) + "\n",
-                capture_output=True,
-                text=True,
-                env=self.env,
-                timeout=self.timeout,
-            )
-            if result.returncode == 0:
-                response = json.loads(result.stdout)
-                return response.get("result", {}).get("tools", [])
-        except Exception as e:
-            logger.warning(f"Failed to list tools: {e}")
-        return []
-class Context7Service(ExternalMCPService):
-    """Context7 documentation search service with caching and rate protection.
-    This is an OPTIONAL service - the system works without it.
-    """
-    # Class-level availability tracking (cached after first check)
-    _availability_checked: bool = False
-    _is_available: bool = False
-    def __init__(self, api_key: Optional[str] = None):
-        """Initialize Context7 MCP service.
-        Args:
-            api_key: Optional Context7 API key (defaults to CONTEXT7_API_KEY env var)
-        """
-        # Get API key from parameter or environment
-        api_key = api_key or os.getenv("CONTEXT7_API_KEY")
-        env = {"CONTEXT7_API_KEY": api_key} if api_key else {}
-        super().__init__(command=["npx", "-y", "@upstash/context7-mcp"], env=env)
-        # Use persistent cache instead of session cache
-        from gaia.mcp.context7_cache import Context7Cache, Context7RateLimiter
-        self._cache = Context7Cache()
-        self._rate_limiter = Context7RateLimiter()
-    @classmethod
-    def check_availability(cls) -> bool:
-        """Check if Context7 can be used (npx available, package works).
-        This check is cached after the first call to avoid repeated slow checks.
-        Returns:
-            True if Context7 is available and working, False otherwise
-        """
-        if cls._availability_checked:
-            return cls._is_available
-        cls._availability_checked = True
-        # Check if npx is available
-        try:
-            import shutil
-            if not shutil.which("npx"):
-                logger.info("Context7 unavailable: npx not found in PATH")
-                cls._is_available = False
-                return False
-        except Exception as e:
-            logger.info(f"Context7 unavailable: failed to check for npx: {e}")
-            cls._is_available = False
-            return False
-        # Try a simple operation to verify Context7 works
-        try:
-            service = cls()
-            tools = service.list_tools()
-            cls._is_available = len(tools) > 0
-            if cls._is_available:
-                logger.info(f"Context7 available ({len(tools)} tools found)")
-            else:
-                logger.info("Context7 unavailable: no tools returned from service")
-        except Exception as e:
-            logger.info(f"Context7 unavailable: {type(e).__name__}: {e}")
-            cls._is_available = False
-        return cls._is_available
-    def _get_resolved_library_id(self, library: str) -> Optional[str]:
-        """Resolve a library name to Context7-compatible ID with persistent caching.
-        Args:
-            library: Library name (e.g., "nextjs") or full ID (e.g., "/vercel/next.js")
-        Returns:
-            Resolved library ID or None if resolution failed
-        """
-        # Already a full ID (has /org/project format)
-        if library.count("/") >= 2:
-            return library if library.startswith("/") else f"/{library}"
-        # Check persistent cache first
-        cached = self._cache.get_library_id(library)
-        if cached is not None:
-            logger.debug(f"Cache hit for library ID: {library} -> {cached}")
-            return cached
-        # Rate limit check before API call
-        can_proceed, reason = self._rate_limiter.can_make_request()
-        if not can_proceed:
-            logger.warning(f"Context7 rate limited: {reason}")
-            return None
-        # Resolve via API
-        logger.info(f"Resolving library ID for '{library}' via Context7 API")
-        self._rate_limiter.consume_token()
-        resolved_id = self.resolve_library_id(library)
-        # Record success/failure for circuit breaker
-        if resolved_id:
-            self._rate_limiter.record_success()
-            logger.info(f"Resolved '{library}' to '{resolved_id}'")
-        else:
-            self._rate_limiter.record_failure()
-            logger.warning(f"Could not resolve library ID for '{library}'")
-        # Cache result (even None to avoid repeated failures)
-        self._cache.set_library_id(library, resolved_id)
-        return resolved_id
-    def search_documentation(
-        self, query: str, library: Optional[str] = None
-    ) -> Dict[str, Any]:
-        """Search documentation using Context7 with caching and rate protection.
-        Args:
-            query: Search query (e.g., "how to use useState")
-            library: Optional library name to search in (e.g., "react")
-        Returns:
-            Documentation search results with code examples and references
-        """
-        # Check availability first (cached after first check)
-        if not self.check_availability():
-            return {
-                "success": False,
-                "documentation": "",
-                "error": "Context7 not available - use embedded knowledge",
-                "unavailable": True,  # Signal to LLM to use embedded patterns
-            }
-        # Resolve library ID first
-        resolved_id = None
-        if library:
-            resolved_id = self._get_resolved_library_id(library)
-            if not resolved_id:
-                logger.warning(f"Could not resolve library '{library}'")
-        # Check documentation cache
-        cache_key_lib = resolved_id or "global"
-        cached_docs = self._cache.get_documentation(cache_key_lib, query)
-        if cached_docs:
-            logger.info(f"Cache hit for documentation: {cache_key_lib}:{query[:30]}...")
-            return {
-                "success": True,
-                "documentation": cached_docs,
-                "cached": True,
-            }
-        # Rate limit check before API call
-        can_proceed, reason = self._rate_limiter.can_make_request()
-        if not can_proceed:
-            logger.warning(f"Context7 rate limited: {reason}")
-            return {
-                "success": False,
-                "error": reason,
-                "documentation": "",
-            }
-        # Make API call
-        self._rate_limiter.consume_token()
-        arguments = {"topic": query}
-        if resolved_id:
-            arguments["context7CompatibleLibraryID"] = resolved_id
-        result = self.call_tool("get-library-docs", arguments)
-        if "error" in result:
-            # Check if it's a rate limit error (HTTP 429)
-            is_rate_limit = "429" in str(result.get("error", ""))
-            self._rate_limiter.record_failure(is_rate_limit)
-            logger.error(f"Context7 search failed: {result['error']}")
-            return {
-                "success": False,
-                "error": result["error"],
-                "documentation": "",
-            }
-        # Success - cache and return
-        self._rate_limiter.record_success()
-        docs = (
-            result.get("content", [{}])[0].get("text", "")
-            if result.get("content")
-            else ""
-        )
-        self._cache.set_documentation(cache_key_lib, query, docs)
-        return {
-            "success": True,
-            "documentation": docs,
-            "cached": False,
-            "raw_result": result,
-        }
-    def resolve_library_id(self, library_name: str) -> Optional[str]:
-        """
-        Resolve a library name to Context7-compatible library ID.
-        Args:
-            library_name: Library name (e.g., "react", "tensorflow")
-        Returns:
-            Context7-compatible library ID (e.g., "/facebook/react") or None
-        """
-        result = self.call_tool("resolve-library-id", {"libraryName": library_name})
-        if "error" in result:
-            logger.warning(f"Failed to resolve library ID: {result['error']}")
-            return None
-        # Extract library ID from response
-        content = result.get("content", [])
-        if not content or len(content) == 0:
-            logger.warning("Empty content in Context7 response")
-            return None
-        text = content[0].get("text", "")
-        logger.debug(f"Context7 resolve-library-id response text:\n{text[:800]}")
-        import re
-        # Parse ALL libraries from response (separated by ----------)
-        # Multiple libraries may have the same title - need smart selection
-        libraries = []
-        blocks = text.split("----------")
-        for block in blocks:
-            if not block.strip():
-                continue
-            title_match = re.search(r"Title:\s*(.+)", block)
-            id_match = re.search(
-                r"Context7-compatible library ID:\s*(/[\w.-]+/[\w.-]+(?:/[\w.-]+)?)",
-                block,
-            )
-            score_match = re.search(r"Benchmark Score:\s*([\d.]+)", block)
-            versions_match = re.search(r"Versions:\s*(.+)", block)
-            if id_match:
-                libraries.append(
-                    {
-                        "title": title_match.group(1).strip() if title_match else "",
-                        "id": id_match.group(1),
-                        "score": float(score_match.group(1)) if score_match else 0,
-                        "has_versions": versions_match is not None,
-                    }
-                )
-        if not libraries:
-            logger.warning(f"No library IDs found in response for '{library_name}'")
-            return None
-        # Selection strategy (in order of priority):
-        # 1. Exact title match that has versions (indicates official repo)
-        # 2. Exact title match with highest score
-        # 3. Title contains search term, prefer ones with versions
-        # 4. Highest benchmark score overall
-        # Normalize for comparison (remove dots, spaces, dashes)
-        def normalize(s):
-            return s.lower().replace(".", "").replace("-", "").replace(" ", "")
-        normalized_search = normalize(library_name)
-        # Find exact matches (after normalization)
-        exact_matches = [
-            lib for lib in libraries if normalize(lib["title"]) == normalized_search
-        ]
-        if exact_matches:
-            # Prefer ones with versions (usually the official repo)
-            versioned = [lib for lib in exact_matches if lib["has_versions"]]
-            if versioned:
-                best = max(versioned, key=lambda x: x["score"])
-                logger.info(
-                    f"Resolved '{library_name}' to '{best['id']}' (exact match with versions, score={best['score']})"
-                )
-                return best["id"]
-            # No versions, pick highest score
-            best = max(exact_matches, key=lambda x: x["score"])
-            logger.info(
-                f"Resolved '{library_name}' to '{best['id']}' (exact match, score={best['score']})"
-            )
-            return best["id"]
-        # No exact match - look for title containing search term
-        partial_matches = [
-            lib for lib in libraries if normalized_search in normalize(lib["title"])
-        ]
-        if partial_matches:
-            versioned = [lib for lib in partial_matches if lib["has_versions"]]
-            if versioned:
-                best = max(versioned, key=lambda x: x["score"])
-                logger.info(
-                    f"Resolved '{library_name}' to '{best['id']}' (partial match with versions, score={best['score']})"
-                )
-                return best["id"]
-            best = max(partial_matches, key=lambda x: x["score"])
-            logger.info(
-                f"Resolved '{library_name}' to '{best['id']}' (partial match, score={best['score']})"
-            )
-            return best["id"]
-        # Fallback: highest score overall
-        best = max(libraries, key=lambda x: x["score"])
-        logger.info(
-            f"Resolved '{library_name}' to '{best['id']}' (fallback: highest score={best['score']})"
-        )
-        return best["id"]
-class PerplexityService(ExternalMCPService):
-    """Perplexity web search service."""
-    def __init__(self, api_key: Optional[str] = None):
-        """
-        Initialize Perplexity MCP service.
-        Args:
-            api_key: Perplexity API key (defaults to PERPLEXITY_API_KEY env var)
-        """
-        api_key = api_key or os.getenv("PERPLEXITY_API_KEY")
-        if not api_key:
-            logger.warning(
-                "PERPLEXITY_API_KEY not set - web search will not be available"
-            )
-        super().__init__(
-            command=["npx", "-y", "server-perplexity-ask"],
-            env={"PERPLEXITY_API_KEY": api_key} if api_key else {},
-        )
-    def search_web(self, query: str) -> Dict[str, Any]:
-        """
-        Search the web using Perplexity.
-        Args:
-            query: Search query
-        Returns:
-            Web search results with answer and sources
-        """
-        result = self.call_tool(
-            "perplexity_ask", {"messages": [{"role": "user", "content": query}]}
-        )
-        if "error" in result:
-            logger.error(f"Perplexity search failed: {result['error']}")
-            return {"success": False, "error": result["error"], "answer": ""}
-        # Extract answer from response
-        content = result.get("content", [])
-        answer = ""
-        if content and len(content) > 0:
-            answer = content[0].get("text", "")
-        return {"success": True, "answer": answer, "raw_result": result}
-# Singleton instances for reuse
-_context7_service: Optional[Context7Service] = None
-_perplexity_service: Optional[PerplexityService] = None
-def get_context7_service() -> Context7Service:
-    """Get or create Context7 service singleton."""
-    global _context7_service
-    if _context7_service is None:
-        _context7_service = Context7Service()
-    return _context7_service
-def get_perplexity_service() -> PerplexityService:
-    """Get or create Perplexity service singleton."""
-    global _perplexity_service
-    if _perplexity_service is None:
-        _perplexity_service = PerplexityService()
-    return _perplexity_service
+#!/usr/bin/env python
+#
+# Copyright(C) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""
+External MCP Services Integration
+Provides wrappers for external MCP services like Context7 and Perplexity
+that run as separate processes via npx commands.
+"""
+import json
+import os
+import subprocess
+import time
+from typing import Any, Dict, List, Optional
+from gaia.logger import get_logger
+logger = get_logger(__name__)
+class ExternalMCPService:
+    """Base class for managing external MCP services via subprocess."""
+    def __init__(
+        self,
+        command: List[str],
+        env: Optional[Dict[str, str]] = None,
+        timeout: int = 30,
+    ):
+        """
+        Initialize external MCP service.
+        Args:
+            command: Command to start the MCP service (e.g., ["npx", "-y", "package"])
+            env: Additional environment variables
+            timeout: Timeout in seconds for subprocess calls
+        """
+        self.command = command
+        self.env = {**os.environ.copy(), **(env or {})}
+        self.timeout = timeout
+        self.process = None
+    def call_tool(self, tool_name: str, arguments: Dict[str, Any]) -> Dict[str, Any]:
+        """
+        Call a tool on the external MCP service.
+        Args:
+            tool_name: Name of the tool to call
+            arguments: Tool arguments as a dictionary
+        Returns:
+            Tool execution result
+        """
+        try:
+            # Create JSON-RPC request
+            request = {
+                "jsonrpc": "2.0",
+                "id": int(time.time() * 1000),
+                "method": "tools/call",
+                "params": {"name": tool_name, "arguments": arguments},
+            }
+            # Call the MCP service via subprocess
+            result = subprocess.run(
+                self.command,
+                input=json.dumps(request) + "\n",
+                capture_output=True,
+                text=True,
+                env=self.env,
+                timeout=self.timeout,
+            )
+            if result.returncode != 0:
+                logger.error(
+                    f"MCP service error (exit {result.returncode}): {result.stderr}"
+                )
+                return {"error": f"Service failed: {result.stderr or 'Unknown error'}"}
+            # Parse response
+            try:
+                response = json.loads(result.stdout)
+                # Extract result from JSON-RPC response
+                if "result" in response:
+                    return response["result"]
+                elif "error" in response:
+                    return {"error": response["error"].get("message", "Unknown error")}
+                else:
+                    return {"error": "Invalid response format"}
+            except json.JSONDecodeError as e:
+                logger.error(f"Failed to parse MCP response: {e}")
+                logger.debug(f"Raw output: {result.stdout}")
+                return {"error": f"Invalid JSON response: {str(e)}"}
+        except subprocess.TimeoutExpired:
+            logger.error(f"MCP service call timed out after {self.timeout}s")
+            return {"error": f"Request timed out after {self.timeout} seconds"}
+        except Exception as e:
+            logger.error(f"MCP service call failed: {e}")
+            return {"error": str(e)}
+    def list_tools(self) -> List[Dict[str, Any]]:
+        """
+        List available tools from the MCP service.
+        Returns:
+            List of tool definitions
+        """
+        try:
+            request = {"jsonrpc": "2.0", "id": 1, "method": "tools/list", "params": {}}
+            result = subprocess.run(
+                self.command,
+                input=json.dumps(request) + "\n",
+                capture_output=True,
+                text=True,
+                env=self.env,
+                timeout=self.timeout,
+            )
+            if result.returncode == 0:
+                response = json.loads(result.stdout)
+                return response.get("result", {}).get("tools", [])
+        except Exception as e:
+            logger.warning(f"Failed to list tools: {e}")
+        return []
+class Context7Service(ExternalMCPService):
+    """Context7 documentation search service with caching and rate protection.
+    This is an OPTIONAL service - the system works without it.
+    """
+    # Class-level availability tracking (cached after first check)
+    _availability_checked: bool = False
+    _is_available: bool = False
+    def __init__(self, api_key: Optional[str] = None):
+        """Initialize Context7 MCP service.
+        Args:
+            api_key: Optional Context7 API key (defaults to CONTEXT7_API_KEY env var)
+        """
+        # Get API key from parameter or environment
+        api_key = api_key or os.getenv("CONTEXT7_API_KEY")
+        env = {"CONTEXT7_API_KEY": api_key} if api_key else {}
+        super().__init__(command=["npx", "-y", "@upstash/context7-mcp"], env=env)
+        # Use persistent cache instead of session cache
+        from gaia.mcp.context7_cache import Context7Cache, Context7RateLimiter
+        self._cache = Context7Cache()
+        self._rate_limiter = Context7RateLimiter()
+    @classmethod
+    def check_availability(cls) -> bool:
+        """Check if Context7 can be used (npx available, package works).
+        This check is cached after the first call to avoid repeated slow checks.
+        Returns:
+            True if Context7 is available and working, False otherwise
+        """
+        if cls._availability_checked:
+            return cls._is_available
+        cls._availability_checked = True
+        # Check if npx is available
+        try:
+            import shutil
+            if not shutil.which("npx"):
+                logger.info("Context7 unavailable: npx not found in PATH")
+                cls._is_available = False
+                return False
+        except Exception as e:
+            logger.info(f"Context7 unavailable: failed to check for npx: {e}")
+            cls._is_available = False
+            return False
+        # Try a simple operation to verify Context7 works
+        try:
+            service = cls()
+            tools = service.list_tools()
+            cls._is_available = len(tools) > 0
+            if cls._is_available:
+                logger.info(f"Context7 available ({len(tools)} tools found)")
+            else:
+                logger.info("Context7 unavailable: no tools returned from service")
+        except Exception as e:
+            logger.info(f"Context7 unavailable: {type(e).__name__}: {e}")
+            cls._is_available = False
+        return cls._is_available
+    def _get_resolved_library_id(self, library: str) -> Optional[str]:
+        """Resolve a library name to Context7-compatible ID with persistent caching.
+        Args:
+            library: Library name (e.g., "nextjs") or full ID (e.g., "/vercel/next.js")
+        Returns:
+            Resolved library ID or None if resolution failed
+        """
+        # Already a full ID (has /org/project format)
+        if library.count("/") >= 2:
+            return library if library.startswith("/") else f"/{library}"
+        # Check persistent cache first
+        cached = self._cache.get_library_id(library)
+        if cached is not None:
+            logger.debug(f"Cache hit for library ID: {library} -> {cached}")
+            return cached
+        # Rate limit check before API call
+        can_proceed, reason = self._rate_limiter.can_make_request()
+        if not can_proceed:
+            logger.warning(f"Context7 rate limited: {reason}")
+            return None
+        # Resolve via API
+        logger.info(f"Resolving library ID for '{library}' via Context7 API")
+        self._rate_limiter.consume_token()
+        resolved_id = self.resolve_library_id(library)
+        # Record success/failure for circuit breaker
+        if resolved_id:
+            self._rate_limiter.record_success()
+            logger.info(f"Resolved '{library}' to '{resolved_id}'")
+        else:
+            self._rate_limiter.record_failure()
+            logger.warning(f"Could not resolve library ID for '{library}'")
+        # Cache result (even None to avoid repeated failures)
+        self._cache.set_library_id(library, resolved_id)
+        return resolved_id
+    def search_documentation(
+        self, query: str, library: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """Search documentation using Context7 with caching and rate protection.
+        Args:
+            query: Search query (e.g., "how to use useState")
+            library: Optional library name to search in (e.g., "react")
+        Returns:
+            Documentation search results with code examples and references
+        """
+        # Check availability first (cached after first check)
+        if not self.check_availability():
+            return {
+                "success": False,
+                "documentation": "",
+                "error": "Context7 not available - use embedded knowledge",
+                "unavailable": True,  # Signal to LLM to use embedded patterns
+            }
+        # Resolve library ID first
+        resolved_id = None
+        if library:
+            resolved_id = self._get_resolved_library_id(library)
+            if not resolved_id:
+                logger.warning(f"Could not resolve library '{library}'")
+        # Check documentation cache
+        cache_key_lib = resolved_id or "global"
+        cached_docs = self._cache.get_documentation(cache_key_lib, query)
+        if cached_docs:
+            logger.info(f"Cache hit for documentation: {cache_key_lib}:{query[:30]}...")
+            return {
+                "success": True,
+                "documentation": cached_docs,
+                "cached": True,
+            }
+        # Rate limit check before API call
+        can_proceed, reason = self._rate_limiter.can_make_request()
+        if not can_proceed:
+            logger.warning(f"Context7 rate limited: {reason}")
+            return {
+                "success": False,
+                "error": reason,
+                "documentation": "",
+            }
+        # Make API call
+        self._rate_limiter.consume_token()
+        arguments = {"topic": query}
+        if resolved_id:
+            arguments["context7CompatibleLibraryID"] = resolved_id
+        result = self.call_tool("get-library-docs", arguments)
+        if "error" in result:
+            # Check if it's a rate limit error (HTTP 429)
+            is_rate_limit = "429" in str(result.get("error", ""))
+            self._rate_limiter.record_failure(is_rate_limit)
+            logger.error(f"Context7 search failed: {result['error']}")
+            return {
+                "success": False,
+                "error": result["error"],
+                "documentation": "",
+            }
+        # Success - cache and return
+        self._rate_limiter.record_success()
+        docs = (
+            result.get("content", [{}])[0].get("text", "")
+            if result.get("content")
+            else ""
+        )
+        self._cache.set_documentation(cache_key_lib, query, docs)
+        return {
+            "success": True,
+            "documentation": docs,
+            "cached": False,
+            "raw_result": result,
+        }
+    def resolve_library_id(self, library_name: str) -> Optional[str]:
+        """
+        Resolve a library name to Context7-compatible library ID.
+        Args:
+            library_name: Library name (e.g., "react", "tensorflow")
+        Returns:
+            Context7-compatible library ID (e.g., "/facebook/react") or None
+        """
+        result = self.call_tool("resolve-library-id", {"libraryName": library_name})
+        if "error" in result:
+            logger.warning(f"Failed to resolve library ID: {result['error']}")
+            return None
+        # Extract library ID from response
+        content = result.get("content", [])
+        if not content or len(content) == 0:
+            logger.warning("Empty content in Context7 response")
+            return None
+        text = content[0].get("text", "")
+        logger.debug(f"Context7 resolve-library-id response text:\n{text[:800]}")
+        import re
+        # Parse ALL libraries from response (separated by ----------)
+        # Multiple libraries may have the same title - need smart selection
+        libraries = []
+        blocks = text.split("----------")
+        for block in blocks:
+            if not block.strip():
+                continue
+            title_match = re.search(r"Title:\s*(.+)", block)
+            id_match = re.search(
+                r"Context7-compatible library ID:\s*(/[\w.-]+/[\w.-]+(?:/[\w.-]+)?)",
+                block,
+            )
+            score_match = re.search(r"Benchmark Score:\s*([\d.]+)", block)
+            versions_match = re.search(r"Versions:\s*(.+)", block)
+            if id_match:
+                libraries.append(
+                    {
+                        "title": title_match.group(1).strip() if title_match else "",
+                        "id": id_match.group(1),
+                        "score": float(score_match.group(1)) if score_match else 0,
+                        "has_versions": versions_match is not None,
+                    }
+                )
+        if not libraries:
+            logger.warning(f"No library IDs found in response for '{library_name}'")
+            return None
+        # Selection strategy (in order of priority):
+        # 1. Exact title match that has versions (indicates official repo)
+        # 2. Exact title match with highest score
+        # 3. Title contains search term, prefer ones with versions
+        # 4. Highest benchmark score overall
+        # Normalize for comparison (remove dots, spaces, dashes)
+        def normalize(s):
+            return s.lower().replace(".", "").replace("-", "").replace(" ", "")
+        normalized_search = normalize(library_name)
+        # Find exact matches (after normalization)
+        exact_matches = [
+            lib for lib in libraries if normalize(lib["title"]) == normalized_search
+        ]
+        if exact_matches:
+            # Prefer ones with versions (usually the official repo)
+            versioned = [lib for lib in exact_matches if lib["has_versions"]]
+            if versioned:
+                best = max(versioned, key=lambda x: x["score"])
+                logger.info(
+                    f"Resolved '{library_name}' to '{best['id']}' (exact match with versions, score={best['score']})"
+                )
+                return best["id"]
+            # No versions, pick highest score
+            best = max(exact_matches, key=lambda x: x["score"])
+            logger.info(
+                f"Resolved '{library_name}' to '{best['id']}' (exact match, score={best['score']})"
+            )
+            return best["id"]
+        # No exact match - look for title containing search term
+        partial_matches = [
+            lib for lib in libraries if normalized_search in normalize(lib["title"])
+        ]
+        if partial_matches:
+            versioned = [lib for lib in partial_matches if lib["has_versions"]]
+            if versioned:
+                best = max(versioned, key=lambda x: x["score"])
+                logger.info(
+                    f"Resolved '{library_name}' to '{best['id']}' (partial match with versions, score={best['score']})"
+                )
+                return best["id"]
+            best = max(partial_matches, key=lambda x: x["score"])
+            logger.info(
+                f"Resolved '{library_name}' to '{best['id']}' (partial match, score={best['score']})"
+            )
+            return best["id"]
+        # Fallback: highest score overall
+        best = max(libraries, key=lambda x: x["score"])
+        logger.info(
+            f"Resolved '{library_name}' to '{best['id']}' (fallback: highest score={best['score']})"
+        )
+        return best["id"]
+class PerplexityService(ExternalMCPService):
+    """Perplexity web search service."""
+    def __init__(self, api_key: Optional[str] = None):
+        """
+        Initialize Perplexity MCP service.
+        Args:
+            api_key: Perplexity API key (defaults to PERPLEXITY_API_KEY env var)
+        """
+        api_key = api_key or os.getenv("PERPLEXITY_API_KEY")
+        if not api_key:
+            logger.warning(
+                "PERPLEXITY_API_KEY not set - web search will not be available"
+            )
+        super().__init__(
+            command=["npx", "-y", "server-perplexity-ask"],
+            env={"PERPLEXITY_API_KEY": api_key} if api_key else {},
+        )
+    def search_web(self, query: str) -> Dict[str, Any]:
+        """
+        Search the web using Perplexity.
+        Args:
+            query: Search query
+        Returns:
+            Web search results with answer and sources
+        """
+        result = self.call_tool(
+            "perplexity_ask", {"messages": [{"role": "user", "content": query}]}
+        )
+        if "error" in result:
+            logger.error(f"Perplexity search failed: {result['error']}")
+            return {"success": False, "error": result["error"], "answer": ""}
+        # Extract answer from response
+        content = result.get("content", [])
+        answer = ""
+        if content and len(content) > 0:
+            answer = content[0].get("text", "")
+        return {"success": True, "answer": answer, "raw_result": result}
+# Singleton instances for reuse
+_context7_service: Optional[Context7Service] = None
+_perplexity_service: Optional[PerplexityService] = None
+def get_context7_service() -> Context7Service:
+    """Get or create Context7 service singleton."""
+    global _context7_service
+    if _context7_service is None:
+        _context7_service = Context7Service()
+    return _context7_service
+def get_perplexity_service() -> PerplexityService:
+    """Get or create Perplexity service singleton."""
+    global _perplexity_service
+    if _perplexity_service is None:
+        _perplexity_service = PerplexityService()
+    return _perplexity_service

amd-gaia 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl