PyPI - amd-gaia - Versions diffs - 0.15.0__py3-none-any.whl → 0.15.2__py3-none-any.whl - Mend

amd-gaia 0.15.0py3-none-any.whl → 0.15.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/METADATA +222 -223
amd_gaia-0.15.2.dist-info/RECORD +182 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/WHEEL +1 -1
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2132 -2177
gaia/agents/base/api_agent.py +119 -120
gaia/agents/base/console.py +1967 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +88 -83
gaia/agents/blender/__init__.py +7 -0
gaia/agents/blender/agent.py +553 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +809 -835
gaia/agents/chat/app.py +1065 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1744 -1729
gaia/agents/chat/tools/shell_tools.py +437 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2034 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +643 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1504 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1972 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +184 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +428 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5659 -5632
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/installer/__init__.py +23 -0
gaia/installer/init_command.py +1275 -0
gaia/installer/lemonade_installer.py +619 -0
gaia/llm/__init__.py +10 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3421 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +118 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +183 -163
gaia/talk/app.py +287 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.15.0.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -723
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/top_level.txt +0 -0

gaia/testing/mocks.py CHANGED Viewed

@@ -1,493 +1,493 @@
-# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""Mock providers for testing GAIA agents without real LLM/VLM services."""
-import logging
-import time
-from typing import Any, Dict, Iterator, List, Optional
-logger = logging.getLogger(__name__)
-class MockLLMProvider:
-    """
-    Mock LLM provider for testing agents without real API calls.
-    Returns pre-configured responses instead of calling a real LLM.
-    Tracks all calls for test assertions.
-    Example:
-        from gaia.testing import MockLLMProvider
-        mock_llm = MockLLMProvider(responses=["First response", "Second response"])
-        # Use in tests
-        result = mock_llm.generate("Test prompt")
-        assert result == "First response"
-        result = mock_llm.generate("Another prompt")
-        assert result == "Second response"
-        # Check call history
-        assert len(mock_llm.call_history) == 2
-        assert mock_llm.call_history[0]["prompt"] == "Test prompt"
-    """
-    def __init__(
-        self,
-        responses: Optional[List[str]] = None,
-        tool_responses: Optional[Dict[str, Any]] = None,
-        default_response: str = "Mock LLM response",
-    ):
-        """
-        Initialize mock LLM provider.
-        Args:
-            responses: List of responses to return in sequence.
-                      Cycles back to first if more calls than responses.
-            tool_responses: Dict mapping tool names to their mock results.
-                           Used when simulating tool calls.
-            default_response: Response when responses list is exhausted or empty.
-        """
-        self.responses = responses or []
-        self.tool_responses = tool_responses or {}
-        self.default_response = default_response
-        self.call_history: List[Dict[str, Any]] = []
-        self._response_index = 0
-    def generate(
-        self,
-        prompt: str,
-        system_prompt: Optional[str] = None,
-        temperature: float = 0.7,
-        max_tokens: Optional[int] = None,
-        **kwargs,
-    ) -> str:
-        """
-        Generate mock response.
-        Args:
-            prompt: Input prompt (recorded but not processed)
-            system_prompt: System prompt (recorded)
-            temperature: Temperature setting (recorded)
-            max_tokens: Max tokens (recorded)
-            **kwargs: Additional parameters (recorded)
-        Returns:
-            Next response from response list, or default_response
-        """
-        self.call_history.append(
-            {
-                "method": "generate",
-                "prompt": prompt,
-                "system_prompt": system_prompt,
-                "temperature": temperature,
-                "max_tokens": max_tokens,
-                "kwargs": kwargs,
-                "timestamp": time.time(),
-            }
-        )
-        if self.responses:
-            response = self.responses[self._response_index % len(self.responses)]
-            self._response_index += 1
-            return response
-        return self.default_response
-    def chat(
-        self,
-        messages: List[Dict[str, str]],
-        **kwargs,
-    ) -> str:
-        """
-        Mock chat completion (messages format).
-        Args:
-            messages: List of message dicts with 'role' and 'content'
-            **kwargs: Additional parameters
-        Returns:
-            Next response from response list
-        """
-        # Extract the last user message as the prompt
-        prompt = ""
-        for msg in reversed(messages):
-            if msg.get("role") == "user":
-                prompt = msg.get("content", "")
-                break
-        self.call_history.append(
-            {
-                "method": "chat",
-                "messages": messages,
-                "prompt": prompt,
-                "kwargs": kwargs,
-                "timestamp": time.time(),
-            }
-        )
-        if self.responses:
-            response = self.responses[self._response_index % len(self.responses)]
-            self._response_index += 1
-            return response
-        return self.default_response
-    def stream(
-        self,
-        prompt: str,
-        **kwargs,
-    ) -> Iterator[str]:
-        """
-        Mock streaming response.
-        Yields the full response as a single chunk for simplicity.
-        Args:
-            prompt: Input prompt
-            **kwargs: Additional parameters
-        Yields:
-            Response chunks (full response as single chunk)
-        """
-        response = self.generate(prompt, **kwargs)
-        # Update the last call to note it was streaming
-        if self.call_history:
-            self.call_history[-1]["method"] = "stream"
-        yield response
-    def complete(self, prompt: str, **kwargs) -> str:
-        """Alias for generate() for compatibility."""
-        return self.generate(prompt, **kwargs)
-    def get_tool_response(self, tool_name: str) -> Any:
-        """
-        Get mock response for a tool call.
-        Args:
-            tool_name: Name of the tool
-        Returns:
-            Configured mock result or default dict
-        """
-        return self.tool_responses.get(tool_name, {"status": "success"})
-    @property
-    def was_called(self) -> bool:
-        """Check if any method was called."""
-        return len(self.call_history) > 0
-    @property
-    def call_count(self) -> int:
-        """Number of times LLM was called."""
-        return len(self.call_history)
-    @property
-    def last_prompt(self) -> Optional[str]:
-        """Get the last prompt that was sent."""
-        if self.call_history:
-            return self.call_history[-1].get("prompt")
-        return None
-    def reset(self) -> None:
-        """Reset call history and response index."""
-        self.call_history = []
-        self._response_index = 0
-    def set_responses(self, responses: List[str]) -> None:
-        """
-        Set new responses and reset index.
-        Args:
-            responses: New list of responses
-        """
-        self.responses = responses
-        self._response_index = 0
-class MockVLMClient:
-    """
-    Mock VLM client for testing image processing without real API calls.
-    Returns pre-configured text instead of processing images.
-    Tracks all calls for test assertions.
-    Example:
-        from gaia.testing import MockVLMClient
-        mock_vlm = MockVLMClient(
-            extracted_text='{"name": "John", "dob": "1990-01-01"}'
-        )
-        # Inject into agent
-        agent = MyAgent()
-        agent.vlm = mock_vlm
-        # Test extraction
-        result = agent.extract_form("test.png")
-        # Verify VLM was called
-        assert mock_vlm.was_called
-        assert mock_vlm.call_count == 1
-    """
-    def __init__(
-        self,
-        extracted_text: str = "Mock extracted text",
-        extraction_results: Optional[List[str]] = None,
-        is_available: bool = True,
-    ):
-        """
-        Initialize mock VLM client.
-        Args:
-            extracted_text: Default text to return from extract_from_image()
-            extraction_results: List of results to return in sequence
-            is_available: Whether check_availability() returns True
-        """
-        self.extracted_text = extracted_text
-        self.extraction_results = extraction_results or []
-        self.is_available = is_available
-        self.call_history: List[Dict[str, Any]] = []
-        self._result_index = 0
-    def check_availability(self) -> bool:
-        """
-        Check if VLM is available.
-        Returns:
-            Configured is_available value
-        """
-        return self.is_available
-    def extract_from_image(
-        self,
-        image_bytes: bytes,
-        prompt: Optional[str] = None,
-        **kwargs,
-    ) -> str:
-        """
-        Mock image text extraction.
-        Args:
-            image_bytes: Image data (recorded but not processed)
-            prompt: Extraction prompt (recorded)
-            **kwargs: Additional parameters
-        Returns:
-            Pre-configured extracted text
-        """
-        self.call_history.append(
-            {
-                "method": "extract_from_image",
-                "image_size": len(image_bytes) if image_bytes else 0,
-                "prompt": prompt,
-                "kwargs": kwargs,
-                "timestamp": time.time(),
-            }
-        )
-        if self.extraction_results:
-            result = self.extraction_results[
-                self._result_index % len(self.extraction_results)
-            ]
-            self._result_index += 1
-            return result
-        return self.extracted_text
-    def extract_from_file(
-        self,
-        file_path: str,
-        prompt: Optional[str] = None,
-        **kwargs,
-    ) -> str:
-        """
-        Mock file-based extraction.
-        Args:
-            file_path: Path to image file
-            prompt: Extraction prompt
-        Returns:
-            Pre-configured extracted text
-        """
-        self.call_history.append(
-            {
-                "method": "extract_from_file",
-                "file_path": file_path,
-                "prompt": prompt,
-                "kwargs": kwargs,
-                "timestamp": time.time(),
-            }
-        )
-        if self.extraction_results:
-            result = self.extraction_results[
-                self._result_index % len(self.extraction_results)
-            ]
-            self._result_index += 1
-            return result
-        return self.extracted_text
-    def describe_image(
-        self,
-        image_bytes: bytes,
-        prompt: Optional[str] = None,
-        **kwargs,
-    ) -> str:
-        """
-        Mock image description.
-        Args:
-            image_bytes: Image data
-            prompt: Description prompt
-        Returns:
-            Pre-configured text
-        """
-        return self.extract_from_image(image_bytes, prompt, **kwargs)
-    @property
-    def was_called(self) -> bool:
-        """Check if any extraction method was called."""
-        return len(self.call_history) > 0
-    @property
-    def call_count(self) -> int:
-        """Number of times extraction was called."""
-        return len(self.call_history)
-    @property
-    def last_prompt(self) -> Optional[str]:
-        """Get the last prompt that was sent."""
-        if self.call_history:
-            return self.call_history[-1].get("prompt")
-        return None
-    def reset(self) -> None:
-        """Reset call history and result index."""
-        self.call_history = []
-        self._result_index = 0
-    def set_extracted_text(self, text: str) -> None:
-        """
-        Set new extracted text.
-        Args:
-            text: New text to return
-        """
-        self.extracted_text = text
-class MockToolExecutor:
-    """
-    Mock tool executor for testing tool calls.
-    Tracks tool calls and returns configurable results.
-    Example:
-        from gaia.testing import MockToolExecutor
-        executor = MockToolExecutor(
-            results={
-                "search": {"results": ["item1", "item2"]},
-                "create_record": {"id": 123, "status": "created"},
-            }
-        )
-        result = executor.execute("search", {"query": "test"})
-        assert result == {"results": ["item1", "item2"]}
-        assert executor.was_tool_called("search")
-        assert executor.get_tool_args("search") == {"query": "test"}
-    """
-    def __init__(
-        self,
-        results: Optional[Dict[str, Any]] = None,
-        default_result: Optional[Dict[str, Any]] = None,
-    ):
-        """
-        Initialize mock tool executor.
-        Args:
-            results: Dict mapping tool names to their results
-            default_result: Default result for unknown tools
-        """
-        self.results = results or {}
-        self.default_result = default_result or {"status": "success"}
-        self.call_history: List[Dict[str, Any]] = []
-    def execute(self, tool_name: str, args: Dict[str, Any]) -> Any:
-        """
-        Execute a mock tool.
-        Args:
-            tool_name: Name of the tool
-            args: Tool arguments
-        Returns:
-            Configured result for the tool
-        """
-        self.call_history.append(
-            {
-                "tool": tool_name,
-                "args": args,
-                "timestamp": time.time(),
-            }
-        )
-        return self.results.get(tool_name, self.default_result)
-    def was_tool_called(self, tool_name: str) -> bool:
-        """
-        Check if a specific tool was called.
-        Args:
-            tool_name: Name of the tool
-        Returns:
-            True if tool was called at least once
-        """
-        return any(call["tool"] == tool_name for call in self.call_history)
-    def get_tool_calls(self, tool_name: str) -> List[Dict[str, Any]]:
-        """
-        Get all calls to a specific tool.
-        Args:
-            tool_name: Name of the tool
-        Returns:
-            List of call records for that tool
-        """
-        return [call for call in self.call_history if call["tool"] == tool_name]
-    def get_tool_args(self, tool_name: str, call_index: int = 0) -> Optional[Dict]:
-        """
-        Get arguments from a specific tool call.
-        Args:
-            tool_name: Name of the tool
-            call_index: Which call to get (0 = first call)
-        Returns:
-            Arguments dict or None if not found
-        """
-        calls = self.get_tool_calls(tool_name)
-        if call_index < len(calls):
-            return calls[call_index]["args"]
-        return None
-    @property
-    def tool_names_called(self) -> List[str]:
-        """Get list of all tool names that were called."""
-        return list(set(call["tool"] for call in self.call_history))
-    def reset(self) -> None:
-        """Reset call history."""
-        self.call_history = []
+# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""Mock providers for testing GAIA agents without real LLM/VLM services."""
+import logging
+import time
+from typing import Any, Dict, Iterator, List, Optional
+logger = logging.getLogger(__name__)
+class MockLLMProvider:
+    """
+    Mock LLM provider for testing agents without real API calls.
+    Returns pre-configured responses instead of calling a real LLM.
+    Tracks all calls for test assertions.
+    Example:
+        from gaia.testing import MockLLMProvider
+        mock_llm = MockLLMProvider(responses=["First response", "Second response"])
+        # Use in tests
+        result = mock_llm.generate("Test prompt")
+        assert result == "First response"
+        result = mock_llm.generate("Another prompt")
+        assert result == "Second response"
+        # Check call history
+        assert len(mock_llm.call_history) == 2
+        assert mock_llm.call_history[0]["prompt"] == "Test prompt"
+    """
+    def __init__(
+        self,
+        responses: Optional[List[str]] = None,
+        tool_responses: Optional[Dict[str, Any]] = None,
+        default_response: str = "Mock LLM response",
+    ):
+        """
+        Initialize mock LLM provider.
+        Args:
+            responses: List of responses to return in sequence.
+                      Cycles back to first if more calls than responses.
+            tool_responses: Dict mapping tool names to their mock results.
+                           Used when simulating tool calls.
+            default_response: Response when responses list is exhausted or empty.
+        """
+        self.responses = responses or []
+        self.tool_responses = tool_responses or {}
+        self.default_response = default_response
+        self.call_history: List[Dict[str, Any]] = []
+        self._response_index = 0
+    def generate(
+        self,
+        prompt: str,
+        system_prompt: Optional[str] = None,
+        temperature: float = 0.7,
+        max_tokens: Optional[int] = None,
+        **kwargs,
+    ) -> str:
+        """
+        Generate mock response.
+        Args:
+            prompt: Input prompt (recorded but not processed)
+            system_prompt: System prompt (recorded)
+            temperature: Temperature setting (recorded)
+            max_tokens: Max tokens (recorded)
+            **kwargs: Additional parameters (recorded)
+        Returns:
+            Next response from response list, or default_response
+        """
+        self.call_history.append(
+            {
+                "method": "generate",
+                "prompt": prompt,
+                "system_prompt": system_prompt,
+                "temperature": temperature,
+                "max_tokens": max_tokens,
+                "kwargs": kwargs,
+                "timestamp": time.time(),
+            }
+        )
+        if self.responses:
+            response = self.responses[self._response_index % len(self.responses)]
+            self._response_index += 1
+            return response
+        return self.default_response
+    def chat(
+        self,
+        messages: List[Dict[str, str]],
+        **kwargs,
+    ) -> str:
+        """
+        Mock chat completion (messages format).
+        Args:
+            messages: List of message dicts with 'role' and 'content'
+            **kwargs: Additional parameters
+        Returns:
+            Next response from response list
+        """
+        # Extract the last user message as the prompt
+        prompt = ""
+        for msg in reversed(messages):
+            if msg.get("role") == "user":
+                prompt = msg.get("content", "")
+                break
+        self.call_history.append(
+            {
+                "method": "chat",
+                "messages": messages,
+                "prompt": prompt,
+                "kwargs": kwargs,
+                "timestamp": time.time(),
+            }
+        )
+        if self.responses:
+            response = self.responses[self._response_index % len(self.responses)]
+            self._response_index += 1
+            return response
+        return self.default_response
+    def stream(
+        self,
+        prompt: str,
+        **kwargs,
+    ) -> Iterator[str]:
+        """
+        Mock streaming response.
+        Yields the full response as a single chunk for simplicity.
+        Args:
+            prompt: Input prompt
+            **kwargs: Additional parameters
+        Yields:
+            Response chunks (full response as single chunk)
+        """
+        response = self.generate(prompt, **kwargs)
+        # Update the last call to note it was streaming
+        if self.call_history:
+            self.call_history[-1]["method"] = "stream"
+        yield response
+    def complete(self, prompt: str, **kwargs) -> str:
+        """Alias for generate() for compatibility."""
+        return self.generate(prompt, **kwargs)
+    def get_tool_response(self, tool_name: str) -> Any:
+        """
+        Get mock response for a tool call.
+        Args:
+            tool_name: Name of the tool
+        Returns:
+            Configured mock result or default dict
+        """
+        return self.tool_responses.get(tool_name, {"status": "success"})
+    @property
+    def was_called(self) -> bool:
+        """Check if any method was called."""
+        return len(self.call_history) > 0
+    @property
+    def call_count(self) -> int:
+        """Number of times LLM was called."""
+        return len(self.call_history)
+    @property
+    def last_prompt(self) -> Optional[str]:
+        """Get the last prompt that was sent."""
+        if self.call_history:
+            return self.call_history[-1].get("prompt")
+        return None
+    def reset(self) -> None:
+        """Reset call history and response index."""
+        self.call_history = []
+        self._response_index = 0
+    def set_responses(self, responses: List[str]) -> None:
+        """
+        Set new responses and reset index.
+        Args:
+            responses: New list of responses
+        """
+        self.responses = responses
+        self._response_index = 0
+class MockVLMClient:
+    """
+    Mock VLM client for testing image processing without real API calls.
+    Returns pre-configured text instead of processing images.
+    Tracks all calls for test assertions.
+    Example:
+        from gaia.testing import MockVLMClient
+        mock_vlm = MockVLMClient(
+            extracted_text='{"name": "John", "dob": "1990-01-01"}'
+        )
+        # Inject into agent
+        agent = MyAgent()
+        agent.vlm = mock_vlm
+        # Test extraction
+        result = agent.extract_form("test.png")
+        # Verify VLM was called
+        assert mock_vlm.was_called
+        assert mock_vlm.call_count == 1
+    """
+    def __init__(
+        self,
+        extracted_text: str = "Mock extracted text",
+        extraction_results: Optional[List[str]] = None,
+        is_available: bool = True,
+    ):
+        """
+        Initialize mock VLM client.
+        Args:
+            extracted_text: Default text to return from extract_from_image()
+            extraction_results: List of results to return in sequence
+            is_available: Whether check_availability() returns True
+        """
+        self.extracted_text = extracted_text
+        self.extraction_results = extraction_results or []
+        self.is_available = is_available
+        self.call_history: List[Dict[str, Any]] = []
+        self._result_index = 0
+    def check_availability(self) -> bool:
+        """
+        Check if VLM is available.
+        Returns:
+            Configured is_available value
+        """
+        return self.is_available
+    def extract_from_image(
+        self,
+        image_bytes: bytes,
+        prompt: Optional[str] = None,
+        **kwargs,
+    ) -> str:
+        """
+        Mock image text extraction.
+        Args:
+            image_bytes: Image data (recorded but not processed)
+            prompt: Extraction prompt (recorded)
+            **kwargs: Additional parameters
+        Returns:
+            Pre-configured extracted text
+        """
+        self.call_history.append(
+            {
+                "method": "extract_from_image",
+                "image_size": len(image_bytes) if image_bytes else 0,
+                "prompt": prompt,
+                "kwargs": kwargs,
+                "timestamp": time.time(),
+            }
+        )
+        if self.extraction_results:
+            result = self.extraction_results[
+                self._result_index % len(self.extraction_results)
+            ]
+            self._result_index += 1
+            return result
+        return self.extracted_text
+    def extract_from_file(
+        self,
+        file_path: str,
+        prompt: Optional[str] = None,
+        **kwargs,
+    ) -> str:
+        """
+        Mock file-based extraction.
+        Args:
+            file_path: Path to image file
+            prompt: Extraction prompt
+        Returns:
+            Pre-configured extracted text
+        """
+        self.call_history.append(
+            {
+                "method": "extract_from_file",
+                "file_path": file_path,
+                "prompt": prompt,
+                "kwargs": kwargs,
+                "timestamp": time.time(),
+            }
+        )
+        if self.extraction_results:
+            result = self.extraction_results[
+                self._result_index % len(self.extraction_results)
+            ]
+            self._result_index += 1
+            return result
+        return self.extracted_text
+    def describe_image(
+        self,
+        image_bytes: bytes,
+        prompt: Optional[str] = None,
+        **kwargs,
+    ) -> str:
+        """
+        Mock image description.
+        Args:
+            image_bytes: Image data
+            prompt: Description prompt
+        Returns:
+            Pre-configured text
+        """
+        return self.extract_from_image(image_bytes, prompt, **kwargs)
+    @property
+    def was_called(self) -> bool:
+        """Check if any extraction method was called."""
+        return len(self.call_history) > 0
+    @property
+    def call_count(self) -> int:
+        """Number of times extraction was called."""
+        return len(self.call_history)
+    @property
+    def last_prompt(self) -> Optional[str]:
+        """Get the last prompt that was sent."""
+        if self.call_history:
+            return self.call_history[-1].get("prompt")
+        return None
+    def reset(self) -> None:
+        """Reset call history and result index."""
+        self.call_history = []
+        self._result_index = 0
+    def set_extracted_text(self, text: str) -> None:
+        """
+        Set new extracted text.
+        Args:
+            text: New text to return
+        """
+        self.extracted_text = text
+class MockToolExecutor:
+    """
+    Mock tool executor for testing tool calls.
+    Tracks tool calls and returns configurable results.
+    Example:
+        from gaia.testing import MockToolExecutor
+        executor = MockToolExecutor(
+            results={
+                "search": {"results": ["item1", "item2"]},
+                "create_record": {"id": 123, "status": "created"},
+            }
+        )
+        result = executor.execute("search", {"query": "test"})
+        assert result == {"results": ["item1", "item2"]}
+        assert executor.was_tool_called("search")
+        assert executor.get_tool_args("search") == {"query": "test"}
+    """
+    def __init__(
+        self,
+        results: Optional[Dict[str, Any]] = None,
+        default_result: Optional[Dict[str, Any]] = None,
+    ):
+        """
+        Initialize mock tool executor.
+        Args:
+            results: Dict mapping tool names to their results
+            default_result: Default result for unknown tools
+        """
+        self.results = results or {}
+        self.default_result = default_result or {"status": "success"}
+        self.call_history: List[Dict[str, Any]] = []
+    def execute(self, tool_name: str, args: Dict[str, Any]) -> Any:
+        """
+        Execute a mock tool.
+        Args:
+            tool_name: Name of the tool
+            args: Tool arguments
+        Returns:
+            Configured result for the tool
+        """
+        self.call_history.append(
+            {
+                "tool": tool_name,
+                "args": args,
+                "timestamp": time.time(),
+            }
+        )
+        return self.results.get(tool_name, self.default_result)
+    def was_tool_called(self, tool_name: str) -> bool:
+        """
+        Check if a specific tool was called.
+        Args:
+            tool_name: Name of the tool
+        Returns:
+            True if tool was called at least once
+        """
+        return any(call["tool"] == tool_name for call in self.call_history)
+    def get_tool_calls(self, tool_name: str) -> List[Dict[str, Any]]:
+        """
+        Get all calls to a specific tool.
+        Args:
+            tool_name: Name of the tool
+        Returns:
+            List of call records for that tool
+        """
+        return [call for call in self.call_history if call["tool"] == tool_name]
+    def get_tool_args(self, tool_name: str, call_index: int = 0) -> Optional[Dict]:
+        """
+        Get arguments from a specific tool call.
+        Args:
+            tool_name: Name of the tool
+            call_index: Which call to get (0 = first call)
+        Returns:
+            Arguments dict or None if not found
+        """
+        calls = self.get_tool_calls(tool_name)
+        if call_index < len(calls):
+            return calls[call_index]["args"]
+        return None
+    @property
+    def tool_names_called(self) -> List[str]:
+        """Get list of all tool names that were called."""
+        return list(set(call["tool"] for call in self.call_history))
+    def reset(self) -> None:
+        """Reset call history."""
+        self.call_history = []

amd-gaia 0.15.0__py3-none-any.whl → 0.15.2__py3-none-any.whl

amd-gaia 0.15.0py3-none-any.whl → 0.15.2py3-none-any.whl