PyPI - amd-gaia - Versions diffs - 0.15.0__py3-none-any.whl → 0.15.1__py3-none-any.whl - Mend

amd-gaia 0.15.0py3-none-any.whl → 0.15.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/METADATA +223 -223
amd_gaia-0.15.1.dist-info/RECORD +178 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2177 -2177
gaia/agents/base/api_agent.py +120 -120
gaia/agents/base/console.py +1841 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +83 -83
gaia/agents/blender/agent.py +556 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +835 -835
gaia/agents/chat/app.py +1058 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1729 -1729
gaia/agents/chat/tools/shell_tools.py +436 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2036 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +642 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1506 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1974 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +173 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +430 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5481 -5632
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/llm/__init__.py +9 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3236 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +120 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +163 -163
gaia/talk/app.py +289 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.15.0.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -723
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/WHEEL +0 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/top_level.txt +0 -0

gaia/eval/claude.py CHANGED Viewed

@@ -1,542 +1,542 @@
-# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-import base64
-import json
-import os
-from pathlib import Path
-try:
-    import anthropic
-except ImportError:
-    anthropic = None
-try:
-    from bs4 import BeautifulSoup
-except ImportError:
-    BeautifulSoup = None
-from dotenv import load_dotenv
-from gaia.eval.config import DEFAULT_CLAUDE_MODEL, MODEL_PRICING
-from gaia.logger import get_logger
-load_dotenv()
-class ClaudeClient:
-    log = get_logger(__name__)
-    def __init__(self, model=None, max_tokens=1024, max_retries=3):
-        """
-        Initialize Claude client with retry support.
-        Args:
-            model: Claude model to use (defaults to DEFAULT_CLAUDE_MODEL)
-            max_tokens: Maximum tokens in response (default: 1024)
-            max_retries: Maximum number of retry attempts for API calls with exponential backoff (default: 3)
-        """
-        # Check for required dependencies
-        if anthropic is None:
-            error_msg = (
-                "\n❌ Error: Missing required package 'anthropic'\n\n"
-                "Please install the eval dependencies:\n"
-                '  uv pip install -e ".[eval]"\n\n'
-                "Or install anthropic directly:\n"
-                "  uv pip install anthropic\n"
-            )
-            raise ImportError(error_msg)
-        if BeautifulSoup is None:
-            error_msg = (
-                "\n❌ Error: Missing required package 'bs4' (BeautifulSoup4)\n\n"
-                "Please install the eval dependencies:\n"
-                '  uv pip install -e ".[eval]"\n\n'
-                "Or install beautifulsoup4 directly:\n"
-                "  uv pip install beautifulsoup4\n"
-            )
-            raise ImportError(error_msg)
-        if model is None:
-            model = DEFAULT_CLAUDE_MODEL
-        self.log = self.__class__.log  # Use the class-level logger for instances
-        self.api_key = os.getenv("ANTHROPIC_API_KEY")
-        if not self.api_key:
-            error_msg = (
-                "ANTHROPIC_API_KEY not found in environment.\n"
-                "Please add your Anthropic API key to the .env file:\n"
-                "  ANTHROPIC_API_KEY=your_api_key_here\n"
-                "Alternatively, export it as an environment variable:\n"
-                "  export ANTHROPIC_API_KEY=your_api_key_here\n"
-            )
-            self.log.error(error_msg)
-            raise ValueError(error_msg)
-        # Initialize Anthropic client with retry support
-        # The SDK handles exponential backoff automatically
-        self.client = anthropic.Anthropic(
-            api_key=self.api_key,
-            max_retries=max_retries,
-            timeout=300.0,  # 5 minute timeout for large documents
-        )
-        self.model = model
-        self.max_tokens = max_tokens
-        self.max_retries = max_retries
-        self.log.info(
-            f"Initialized ClaudeClient with model: {model}, max_retries: {max_retries}"
-        )
-    def calculate_cost(self, input_tokens, output_tokens):
-        """
-        Calculate the cost of an API call based on token usage.
-        Args:
-            input_tokens (int): Number of input tokens
-            output_tokens (int): Number of output tokens
-        Returns:
-            dict: Cost breakdown with input_cost, output_cost, and total_cost
-        """
-        # Get pricing for the current model, fallback to default if not found
-        pricing = MODEL_PRICING.get(self.model, MODEL_PRICING["default"])
-        # Calculate costs (convert tokens to millions)
-        input_cost = (input_tokens / 1_000_000) * pricing["input_per_mtok"]
-        output_cost = (output_tokens / 1_000_000) * pricing["output_per_mtok"]
-        total_cost = input_cost + output_cost
-        return {
-            "input_cost": round(input_cost, 6),
-            "output_cost": round(output_cost, 6),
-            "total_cost": round(total_cost, 6),
-        }
-    def get_completion(self, prompt):
-        self.log.debug("Getting completion from Claude")
-        self.log.debug(f"Prompt token count: {self.count_tokens(prompt)}")
-        try:
-            message = self.client.messages.create(
-                model=self.model,
-                max_tokens=self.max_tokens,
-                messages=[{"role": "user", "content": prompt}],
-            )
-            return message.content
-        except Exception as e:
-            self.log.error(f"Error getting completion: {e}")
-            raise
-    def get_completion_with_usage(self, prompt):
-        """
-        Get completion from Claude and return both content and usage/cost information.
-        Args:
-            prompt (str): The prompt to send to Claude
-        Returns:
-            dict: Contains 'content', 'usage', and 'cost' keys
-        """
-        self.log.info("Getting completion with usage tracking from Claude")
-        try:
-            message = self.client.messages.create(
-                model=self.model,
-                max_tokens=self.max_tokens,
-                messages=[{"role": "user", "content": prompt}],
-            )
-            # Extract usage information
-            usage = {
-                "input_tokens": message.usage.input_tokens,
-                "output_tokens": message.usage.output_tokens,
-                "total_tokens": message.usage.input_tokens
-                + message.usage.output_tokens,
-            }
-            # Calculate cost
-            cost = self.calculate_cost(usage["input_tokens"], usage["output_tokens"])
-            self.log.info(
-                f"Usage: {usage['input_tokens']} input + {usage['output_tokens']} output = {usage['total_tokens']} total tokens"
-            )
-            self.log.info(
-                f"Cost: ${cost['input_cost']:.4f} input + ${cost['output_cost']:.4f} output = ${cost['total_cost']:.4f} total"
-            )
-            return {"content": message.content, "usage": usage, "cost": cost}
-        except Exception as e:
-            self.log.error(f"Error getting completion with usage: {e}")
-            raise
-    def list_models(self):
-        self.log.info("Retrieving available models")
-        try:
-            models = self.client.models.list(limit=20)
-            self.log.info(f"Successfully retrieved {len(models)} models")
-            return models
-        except Exception as e:
-            self.log.error(f"Error listing models: {e}")
-            raise
-    def count_tokens(self, prompt):
-        return self.client.messages.count_tokens(
-            model=self.model, messages=[{"role": "user", "content": prompt}]
-        )
-    def _convert_html_to_text(
-        self, file_path, save_text=False, output_dir="./output/claude"
-    ):
-        """
-        Convert HTML file content to plain text.
-        Args:
-            file_path (str): Path to the HTML file
-            save_text (bool): If True, saves extracted text to a file
-        Returns:
-            str: Extracted text content
-        """
-        self.log.info("Converting HTML to text")
-        with open(file_path, "r", encoding="utf-8") as f:
-            soup = BeautifulSoup(f.read(), "html.parser")
-            text_content = soup.get_text(separator="\n", strip=True)
-            self.log.debug(f"Extracted {len(text_content)} characters of text")
-            if save_text:
-                # Create output directory if it doesn't exist
-                os.makedirs(output_dir, exist_ok=True)
-                filename = Path(file_path).stem
-                output_path = f"{output_dir}/{filename}.soup.txt"
-                with open(output_path, "w", encoding="utf-8") as f:
-                    f.write(text_content)
-                self.log.info(f"Saved extracted text to: {output_path}")
-            return text_content
-    def analyze_file(
-        self,
-        file_path,
-        prompt,
-        media_type=None,
-        save_text=False,
-        output_dir="./output/claude",
-    ):
-        """
-        Analyze a file using Claude's file understanding capabilities.
-        Args:
-            file_path (str): Path to the file to analyze
-            prompt (str): The analysis prompt/question
-            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
-            save_text (bool, optional): If True, saves extracted text content to a file (for HTML files only)
-            output_dir (str, optional): The directory to save the output file
-        """
-        self.log.info(f"Analyzing file: {file_path}")
-        ext = os.path.splitext(file_path)[1].lower()
-        try:
-            # For HTML files, extract text using BeautifulSoup
-            if ext in [".html", ".htm"]:
-                text_content = self._convert_html_to_text(
-                    file_path, save_text, output_dir
-                )
-                message = self.client.messages.create(
-                    model=self.model,
-                    max_tokens=self.max_tokens,
-                    messages=[
-                        {
-                            "role": "user",
-                            "content": f"Document content:\n\n{text_content}\n\n{prompt}",
-                        }
-                    ],
-                )
-                self.log.info("Successfully analyzed HTML content")
-                return message.content[0].text
-            # For other file types, use the original base64 encoding method
-            mime_types = {
-                ".txt": "text/plain",
-                ".pdf": "application/pdf",
-                ".md": "text/markdown",
-                ".csv": "text/csv",
-                ".json": "application/json",
-            }
-            if media_type is None:
-                media_type = mime_types.get(ext, "application/octet-stream")
-                self.log.debug(f"Using media type: {media_type}")
-            with open(file_path, "rb") as f:
-                file_content = base64.b64encode(f.read()).decode("utf-8")
-                self.log.debug(f"File encoded, size: {len(file_content)} bytes")
-            self.log.info("Sending file for analysis")
-            message = self.client.messages.create(
-                model=self.model,
-                max_tokens=self.max_tokens,
-                messages=[
-                    {
-                        "role": "user",
-                        "content": [
-                            {
-                                "type": "document",
-                                "source": {
-                                    "type": "base64",
-                                    "media_type": media_type,
-                                    "data": file_content,
-                                },
-                            },
-                            {"type": "text", "text": prompt},
-                        ],
-                    }
-                ],
-            )
-            self.log.info("Successfully analyzed file")
-            return message.content[0].text
-        except Exception as e:
-            self.log.error(f"Error analyzing file: {e}")
-            raise
-    def analyze_file_with_usage(
-        self,
-        file_path,
-        prompt,
-        media_type=None,
-        save_text=False,
-        output_dir="./output/claude",
-    ):
-        """
-        Analyze a file using Claude's file understanding capabilities with usage tracking.
-        Args:
-            file_path (str): Path to the file to analyze
-            prompt (str): The analysis prompt/question
-            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
-            save_text (bool, optional): If True, saves extracted text content to a file (for HTML files only)
-            output_dir (str, optional): The directory to save the output file
-        Returns:
-            dict: Contains 'content', 'usage', and 'cost' keys
-        """
-        self.log.info(f"Analyzing file with usage tracking: {file_path}")
-        ext = os.path.splitext(file_path)[1].lower()
-        try:
-            # For text-based files, read content directly as text
-            if ext in [".html", ".htm", ".txt", ".md", ".csv", ".json"]:
-                if ext in [".html", ".htm"]:
-                    text_content = self._convert_html_to_text(
-                        file_path, save_text, output_dir
-                    )
-                else:
-                    # For other text files, read directly
-                    with open(file_path, "r", encoding="utf-8") as f:
-                        text_content = f.read()
-                    self.log.debug(
-                        f"Read text file, length: {len(text_content)} characters"
-                    )
-                message = self.client.messages.create(
-                    model=self.model,
-                    max_tokens=self.max_tokens,
-                    messages=[
-                        {
-                            "role": "user",
-                            "content": f"Document content:\n\n{text_content}\n\n{prompt}",
-                        }
-                    ],
-                )
-                self.log.info(f"Successfully analyzed text content ({ext} file)")
-                # Extract usage and calculate cost
-                usage = {
-                    "input_tokens": message.usage.input_tokens,
-                    "output_tokens": message.usage.output_tokens,
-                    "total_tokens": message.usage.input_tokens
-                    + message.usage.output_tokens,
-                }
-                cost = self.calculate_cost(
-                    usage["input_tokens"], usage["output_tokens"]
-                )
-                return {
-                    "content": message.content[0].text,
-                    "usage": usage,
-                    "cost": cost,
-                }
-            # For binary file types (primarily PDFs), use base64 encoding with document format
-            mime_types = {
-                ".pdf": "application/pdf",
-            }
-            if media_type is None:
-                media_type = mime_types.get(ext)
-                if media_type is None:
-                    raise ValueError(
-                        f"Unsupported file type: {ext}. Supported types: {list(mime_types.keys())}"
-                    )
-                self.log.debug(f"Using media type: {media_type}")
-            with open(file_path, "rb") as f:
-                file_content = base64.b64encode(f.read()).decode("utf-8")
-                self.log.debug(f"File encoded, size: {len(file_content)} bytes")
-            self.log.info("Sending file for analysis")
-            message = self.client.messages.create(
-                model=self.model,
-                max_tokens=self.max_tokens,
-                messages=[
-                    {
-                        "role": "user",
-                        "content": [
-                            {
-                                "type": "document",
-                                "source": {
-                                    "type": "base64",
-                                    "media_type": media_type,
-                                    "data": file_content,
-                                },
-                            },
-                            {"type": "text", "text": prompt},
-                        ],
-                    }
-                ],
-            )
-            self.log.info("Successfully analyzed file")
-            # Extract usage and calculate cost
-            usage = {
-                "input_tokens": message.usage.input_tokens,
-                "output_tokens": message.usage.output_tokens,
-                "total_tokens": message.usage.input_tokens
-                + message.usage.output_tokens,
-            }
-            cost = self.calculate_cost(usage["input_tokens"], usage["output_tokens"])
-            return {"content": message.content[0].text, "usage": usage, "cost": cost}
-        except Exception as e:
-            self.log.error(f"Error analyzing file: {e}")
-            raise
-    def count_file_tokens(
-        self, file_path, prompt="", media_type=None, output_dir="./output/claude"
-    ):
-        """
-        Count tokens for a file and optional prompt combination.
-        Args:
-            file_path (str): Path to the file to analyze
-            prompt (str, optional): Additional prompt text to include in token count
-            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
-        Returns:
-            int: Total token count
-        """
-        self.log.info(f"Counting tokens for file: {file_path}")
-        ext = os.path.splitext(file_path)[1].lower()
-        try:
-            # For text-based files, count tokens of extracted text
-            if ext in [".html", ".htm", ".txt", ".md", ".csv", ".json"]:
-                if ext in [".html", ".htm"]:
-                    text_content = self._convert_html_to_text(
-                        file_path, save_text=False, output_dir=output_dir
-                    )
-                else:
-                    # For other text files, read directly
-                    with open(file_path, "r", encoding="utf-8") as f:
-                        text_content = f.read()
-                content = f"Document content:\n\n{text_content}\n\n{prompt}"
-                token_count = self.count_tokens(content)
-                self.log.info(
-                    f"Text file ({ext}) token count: {token_count.input_tokens}"
-                )
-                return token_count.input_tokens
-            # For binary file types (primarily PDFs), encode and count
-            mime_types = {
-                ".pdf": "application/pdf",
-            }
-            if media_type is None:
-                media_type = mime_types.get(ext)
-                if media_type is None:
-                    raise ValueError(
-                        f"Unsupported file type: {ext}. Supported types: {list(mime_types.keys())}"
-                    )
-                self.log.debug(f"Using media type: {media_type}")
-            with open(file_path, "rb") as f:
-                file_content = base64.b64encode(f.read()).decode("utf-8")
-            message_content = [
-                {
-                    "type": "document",
-                    "source": {
-                        "type": "base64",
-                        "media_type": media_type,
-                        "data": file_content,
-                    },
-                }
-            ]
-            if prompt:
-                message_content.append({"type": "text", "text": prompt})
-            token_count = self.client.messages.count_tokens(
-                model=self.model,
-                messages=[{"role": "user", "content": message_content}],
-            )
-            self.log.info(f"File token count: {token_count.input_tokens}")
-            return token_count.input_tokens
-        except Exception as e:
-            self.log.error(f"Error counting tokens: {e}")
-            raise
-# Example usage
-if __name__ == "__main__":
-    client = ClaudeClient()
-    # Test file analysis with Blender introduction document
-    file_path = "./data/html/blender/introduction.html"
-    prompt = (
-        "Given this document, generate a set of short queries a user "
-        "may ask about the document and produce a set of ground truth "
-        "answers to be used in validating a RAG system. Include a "
-        "summary of the document in the queries. Return a json "
-        "formatted list of query-response pairs formatted as follows:"
-        "{'source': 'path/to/document', 'summary': 'summarized document', "
-        "'qa_pairs': [{'query': 'query1', 'response': 'response1'}, "
-        "{'query': 'query2', 'response': 'response2'}, ...]}"
-    )
-    analysis = client.analyze_file(
-        file_path, prompt, save_text=True, output_dir="./output/claude"
-    )
-    print(client.count_file_tokens(file_path, prompt))
-    # Prepare enhanced output with metadata
-    from datetime import datetime
-    output_data = {
-        "metadata": {
-            "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
-            "model": client.model,
-            "source_file": file_path,
-            "prompt": prompt,
-            "token_count": client.count_file_tokens(file_path, prompt),
-        },
-        "analysis": json.loads(analysis),  # Parse JSON string into dictionary
-    }
-    # Save analysis to JSON file
-    output_dir = "./output/claude"
-    os.makedirs(output_dir, exist_ok=True)
-    output_path = f"{output_dir}/{Path(file_path).stem}.out.json"
-    with open(output_path, "w", encoding="utf-8") as f:
-        json.dump(output_data, f, indent=2)
-    print(f"Analysis saved to: {output_path}")
+# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+import base64
+import json
+import os
+from pathlib import Path
+try:
+    import anthropic
+except ImportError:
+    anthropic = None
+try:
+    from bs4 import BeautifulSoup
+except ImportError:
+    BeautifulSoup = None
+from dotenv import load_dotenv
+from gaia.eval.config import DEFAULT_CLAUDE_MODEL, MODEL_PRICING
+from gaia.logger import get_logger
+load_dotenv()
+class ClaudeClient:
+    log = get_logger(__name__)
+    def __init__(self, model=None, max_tokens=1024, max_retries=3):
+        """
+        Initialize Claude client with retry support.
+        Args:
+            model: Claude model to use (defaults to DEFAULT_CLAUDE_MODEL)
+            max_tokens: Maximum tokens in response (default: 1024)
+            max_retries: Maximum number of retry attempts for API calls with exponential backoff (default: 3)
+        """
+        # Check for required dependencies
+        if anthropic is None:
+            error_msg = (
+                "\n❌ Error: Missing required package 'anthropic'\n\n"
+                "Please install the eval dependencies:\n"
+                '  uv pip install -e ".[eval]"\n\n'
+                "Or install anthropic directly:\n"
+                "  uv pip install anthropic\n"
+            )
+            raise ImportError(error_msg)
+        if BeautifulSoup is None:
+            error_msg = (
+                "\n❌ Error: Missing required package 'bs4' (BeautifulSoup4)\n\n"
+                "Please install the eval dependencies:\n"
+                '  uv pip install -e ".[eval]"\n\n'
+                "Or install beautifulsoup4 directly:\n"
+                "  uv pip install beautifulsoup4\n"
+            )
+            raise ImportError(error_msg)
+        if model is None:
+            model = DEFAULT_CLAUDE_MODEL
+        self.log = self.__class__.log  # Use the class-level logger for instances
+        self.api_key = os.getenv("ANTHROPIC_API_KEY")
+        if not self.api_key:
+            error_msg = (
+                "ANTHROPIC_API_KEY not found in environment.\n"
+                "Please add your Anthropic API key to the .env file:\n"
+                "  ANTHROPIC_API_KEY=your_api_key_here\n"
+                "Alternatively, export it as an environment variable:\n"
+                "  export ANTHROPIC_API_KEY=your_api_key_here\n"
+            )
+            self.log.error(error_msg)
+            raise ValueError(error_msg)
+        # Initialize Anthropic client with retry support
+        # The SDK handles exponential backoff automatically
+        self.client = anthropic.Anthropic(
+            api_key=self.api_key,
+            max_retries=max_retries,
+            timeout=300.0,  # 5 minute timeout for large documents
+        )
+        self.model = model
+        self.max_tokens = max_tokens
+        self.max_retries = max_retries
+        self.log.info(
+            f"Initialized ClaudeClient with model: {model}, max_retries: {max_retries}"
+        )
+    def calculate_cost(self, input_tokens, output_tokens):
+        """
+        Calculate the cost of an API call based on token usage.
+        Args:
+            input_tokens (int): Number of input tokens
+            output_tokens (int): Number of output tokens
+        Returns:
+            dict: Cost breakdown with input_cost, output_cost, and total_cost
+        """
+        # Get pricing for the current model, fallback to default if not found
+        pricing = MODEL_PRICING.get(self.model, MODEL_PRICING["default"])
+        # Calculate costs (convert tokens to millions)
+        input_cost = (input_tokens / 1_000_000) * pricing["input_per_mtok"]
+        output_cost = (output_tokens / 1_000_000) * pricing["output_per_mtok"]
+        total_cost = input_cost + output_cost
+        return {
+            "input_cost": round(input_cost, 6),
+            "output_cost": round(output_cost, 6),
+            "total_cost": round(total_cost, 6),
+        }
+    def get_completion(self, prompt):
+        self.log.debug("Getting completion from Claude")
+        self.log.debug(f"Prompt token count: {self.count_tokens(prompt)}")
+        try:
+            message = self.client.messages.create(
+                model=self.model,
+                max_tokens=self.max_tokens,
+                messages=[{"role": "user", "content": prompt}],
+            )
+            return message.content
+        except Exception as e:
+            self.log.error(f"Error getting completion: {e}")
+            raise
+    def get_completion_with_usage(self, prompt):
+        """
+        Get completion from Claude and return both content and usage/cost information.
+        Args:
+            prompt (str): The prompt to send to Claude
+        Returns:
+            dict: Contains 'content', 'usage', and 'cost' keys
+        """
+        self.log.info("Getting completion with usage tracking from Claude")
+        try:
+            message = self.client.messages.create(
+                model=self.model,
+                max_tokens=self.max_tokens,
+                messages=[{"role": "user", "content": prompt}],
+            )
+            # Extract usage information
+            usage = {
+                "input_tokens": message.usage.input_tokens,
+                "output_tokens": message.usage.output_tokens,
+                "total_tokens": message.usage.input_tokens
+                + message.usage.output_tokens,
+            }
+            # Calculate cost
+            cost = self.calculate_cost(usage["input_tokens"], usage["output_tokens"])
+            self.log.info(
+                f"Usage: {usage['input_tokens']} input + {usage['output_tokens']} output = {usage['total_tokens']} total tokens"
+            )
+            self.log.info(
+                f"Cost: ${cost['input_cost']:.4f} input + ${cost['output_cost']:.4f} output = ${cost['total_cost']:.4f} total"
+            )
+            return {"content": message.content, "usage": usage, "cost": cost}
+        except Exception as e:
+            self.log.error(f"Error getting completion with usage: {e}")
+            raise
+    def list_models(self):
+        self.log.info("Retrieving available models")
+        try:
+            models = self.client.models.list(limit=20)
+            self.log.info(f"Successfully retrieved {len(models)} models")
+            return models
+        except Exception as e:
+            self.log.error(f"Error listing models: {e}")
+            raise
+    def count_tokens(self, prompt):
+        return self.client.messages.count_tokens(
+            model=self.model, messages=[{"role": "user", "content": prompt}]
+        )
+    def _convert_html_to_text(
+        self, file_path, save_text=False, output_dir="./output/claude"
+    ):
+        """
+        Convert HTML file content to plain text.
+        Args:
+            file_path (str): Path to the HTML file
+            save_text (bool): If True, saves extracted text to a file
+        Returns:
+            str: Extracted text content
+        """
+        self.log.info("Converting HTML to text")
+        with open(file_path, "r", encoding="utf-8") as f:
+            soup = BeautifulSoup(f.read(), "html.parser")
+            text_content = soup.get_text(separator="\n", strip=True)
+            self.log.debug(f"Extracted {len(text_content)} characters of text")
+            if save_text:
+                # Create output directory if it doesn't exist
+                os.makedirs(output_dir, exist_ok=True)
+                filename = Path(file_path).stem
+                output_path = f"{output_dir}/{filename}.soup.txt"
+                with open(output_path, "w", encoding="utf-8") as f:
+                    f.write(text_content)
+                self.log.info(f"Saved extracted text to: {output_path}")
+            return text_content
+    def analyze_file(
+        self,
+        file_path,
+        prompt,
+        media_type=None,
+        save_text=False,
+        output_dir="./output/claude",
+    ):
+        """
+        Analyze a file using Claude's file understanding capabilities.
+        Args:
+            file_path (str): Path to the file to analyze
+            prompt (str): The analysis prompt/question
+            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
+            save_text (bool, optional): If True, saves extracted text content to a file (for HTML files only)
+            output_dir (str, optional): The directory to save the output file
+        """
+        self.log.info(f"Analyzing file: {file_path}")
+        ext = os.path.splitext(file_path)[1].lower()
+        try:
+            # For HTML files, extract text using BeautifulSoup
+            if ext in [".html", ".htm"]:
+                text_content = self._convert_html_to_text(
+                    file_path, save_text, output_dir
+                )
+                message = self.client.messages.create(
+                    model=self.model,
+                    max_tokens=self.max_tokens,
+                    messages=[
+                        {
+                            "role": "user",
+                            "content": f"Document content:\n\n{text_content}\n\n{prompt}",
+                        }
+                    ],
+                )
+                self.log.info("Successfully analyzed HTML content")
+                return message.content[0].text
+            # For other file types, use the original base64 encoding method
+            mime_types = {
+                ".txt": "text/plain",
+                ".pdf": "application/pdf",
+                ".md": "text/markdown",
+                ".csv": "text/csv",
+                ".json": "application/json",
+            }
+            if media_type is None:
+                media_type = mime_types.get(ext, "application/octet-stream")
+                self.log.debug(f"Using media type: {media_type}")
+            with open(file_path, "rb") as f:
+                file_content = base64.b64encode(f.read()).decode("utf-8")
+                self.log.debug(f"File encoded, size: {len(file_content)} bytes")
+            self.log.info("Sending file for analysis")
+            message = self.client.messages.create(
+                model=self.model,
+                max_tokens=self.max_tokens,
+                messages=[
+                    {
+                        "role": "user",
+                        "content": [
+                            {
+                                "type": "document",
+                                "source": {
+                                    "type": "base64",
+                                    "media_type": media_type,
+                                    "data": file_content,
+                                },
+                            },
+                            {"type": "text", "text": prompt},
+                        ],
+                    }
+                ],
+            )
+            self.log.info("Successfully analyzed file")
+            return message.content[0].text
+        except Exception as e:
+            self.log.error(f"Error analyzing file: {e}")
+            raise
+    def analyze_file_with_usage(
+        self,
+        file_path,
+        prompt,
+        media_type=None,
+        save_text=False,
+        output_dir="./output/claude",
+    ):
+        """
+        Analyze a file using Claude's file understanding capabilities with usage tracking.
+        Args:
+            file_path (str): Path to the file to analyze
+            prompt (str): The analysis prompt/question
+            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
+            save_text (bool, optional): If True, saves extracted text content to a file (for HTML files only)
+            output_dir (str, optional): The directory to save the output file
+        Returns:
+            dict: Contains 'content', 'usage', and 'cost' keys
+        """
+        self.log.info(f"Analyzing file with usage tracking: {file_path}")
+        ext = os.path.splitext(file_path)[1].lower()
+        try:
+            # For text-based files, read content directly as text
+            if ext in [".html", ".htm", ".txt", ".md", ".csv", ".json"]:
+                if ext in [".html", ".htm"]:
+                    text_content = self._convert_html_to_text(
+                        file_path, save_text, output_dir
+                    )
+                else:
+                    # For other text files, read directly
+                    with open(file_path, "r", encoding="utf-8") as f:
+                        text_content = f.read()
+                    self.log.debug(
+                        f"Read text file, length: {len(text_content)} characters"
+                    )
+                message = self.client.messages.create(
+                    model=self.model,
+                    max_tokens=self.max_tokens,
+                    messages=[
+                        {
+                            "role": "user",
+                            "content": f"Document content:\n\n{text_content}\n\n{prompt}",
+                        }
+                    ],
+                )
+                self.log.info(f"Successfully analyzed text content ({ext} file)")
+                # Extract usage and calculate cost
+                usage = {
+                    "input_tokens": message.usage.input_tokens,
+                    "output_tokens": message.usage.output_tokens,
+                    "total_tokens": message.usage.input_tokens
+                    + message.usage.output_tokens,
+                }
+                cost = self.calculate_cost(
+                    usage["input_tokens"], usage["output_tokens"]
+                )
+                return {
+                    "content": message.content[0].text,
+                    "usage": usage,
+                    "cost": cost,
+                }
+            # For binary file types (primarily PDFs), use base64 encoding with document format
+            mime_types = {
+                ".pdf": "application/pdf",
+            }
+            if media_type is None:
+                media_type = mime_types.get(ext)
+                if media_type is None:
+                    raise ValueError(
+                        f"Unsupported file type: {ext}. Supported types: {list(mime_types.keys())}"
+                    )
+                self.log.debug(f"Using media type: {media_type}")
+            with open(file_path, "rb") as f:
+                file_content = base64.b64encode(f.read()).decode("utf-8")
+                self.log.debug(f"File encoded, size: {len(file_content)} bytes")
+            self.log.info("Sending file for analysis")
+            message = self.client.messages.create(
+                model=self.model,
+                max_tokens=self.max_tokens,
+                messages=[
+                    {
+                        "role": "user",
+                        "content": [
+                            {
+                                "type": "document",
+                                "source": {
+                                    "type": "base64",
+                                    "media_type": media_type,
+                                    "data": file_content,
+                                },
+                            },
+                            {"type": "text", "text": prompt},
+                        ],
+                    }
+                ],
+            )
+            self.log.info("Successfully analyzed file")
+            # Extract usage and calculate cost
+            usage = {
+                "input_tokens": message.usage.input_tokens,
+                "output_tokens": message.usage.output_tokens,
+                "total_tokens": message.usage.input_tokens
+                + message.usage.output_tokens,
+            }
+            cost = self.calculate_cost(usage["input_tokens"], usage["output_tokens"])
+            return {"content": message.content[0].text, "usage": usage, "cost": cost}
+        except Exception as e:
+            self.log.error(f"Error analyzing file: {e}")
+            raise
+    def count_file_tokens(
+        self, file_path, prompt="", media_type=None, output_dir="./output/claude"
+    ):
+        """
+        Count tokens for a file and optional prompt combination.
+        Args:
+            file_path (str): Path to the file to analyze
+            prompt (str, optional): Additional prompt text to include in token count
+            media_type (str, optional): The MIME type of the file. If None, will try to infer from extension
+        Returns:
+            int: Total token count
+        """
+        self.log.info(f"Counting tokens for file: {file_path}")
+        ext = os.path.splitext(file_path)[1].lower()
+        try:
+            # For text-based files, count tokens of extracted text
+            if ext in [".html", ".htm", ".txt", ".md", ".csv", ".json"]:
+                if ext in [".html", ".htm"]:
+                    text_content = self._convert_html_to_text(
+                        file_path, save_text=False, output_dir=output_dir
+                    )
+                else:
+                    # For other text files, read directly
+                    with open(file_path, "r", encoding="utf-8") as f:
+                        text_content = f.read()
+                content = f"Document content:\n\n{text_content}\n\n{prompt}"
+                token_count = self.count_tokens(content)
+                self.log.info(
+                    f"Text file ({ext}) token count: {token_count.input_tokens}"
+                )
+                return token_count.input_tokens
+            # For binary file types (primarily PDFs), encode and count
+            mime_types = {
+                ".pdf": "application/pdf",
+            }
+            if media_type is None:
+                media_type = mime_types.get(ext)
+                if media_type is None:
+                    raise ValueError(
+                        f"Unsupported file type: {ext}. Supported types: {list(mime_types.keys())}"
+                    )
+                self.log.debug(f"Using media type: {media_type}")
+            with open(file_path, "rb") as f:
+                file_content = base64.b64encode(f.read()).decode("utf-8")
+            message_content = [
+                {
+                    "type": "document",
+                    "source": {
+                        "type": "base64",
+                        "media_type": media_type,
+                        "data": file_content,
+                    },
+                }
+            ]
+            if prompt:
+                message_content.append({"type": "text", "text": prompt})
+            token_count = self.client.messages.count_tokens(
+                model=self.model,
+                messages=[{"role": "user", "content": message_content}],
+            )
+            self.log.info(f"File token count: {token_count.input_tokens}")
+            return token_count.input_tokens
+        except Exception as e:
+            self.log.error(f"Error counting tokens: {e}")
+            raise
+# Example usage
+if __name__ == "__main__":
+    client = ClaudeClient()
+    # Test file analysis with Blender introduction document
+    file_path = "./data/html/blender/introduction.html"
+    prompt = (
+        "Given this document, generate a set of short queries a user "
+        "may ask about the document and produce a set of ground truth "
+        "answers to be used in validating a RAG system. Include a "
+        "summary of the document in the queries. Return a json "
+        "formatted list of query-response pairs formatted as follows:"
+        "{'source': 'path/to/document', 'summary': 'summarized document', "
+        "'qa_pairs': [{'query': 'query1', 'response': 'response1'}, "
+        "{'query': 'query2', 'response': 'response2'}, ...]}"
+    )
+    analysis = client.analyze_file(
+        file_path, prompt, save_text=True, output_dir="./output/claude"
+    )
+    print(client.count_file_tokens(file_path, prompt))
+    # Prepare enhanced output with metadata
+    from datetime import datetime
+    output_data = {
+        "metadata": {
+            "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
+            "model": client.model,
+            "source_file": file_path,
+            "prompt": prompt,
+            "token_count": client.count_file_tokens(file_path, prompt),
+        },
+        "analysis": json.loads(analysis),  # Parse JSON string into dictionary
+    }
+    # Save analysis to JSON file
+    output_dir = "./output/claude"
+    os.makedirs(output_dir, exist_ok=True)
+    output_path = f"{output_dir}/{Path(file_path).stem}.out.json"
+    with open(output_path, "w", encoding="utf-8") as f:
+        json.dump(output_data, f, indent=2)
+    print(f"Analysis saved to: {output_path}")

amd-gaia 0.15.0__py3-none-any.whl → 0.15.1__py3-none-any.whl

amd-gaia 0.15.0py3-none-any.whl → 0.15.1py3-none-any.whl