PyPI - amd-gaia - Versions diffs - 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl - Mend

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/METADATA +223 -223
amd_gaia-0.15.1.dist-info/RECORD +178 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2177 -2177
gaia/agents/base/api_agent.py +120 -120
gaia/agents/base/console.py +1841 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +83 -83
gaia/agents/blender/agent.py +556 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +835 -835
gaia/agents/chat/app.py +1058 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1729 -1729
gaia/agents/chat/tools/shell_tools.py +436 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2036 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +642 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1506 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1974 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +173 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +430 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5481 -5621
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/llm/__init__.py +9 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3236 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +120 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +163 -163
gaia/talk/app.py +289 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.14.3.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -729
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/WHEEL +0 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/top_level.txt +0 -0

gaia/api/openai_server.py CHANGED Viewed

@@ -1,575 +1,575 @@
-# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""
-OpenAI-compatible API server for GAIA
-This module provides a FastAPI server that exposes GAIA agents via
-OpenAI-compatible endpoints, allowing VSCode and other tools to use
-GAIA agents as if they were OpenAI models.
-Endpoints:
-    POST /v1/chat/completions - Create chat completion (streaming and non-streaming)
-    GET /v1/models - List available models (GAIA agents)
-    GET /health - Health check
-"""
-import asyncio
-import json
-import logging
-import os
-import time
-import uuid
-from typing import AsyncGenerator
-from fastapi import FastAPI, HTTPException, Request
-from fastapi.middleware.cors import CORSMiddleware
-from fastapi.responses import StreamingResponse
-from gaia.agents.base.api_agent import ApiAgent
-from .agent_registry import registry
-from .schemas import (
-    ChatCompletionChoice,
-    ChatCompletionRequest,
-    ChatCompletionResponse,
-    ChatCompletionResponseMessage,
-    ModelListResponse,
-    UsageInfo,
-)
-# Configure logging
-logger = logging.getLogger(__name__)
-# Set logger level based on debug flag
-if os.environ.get("GAIA_API_DEBUG") == "1":
-    logger.setLevel(logging.DEBUG)
-    logger.info("Debug logging enabled for API server")
-def extract_workspace_root(messages):
-    """
-    Extract workspace root path from GitHub Copilot messages.
-    GitHub Copilot includes workspace info in messages like:
-    <workspace_info>
-    I am working in a workspace with the following folders:
-    - /Users/username/path/to/workspace
-    </workspace_info>
-    Args:
-        messages: List of ChatMessage objects
-    Returns:
-        str: Workspace root path, or None if not found
-    """
-    import re
-    for msg in messages:
-        if msg.role == "user" and msg.content:
-            # Look for workspace_info section
-            workspace_match = re.search(
-                r"<workspace_info>.*?following folders:\s*\n\s*-\s*([^\s\n]+)",
-                msg.content,
-                re.DOTALL,
-            )
-            if workspace_match:
-                return workspace_match.group(1).strip()
-    return None
-# Initialize FastAPI app
-app = FastAPI(
-    title="GAIA OpenAI-Compatible API",
-    description="OpenAI-compatible API for GAIA agents",
-    version="1.0.0",
-)
-# CORS middleware - allow all origins for development
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-# Raw request logging middleware (debug mode only)
-@app.middleware("http")
-async def log_raw_requests(request: Request, call_next):
-    """
-    Middleware to log raw HTTP requests when debug mode is enabled.
-    For streaming endpoints, only log headers to avoid breaking SSE.
-    """
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("=" * 80)
-        logger.debug("📥 RAW HTTP REQUEST")
-        logger.debug("=" * 80)
-        logger.debug(f"Path: {request.url.path}")
-        logger.debug(f"Method: {request.method}")
-        logger.debug("Headers:")
-        for name, value in request.headers.items():
-            logger.debug(f"  {name}: {value}")
-        # DON'T read body for streaming endpoints - it breaks ASGI message flow
-        # Per FastAPI docs: "Never read the request body in middleware for streaming responses"
-        if request.url.path == "/v1/chat/completions" and request.method == "POST":
-            logger.debug(
-                "Body: [Skipped for streaming endpoint - prevents ASGI message flow disruption]"
-            )
-        else:
-            # Safe to read body for non-streaming endpoints
-            body_bytes = await request.body()
-            logger.debug(f"Body (raw bytes length): {len(body_bytes)}")
-            if body_bytes:
-                try:
-                    body_str = body_bytes.decode("utf-8")
-                    logger.debug("Body (decoded UTF-8):")
-                    logger.debug(body_str)
-                    # Try to pretty-print JSON
-                    try:
-                        body_json = json.loads(body_str)
-                        logger.debug("Body (parsed JSON):")
-                        logger.debug(json.dumps(body_json, indent=2))
-                    except json.JSONDecodeError:
-                        pass
-                except UnicodeDecodeError:
-                    logger.debug("Body contains non-UTF-8 data")
-        logger.debug("=" * 80)
-    response = await call_next(request)
-    return response
-@app.post("/v1/chat/completions")
-async def create_chat_completion(request: ChatCompletionRequest):
-    """
-    Create chat completion (OpenAI-compatible endpoint).
-    Supports both streaming (SSE) and non-streaming responses.
-    Args:
-        request: Chat completion request with model, messages, and options
-    Returns:
-        For non-streaming: ChatCompletionResponse
-        For streaming: StreamingResponse with SSE chunks
-    Raises:
-        HTTPException 404: Model not found
-        HTTPException 400: No user message in request
-    Example:
-        Non-streaming:
-        ```
-        POST /v1/chat/completions
-        {
-            "model": "gaia-code",
-            "messages": [{"role": "user", "content": "Write hello world"}],
-            "stream": false
-        }
-        ```
-        Streaming:
-        ```
-        POST /v1/chat/completions
-        {
-            "model": "gaia-code",
-            "messages": [{"role": "user", "content": "Write hello world"}],
-            "stream": true
-        }
-        ```
-    """
-    # Debug logging: trace incoming request
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("=" * 80)
-        logger.debug("📥 INCOMING CHAT COMPLETION REQUEST")
-        logger.debug("=" * 80)
-        logger.debug(f"Model: {request.model}")
-        logger.debug(f"Stream: {request.stream}")
-        logger.debug(f"Message count: {len(request.messages)}")
-        logger.debug("-" * 80)
-        for i, msg in enumerate(request.messages):
-            logger.debug(f"Message {i}:")
-            logger.debug(f"  Role: {msg.role}")
-            # Preview content (truncate if too long)
-            content_preview = (
-                msg.content[:500] if len(msg.content) > 500 else msg.content
-            )
-            if len(msg.content) > 500:
-                content_preview += (
-                    f"\n  ... (truncated, total length: {len(msg.content)} chars)"
-                )
-            logger.debug(f"  Content:\n{content_preview}")
-            logger.debug("-" * 40)
-        # Log additional request parameters
-        logger.debug("Request parameters:")
-        logger.debug(f"  temperature: {getattr(request, 'temperature', 'not set')}")
-        logger.debug(f"  max_tokens: {getattr(request, 'max_tokens', 'not set')}")
-        logger.debug(f"  top_p: {getattr(request, 'top_p', 'not set')}")
-        logger.debug("=" * 80)
-    # Validate model exists
-    if not registry.model_exists(request.model):
-        raise HTTPException(
-            status_code=404, detail=f"Model '{request.model}' not found"
-        )
-    # Extract workspace root from messages (for converting relative paths to absolute)
-    workspace_root = extract_workspace_root(request.messages)
-    if os.environ.get("GAIA_API_DEBUG") == "1" and workspace_root:
-        logger.debug(f"📁 Extracted workspace root: {workspace_root}")
-    # Extract user query from messages (get last user message)
-    user_message = next(
-        (m.content for m in reversed(request.messages) if m.role == "user"), None
-    )
-    if not user_message:
-        raise HTTPException(
-            status_code=400, detail="No user message found in messages array"
-        )
-    # Debug logging: show what we're passing to the agent
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("🔄 EXTRACTED FOR AGENT:")
-        logger.debug(f"Passing to agent: {user_message[:500]}...")
-        if len(user_message) > 500:
-            logger.debug(f"(Total length: {len(user_message)} chars)")
-        logger.debug("=" * 80)
-    # Get agent instance for this model
-    try:
-        agent = registry.get_agent(request.model)
-    except ValueError as e:
-        raise HTTPException(status_code=404, detail=str(e))
-    # Handle streaming vs non-streaming
-    if request.stream:
-        # Debug logging for streaming mode
-        if os.environ.get("GAIA_API_DEBUG") == "1":
-            logger.debug("🌊 Using STREAMING mode")
-        return StreamingResponse(
-            create_sse_stream(
-                agent, user_message, request.model, workspace_root=workspace_root
-            ),
-            media_type="text/event-stream",
-            headers={
-                "Cache-Control": "no-cache",
-                "Connection": "keep-alive",
-                "X-Accel-Buffering": "no",  # Disable proxy buffering
-            },
-        )
-    else:
-        # Debug logging for non-streaming mode
-        if os.environ.get("GAIA_API_DEBUG") == "1":
-            logger.debug("📦 Using NON-STREAMING mode")
-        # Process query synchronously with workspace root
-        result = agent.process_query(user_message, workspace_root=workspace_root)
-        # Debug logging: show what agent returned
-        if os.environ.get("GAIA_API_DEBUG") == "1":
-            logger.debug("=" * 80)
-            logger.debug("📤 AGENT RESPONSE (NON-STREAMING)")
-            logger.debug("=" * 80)
-            logger.debug(f"Result type: {type(result)}")
-            logger.debug(
-                f"Result keys: {list(result.keys()) if isinstance(result, dict) else 'N/A'}"
-            )
-            logger.debug(
-                f"Status: {result.get('status') if isinstance(result, dict) else 'N/A'}"
-            )
-            logger.debug(
-                f"Steps taken: {result.get('steps_taken') if isinstance(result, dict) else 'N/A'}"
-            )
-            result_preview = (
-                str(result.get("result", ""))[:200]
-                if isinstance(result, dict)
-                else str(result)[:200]
-            )
-            logger.debug(f"Result preview: {result_preview}...")
-            logger.debug("=" * 80)
-        # Extract content from result
-        content = result.get("result", str(result))
-        # Estimate tokens
-        if isinstance(agent, ApiAgent):
-            prompt_tokens = agent.estimate_tokens(user_message)
-            completion_tokens = agent.estimate_tokens(content)
-        else:
-            prompt_tokens = len(user_message) // 4
-            completion_tokens = len(content) // 4
-        return ChatCompletionResponse(
-            id=f"chatcmpl-{uuid.uuid4().hex[:24]}",
-            object="chat.completion",
-            created=int(time.time()),
-            model=request.model,
-            choices=[
-                ChatCompletionChoice(
-                    index=0,
-                    message=ChatCompletionResponseMessage(
-                        role="assistant",
-                        content=content,
-                    ),
-                    finish_reason="stop",
-                )
-            ],
-            usage=UsageInfo(
-                prompt_tokens=prompt_tokens,
-                completion_tokens=completion_tokens,
-                total_tokens=prompt_tokens + completion_tokens,
-            ),
-        )
-async def create_sse_stream(
-    agent, query: str, model: str, workspace_root: str = None
-) -> AsyncGenerator[str, None]:
-    """
-    Create Server-Sent Events stream for chat completion.
-    This function processes the agent query in a thread pool (to avoid blocking)
-    and streams agent progress events in real-time via the SSEOutputHandler.
-    Args:
-        agent: Agent instance (with SSEOutputHandler)
-        query: User query string
-        model: Model ID
-        workspace_root: Optional workspace root path for absolute file paths
-    Yields:
-        SSE-formatted chunks with "data: " prefix
-    Example output:
-        data: {"id":"chatcmpl-123","object":"chat.completion.chunk",...}
-        data: {"id":"chatcmpl-123","object":"chat.completion.chunk",...}
-        data: [DONE]
-    """
-    # Debug logging - FIRST LINE to confirm generator starts
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("🎬 Generator started! Client is consuming the stream.")
-    completion_id = f"chatcmpl-{uuid.uuid4().hex[:24]}"
-    created = int(time.time())
-    # First chunk with role
-    first_chunk = {
-        "id": completion_id,
-        "object": "chat.completion.chunk",
-        "created": created,
-        "model": model,
-        "choices": [
-            {
-                "index": 0,
-                "delta": {"role": "assistant", "content": ""},
-                "finish_reason": None,
-            }
-        ],
-    }
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug(f"📤 Sending first chunk: {json.dumps(first_chunk)}")
-    yield f"data: {json.dumps(first_chunk)}\n\n"
-    # Debug logging
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("🔄 Starting agent query processing in thread pool...")
-    # Process query in thread pool to avoid blocking event loop
-    loop = asyncio.get_event_loop()
-    # Get the SSEOutputHandler from the agent (try output_handler first, fall back to console)
-    output_handler = getattr(agent, "output_handler", None) or getattr(
-        agent, "console", None
-    )
-    try:
-        # Start processing in background
-        task = loop.run_in_executor(
-            None, lambda: agent.process_query(query, workspace_root=workspace_root)
-        )
-        # Stream events as they are generated
-        while not task.done():
-            # Check for new events from the output handler
-            if hasattr(output_handler, "has_events") and output_handler.has_events():
-                events = output_handler.get_events()
-                for event in events:
-                    event_type = event.get("type", "message")
-                    # Check if this event should be streamed to client
-                    if not output_handler.should_stream_as_content(event_type):
-                        # Still log it in debug mode
-                        if os.environ.get("GAIA_API_DEBUG") == "1":
-                            logger.debug(f"📝 Skipping event: {event_type}")
-                        continue
-                    # Format event as clean content
-                    content_text = output_handler.format_event_as_content(event)
-                    # Skip empty content (filtered events)
-                    if not content_text:
-                        continue
-                    content_chunk = {
-                        "id": completion_id,
-                        "object": "chat.completion.chunk",
-                        "created": created,
-                        "model": model,
-                        "choices": [
-                            {
-                                "index": 0,
-                                "delta": {"content": content_text},
-                                "finish_reason": None,
-                            }
-                        ],
-                    }
-                    if os.environ.get("GAIA_API_DEBUG") == "1":
-                        logger.debug(
-                            f"📤 Streaming event: {event_type} -> {content_text[:100]}"
-                        )
-                    yield f"data: {json.dumps(content_chunk)}\n\n"
-            # Small delay to avoid busy waiting
-            await asyncio.sleep(0.1)
-        # Get the final result
-        result = await task
-        # Get any remaining events
-        if hasattr(output_handler, "has_events") and output_handler.has_events():
-            events = output_handler.get_events()
-            for event in events:
-                event_type = event.get("type", "message")
-                # Check if this event should be streamed
-                if not output_handler.should_stream_as_content(event_type):
-                    continue
-                # Format event as clean content
-                content_text = output_handler.format_event_as_content(event)
-                # Skip empty content
-                if not content_text:
-                    continue
-                content_chunk = {
-                    "id": completion_id,
-                    "object": "chat.completion.chunk",
-                    "created": created,
-                    "model": model,
-                    "choices": [
-                        {
-                            "index": 0,
-                            "delta": {"content": content_text},
-                            "finish_reason": None,
-                        }
-                    ],
-                }
-                yield f"data: {json.dumps(content_chunk)}\n\n"
-        # Debug logging: show what agent returned
-        if os.environ.get("GAIA_API_DEBUG") == "1":
-            logger.debug("=" * 80)
-            logger.debug("📤 AGENT RESPONSE (STREAMING)")
-            logger.debug("=" * 80)
-            logger.debug(f"Result type: {type(result)}")
-            logger.debug(
-                f"Result keys: {list(result.keys()) if isinstance(result, dict) else 'N/A'}"
-            )
-            logger.debug(
-                f"Status: {result.get('status') if isinstance(result, dict) else 'N/A'}"
-            )
-            logger.debug(
-                f"Steps taken: {result.get('steps_taken') if isinstance(result, dict) else 'N/A'}"
-            )
-            result_preview = (
-                str(result.get("result", ""))[:200]
-                if isinstance(result, dict)
-                else str(result)[:200]
-            )
-            logger.debug(f"Result preview: {result_preview}...")
-            logger.debug("=" * 80)
-    except Exception as e:
-        # Log and re-raise errors
-        logger.error(f"❌ Agent query processing failed: {e}", exc_info=True)
-        raise
-    # Final chunk with finish_reason
-    final_chunk = {
-        "id": completion_id,
-        "object": "chat.completion.chunk",
-        "created": created,
-        "model": model,
-        "choices": [{"index": 0, "delta": {}, "finish_reason": "stop"}],
-    }
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("📤 Sending final chunk with finish_reason=stop")
-    yield f"data: {json.dumps(final_chunk)}\n\n"
-    # Done marker
-    if os.environ.get("GAIA_API_DEBUG") == "1":
-        logger.debug("✅ SSE stream complete. Sending [DONE] marker.")
-    yield "data: [DONE]\n\n"
-@app.get("/v1/models")
-async def list_models() -> ModelListResponse:
-    """
-    List available models (OpenAI-compatible endpoint).
-    Note: These are GAIA agents exposed as "models", not LLM models.
-    Lemonade manages the actual LLM models underneath.
-    Returns:
-        ModelListResponse with list of available agent "models"
-    Example:
-        ```
-        GET /v1/models
-        {
-            "object": "list",
-            "data": [
-                {
-                    "id": "gaia-code",
-                    "object": "model",
-                    "created": 1234567890,
-                    "owned_by": "amd-gaia"
-                },
-                ...
-            ]
-        }
-        ```
-    """
-    return ModelListResponse(object="list", data=registry.list_models())
-@app.get("/health")
-async def health_check():
-    """
-    Health check endpoint.
-    Returns:
-        Status and service name
-    Example:
-        ```
-        GET /health
-        {
-            "status": "ok",
-            "service": "gaia-api"
-        }
-        ```
-    """
-    return {"status": "ok", "service": "gaia-api"}
+# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""
+OpenAI-compatible API server for GAIA
+This module provides a FastAPI server that exposes GAIA agents via
+OpenAI-compatible endpoints, allowing VSCode and other tools to use
+GAIA agents as if they were OpenAI models.
+Endpoints:
+    POST /v1/chat/completions - Create chat completion (streaming and non-streaming)
+    GET /v1/models - List available models (GAIA agents)
+    GET /health - Health check
+"""
+import asyncio
+import json
+import logging
+import os
+import time
+import uuid
+from typing import AsyncGenerator
+from fastapi import FastAPI, HTTPException, Request
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import StreamingResponse
+from gaia.agents.base.api_agent import ApiAgent
+from .agent_registry import registry
+from .schemas import (
+    ChatCompletionChoice,
+    ChatCompletionRequest,
+    ChatCompletionResponse,
+    ChatCompletionResponseMessage,
+    ModelListResponse,
+    UsageInfo,
+)
+# Configure logging
+logger = logging.getLogger(__name__)
+# Set logger level based on debug flag
+if os.environ.get("GAIA_API_DEBUG") == "1":
+    logger.setLevel(logging.DEBUG)
+    logger.info("Debug logging enabled for API server")
+def extract_workspace_root(messages):
+    """
+    Extract workspace root path from GitHub Copilot messages.
+    GitHub Copilot includes workspace info in messages like:
+    <workspace_info>
+    I am working in a workspace with the following folders:
+    - /Users/username/path/to/workspace
+    </workspace_info>
+    Args:
+        messages: List of ChatMessage objects
+    Returns:
+        str: Workspace root path, or None if not found
+    """
+    import re
+    for msg in messages:
+        if msg.role == "user" and msg.content:
+            # Look for workspace_info section
+            workspace_match = re.search(
+                r"<workspace_info>.*?following folders:\s*\n\s*-\s*([^\s\n]+)",
+                msg.content,
+                re.DOTALL,
+            )
+            if workspace_match:
+                return workspace_match.group(1).strip()
+    return None
+# Initialize FastAPI app
+app = FastAPI(
+    title="GAIA OpenAI-Compatible API",
+    description="OpenAI-compatible API for GAIA agents",
+    version="1.0.0",
+)
+# CORS middleware - allow all origins for development
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Raw request logging middleware (debug mode only)
+@app.middleware("http")
+async def log_raw_requests(request: Request, call_next):
+    """
+    Middleware to log raw HTTP requests when debug mode is enabled.
+    For streaming endpoints, only log headers to avoid breaking SSE.
+    """
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("=" * 80)
+        logger.debug("📥 RAW HTTP REQUEST")
+        logger.debug("=" * 80)
+        logger.debug(f"Path: {request.url.path}")
+        logger.debug(f"Method: {request.method}")
+        logger.debug("Headers:")
+        for name, value in request.headers.items():
+            logger.debug(f"  {name}: {value}")
+        # DON'T read body for streaming endpoints - it breaks ASGI message flow
+        # Per FastAPI docs: "Never read the request body in middleware for streaming responses"
+        if request.url.path == "/v1/chat/completions" and request.method == "POST":
+            logger.debug(
+                "Body: [Skipped for streaming endpoint - prevents ASGI message flow disruption]"
+            )
+        else:
+            # Safe to read body for non-streaming endpoints
+            body_bytes = await request.body()
+            logger.debug(f"Body (raw bytes length): {len(body_bytes)}")
+            if body_bytes:
+                try:
+                    body_str = body_bytes.decode("utf-8")
+                    logger.debug("Body (decoded UTF-8):")
+                    logger.debug(body_str)
+                    # Try to pretty-print JSON
+                    try:
+                        body_json = json.loads(body_str)
+                        logger.debug("Body (parsed JSON):")
+                        logger.debug(json.dumps(body_json, indent=2))
+                    except json.JSONDecodeError:
+                        pass
+                except UnicodeDecodeError:
+                    logger.debug("Body contains non-UTF-8 data")
+        logger.debug("=" * 80)
+    response = await call_next(request)
+    return response
+@app.post("/v1/chat/completions")
+async def create_chat_completion(request: ChatCompletionRequest):
+    """
+    Create chat completion (OpenAI-compatible endpoint).
+    Supports both streaming (SSE) and non-streaming responses.
+    Args:
+        request: Chat completion request with model, messages, and options
+    Returns:
+        For non-streaming: ChatCompletionResponse
+        For streaming: StreamingResponse with SSE chunks
+    Raises:
+        HTTPException 404: Model not found
+        HTTPException 400: No user message in request
+    Example:
+        Non-streaming:
+        ```
+        POST /v1/chat/completions
+        {
+            "model": "gaia-code",
+            "messages": [{"role": "user", "content": "Write hello world"}],
+            "stream": false
+        }
+        ```
+        Streaming:
+        ```
+        POST /v1/chat/completions
+        {
+            "model": "gaia-code",
+            "messages": [{"role": "user", "content": "Write hello world"}],
+            "stream": true
+        }
+        ```
+    """
+    # Debug logging: trace incoming request
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("=" * 80)
+        logger.debug("📥 INCOMING CHAT COMPLETION REQUEST")
+        logger.debug("=" * 80)
+        logger.debug(f"Model: {request.model}")
+        logger.debug(f"Stream: {request.stream}")
+        logger.debug(f"Message count: {len(request.messages)}")
+        logger.debug("-" * 80)
+        for i, msg in enumerate(request.messages):
+            logger.debug(f"Message {i}:")
+            logger.debug(f"  Role: {msg.role}")
+            # Preview content (truncate if too long)
+            content_preview = (
+                msg.content[:500] if len(msg.content) > 500 else msg.content
+            )
+            if len(msg.content) > 500:
+                content_preview += (
+                    f"\n  ... (truncated, total length: {len(msg.content)} chars)"
+                )
+            logger.debug(f"  Content:\n{content_preview}")
+            logger.debug("-" * 40)
+        # Log additional request parameters
+        logger.debug("Request parameters:")
+        logger.debug(f"  temperature: {getattr(request, 'temperature', 'not set')}")
+        logger.debug(f"  max_tokens: {getattr(request, 'max_tokens', 'not set')}")
+        logger.debug(f"  top_p: {getattr(request, 'top_p', 'not set')}")
+        logger.debug("=" * 80)
+    # Validate model exists
+    if not registry.model_exists(request.model):
+        raise HTTPException(
+            status_code=404, detail=f"Model '{request.model}' not found"
+        )
+    # Extract workspace root from messages (for converting relative paths to absolute)
+    workspace_root = extract_workspace_root(request.messages)
+    if os.environ.get("GAIA_API_DEBUG") == "1" and workspace_root:
+        logger.debug(f"📁 Extracted workspace root: {workspace_root}")
+    # Extract user query from messages (get last user message)
+    user_message = next(
+        (m.content for m in reversed(request.messages) if m.role == "user"), None
+    )
+    if not user_message:
+        raise HTTPException(
+            status_code=400, detail="No user message found in messages array"
+        )
+    # Debug logging: show what we're passing to the agent
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("🔄 EXTRACTED FOR AGENT:")
+        logger.debug(f"Passing to agent: {user_message[:500]}...")
+        if len(user_message) > 500:
+            logger.debug(f"(Total length: {len(user_message)} chars)")
+        logger.debug("=" * 80)
+    # Get agent instance for this model
+    try:
+        agent = registry.get_agent(request.model)
+    except ValueError as e:
+        raise HTTPException(status_code=404, detail=str(e))
+    # Handle streaming vs non-streaming
+    if request.stream:
+        # Debug logging for streaming mode
+        if os.environ.get("GAIA_API_DEBUG") == "1":
+            logger.debug("🌊 Using STREAMING mode")
+        return StreamingResponse(
+            create_sse_stream(
+                agent, user_message, request.model, workspace_root=workspace_root
+            ),
+            media_type="text/event-stream",
+            headers={
+                "Cache-Control": "no-cache",
+                "Connection": "keep-alive",
+                "X-Accel-Buffering": "no",  # Disable proxy buffering
+            },
+        )
+    else:
+        # Debug logging for non-streaming mode
+        if os.environ.get("GAIA_API_DEBUG") == "1":
+            logger.debug("📦 Using NON-STREAMING mode")
+        # Process query synchronously with workspace root
+        result = agent.process_query(user_message, workspace_root=workspace_root)
+        # Debug logging: show what agent returned
+        if os.environ.get("GAIA_API_DEBUG") == "1":
+            logger.debug("=" * 80)
+            logger.debug("📤 AGENT RESPONSE (NON-STREAMING)")
+            logger.debug("=" * 80)
+            logger.debug(f"Result type: {type(result)}")
+            logger.debug(
+                f"Result keys: {list(result.keys()) if isinstance(result, dict) else 'N/A'}"
+            )
+            logger.debug(
+                f"Status: {result.get('status') if isinstance(result, dict) else 'N/A'}"
+            )
+            logger.debug(
+                f"Steps taken: {result.get('steps_taken') if isinstance(result, dict) else 'N/A'}"
+            )
+            result_preview = (
+                str(result.get("result", ""))[:200]
+                if isinstance(result, dict)
+                else str(result)[:200]
+            )
+            logger.debug(f"Result preview: {result_preview}...")
+            logger.debug("=" * 80)
+        # Extract content from result
+        content = result.get("result", str(result))
+        # Estimate tokens
+        if isinstance(agent, ApiAgent):
+            prompt_tokens = agent.estimate_tokens(user_message)
+            completion_tokens = agent.estimate_tokens(content)
+        else:
+            prompt_tokens = len(user_message) // 4
+            completion_tokens = len(content) // 4
+        return ChatCompletionResponse(
+            id=f"chatcmpl-{uuid.uuid4().hex[:24]}",
+            object="chat.completion",
+            created=int(time.time()),
+            model=request.model,
+            choices=[
+                ChatCompletionChoice(
+                    index=0,
+                    message=ChatCompletionResponseMessage(
+                        role="assistant",
+                        content=content,
+                    ),
+                    finish_reason="stop",
+                )
+            ],
+            usage=UsageInfo(
+                prompt_tokens=prompt_tokens,
+                completion_tokens=completion_tokens,
+                total_tokens=prompt_tokens + completion_tokens,
+            ),
+        )
+async def create_sse_stream(
+    agent, query: str, model: str, workspace_root: str = None
+) -> AsyncGenerator[str, None]:
+    """
+    Create Server-Sent Events stream for chat completion.
+    This function processes the agent query in a thread pool (to avoid blocking)
+    and streams agent progress events in real-time via the SSEOutputHandler.
+    Args:
+        agent: Agent instance (with SSEOutputHandler)
+        query: User query string
+        model: Model ID
+        workspace_root: Optional workspace root path for absolute file paths
+    Yields:
+        SSE-formatted chunks with "data: " prefix
+    Example output:
+        data: {"id":"chatcmpl-123","object":"chat.completion.chunk",...}
+        data: {"id":"chatcmpl-123","object":"chat.completion.chunk",...}
+        data: [DONE]
+    """
+    # Debug logging - FIRST LINE to confirm generator starts
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("🎬 Generator started! Client is consuming the stream.")
+    completion_id = f"chatcmpl-{uuid.uuid4().hex[:24]}"
+    created = int(time.time())
+    # First chunk with role
+    first_chunk = {
+        "id": completion_id,
+        "object": "chat.completion.chunk",
+        "created": created,
+        "model": model,
+        "choices": [
+            {
+                "index": 0,
+                "delta": {"role": "assistant", "content": ""},
+                "finish_reason": None,
+            }
+        ],
+    }
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug(f"📤 Sending first chunk: {json.dumps(first_chunk)}")
+    yield f"data: {json.dumps(first_chunk)}\n\n"
+    # Debug logging
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("🔄 Starting agent query processing in thread pool...")
+    # Process query in thread pool to avoid blocking event loop
+    loop = asyncio.get_event_loop()
+    # Get the SSEOutputHandler from the agent (try output_handler first, fall back to console)
+    output_handler = getattr(agent, "output_handler", None) or getattr(
+        agent, "console", None
+    )
+    try:
+        # Start processing in background
+        task = loop.run_in_executor(
+            None, lambda: agent.process_query(query, workspace_root=workspace_root)
+        )
+        # Stream events as they are generated
+        while not task.done():
+            # Check for new events from the output handler
+            if hasattr(output_handler, "has_events") and output_handler.has_events():
+                events = output_handler.get_events()
+                for event in events:
+                    event_type = event.get("type", "message")
+                    # Check if this event should be streamed to client
+                    if not output_handler.should_stream_as_content(event_type):
+                        # Still log it in debug mode
+                        if os.environ.get("GAIA_API_DEBUG") == "1":
+                            logger.debug(f"📝 Skipping event: {event_type}")
+                        continue
+                    # Format event as clean content
+                    content_text = output_handler.format_event_as_content(event)
+                    # Skip empty content (filtered events)
+                    if not content_text:
+                        continue
+                    content_chunk = {
+                        "id": completion_id,
+                        "object": "chat.completion.chunk",
+                        "created": created,
+                        "model": model,
+                        "choices": [
+                            {
+                                "index": 0,
+                                "delta": {"content": content_text},
+                                "finish_reason": None,
+                            }
+                        ],
+                    }
+                    if os.environ.get("GAIA_API_DEBUG") == "1":
+                        logger.debug(
+                            f"📤 Streaming event: {event_type} -> {content_text[:100]}"
+                        )
+                    yield f"data: {json.dumps(content_chunk)}\n\n"
+            # Small delay to avoid busy waiting
+            await asyncio.sleep(0.1)
+        # Get the final result
+        result = await task
+        # Get any remaining events
+        if hasattr(output_handler, "has_events") and output_handler.has_events():
+            events = output_handler.get_events()
+            for event in events:
+                event_type = event.get("type", "message")
+                # Check if this event should be streamed
+                if not output_handler.should_stream_as_content(event_type):
+                    continue
+                # Format event as clean content
+                content_text = output_handler.format_event_as_content(event)
+                # Skip empty content
+                if not content_text:
+                    continue
+                content_chunk = {
+                    "id": completion_id,
+                    "object": "chat.completion.chunk",
+                    "created": created,
+                    "model": model,
+                    "choices": [
+                        {
+                            "index": 0,
+                            "delta": {"content": content_text},
+                            "finish_reason": None,
+                        }
+                    ],
+                }
+                yield f"data: {json.dumps(content_chunk)}\n\n"
+        # Debug logging: show what agent returned
+        if os.environ.get("GAIA_API_DEBUG") == "1":
+            logger.debug("=" * 80)
+            logger.debug("📤 AGENT RESPONSE (STREAMING)")
+            logger.debug("=" * 80)
+            logger.debug(f"Result type: {type(result)}")
+            logger.debug(
+                f"Result keys: {list(result.keys()) if isinstance(result, dict) else 'N/A'}"
+            )
+            logger.debug(
+                f"Status: {result.get('status') if isinstance(result, dict) else 'N/A'}"
+            )
+            logger.debug(
+                f"Steps taken: {result.get('steps_taken') if isinstance(result, dict) else 'N/A'}"
+            )
+            result_preview = (
+                str(result.get("result", ""))[:200]
+                if isinstance(result, dict)
+                else str(result)[:200]
+            )
+            logger.debug(f"Result preview: {result_preview}...")
+            logger.debug("=" * 80)
+    except Exception as e:
+        # Log and re-raise errors
+        logger.error(f"❌ Agent query processing failed: {e}", exc_info=True)
+        raise
+    # Final chunk with finish_reason
+    final_chunk = {
+        "id": completion_id,
+        "object": "chat.completion.chunk",
+        "created": created,
+        "model": model,
+        "choices": [{"index": 0, "delta": {}, "finish_reason": "stop"}],
+    }
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("📤 Sending final chunk with finish_reason=stop")
+    yield f"data: {json.dumps(final_chunk)}\n\n"
+    # Done marker
+    if os.environ.get("GAIA_API_DEBUG") == "1":
+        logger.debug("✅ SSE stream complete. Sending [DONE] marker.")
+    yield "data: [DONE]\n\n"
+@app.get("/v1/models")
+async def list_models() -> ModelListResponse:
+    """
+    List available models (OpenAI-compatible endpoint).
+    Note: These are GAIA agents exposed as "models", not LLM models.
+    Lemonade manages the actual LLM models underneath.
+    Returns:
+        ModelListResponse with list of available agent "models"
+    Example:
+        ```
+        GET /v1/models
+        {
+            "object": "list",
+            "data": [
+                {
+                    "id": "gaia-code",
+                    "object": "model",
+                    "created": 1234567890,
+                    "owned_by": "amd-gaia"
+                },
+                ...
+            ]
+        }
+        ```
+    """
+    return ModelListResponse(object="list", data=registry.list_models())
+@app.get("/health")
+async def health_check():
+    """
+    Health check endpoint.
+    Returns:
+        Status and service name
+    Example:
+        ```
+        GET /health
+        {
+            "status": "ok",
+            "service": "gaia-api"
+        }
+        ```
+    """
+    return {"status": "ok", "service": "gaia-api"}

amd-gaia 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl