PyPI - amd-gaia - Versions diffs - 0.15.0__py3-none-any.whl → 0.15.2__py3-none-any.whl - Mend

amd-gaia 0.15.0py3-none-any.whl → 0.15.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/METADATA +222 -223
amd_gaia-0.15.2.dist-info/RECORD +182 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/WHEEL +1 -1
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2132 -2177
gaia/agents/base/api_agent.py +119 -120
gaia/agents/base/console.py +1967 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +88 -83
gaia/agents/blender/__init__.py +7 -0
gaia/agents/blender/agent.py +553 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +809 -835
gaia/agents/chat/app.py +1065 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1744 -1729
gaia/agents/chat/tools/shell_tools.py +437 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2034 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +643 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1504 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1972 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +184 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +428 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5659 -5632
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/installer/__init__.py +23 -0
gaia/installer/init_command.py +1275 -0
gaia/installer/lemonade_installer.py +619 -0
gaia/llm/__init__.py +10 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3421 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +118 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +183 -163
gaia/talk/app.py +287 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.15.0.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -723
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.2.dist-info}/top_level.txt +0 -0

gaia/talk/sdk.py CHANGED Viewed

@@ -1,538 +1,538 @@
-#!/usr/bin/env python3
-# Copyright(C) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""
-Gaia Talk SDK - Unified voice and text chat integration
-"""
-import logging
-from dataclasses import dataclass
-from enum import Enum
-from typing import Any, AsyncGenerator, Callable, Dict, Optional
-from gaia.audio.audio_client import AudioClient
-from gaia.chat.sdk import ChatConfig, ChatSDK
-from gaia.llm.lemonade_client import DEFAULT_MODEL_NAME
-from gaia.logger import get_logger
-class TalkMode(Enum):
-    """Talk mode options."""
-    TEXT_ONLY = "text_only"
-    VOICE_ONLY = "voice_only"
-    VOICE_AND_TEXT = "voice_and_text"
-@dataclass
-class TalkConfig:
-    """Configuration for TalkSDK."""
-    # Voice-specific settings
-    whisper_model_size: str = "base"
-    audio_device_index: Optional[int] = None  # Use default input device
-    silence_threshold: float = 0.5
-    enable_tts: bool = True
-    mode: TalkMode = TalkMode.VOICE_AND_TEXT
-    # Chat settings (from ChatConfig)
-    model: str = DEFAULT_MODEL_NAME
-    max_tokens: int = 512
-    system_prompt: Optional[str] = None
-    max_history_length: int = 4  # Number of conversation pairs to keep
-    assistant_name: str = "gaia"
-    # General settings
-    use_claude: bool = False  # Use Claude API
-    use_chatgpt: bool = False  # Use ChatGPT/OpenAI API
-    show_stats: bool = False
-    logging_level: str = "INFO"
-    # RAG settings (optional - for document Q&A)
-    rag_documents: Optional[list] = None  # PDF documents to index
-@dataclass
-class TalkResponse:
-    """Response from talk operations."""
-    text: str
-    stats: Optional[Dict[str, Any]] = None
-    is_complete: bool = True
-class TalkSDK:
-    """
-    Gaia Talk SDK - Unified voice and text chat integration.
-    This SDK provides a simple interface for integrating Gaia's voice and text
-    chat capabilities into applications.
-    Example usage:
-        ```python
-        from gaia.talk.sdk import TalkSDK, TalkConfig
-        # Create SDK instance
-        config = TalkConfig(enable_tts=True, show_stats=True)
-        talk = TalkSDK(config)
-        # Text chat
-        response = await talk.chat("Hello, how are you?")
-        print(response.text)
-        # Streaming chat
-        async for chunk in talk.chat_stream("Tell me a story"):
-            print(chunk.text, end="", flush=True)
-        # Voice chat with document Q&A
-        talk_rag = TalkSDK(TalkConfig(enable_tts=True))
-        talk_rag.enable_rag(documents=["manual.pdf", "guide.pdf"])
-        await talk_rag.start_voice_session()
-        # Voice chat with callback
-        def on_voice_input(text):
-            print(f"User said: {text}")
-        await talk.start_voice_session(on_voice_input)
-        ```
-    """
-    def __init__(self, config: Optional[TalkConfig] = None):
-        """
-        Initialize the TalkSDK.
-        Args:
-            config: Configuration options. If None, uses defaults.
-        """
-        self.config = config or TalkConfig()
-        self.log = get_logger(__name__)
-        self.log.setLevel(getattr(logging, self.config.logging_level))
-        # Initialize ChatSDK for text generation with conversation history
-        chat_config = ChatConfig(
-            model=self.config.model,
-            max_tokens=self.config.max_tokens,
-            system_prompt=self.config.system_prompt,
-            max_history_length=self.config.max_history_length,
-            assistant_name=self.config.assistant_name,
-            show_stats=self.config.show_stats,
-            logging_level=self.config.logging_level,
-            use_claude=self.config.use_claude,
-            use_chatgpt=self.config.use_chatgpt,
-        )
-        self.chat_sdk = ChatSDK(chat_config)
-        # Initialize AudioClient with configuration (for voice features)
-        self.audio_client = AudioClient(
-            whisper_model_size=self.config.whisper_model_size,
-            audio_device_index=self.config.audio_device_index,
-            silence_threshold=self.config.silence_threshold,
-            enable_tts=self.config.enable_tts,
-            logging_level=self.config.logging_level,
-            use_claude=self.config.use_claude,
-            use_chatgpt=self.config.use_chatgpt,
-            system_prompt=self.config.system_prompt,
-        )
-        self.show_stats = self.config.show_stats
-        self._voice_session_active = False
-        # Enable RAG if documents are provided
-        if self.config.rag_documents:
-            self.enable_rag(documents=self.config.rag_documents)
-        self.log.info("TalkSDK initialized with ChatSDK integration")
-    async def chat(self, message: str) -> TalkResponse:
-        """
-        Send a text message and get a complete response.
-        Args:
-            message: The message to send
-        Returns:
-            TalkResponse with the complete response
-        """
-        try:
-            # Use ChatSDK for text generation (with conversation history)
-            chat_response = self.chat_sdk.send(message)
-            stats = None
-            if self.show_stats:
-                stats = chat_response.stats or self.get_stats()
-            return TalkResponse(text=chat_response.text, stats=stats, is_complete=True)
-        except Exception as e:
-            self.log.error(f"Error in chat: {e}")
-            raise
-    async def chat_stream(self, message: str) -> AsyncGenerator[TalkResponse, None]:
-        """
-        Send a text message and get a streaming response.
-        Args:
-            message: The message to send
-        Yields:
-            TalkResponse chunks as they arrive
-        """
-        try:
-            # Use ChatSDK for streaming text generation (with conversation history)
-            for chat_chunk in self.chat_sdk.send_stream(message):
-                if not chat_chunk.is_complete:
-                    yield TalkResponse(text=chat_chunk.text, is_complete=False)
-                else:
-                    # Final chunk with stats
-                    stats = chat_chunk.stats if self.show_stats else None
-                    yield TalkResponse(text="", stats=stats, is_complete=True)
-        except Exception as e:
-            self.log.error(f"Error in chat_stream: {e}")
-            raise
-    async def process_voice_input(self, text: str) -> TalkResponse:
-        """
-        Process voice input text through the complete voice pipeline.
-        This includes TTS output if enabled.
-        Args:
-            text: The transcribed voice input
-        Returns:
-            TalkResponse with the processed response
-        """
-        try:
-            # Use ChatSDK to generate response (with conversation history)
-            chat_response = self.chat_sdk.send(text)
-            # If TTS is enabled, speak the response
-            if self.config.enable_tts and getattr(self.audio_client, "tts", None):
-                await self.audio_client.speak_text(chat_response.text)
-            stats = None
-            if self.show_stats:
-                stats = chat_response.stats or self.get_stats()
-            return TalkResponse(text=chat_response.text, stats=stats, is_complete=True)
-        except Exception as e:
-            self.log.error(f"Error processing voice input: {e}")
-            raise
-    async def start_voice_session(
-        self,
-        on_voice_input: Optional[Callable[[str], None]] = None,
-    ) -> None:
-        """
-        Start an interactive voice session.
-        Args:
-            on_voice_input: Optional callback called when voice input is detected
-        """
-        try:
-            self._voice_session_active = True
-            # Initialize TTS if enabled
-            self.audio_client.initialize_tts()
-            # Create voice processor that uses ChatSDK for responses
-            async def voice_processor(text: str):
-                # Call user callback if provided
-                if on_voice_input:
-                    on_voice_input(text)
-                # Use ChatSDK to generate response (with conversation history)
-                chat_response = self.chat_sdk.send(text)
-                # If TTS is enabled, speak the response
-                if self.config.enable_tts and getattr(self.audio_client, "tts", None):
-                    await self.audio_client.speak_text(chat_response.text)
-                # Print the response for user feedback
-                print(f"{self.config.assistant_name.title()}: {chat_response.text}")
-                # Show stats if enabled
-                if self.show_stats and chat_response.stats:
-                    print(f"Stats: {chat_response.stats}")
-            # Start voice chat session with our processor
-            await self.audio_client.start_voice_chat(voice_processor)
-        except KeyboardInterrupt:
-            self.log.info("Voice session interrupted by user")
-        except Exception as e:
-            self.log.error(f"Error in voice session: {e}")
-            raise
-        finally:
-            self._voice_session_active = False
-            self.log.info("Voice chat session ended")
-    async def halt_generation(self) -> None:
-        """Halt the current LLM generation."""
-        try:
-            await self.audio_client.halt_generation()
-        except Exception as e:
-            self.log.error(f"Error halting generation: {e}")
-            raise
-    def get_stats(self) -> Dict[str, Any]:
-        """
-        Get performance statistics.
-        Returns:
-            Dictionary of performance stats
-        """
-        try:
-            # Get stats from ChatSDK instead of directly from LLMClient
-            return self.chat_sdk.get_stats()
-        except Exception as e:
-            self.log.warning(f"Failed to get stats: {e}")
-            return {}
-    def update_config(self, **kwargs) -> None:
-        """
-        Update configuration dynamically.
-        Args:
-            **kwargs: Configuration parameters to update
-        """
-        # Update our config
-        for key, value in kwargs.items():
-            if hasattr(self.config, key):
-                setattr(self.config, key, value)
-        # Update show_stats
-        if "show_stats" in kwargs:
-            self.show_stats = kwargs["show_stats"]
-        # Update AudioClient configuration
-        if "silence_threshold" in kwargs:
-            self.audio_client.silence_threshold = kwargs["silence_threshold"]
-        # Update ChatSDK configuration
-        chat_updates = {}
-        if "system_prompt" in kwargs:
-            chat_updates["system_prompt"] = kwargs["system_prompt"]
-            # Also update AudioClient's system prompt for consistency
-            self.audio_client.llm_client.system_prompt = kwargs["system_prompt"]
-        if "max_tokens" in kwargs:
-            chat_updates["max_tokens"] = kwargs["max_tokens"]
-        if "max_history_length" in kwargs:
-            chat_updates["max_history_length"] = kwargs["max_history_length"]
-        if "assistant_name" in kwargs:
-            chat_updates["assistant_name"] = kwargs["assistant_name"]
-        if chat_updates:
-            self.chat_sdk.update_config(**chat_updates)
-    def clear_history(self) -> None:
-        """Clear the conversation history."""
-        self.chat_sdk.clear_history()
-        self.log.debug("Conversation history cleared")
-    def get_history(self) -> list:
-        """Get the current conversation history."""
-        return self.chat_sdk.get_history()
-    def get_formatted_history(self) -> list:
-        """Get the conversation history in structured format."""
-        return self.chat_sdk.get_formatted_history()
-    def enable_rag(self, documents: Optional[list] = None, **rag_kwargs) -> bool:
-        """
-        Enable RAG (Retrieval-Augmented Generation) for document-based voice/text chat.
-        Args:
-            documents: List of PDF file paths to index
-            **rag_kwargs: Additional RAG configuration options
-        Returns:
-            True if RAG was successfully enabled
-        """
-        try:
-            self.chat_sdk.enable_rag(documents=documents, **rag_kwargs)
-            self.log.info(
-                f"RAG enabled with {len(documents) if documents else 0} documents"
-            )
-            return True
-        except ImportError:
-            self.log.warning(
-                'RAG dependencies not available. Install with: uv pip install -e ".[rag]"'
-            )
-            return False
-        except Exception as e:
-            self.log.error(f"Failed to enable RAG: {e}")
-            return False
-    def disable_rag(self) -> None:
-        """Disable RAG functionality."""
-        self.chat_sdk.disable_rag()
-        self.log.info("RAG disabled")
-    def add_document(self, document_path: str) -> bool:
-        """
-        Add a document to the RAG index.
-        Args:
-            document_path: Path to PDF file to index
-        Returns:
-            True if document was successfully added
-        """
-        if not self.chat_sdk.rag_enabled:
-            self.log.warning("RAG not enabled. Call enable_rag() first.")
-            return False
-        try:
-            return self.chat_sdk.add_document(document_path)
-        except Exception as e:
-            self.log.error(f"Failed to add document {document_path}: {e}")
-            return False
-    @property
-    def is_voice_session_active(self) -> bool:
-        """Check if a voice session is currently active."""
-        return self._voice_session_active
-    @property
-    def audio_devices(self) -> list:
-        """Get list of available audio input devices."""
-        try:
-            from gaia.audio.audio_recorder import AudioRecorder
-            recorder = AudioRecorder()
-            return recorder.list_audio_devices()
-        except Exception as e:
-            self.log.error(f"Error listing audio devices: {e}")
-            return []
-class SimpleTalk:
-    """
-    Ultra-simple interface for quick integration.
-    Example usage:
-        ```python
-        from gaia.talk.sdk import SimpleTalk
-        talk = SimpleTalk()
-        # Simple text chat
-        response = await talk.ask("What's the weather like?")
-        print(response)
-        # Simple voice chat
-        await talk.voice_chat()  # Starts interactive session
-        ```
-    """
-    def __init__(
-        self,
-        system_prompt: Optional[str] = None,
-        enable_tts: bool = True,
-        assistant_name: str = "gaia",
-    ):
-        """
-        Initialize SimpleTalk with minimal configuration.
-        Args:
-            system_prompt: Optional system prompt for the AI
-            enable_tts: Whether to enable text-to-speech
-            assistant_name: Name to use for the assistant
-        """
-        config = TalkConfig(
-            system_prompt=system_prompt,
-            enable_tts=enable_tts,
-            assistant_name=assistant_name,
-            show_stats=False,
-            logging_level="WARNING",  # Minimal logging
-        )
-        self._sdk = TalkSDK(config)
-    async def ask(self, question: str) -> str:
-        """
-        Ask a question and get a text response.
-        Args:
-            question: The question to ask
-        Returns:
-            The AI's response as a string
-        """
-        response = await self._sdk.chat(question)
-        return response.text
-    async def ask_stream(self, question: str):
-        """
-        Ask a question and get a streaming response.
-        Args:
-            question: The question to ask
-        Yields:
-            Response chunks as they arrive
-        """
-        async for chunk in self._sdk.chat_stream(question):
-            if not chunk.is_complete:
-                yield chunk.text
-    async def voice_chat(self) -> None:
-        """Start an interactive voice chat session."""
-        print("Starting voice chat... Say 'stop' to quit or press Ctrl+C")
-        def on_voice_input(text: str):
-            print(f"You: {text}")
-        await self._sdk.start_voice_session(on_voice_input)
-    def clear_memory(self) -> None:
-        """Clear the conversation memory."""
-        self._sdk.clear_history()
-    def get_conversation(self) -> list:
-        """Get the conversation history in a readable format."""
-        return self._sdk.get_formatted_history()
-# Convenience functions for one-off usage
-async def quick_chat(
-    message: str, system_prompt: Optional[str] = None, assistant_name: str = "gaia"
-) -> str:
-    """
-    Quick one-off text chat with conversation memory.
-    Args:
-        message: Message to send
-        system_prompt: Optional system prompt
-        assistant_name: Name to use for the assistant
-    Returns:
-        AI response
-    """
-    config = TalkConfig(
-        system_prompt=system_prompt,
-        assistant_name=assistant_name,
-        enable_tts=False,
-        logging_level="WARNING",
-        max_history_length=2,  # Small history for quick chat
-    )
-    sdk = TalkSDK(config)
-    response = await sdk.chat(message)
-    return response.text
-async def quick_voice_chat(
-    system_prompt: Optional[str] = None, assistant_name: str = "gaia"
-) -> None:
-    """
-    Quick one-off voice chat session with conversation memory.
-    Args:
-        system_prompt: Optional system prompt
-        assistant_name: Name to use for the assistant
-    """
-    simple = SimpleTalk(system_prompt=system_prompt, assistant_name=assistant_name)
-    await simple.voice_chat()
+#!/usr/bin/env python3
+# Copyright(C) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""
+Gaia Talk SDK - Unified voice and text chat integration
+"""
+import logging
+from dataclasses import dataclass
+from enum import Enum
+from typing import Any, AsyncGenerator, Callable, Dict, Optional
+from gaia.audio.audio_client import AudioClient
+from gaia.chat.sdk import ChatConfig, ChatSDK
+from gaia.llm.lemonade_client import DEFAULT_MODEL_NAME
+from gaia.logger import get_logger
+class TalkMode(Enum):
+    """Talk mode options."""
+    TEXT_ONLY = "text_only"
+    VOICE_ONLY = "voice_only"
+    VOICE_AND_TEXT = "voice_and_text"
+@dataclass
+class TalkConfig:
+    """Configuration for TalkSDK."""
+    # Voice-specific settings
+    whisper_model_size: str = "base"
+    audio_device_index: Optional[int] = None  # Use default input device
+    silence_threshold: float = 0.5
+    enable_tts: bool = True
+    mode: TalkMode = TalkMode.VOICE_AND_TEXT
+    # Chat settings (from ChatConfig)
+    model: str = DEFAULT_MODEL_NAME
+    max_tokens: int = 512
+    system_prompt: Optional[str] = None
+    max_history_length: int = 4  # Number of conversation pairs to keep
+    assistant_name: str = "gaia"
+    # General settings
+    use_claude: bool = False  # Use Claude API
+    use_chatgpt: bool = False  # Use ChatGPT/OpenAI API
+    show_stats: bool = False
+    logging_level: str = "INFO"
+    # RAG settings (optional - for document Q&A)
+    rag_documents: Optional[list] = None  # PDF documents to index
+@dataclass
+class TalkResponse:
+    """Response from talk operations."""
+    text: str
+    stats: Optional[Dict[str, Any]] = None
+    is_complete: bool = True
+class TalkSDK:
+    """
+    Gaia Talk SDK - Unified voice and text chat integration.
+    This SDK provides a simple interface for integrating Gaia's voice and text
+    chat capabilities into applications.
+    Example usage:
+        ```python
+        from gaia.talk.sdk import TalkSDK, TalkConfig
+        # Create SDK instance
+        config = TalkConfig(enable_tts=True, show_stats=True)
+        talk = TalkSDK(config)
+        # Text chat
+        response = await talk.chat("Hello, how are you?")
+        print(response.text)
+        # Streaming chat
+        async for chunk in talk.chat_stream("Tell me a story"):
+            print(chunk.text, end="", flush=True)
+        # Voice chat with document Q&A
+        talk_rag = TalkSDK(TalkConfig(enable_tts=True))
+        talk_rag.enable_rag(documents=["manual.pdf", "guide.pdf"])
+        await talk_rag.start_voice_session()
+        # Voice chat with callback
+        def on_voice_input(text):
+            print(f"User said: {text}")
+        await talk.start_voice_session(on_voice_input)
+        ```
+    """
+    def __init__(self, config: Optional[TalkConfig] = None):
+        """
+        Initialize the TalkSDK.
+        Args:
+            config: Configuration options. If None, uses defaults.
+        """
+        self.config = config or TalkConfig()
+        self.log = get_logger(__name__)
+        self.log.setLevel(getattr(logging, self.config.logging_level))
+        # Initialize ChatSDK for text generation with conversation history
+        chat_config = ChatConfig(
+            model=self.config.model,
+            max_tokens=self.config.max_tokens,
+            system_prompt=self.config.system_prompt,
+            max_history_length=self.config.max_history_length,
+            assistant_name=self.config.assistant_name,
+            show_stats=self.config.show_stats,
+            logging_level=self.config.logging_level,
+            use_claude=self.config.use_claude,
+            use_chatgpt=self.config.use_chatgpt,
+        )
+        self.chat_sdk = ChatSDK(chat_config)
+        # Initialize AudioClient with configuration (for voice features)
+        self.audio_client = AudioClient(
+            whisper_model_size=self.config.whisper_model_size,
+            audio_device_index=self.config.audio_device_index,
+            silence_threshold=self.config.silence_threshold,
+            enable_tts=self.config.enable_tts,
+            logging_level=self.config.logging_level,
+            use_claude=self.config.use_claude,
+            use_chatgpt=self.config.use_chatgpt,
+            system_prompt=self.config.system_prompt,
+        )
+        self.show_stats = self.config.show_stats
+        self._voice_session_active = False
+        # Enable RAG if documents are provided
+        if self.config.rag_documents:
+            self.enable_rag(documents=self.config.rag_documents)
+        self.log.info("TalkSDK initialized with ChatSDK integration")
+    async def chat(self, message: str) -> TalkResponse:
+        """
+        Send a text message and get a complete response.
+        Args:
+            message: The message to send
+        Returns:
+            TalkResponse with the complete response
+        """
+        try:
+            # Use ChatSDK for text generation (with conversation history)
+            chat_response = self.chat_sdk.send(message)
+            stats = None
+            if self.show_stats:
+                stats = chat_response.stats or self.get_stats()
+            return TalkResponse(text=chat_response.text, stats=stats, is_complete=True)
+        except Exception as e:
+            self.log.error(f"Error in chat: {e}")
+            raise
+    async def chat_stream(self, message: str) -> AsyncGenerator[TalkResponse, None]:
+        """
+        Send a text message and get a streaming response.
+        Args:
+            message: The message to send
+        Yields:
+            TalkResponse chunks as they arrive
+        """
+        try:
+            # Use ChatSDK for streaming text generation (with conversation history)
+            for chat_chunk in self.chat_sdk.send_stream(message):
+                if not chat_chunk.is_complete:
+                    yield TalkResponse(text=chat_chunk.text, is_complete=False)
+                else:
+                    # Final chunk with stats
+                    stats = chat_chunk.stats if self.show_stats else None
+                    yield TalkResponse(text="", stats=stats, is_complete=True)
+        except Exception as e:
+            self.log.error(f"Error in chat_stream: {e}")
+            raise
+    async def process_voice_input(self, text: str) -> TalkResponse:
+        """
+        Process voice input text through the complete voice pipeline.
+        This includes TTS output if enabled.
+        Args:
+            text: The transcribed voice input
+        Returns:
+            TalkResponse with the processed response
+        """
+        try:
+            # Use ChatSDK to generate response (with conversation history)
+            chat_response = self.chat_sdk.send(text)
+            # If TTS is enabled, speak the response
+            if self.config.enable_tts and getattr(self.audio_client, "tts", None):
+                await self.audio_client.speak_text(chat_response.text)
+            stats = None
+            if self.show_stats:
+                stats = chat_response.stats or self.get_stats()
+            return TalkResponse(text=chat_response.text, stats=stats, is_complete=True)
+        except Exception as e:
+            self.log.error(f"Error processing voice input: {e}")
+            raise
+    async def start_voice_session(
+        self,
+        on_voice_input: Optional[Callable[[str], None]] = None,
+    ) -> None:
+        """
+        Start an interactive voice session.
+        Args:
+            on_voice_input: Optional callback called when voice input is detected
+        """
+        try:
+            self._voice_session_active = True
+            # Initialize TTS if enabled
+            self.audio_client.initialize_tts()
+            # Create voice processor that uses ChatSDK for responses
+            async def voice_processor(text: str):
+                # Call user callback if provided
+                if on_voice_input:
+                    on_voice_input(text)
+                # Use ChatSDK to generate response (with conversation history)
+                chat_response = self.chat_sdk.send(text)
+                # If TTS is enabled, speak the response
+                if self.config.enable_tts and getattr(self.audio_client, "tts", None):
+                    await self.audio_client.speak_text(chat_response.text)
+                # Print the response for user feedback
+                print(f"{self.config.assistant_name.title()}: {chat_response.text}")
+                # Show stats if enabled
+                if self.show_stats and chat_response.stats:
+                    print(f"Stats: {chat_response.stats}")
+            # Start voice chat session with our processor
+            await self.audio_client.start_voice_chat(voice_processor)
+        except KeyboardInterrupt:
+            self.log.info("Voice session interrupted by user")
+        except Exception as e:
+            self.log.error(f"Error in voice session: {e}")
+            raise
+        finally:
+            self._voice_session_active = False
+            self.log.info("Voice chat session ended")
+    async def halt_generation(self) -> None:
+        """Halt the current LLM generation."""
+        try:
+            await self.audio_client.halt_generation()
+        except Exception as e:
+            self.log.error(f"Error halting generation: {e}")
+            raise
+    def get_stats(self) -> Dict[str, Any]:
+        """
+        Get performance statistics.
+        Returns:
+            Dictionary of performance stats
+        """
+        try:
+            # Get stats from ChatSDK instead of directly from LLMClient
+            return self.chat_sdk.get_stats()
+        except Exception as e:
+            self.log.warning(f"Failed to get stats: {e}")
+            return {}
+    def update_config(self, **kwargs) -> None:
+        """
+        Update configuration dynamically.
+        Args:
+            **kwargs: Configuration parameters to update
+        """
+        # Update our config
+        for key, value in kwargs.items():
+            if hasattr(self.config, key):
+                setattr(self.config, key, value)
+        # Update show_stats
+        if "show_stats" in kwargs:
+            self.show_stats = kwargs["show_stats"]
+        # Update AudioClient configuration
+        if "silence_threshold" in kwargs:
+            self.audio_client.silence_threshold = kwargs["silence_threshold"]
+        # Update ChatSDK configuration
+        chat_updates = {}
+        if "system_prompt" in kwargs:
+            chat_updates["system_prompt"] = kwargs["system_prompt"]
+            # Also update AudioClient's system prompt for consistency
+            self.audio_client.llm_client.system_prompt = kwargs["system_prompt"]
+        if "max_tokens" in kwargs:
+            chat_updates["max_tokens"] = kwargs["max_tokens"]
+        if "max_history_length" in kwargs:
+            chat_updates["max_history_length"] = kwargs["max_history_length"]
+        if "assistant_name" in kwargs:
+            chat_updates["assistant_name"] = kwargs["assistant_name"]
+        if chat_updates:
+            self.chat_sdk.update_config(**chat_updates)
+    def clear_history(self) -> None:
+        """Clear the conversation history."""
+        self.chat_sdk.clear_history()
+        self.log.debug("Conversation history cleared")
+    def get_history(self) -> list:
+        """Get the current conversation history."""
+        return self.chat_sdk.get_history()
+    def get_formatted_history(self) -> list:
+        """Get the conversation history in structured format."""
+        return self.chat_sdk.get_formatted_history()
+    def enable_rag(self, documents: Optional[list] = None, **rag_kwargs) -> bool:
+        """
+        Enable RAG (Retrieval-Augmented Generation) for document-based voice/text chat.
+        Args:
+            documents: List of PDF file paths to index
+            **rag_kwargs: Additional RAG configuration options
+        Returns:
+            True if RAG was successfully enabled
+        """
+        try:
+            self.chat_sdk.enable_rag(documents=documents, **rag_kwargs)
+            self.log.info(
+                f"RAG enabled with {len(documents) if documents else 0} documents"
+            )
+            return True
+        except ImportError:
+            self.log.warning(
+                'RAG dependencies not available. Install with: uv pip install -e ".[rag]"'
+            )
+            return False
+        except Exception as e:
+            self.log.error(f"Failed to enable RAG: {e}")
+            return False
+    def disable_rag(self) -> None:
+        """Disable RAG functionality."""
+        self.chat_sdk.disable_rag()
+        self.log.info("RAG disabled")
+    def add_document(self, document_path: str) -> bool:
+        """
+        Add a document to the RAG index.
+        Args:
+            document_path: Path to PDF file to index
+        Returns:
+            True if document was successfully added
+        """
+        if not self.chat_sdk.rag_enabled:
+            self.log.warning("RAG not enabled. Call enable_rag() first.")
+            return False
+        try:
+            return self.chat_sdk.add_document(document_path)
+        except Exception as e:
+            self.log.error(f"Failed to add document {document_path}: {e}")
+            return False
+    @property
+    def is_voice_session_active(self) -> bool:
+        """Check if a voice session is currently active."""
+        return self._voice_session_active
+    @property
+    def audio_devices(self) -> list:
+        """Get list of available audio input devices."""
+        try:
+            from gaia.audio.audio_recorder import AudioRecorder
+            recorder = AudioRecorder()
+            return recorder.list_audio_devices()
+        except Exception as e:
+            self.log.error(f"Error listing audio devices: {e}")
+            return []
+class SimpleTalk:
+    """
+    Ultra-simple interface for quick integration.
+    Example usage:
+        ```python
+        from gaia.talk.sdk import SimpleTalk
+        talk = SimpleTalk()
+        # Simple text chat
+        response = await talk.ask("What's the weather like?")
+        print(response)
+        # Simple voice chat
+        await talk.voice_chat()  # Starts interactive session
+        ```
+    """
+    def __init__(
+        self,
+        system_prompt: Optional[str] = None,
+        enable_tts: bool = True,
+        assistant_name: str = "gaia",
+    ):
+        """
+        Initialize SimpleTalk with minimal configuration.
+        Args:
+            system_prompt: Optional system prompt for the AI
+            enable_tts: Whether to enable text-to-speech
+            assistant_name: Name to use for the assistant
+        """
+        config = TalkConfig(
+            system_prompt=system_prompt,
+            enable_tts=enable_tts,
+            assistant_name=assistant_name,
+            show_stats=False,
+            logging_level="WARNING",  # Minimal logging
+        )
+        self._sdk = TalkSDK(config)
+    async def ask(self, question: str) -> str:
+        """
+        Ask a question and get a text response.
+        Args:
+            question: The question to ask
+        Returns:
+            The AI's response as a string
+        """
+        response = await self._sdk.chat(question)
+        return response.text
+    async def ask_stream(self, question: str):
+        """
+        Ask a question and get a streaming response.
+        Args:
+            question: The question to ask
+        Yields:
+            Response chunks as they arrive
+        """
+        async for chunk in self._sdk.chat_stream(question):
+            if not chunk.is_complete:
+                yield chunk.text
+    async def voice_chat(self) -> None:
+        """Start an interactive voice chat session."""
+        print("Starting voice chat... Say 'stop' to quit or press Ctrl+C")
+        def on_voice_input(text: str):
+            print(f"You: {text}")
+        await self._sdk.start_voice_session(on_voice_input)
+    def clear_memory(self) -> None:
+        """Clear the conversation memory."""
+        self._sdk.clear_history()
+    def get_conversation(self) -> list:
+        """Get the conversation history in a readable format."""
+        return self._sdk.get_formatted_history()
+# Convenience functions for one-off usage
+async def quick_chat(
+    message: str, system_prompt: Optional[str] = None, assistant_name: str = "gaia"
+) -> str:
+    """
+    Quick one-off text chat with conversation memory.
+    Args:
+        message: Message to send
+        system_prompt: Optional system prompt
+        assistant_name: Name to use for the assistant
+    Returns:
+        AI response
+    """
+    config = TalkConfig(
+        system_prompt=system_prompt,
+        assistant_name=assistant_name,
+        enable_tts=False,
+        logging_level="WARNING",
+        max_history_length=2,  # Small history for quick chat
+    )
+    sdk = TalkSDK(config)
+    response = await sdk.chat(message)
+    return response.text
+async def quick_voice_chat(
+    system_prompt: Optional[str] = None, assistant_name: str = "gaia"
+) -> None:
+    """
+    Quick one-off voice chat session with conversation memory.
+    Args:
+        system_prompt: Optional system prompt
+        assistant_name: Name to use for the assistant
+    """
+    simple = SimpleTalk(system_prompt=system_prompt, assistant_name=assistant_name)
+    await simple.voice_chat()

amd-gaia 0.15.0__py3-none-any.whl → 0.15.2__py3-none-any.whl

amd-gaia 0.15.0py3-none-any.whl → 0.15.2py3-none-any.whl