PyPI - camel-ai - Versions diffs - 0.2.23a0__py3-none-any.whl → 0.2.25__py3-none-any.whl - Mend

camel-ai 0.2.23a0py3-none-any.whl → 0.2.25py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of camel-ai might be problematic. Click here for more details.

Files changed (31) hide show

camel/__init__.py +1 -1
camel/agents/chat_agent.py +16 -2
camel/configs/anthropic_config.py +45 -11
camel/configs/sglang_config.py +7 -5
camel/datagen/self_improving_cot.py +2 -2
camel/datagen/self_instruct/self_instruct.py +46 -2
camel/interpreters/subprocess_interpreter.py +187 -46
camel/models/__init__.py +2 -0
camel/models/anthropic_model.py +5 -1
camel/models/base_audio_model.py +92 -0
camel/models/fish_audio_model.py +18 -8
camel/models/model_manager.py +9 -0
camel/models/openai_audio_models.py +80 -1
camel/models/sglang_model.py +35 -5
camel/societies/role_playing.py +119 -0
camel/toolkits/__init__.py +17 -1
camel/toolkits/audio_analysis_toolkit.py +238 -0
camel/toolkits/excel_toolkit.py +172 -0
camel/toolkits/file_write_toolkit.py +371 -0
camel/toolkits/image_analysis_toolkit.py +202 -0
camel/toolkits/mcp_toolkit.py +251 -0
camel/toolkits/page_script.js +376 -0
camel/toolkits/terminal_toolkit.py +421 -0
camel/toolkits/video_analysis_toolkit.py +407 -0
camel/toolkits/{video_toolkit.py → video_download_toolkit.py} +19 -25
camel/toolkits/web_toolkit.py +1306 -0
camel/types/enums.py +3 -0
{camel_ai-0.2.23a0.dist-info → camel_ai-0.2.25.dist-info}/METADATA +241 -106
{camel_ai-0.2.23a0.dist-info → camel_ai-0.2.25.dist-info}/RECORD +60 -50
{camel_ai-0.2.23a0.dist-info → camel_ai-0.2.25.dist-info}/WHEEL +1 -1
{camel_ai-0.2.23a0.dist-info → camel_ai-0.2.25.dist-info/licenses}/LICENSE +0 -0

camel/toolkits/audio_analysis_toolkit.py ADDED Viewed

@@ -0,0 +1,238 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+import os
+import uuid
+from typing import List, Optional
+from urllib.parse import urlparse
+import requests
+from camel.logger import get_logger
+from camel.messages import BaseMessage
+from camel.models import BaseAudioModel, BaseModelBackend, OpenAIAudioModels
+from camel.toolkits.base import BaseToolkit
+from camel.toolkits.function_tool import FunctionTool
+logger = get_logger(__name__)
+def download_file(url: str, cache_dir: str) -> str:
+    r"""Download a file from a URL to a local cache directory.
+    Args:
+        url (str): The URL of the file to download.
+        cache_dir (str): The directory to save the downloaded file.
+    Returns:
+        str: The path to the downloaded file.
+    Raises:
+        Exception: If the download fails.
+    """
+    # Create cache directory if it doesn't exist
+    os.makedirs(cache_dir, exist_ok=True)
+    # Extract filename from URL or generate a unique one
+    parsed_url = urlparse(url)
+    filename = os.path.basename(parsed_url.path)
+    if not filename:
+        # Generate a unique filename if none is provided in the URL
+        file_ext = ".mp3"  # Default extension
+        content_type = None
+        # Try to get the file extension from the content type
+        try:
+            response = requests.head(url)
+            content_type = response.headers.get('Content-Type', '')
+            if 'audio/wav' in content_type:
+                file_ext = '.wav'
+            elif 'audio/mpeg' in content_type:
+                file_ext = '.mp3'
+            elif 'audio/ogg' in content_type:
+                file_ext = '.ogg'
+        except Exception:
+            pass
+        filename = f"{uuid.uuid4()}{file_ext}"
+    local_path = os.path.join(cache_dir, filename)
+    # Download the file
+    response = requests.get(url, stream=True)
+    response.raise_for_status()
+    with open(local_path, 'wb') as f:
+        for chunk in response.iter_content(chunk_size=8192):
+            f.write(chunk)
+    logger.debug(f"Downloaded file from {url} to {local_path}")
+    return local_path
+class AudioAnalysisToolkit(BaseToolkit):
+    r"""A toolkit for audio processing and analysis.
+    This class provides methods for processing, transcribing, and extracting
+    information from audio data, including direct question answering about
+    audio content.
+    Args:
+        cache_dir (Optional[str]): Directory path for caching downloaded audio
+            files. If not provided, 'tmp/' will be used. (default: :obj:`None`)
+        transcribe_model (Optional[BaseAudioModel]): Model used for audio
+            transcription. If not provided, OpenAIAudioModels will be used.
+            (default: :obj:`None`)
+        audio_reasoning_model (Optional[BaseModelBackend]): Model used for
+            audio reasoning and question answering. If not provided, uses the
+            default model from ChatAgent. (default: :obj:`None`)
+    """
+    def __init__(
+        self,
+        cache_dir: Optional[str] = None,
+        transcribe_model: Optional[BaseAudioModel] = None,
+        audio_reasoning_model: Optional[BaseModelBackend] = None,
+    ):
+        self.cache_dir = 'tmp/'
+        if cache_dir:
+            self.cache_dir = cache_dir
+        if transcribe_model:
+            self.transcribe_model = transcribe_model
+        else:
+            self.transcribe_model = OpenAIAudioModels()
+            logger.warning(
+                "No audio transcription model provided. "
+                "Using OpenAIAudioModels."
+            )
+        from camel.agents import ChatAgent
+        if audio_reasoning_model:
+            self.audio_agent = ChatAgent(model=audio_reasoning_model)
+        else:
+            self.audio_agent = ChatAgent()
+            logger.warning(
+                "No audio reasoning model provided. Using default model in"
+                " ChatAgent."
+            )
+    def audio2text(self, audio_path: str) -> str:
+        r"""Transcribe audio to text.
+        Args:
+            audio_path (str): The path to the audio file or URL.
+        Returns:
+            str: The transcribed text.
+        """
+        logger.debug(
+            f"Calling transcribe_audio method for audio file `{audio_path}`."
+        )
+        try:
+            audio_transcript = self.transcribe_model.speech_to_text(audio_path)
+            if not audio_transcript:
+                logger.warning("Audio transcription returned empty result")
+                return "No audio transcription available."
+            return audio_transcript
+        except Exception as e:
+            logger.error(f"Audio transcription failed: {e}")
+            return "Audio transcription failed."
+    def ask_question_about_audio(self, audio_path: str, question: str) -> str:
+        r"""Ask any question about the audio and get the answer using
+        multimodal model.
+        Args:
+            audio_path (str): The path to the audio file.
+            question (str): The question to ask about the audio.
+        Returns:
+            str: The answer to the question.
+        """
+        logger.debug(
+            f"Calling ask_question_about_audio method for audio file \
+            `{audio_path}` and question `{question}`."
+        )
+        parsed_url = urlparse(audio_path)
+        is_url = all([parsed_url.scheme, parsed_url.netloc])
+        local_audio_path = audio_path
+        # If the audio is a URL, download it first
+        if is_url:
+            try:
+                local_audio_path = download_file(audio_path, self.cache_dir)
+            except Exception as e:
+                logger.error(f"Failed to download audio file: {e}")
+                return f"Failed to download audio file: {e!s}"
+        # Try direct audio question answering first
+        try:
+            # Check if the transcribe_model supports audio_question_answering
+            if hasattr(self.transcribe_model, 'audio_question_answering'):
+                logger.debug("Using direct audio question answering")
+                response = self.transcribe_model.audio_question_answering(
+                    local_audio_path, question
+                )
+                return response
+        except Exception as e:
+            logger.warning(
+                f"Direct audio question answering failed: {e}. "
+                "Falling back to transcription-based approach."
+            )
+        # Fallback to transcription-based approach
+        try:
+            transcript = self.audio2text(local_audio_path)
+            reasoning_prompt = f"""
+            <speech_transcription_result>{transcript}</
+            speech_transcription_result>
+            Please answer the following question based on the speech
+            transcription result above:
+            <question>{question}</question>
+            """
+            msg = BaseMessage.make_user_message(
+                role_name="User", content=reasoning_prompt
+            )
+            response = self.audio_agent.step(msg)
+            if not response or not response.msgs:
+                logger.error("Model returned empty response")
+                return (
+                    "Failed to generate an answer. "
+                    "The model returned an empty response."
+                )
+            answer = response.msgs[0].content
+            return answer
+        except Exception as e:
+            logger.error(f"Audio question answering failed: {e}")
+            return f"Failed to answer question about audio: {e!s}"
+    def get_tools(self) -> List[FunctionTool]:
+        r"""Returns a list of FunctionTool objects representing the functions
+            in the toolkit.
+        Returns:
+            List[FunctionTool]: A list of FunctionTool objects representing the
+                functions in the toolkit.
+        """
+        return [
+            FunctionTool(self.ask_question_about_audio),
+            FunctionTool(self.audio2text),
+        ]

camel/toolkits/excel_toolkit.py ADDED Viewed

@@ -0,0 +1,172 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from typing import List
+import pandas as pd
+from camel.logger import get_logger
+from camel.toolkits.base import BaseToolkit
+from camel.toolkits.function_tool import FunctionTool
+logger = get_logger(__name__)
+class ExcelToolkit(BaseToolkit):
+    r"""A class representing a toolkit for extract detailed cell information
+    from an Excel file.
+    This class provides method for processing docx, pdf, pptx, etc. It cannot
+    process excel files.
+    """
+    def _convert_to_markdown(self, df: pd.DataFrame) -> str:
+        r"""Convert DataFrame to Markdown format table.
+        Args:
+            df (pd.DataFrame): DataFrame containing the Excel data.
+        Returns:
+            str: Markdown formatted table.
+        """
+        from tabulate import tabulate
+        md_table = tabulate(df, headers='keys', tablefmt='pipe')
+        return str(md_table)
+    def extract_excel_content(self, document_path: str) -> str:
+        r"""Extract detailed cell information from an Excel file, including
+        multiple sheets.
+        Args:
+            document_path (str): The path of the Excel file.
+        Returns:
+            str: Extracted excel information, including details of each sheet.
+        """
+        from openpyxl import load_workbook
+        from xls2xlsx import XLS2XLSX
+        logger.debug(
+            f"Calling extract_excel_content with document_path"
+            f": {document_path}"
+        )
+        if not (
+            document_path.endswith("xls")
+            or document_path.endswith("xlsx")
+            or document_path.endswith("csv")
+        ):
+            logger.error("Only xls, xlsx, csv files are supported.")
+            return (
+                f"Failed to process file {document_path}: "
+                f"It is not excel format. Please try other ways."
+            )
+        if document_path.endswith("csv"):
+            try:
+                df = pd.read_csv(document_path)
+                md_table = self._convert_to_markdown(df)
+                return f"CSV File Processed:\n{md_table}"
+            except Exception as e:
+                logger.error(f"Failed to process file {document_path}: {e}")
+                return f"Failed to process file {document_path}: {e}"
+        if document_path.endswith("xls"):
+            output_path = document_path.replace(".xls", ".xlsx")
+            x2x = XLS2XLSX(document_path)
+            x2x.to_xlsx(output_path)
+            document_path = output_path
+        # Load the Excel workbook
+        wb = load_workbook(document_path, data_only=True)
+        sheet_info_list = []
+        # Iterate through all sheets
+        for sheet in wb.sheetnames:
+            ws = wb[sheet]
+            cell_info_list = []
+            for row in ws.iter_rows():
+                for cell in row:
+                    row_num = cell.row
+                    col_letter = cell.column_letter
+                    cell_value = cell.value
+                    font_color = None
+                    if (
+                        cell.font
+                        and cell.font.color
+                        and "rgb=None" not in str(cell.font.color)
+                    ):  # Handle font color
+                        font_color = cell.font.color.rgb
+                    fill_color = None
+                    if (
+                        cell.fill
+                        and cell.fill.fgColor
+                        and "rgb=None" not in str(cell.fill.fgColor)
+                    ):  # Handle fill color
+                        fill_color = cell.fill.fgColor.rgb
+                    cell_info_list.append(
+                        {
+                            "index": f"{row_num}{col_letter}",
+                            "value": cell_value,
+                            "font_color": font_color,
+                            "fill_color": fill_color,
+                        }
+                    )
+            # Convert the sheet to a DataFrame and then to markdown
+            sheet_df = pd.read_excel(
+                document_path, sheet_name=sheet, engine='openpyxl'
+            )
+            markdown_content = self._convert_to_markdown(sheet_df)
+            # Collect all information for the sheet
+            sheet_info = {
+                "sheet_name": sheet,
+                "cell_info_list": cell_info_list,
+                "markdown_content": markdown_content,
+            }
+            sheet_info_list.append(sheet_info)
+        result_str = ""
+        for sheet_info in sheet_info_list:
+            result_str += f"""
+            Sheet Name: {sheet_info['sheet_name']}
+            Cell information list:
+            {sheet_info['cell_info_list']}
+            Markdown View of the content:
+            {sheet_info['markdown_content']}
+            {'-'*40}
+            """
+        return result_str
+    def get_tools(self) -> List[FunctionTool]:
+        r"""Returns a list of FunctionTool objects representing the functions
+        in the toolkit.
+        Returns:
+            List[FunctionTool]: A list of FunctionTool objects representing
+                the functions in the toolkit.
+        """
+        return [
+            FunctionTool(self.extract_excel_content),
+        ]

camel-ai 0.2.23a0__py3-none-any.whl → 0.2.25__py3-none-any.whl

Potentially problematic release.

camel-ai 0.2.23a0py3-none-any.whl → 0.2.25py3-none-any.whl