PyPI - camel-ai - Versions diffs - 0.2.36__py3-none-any.whl → 0.2.38__py3-none-any.whl - Mend

camel-ai 0.2.36py3-none-any.whl → 0.2.38py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of camel-ai might be problematic. Click here for more details.

Files changed (84) hide show

camel/__init__.py +1 -1
camel/agents/__init__.py +2 -0
camel/agents/repo_agent.py +579 -0
camel/configs/aiml_config.py +20 -19
camel/configs/anthropic_config.py +25 -27
camel/configs/cohere_config.py +11 -10
camel/configs/deepseek_config.py +16 -16
camel/configs/gemini_config.py +8 -8
camel/configs/groq_config.py +18 -19
camel/configs/internlm_config.py +8 -8
camel/configs/litellm_config.py +26 -24
camel/configs/mistral_config.py +8 -8
camel/configs/moonshot_config.py +11 -11
camel/configs/nvidia_config.py +13 -13
camel/configs/ollama_config.py +14 -15
camel/configs/openai_config.py +3 -3
camel/configs/openrouter_config.py +9 -9
camel/configs/qwen_config.py +8 -8
camel/configs/reka_config.py +12 -11
camel/configs/samba_config.py +14 -14
camel/configs/sglang_config.py +15 -16
camel/configs/siliconflow_config.py +18 -17
camel/configs/togetherai_config.py +18 -19
camel/configs/vllm_config.py +18 -19
camel/configs/yi_config.py +7 -8
camel/configs/zhipuai_config.py +8 -9
camel/datagen/evol_instruct/__init__.py +20 -0
camel/datagen/evol_instruct/evol_instruct.py +424 -0
camel/datagen/evol_instruct/scorer.py +166 -0
camel/datagen/evol_instruct/templates.py +268 -0
camel/datasets/static_dataset.py +25 -23
camel/environments/models.py +10 -1
camel/environments/single_step.py +296 -136
camel/extractors/__init__.py +16 -1
camel/interpreters/docker_interpreter.py +1 -1
camel/interpreters/e2b_interpreter.py +1 -1
camel/interpreters/subprocess_interpreter.py +1 -1
camel/loaders/__init__.py +2 -2
camel/loaders/{panda_reader.py → pandas_reader.py} +61 -30
camel/memories/context_creators/score_based.py +198 -67
camel/models/aiml_model.py +9 -3
camel/models/anthropic_model.py +11 -3
camel/models/azure_openai_model.py +9 -3
camel/models/base_audio_model.py +6 -0
camel/models/base_model.py +4 -0
camel/models/deepseek_model.py +9 -3
camel/models/gemini_model.py +9 -3
camel/models/groq_model.py +9 -3
camel/models/internlm_model.py +8 -2
camel/models/model_factory.py +4 -0
camel/models/moonshot_model.py +8 -2
camel/models/nemotron_model.py +9 -3
camel/models/nvidia_model.py +9 -3
camel/models/ollama_model.py +9 -3
camel/models/openai_audio_models.py +5 -3
camel/models/openai_compatible_model.py +9 -3
camel/models/openai_model.py +9 -3
camel/models/openrouter_model.py +9 -3
camel/models/qwen_model.py +9 -3
camel/models/samba_model.py +9 -3
camel/models/sglang_model.py +11 -4
camel/models/siliconflow_model.py +8 -2
camel/models/stub_model.py +2 -1
camel/models/togetherai_model.py +9 -3
camel/models/vllm_model.py +9 -3
camel/models/yi_model.py +9 -3
camel/models/zhipuai_model.py +9 -3
camel/retrievers/auto_retriever.py +14 -0
camel/storages/__init__.py +2 -0
camel/storages/vectordb_storages/__init__.py +2 -0
camel/storages/vectordb_storages/tidb.py +332 -0
camel/toolkits/__init__.py +7 -0
camel/toolkits/browser_toolkit.py +84 -61
camel/toolkits/openai_agent_toolkit.py +131 -0
camel/toolkits/searxng_toolkit.py +207 -0
camel/toolkits/thinking_toolkit.py +230 -0
camel/types/enums.py +4 -0
camel/utils/chunker/code_chunker.py +9 -15
camel/verifiers/base.py +28 -5
camel/verifiers/python_verifier.py +321 -68
{camel_ai-0.2.36.dist-info → camel_ai-0.2.38.dist-info}/METADATA +103 -8
{camel_ai-0.2.36.dist-info → camel_ai-0.2.38.dist-info}/RECORD +84 -75
{camel_ai-0.2.36.dist-info → camel_ai-0.2.38.dist-info}/WHEEL +0 -0
{camel_ai-0.2.36.dist-info → camel_ai-0.2.38.dist-info}/licenses/LICENSE +0 -0

camel/verifiers/python_verifier.py CHANGED Viewed

@@ -12,15 +12,17 @@
 # limitations under the License.
 # ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+import ast
 import asyncio
 import os
 import shutil
 import subprocess
+import sys
 import tempfile
 import venv
-from typing import List, Optional
+from typing import List, Optional, Tuple
-from camel.extractors import BaseExtractor
+from camel.extractors.base import BaseExtractor
 from camel.logger import get_logger
 from camel.verifiers import BaseVerifier
@@ -46,13 +48,16 @@ class PythonVerifier(BaseVerifier):
     def __init__(
         self,
+        extractor: Optional[BaseExtractor] = None,
         timeout: Optional[float] = 30.0,
         required_packages: Optional[List[str]] = None,
-        extractor: Optional[BaseExtractor] = None,
+        **kwargs,
     ):
         r"""Initializes the PythonVerifier.
         Args:
+            extractor (Optional[BaseExtractor], optional): The extractor to use
+                for extracting code from the solution. (default: :obj:`None`)
             timeout (Optional[float], optional): The execution timeout in
                 seconds. (default: :obj:`30.0`)
             required_packages (Optional[List[str]], optional): A list of
@@ -60,7 +65,7 @@ class PythonVerifier(BaseVerifier):
                 (default: :obj:`None`)
         """
         # TODO: Use CAMEL's Interpreter to execute the code
-        super().__init__(timeout=timeout)
+        super().__init__(extractor=extractor, timeout=timeout, **kwargs)
         self.venv_path: Optional[str] = None
         self.required_packages = required_packages or []
@@ -69,25 +74,39 @@ class PythonVerifier(BaseVerifier):
         else:  # Unix-like systems
             self.bin_dir = 'bin'
-    async def _setup(self) -> None:
-        r"""Set up a virtual environment for execution
-        and install required packages.
-        """
+    async def _setup(self, **kwargs) -> None:
+        r"""Set up a virtual environment and install required packages."""
+        uv = kwargs.get('uv', True)
+        if uv and self._is_uv_environment():
+            logger.info("[UV] Detected uv environment. Using uv for setup.")
+            self._setup_with_uv()
+            return
         self.venv_path = tempfile.mkdtemp()
-        venv.create(self.venv_path, with_pip=True)
-        logger.info(f"Virtual environment created at {self.venv_path}")
+        try:
+            venv.create(self.venv_path, with_pip=True)
+            logger.info(f"Virtual environment created at {self.venv_path}")
+        except Exception as e:
+            logger.error(f"Failed to create virtual environment: {e}")
+            # Clean up resources before re-raising
+            if self.venv_path and os.path.exists(self.venv_path):
+                shutil.rmtree(self.venv_path)
+                self.venv_path = None
+            raise
         venv_pip = os.path.join(self.venv_path, self.bin_dir, "pip")
         if self.required_packages:
             try:
+                # Add timeout to subprocess call
                 subprocess.run(
                     [venv_pip, "install", *self.required_packages],
                     check=True,
                     capture_output=True,
+                    timeout=self._timeout,
                 )
                 logger.info(
-                    "Installed required packages:"
+                    "Installed required packages: "
                     f"{', '.join(self.required_packages)}"
                 )
             except subprocess.CalledProcessError as e:
@@ -95,6 +114,101 @@ class PythonVerifier(BaseVerifier):
                     "Failed to install required packages: "
                     f"{e.stderr.decode().strip()}"
                 )
+                # Clean up resources before re-raising
+                if self.venv_path and os.path.exists(self.venv_path):
+                    shutil.rmtree(self.venv_path)
+                    self.venv_path = None
+                raise
+            except subprocess.TimeoutExpired:
+                logger.error(
+                    f"Package installation timed out "
+                    f"after {self._timeout} seconds"
+                )
+                if self.venv_path and os.path.exists(self.venv_path):
+                    shutil.rmtree(self.venv_path)
+                    self.venv_path = None
+                raise
+    def _is_uv_environment(self) -> bool:
+        r"""Detect whether the current Python runtime is managed by uv."""
+        return "UV_CACHE_DIR" in os.environ or "uv" in sys.executable
+    def _setup_with_uv(self) -> None:
+        r"""Create virtual environment and install packages using uv."""
+        self.venv_path = tempfile.mkdtemp()
+        try:
+            subprocess.run(
+                ["uv", "venv", self.venv_path],
+                check=True,
+                capture_output=True,
+                timeout=self._timeout,
+            )
+            logger.info(
+                f"[UV] Virtual environment created at {self.venv_path}"
+            )
+        except subprocess.CalledProcessError as e:
+            logger.error(
+                "[UV] Failed to create virtual environment:\n"
+                f"{e.stderr.decode().strip()}"
+            )
+            # Clean up resources before re-raising
+            if self.venv_path and os.path.exists(self.venv_path):
+                shutil.rmtree(self.venv_path)
+                self.venv_path = None
+            raise
+        except subprocess.TimeoutExpired:
+            logger.error(
+                f"[UV] Virtual environment creation timed "
+                f"out after {self._timeout} seconds"
+            )
+            if self.venv_path and os.path.exists(self.venv_path):
+                shutil.rmtree(self.venv_path)
+                self.venv_path = None
+            raise
+        if self.required_packages:
+            venv_python = os.path.join(
+                self.venv_path,
+                self.bin_dir,
+                "python.exe" if os.name == 'nt' else "python",
+            )
+            try:
+                subprocess.run(
+                    [
+                        "uv",
+                        "pip",
+                        "install",
+                        "--python",
+                        venv_python,
+                        *self.required_packages,
+                    ],
+                    check=True,
+                    capture_output=True,
+                    timeout=self._timeout,
+                )
+                logger.info(
+                    "[UV] Installed required packages via uv: "
+                    f"{', '.join(self.required_packages)}"
+                )
+            except subprocess.CalledProcessError as e:
+                logger.error(
+                    "[UV] Failed to install required packages via uv:\n"
+                    f"{e.stderr.decode().strip()}"
+                )
+                # Clean up resources before re-raising
+                if self.venv_path and os.path.exists(self.venv_path):
+                    shutil.rmtree(self.venv_path)
+                    self.venv_path = None
+                raise
+            except subprocess.TimeoutExpired:
+                logger.error(
+                    f"[UV] Package installation timed "
+                    f"out after {self._timeout} seconds"
+                )
+                if self.venv_path and os.path.exists(self.venv_path):
+                    shutil.rmtree(self.venv_path)
+                    self.venv_path = None
+                raise
     async def _cleanup(self) -> None:
         r"""Clean up the virtual environment."""
@@ -106,32 +220,27 @@ class PythonVerifier(BaseVerifier):
     async def _verify_implementation(
         self, solution: str, ground_truth: Optional[str]
     ) -> VerificationResult:
-        r"""Executes and verifies the LLM-generated Python solution in an
-        isolated virtual environment.
+        r"""Executes the provided Python solution in an isolated environment
+        and verifies its output against an expected ground truth expression.
+        This method runs the solution in a subprocess inside a virtual
+        environment. The ground truth is assumed to be a pure Python
+        expression and is evaluated directly in the verifier process.
-        This method runs the given Python solution inside a controlled virtual
-        environment, captures its execution output, and optionally compares it
-        against a provided ground truth. Handles timeouts and execution errors.
+        If both executions are successful, the actual output is compared
+        against the evaluated ground truth using semantic equality. If
+        evaluation fails, string comparison is used as a fallback.
         Args:
-            solution (str): The Python code to execute and verify.
-            ground_truth (Optional[str]): The expected output for comparison.
-                If None, verification is based only on execution success.
+            solution (str): The Python code or expression to execute and
+                verify.
+            ground_truth (Optional[str]): The expected value as a Python
+             expression. If None, only execution success is verified.
         Returns:
-            VerificationResult: A structured object containing:
-                - status (VerificationOutcome): SUCCESS, FAILURE, ERROR,
-                or TIMEOUT.
-                - result (str): The execution output of the solution.
-                - error_message (Optional[str]): Captured error message,
-                if any.
-                - duration (float, optional): Execution time (set externally).
-        Raises:
-            asyncio.TimeoutError: If execution exceeds the configured timeout.
-            Exception: Any unexpected errors are caught and converted to an
-                ERROR verification result.
+            VerificationResult: Result of the verification process.
         """
+        # Check for virtual environment setup
         if not self.venv_path:
             return VerificationResult(
                 status=VerificationOutcome.ERROR,
@@ -139,9 +248,51 @@ class PythonVerifier(BaseVerifier):
                 error_message="Virtual environment is not set up.",
             )
-        script = solution.strip()
-        venv_python = os.path.join(self.venv_path, self.bin_dir, "python")
+        # If the solution is an expression, evaluate it directly
+        if self._is_expression(solution):
+            try:
+                sol_val = ast.literal_eval(solution)
+            except Exception as e:
+                return VerificationResult(
+                    status=VerificationOutcome.ERROR,
+                    result="",
+                    error_message=f"Expression evaluation error: {e}",
+                )
+            if ground_truth is not None:
+                try:
+                    gt_val = ast.literal_eval(ground_truth)
+                except Exception as e:
+                    return VerificationResult(
+                        status=VerificationOutcome.ERROR,
+                        result="",
+                        error_message=f"Ground truth evaluation error: {e}",
+                    )
+                if sol_val == gt_val:
+                    return VerificationResult(
+                        status=VerificationOutcome.SUCCESS,
+                        result=str(sol_val),
+                    )
+                else:
+                    return VerificationResult(
+                        status=VerificationOutcome.FAILURE,
+                        result=str(sol_val),
+                        error_message="Output mismatch: "
+                        f"{sol_val} != {gt_val}",
+                    )
+            else:
+                return VerificationResult(
+                    status=VerificationOutcome.SUCCESS,
+                    result=str(sol_val),
+                )
+        # Otherwise, run the code block,
+        # which should already include a print(...) in the end
+        venv_python = os.path.join(
+            self.venv_path,
+            self.bin_dir,
+            "python.exe" if os.name == 'nt' else "python",
+        )
         if not os.path.exists(venv_python):
             return VerificationResult(
                 status=VerificationOutcome.ERROR,
@@ -150,64 +301,166 @@ class PythonVerifier(BaseVerifier):
             )
         try:
-            process = await asyncio.create_subprocess_exec(
-                venv_python,
-                "-c",
-                script,
-                stdout=asyncio.subprocess.PIPE,
-                stderr=asyncio.subprocess.PIPE,
-            )
-            stdout, stderr = await asyncio.wait_for(
-                process.communicate(), timeout=self._timeout
+            sol_out, sol_err, sol_code = await self._run_code_block(
+                solution, venv_python
             )
+            if sol_code != 0:
+                return VerificationResult(
+                    status=VerificationOutcome.ERROR,
+                    result=sol_out,
+                    error_message=f"Solution code error:\n{sol_err}",
+                )
-            output_result = stdout.decode().strip()
-            error_output = stderr.decode().strip()
-            if process.returncode == 0:
-                # If ground truth is provided, compare it with the result
-                if ground_truth is not None:
-                    # Normalize both strings by removing extra whitespace
-                    normalized_output = ' '.join(output_result.strip().split())
-                    normalized_truth = ' '.join(
-                        str(ground_truth).strip().split()
+            if ground_truth is not None:
+                try:
+                    # First, try to evaluate the output as-is.
+                    sol_val = ast.literal_eval(sol_out)
+                except Exception as e:
+                    logger.warning(
+                        f"Direct eval failed: {e}. Trying repr on output."
                     )
+                    try:
+                        # Try to convert sol_out to a literal
+                        # by wrapping it with repr.
+                        # FIXME: may be unnecessary
+                        sol_val = ast.literal_eval(repr(sol_out))
+                    except Exception as e2:
+                        logger.warning(
+                            f"repr eval also failed: {e2}."
+                            "Falling back to string comparison."
+                        )
+                        sol_val = None
-                    if normalized_output == normalized_truth:
+                if sol_val is not None:
+                    try:
+                        gt_val = ast.literal_eval(ground_truth)
+                    except Exception as e:
+                        return VerificationResult(
+                            status=VerificationOutcome.ERROR,
+                            result="",
+                            error_message="Ground truth evaluation error:"
+                            f"{e}",
+                        )
+                    if sol_val == gt_val:
                         return VerificationResult(
                             status=VerificationOutcome.SUCCESS,
-                            result=output_result,
+                            result=sol_out,
                         )
                     else:
                         return VerificationResult(
                             status=VerificationOutcome.FAILURE,
-                            error_message="Output doesn't match ground truth",
-                            result=output_result,
+                            result=sol_out,
+                            error_message="Output mismatch: "
+                            f"{sol_val} != {gt_val}",
                         )
                 else:
-                    return VerificationResult(
-                        status=VerificationOutcome.SUCCESS,
-                        result=output_result,
-                    )
+                    # Fallback: string comparison
+                    if sol_out.strip() == ground_truth.strip():
+                        return VerificationResult(
+                            status=VerificationOutcome.SUCCESS,
+                            result=sol_out,
+                        )
+                    else:
+                        return VerificationResult(
+                            status=VerificationOutcome.FAILURE,
+                            result=sol_out,
+                            error_message="Fallback string mismatch: "
+                            f"'{sol_out}' != '{ground_truth}'",
+                        )
             else:
                 return VerificationResult(
-                    status=VerificationOutcome.ERROR,
-                    error_message=error_output,
-                    result=output_result,
+                    status=VerificationOutcome.SUCCESS,
+                    result=sol_out,
                 )
         except asyncio.TimeoutError:
             return VerificationResult(
                 status=VerificationOutcome.TIMEOUT,
                 result="",
                 error_message="Execution timed out.",
             )
         except Exception as e:
             return VerificationResult(
                 status=VerificationOutcome.ERROR,
                 result="",
-                error_message=f"Execution error: {e}",
+                error_message=f"Unexpected error: {e}",
             )
+    async def _run_code_block(
+        self, code: str, venv_path: str
+    ) -> Tuple[str, str, int]:
+        r"""Executes a block of Python code in the virtual environment.
+        The code is written to a temporary file, executed using the Python
+        interpreter from the specified virtual environment, and
+        its output and error streams are captured.
+        Args:
+            code (str): The Python code to execute.
+            venv_path (str): The path to the virtual environment's Python
+                binary.
+        Returns:
+            Tuple[str, str, int]: A tuple containing the stdout output,
+            stderr output, and return code from the executed script.
+        """
+        # No longer checking for expressions since they're handled separately
+        with tempfile.NamedTemporaryFile(
+            "w+", suffix=".py", delete=False
+        ) as tmp:
+            tmp.write(code)
+            tmp_path = tmp.name
+        proc = await asyncio.create_subprocess_exec(
+            venv_path,
+            tmp_path,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        stdout, stderr = await asyncio.wait_for(
+            proc.communicate(), timeout=self._timeout
+        )
+        os.remove(tmp_path)
+        return (
+            stdout.decode().strip(),
+            stderr.decode().strip(),
+            proc.returncode if proc.returncode is not None else -1,
+        )
+    def _is_expression(self, code: str) -> bool:
+        r"""Determines whether a given string of code is a single expression.
+        This utility uses Python's AST module to parse the code and checks if
+        it consists of a single expression node.
+        Args:
+            code (str): The Python code to analyze.
+        Returns:
+            bool: True if the code is a single expression, False otherwise.
+        """
+        # Skip empty or whitespace-only strings
+        if not code or code.isspace():
+            return False
+        try:
+            # First try parsing as an expression - this is more reliable than
+            # starting with literal_eval
+            tree = ast.parse(code.strip(), mode='eval')
+            # Check if it's a function call (like print()) - these should not
+            # be treated as expressions
+            if isinstance(tree.body, ast.Call):
+                return False
+            # If parsing succeeds in 'eval' mode and it's not a function call,
+            # it's a valid expression
+            return True
+        except SyntaxError:
+            # If parsing as expression fails, it's not a valid expression
+            return False
+        except Exception:
+            # For any other parsing errors, try literal_eval as fallback for
+            # simple literals
+            try:
+                ast.literal_eval(code)
+                return True
+            except Exception:
+                return False

camel-ai 0.2.36__py3-none-any.whl → 0.2.38__py3-none-any.whl

Potentially problematic release.

camel-ai 0.2.36py3-none-any.whl → 0.2.38py3-none-any.whl