PyPI - camel-ai - Versions diffs - 0.2.76a9__py3-none-any.whl → 0.2.76a12__py3-none-any.whl - Mend

camel-ai 0.2.76a9py3-none-any.whl → 0.2.76a12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of camel-ai might be problematic. Click here for more details.

Files changed (20) hide show

camel/__init__.py +1 -1
camel/loaders/chunkr_reader.py +9 -0
camel/memories/records.py +36 -0
camel/messages/base.py +126 -33
camel/societies/workforce/task_channel.py +43 -0
camel/societies/workforce/workforce.py +433 -76
camel/storages/vectordb_storages/oceanbase.py +0 -1
camel/tasks/task.py +4 -3
camel/toolkits/hybrid_browser_toolkit/installer.py +203 -0
camel/toolkits/hybrid_browser_toolkit/ts/package-lock.json +5 -612
camel/toolkits/hybrid_browser_toolkit/ts/package.json +0 -1
camel/toolkits/hybrid_browser_toolkit/ws_wrapper.py +54 -131
camel/toolkits/video_analysis_toolkit.py +1 -1
camel/types/enums.py +3 -0
camel/utils/commons.py +13 -0
camel/utils/token_counting.py +25 -17
{camel_ai-0.2.76a9.dist-info → camel_ai-0.2.76a12.dist-info}/METADATA +43 -40
{camel_ai-0.2.76a9.dist-info → camel_ai-0.2.76a12.dist-info}/RECORD +20 -19
{camel_ai-0.2.76a9.dist-info → camel_ai-0.2.76a12.dist-info}/WHEEL +0 -0
{camel_ai-0.2.76a9.dist-info → camel_ai-0.2.76a12.dist-info}/licenses/LICENSE +0 -0

camel/__init__.py CHANGED Viewed

@@ -14,7 +14,7 @@
 from camel.logger import disable_logging, enable_logging, set_log_level
-__version__ = '0.2.76a9'
+__version__ = '0.2.76a12'
 __all__ = [
     '__version__',

camel/loaders/chunkr_reader.py CHANGED Viewed

@@ -34,6 +34,12 @@ class ChunkrReaderConfig:
         high_resolution (bool, optional): Whether to use high resolution OCR.
             (default: :obj:`True`)
         ocr_strategy (str, optional): The OCR strategy. Defaults to 'Auto'.
+        **kwargs: Additional keyword arguments to pass to the Chunkr
+            Configuration. This accepts all other Configuration parameters
+            such as expires_in, pipeline, segment_processing,
+            segmentation_strategy, etc.
+            See: https://github.com/lumina-ai-inc/chunkr/blob/main/core/src/
+            models/task.rs#L749
     """
     def __init__(
@@ -41,10 +47,12 @@ class ChunkrReaderConfig:
         chunk_processing: int = 512,
         high_resolution: bool = True,
         ocr_strategy: str = "Auto",
+        **kwargs,
     ):
         self.chunk_processing = chunk_processing
         self.high_resolution = high_resolution
         self.ocr_strategy = ocr_strategy
+        self.kwargs = kwargs
 class ChunkrReader:
@@ -190,4 +198,5 @@ class ChunkrReader:
                 "Auto": OcrStrategy.AUTO,
                 "All": OcrStrategy.ALL,
             }.get(chunkr_config.ocr_strategy, OcrStrategy.ALL),
+            **chunkr_config.kwargs,
         )

camel/memories/records.py CHANGED Viewed

@@ -94,6 +94,42 @@ class MemoryRecord(BaseModel):
         if "role_type" in data and isinstance(data["role_type"], str):
             data["role_type"] = RoleType(data["role_type"])
+        # Deserialize image_list from base64 strings/URLs back to PIL Images/
+        # URLs
+        if "image_list" in data and data["image_list"] is not None:
+            import base64
+            from io import BytesIO
+            from PIL import Image
+            image_objects = []
+            for img_item in data["image_list"]:
+                if isinstance(img_item, dict):
+                    # New format with type indicator
+                    if img_item["type"] == "url":
+                        # URL string, keep as-is
+                        image_objects.append(img_item["data"])
+                    else:  # type == "base64"
+                        # Base64 encoded image, convert to PIL Image
+                        img_bytes = base64.b64decode(img_item["data"])
+                        img = Image.open(BytesIO(img_bytes))
+                        # Restore the format attribute if it was saved
+                        if "format" in img_item:
+                            img.format = img_item["format"]
+                        image_objects.append(img)
+                else:
+                    # Legacy format: assume it's a base64 string
+                    img_bytes = base64.b64decode(img_item)
+                    img = Image.open(BytesIO(img_bytes))
+                    image_objects.append(img)
+            data["image_list"] = image_objects
+        # Deserialize video_bytes from base64 string
+        if "video_bytes" in data and data["video_bytes"] is not None:
+            import base64
+            data["video_bytes"] = base64.b64decode(data["video_bytes"])
         # Get valid constructor parameters (cached)
         valid_params = cls._get_constructor_params(message_cls)

camel/messages/base.py CHANGED Viewed

@@ -64,8 +64,9 @@ class BaseMessage:
         content (str): The content of the message.
         video_bytes (Optional[bytes]): Optional bytes of a video associated
             with the message. (default: :obj:`None`)
-        image_list (Optional[List[Image.Image]]): Optional list of PIL Image
-            objects associated with the message. (default: :obj:`None`)
+        image_list (Optional[List[Union[Image.Image, str]]]): Optional list of
+            PIL Image objects or image URLs (strings) associated with the
+            message. (default: :obj:`None`)
         image_detail (Literal["auto", "low", "high"]): Detail level of the
             images associated with the message. (default: :obj:`auto`)
         video_detail (Literal["auto", "low", "high"]): Detail level of the
@@ -80,7 +81,7 @@ class BaseMessage:
     content: str
     video_bytes: Optional[bytes] = None
-    image_list: Optional[List[Image.Image]] = None
+    image_list: Optional[List[Union[Image.Image, str]]] = None
     image_detail: Literal["auto", "low", "high"] = "auto"
     video_detail: Literal["auto", "low", "high"] = "auto"
     parsed: Optional[Union[BaseModel, dict]] = None
@@ -92,7 +93,7 @@ class BaseMessage:
         content: str,
         meta_dict: Optional[Dict[str, str]] = None,
         video_bytes: Optional[bytes] = None,
-        image_list: Optional[List[Image.Image]] = None,
+        image_list: Optional[List[Union[Image.Image, str]]] = None,
         image_detail: Union[
             OpenAIVisionDetailType, str
         ] = OpenAIVisionDetailType.AUTO,
@@ -109,8 +110,9 @@ class BaseMessage:
                 dictionary for the message.
             video_bytes (Optional[bytes]): Optional bytes of a video
                 associated with the message.
-            image_list (Optional[List[Image.Image]]): Optional list of PIL
-                Image objects associated with the message.
+            image_list (Optional[List[Union[Image.Image, str]]]): Optional list
+                of PIL Image objects or image URLs (strings) associated with
+                the message.
             image_detail (Union[OpenAIVisionDetailType, str]): Detail level of
                 the images associated with the message.
             video_detail (Union[OpenAIVisionDetailType, str]): Detail level of
@@ -137,7 +139,7 @@ class BaseMessage:
         content: str,
         meta_dict: Optional[Dict[str, str]] = None,
         video_bytes: Optional[bytes] = None,
-        image_list: Optional[List[Image.Image]] = None,
+        image_list: Optional[List[Union[Image.Image, str]]] = None,
         image_detail: Union[
             OpenAIVisionDetailType, str
         ] = OpenAIVisionDetailType.AUTO,
@@ -154,8 +156,9 @@ class BaseMessage:
                 dictionary for the message.
             video_bytes (Optional[bytes]): Optional bytes of a video
                 associated with the message.
-            image_list (Optional[List[Image.Image]]): Optional list of PIL
-                Image objects associated with the message.
+            image_list (Optional[List[Union[Image.Image, str]]]): Optional list
+                of PIL Image objects or image URLs (strings) associated with
+                the message.
             image_detail (Union[OpenAIVisionDetailType, str]): Detail level of
                 the images associated with the message.
             video_detail (Union[OpenAIVisionDetailType, str]): Detail level of
@@ -436,31 +439,64 @@ class BaseMessage:
         )
         if self.image_list and len(self.image_list) > 0:
             for image in self.image_list:
-                if image.format is None:
-                    # Set default format to PNG as fallback
-                    image.format = 'PNG'
-                image_type: str = image.format.lower()
-                if image_type not in OpenAIImageType:
-                    raise ValueError(
-                        f"Image type {image.format} "
-                        f"is not supported by OpenAI vision model"
+                # Check if image is a URL string or PIL Image
+                if isinstance(image, str):
+                    # Image is a URL string
+                    hybrid_content.append(
+                        {
+                            "type": "image_url",
+                            "image_url": {
+                                "url": image,
+                                "detail": self.image_detail,
+                            },
+                        }
                     )
-                with io.BytesIO() as buffer:
-                    image.save(fp=buffer, format=image.format)
-                    encoded_image = base64.b64encode(buffer.getvalue()).decode(
-                        "utf-8"
+                else:
+                    # Image is a PIL Image object
+                    if image.format is None:
+                        # Set default format to PNG as fallback
+                        image.format = 'PNG'
+                    image_type: str = image.format.lower()
+                    if image_type not in OpenAIImageType:
+                        raise ValueError(
+                            f"Image type {image.format} "
+                            f"is not supported by OpenAI vision model"
+                        )
+                    # Convert RGBA to RGB for formats that don't support
+                    # transparency or when the image has transparency channel
+                    img_to_save = image
+                    if image.mode in ('RGBA', 'LA', 'P') and image_type in (
+                        'jpeg',
+                        'jpg',
+                    ):
+                        # JPEG doesn't support transparency, convert to RGB
+                        img_to_save = image.convert('RGB')
+                    elif (
+                        image.mode in ('RGBA', 'LA', 'P')
+                        and image_type == 'png'
+                    ):
+                        # For PNG with transparency, convert to RGBA if needed
+                        if image.mode in ('LA', 'P'):
+                            img_to_save = image.convert('RGBA')
+                        # else: RGBA mode, keep as-is
+                    with io.BytesIO() as buffer:
+                        img_to_save.save(fp=buffer, format=image.format)
+                        encoded_image = base64.b64encode(
+                            buffer.getvalue()
+                        ).decode("utf-8")
+                    image_prefix = f"data:image/{image_type};base64,"
+                    hybrid_content.append(
+                        {
+                            "type": "image_url",
+                            "image_url": {
+                                "url": f"{image_prefix}{encoded_image}",
+                                "detail": self.image_detail,
+                            },
+                        }
                     )
-                image_prefix = f"data:image/{image_type};base64,"
-                hybrid_content.append(
-                    {
-                        "type": "image_url",
-                        "image_url": {
-                            "url": f"{image_prefix}{encoded_image}",
-                            "detail": self.image_detail,
-                        },
-                    }
-                )
         if self.video_bytes:
             import imageio.v3 as iio
@@ -552,9 +588,66 @@ class BaseMessage:
         Returns:
             dict: The converted dictionary.
         """
-        return {
+        result = {
             "role_name": self.role_name,
             "role_type": self.role_type.value,
             **(self.meta_dict or {}),
             "content": self.content,
         }
+        # Include image/video fields if present
+        if self.image_list is not None:
+            # Handle both PIL Images and URL strings
+            import base64
+            from io import BytesIO
+            image_data_list = []
+            for img in self.image_list:
+                if isinstance(img, str):
+                    # Image is a URL string, store as-is
+                    image_data_list.append({"type": "url", "data": img})
+                else:
+                    # Image is a PIL Image, convert to base64
+                    # Preserve format, default to PNG if not set
+                    img_format = img.format if img.format else "PNG"
+                    # Handle transparency for different formats
+                    img_to_save = img
+                    if img.mode in (
+                        'RGBA',
+                        'LA',
+                        'P',
+                    ) and img_format.upper() in ('JPEG', 'JPG'):
+                        # JPEG doesn't support transparency, convert to RGB
+                        img_to_save = img.convert('RGB')
+                    elif (
+                        img.mode in ('LA', 'P') and img_format.upper() == 'PNG'
+                    ):
+                        # For PNG with transparency, convert to RGBA if needed
+                        img_to_save = img.convert('RGBA')
+                    # else: keep as-is for other combinations
+                    buffered = BytesIO()
+                    img_to_save.save(buffered, format=img_format)
+                    img_str = base64.b64encode(buffered.getvalue()).decode()
+                    image_data_list.append(
+                        {
+                            "type": "base64",
+                            "data": img_str,
+                            "format": img_format,  # Preserve format
+                        }
+                    )
+            result["image_list"] = image_data_list
+        if self.video_bytes is not None:
+            import base64
+            result["video_bytes"] = base64.b64encode(self.video_bytes).decode()
+        if self.image_detail is not None:
+            result["image_detail"] = self.image_detail
+        if self.video_detail is not None:
+            result["video_detail"] = self.video_detail
+        return result

camel/societies/workforce/task_channel.py CHANGED Viewed

@@ -16,8 +16,11 @@ from collections import defaultdict, deque
 from enum import Enum
 from typing import Dict, List, Optional, Set
+from camel.logger import get_logger
 from camel.tasks import Task
+logger = get_logger(__name__)
 class PacketStatus(Enum):
     r"""The status of a packet. The packet can be in one of the following
@@ -269,6 +272,46 @@ class TaskChannel:
         async with self._condition:
             return list(self._task_by_status[PacketStatus.ARCHIVED])
+    async def get_in_flight_tasks(self, publisher_id: str) -> List[Task]:
+        r"""Get all tasks that are currently in-flight (SENT, RETURNED
+        or PROCESSING) published by the given publisher.
+        Args:
+            publisher_id (str): The ID of the publisher whose
+            in-flight tasks to retrieve.
+        Returns:
+            List[Task]: List of tasks that are currently in-flight.
+        """
+        async with self._condition:
+            in_flight_tasks = []
+            seen_task_ids = set()  # Track seen IDs for duplicate detection
+            # Get tasks with SENT, RETURNED or PROCESSING
+            # status published by this publisher
+            for status in [
+                PacketStatus.SENT,
+                PacketStatus.PROCESSING,
+                PacketStatus.RETURNED,
+            ]:
+                for task_id in self._task_by_status[status]:
+                    if task_id in self._task_dict:
+                        packet = self._task_dict[task_id]
+                        if packet.publisher_id == publisher_id:
+                            # Defensive check: detect if task appears in
+                            # multiple status sets (should never happen)
+                            if task_id in seen_task_ids:
+                                logger.warning(
+                                    f"Task {task_id} found in multiple "
+                                    f"status sets. This indicates a bug in "
+                                    f"status management."
+                                )
+                                continue
+                            in_flight_tasks.append(packet.task)
+                            seen_task_ids.add(task_id)
+            return in_flight_tasks
     async def get_task_by_id(self, task_id: str) -> Task:
         r"""Get a task from the channel by its ID."""
         async with self._condition:

camel-ai 0.2.76a9__py3-none-any.whl → 0.2.76a12__py3-none-any.whl

Potentially problematic release.

camel-ai 0.2.76a9py3-none-any.whl → 0.2.76a12py3-none-any.whl