PyPI - camel-ai - Versions diffs - 0.2.15a0__py3-none-any.whl → 0.2.17__py3-none-any.whl - Mend

camel-ai 0.2.15a0py3-none-any.whl → 0.2.17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of camel-ai might be problematic. Click here for more details.

Files changed (95) hide show

camel/__init__.py +1 -1
camel/agents/chat_agent.py +18 -4
camel/agents/multi_hop_generator_agent.py +85 -0
camel/agents/programmed_agent_instruction.py +148 -0
camel/benchmarks/__init__.py +13 -1
camel/benchmarks/apibank.py +565 -0
camel/benchmarks/apibench.py +500 -0
camel/benchmarks/gaia.py +4 -4
camel/benchmarks/nexus.py +518 -0
camel/benchmarks/ragbench.py +333 -0
camel/bots/__init__.py +1 -1
camel/bots/discord/__init__.py +26 -0
camel/bots/discord/discord_app.py +384 -0
camel/bots/discord/discord_installation.py +64 -0
camel/bots/discord/discord_store.py +160 -0
camel/configs/__init__.py +3 -0
camel/configs/anthropic_config.py +17 -15
camel/configs/internlm_config.py +60 -0
camel/data_collector/base.py +5 -5
camel/data_collector/sharegpt_collector.py +2 -2
camel/datagen/__init__.py +6 -2
camel/datagen/{o1datagen.py → cotdatagen.py} +19 -6
camel/datagen/self_instruct/__init__.py +36 -0
camel/datagen/self_instruct/filter/__init__.py +34 -0
camel/datagen/self_instruct/filter/filter_function.py +216 -0
camel/datagen/self_instruct/filter/filter_registry.py +56 -0
camel/datagen/self_instruct/filter/instruction_filter.py +81 -0
camel/datagen/self_instruct/self_instruct.py +393 -0
camel/datagen/self_instruct/templates.py +382 -0
camel/datahubs/huggingface.py +12 -2
camel/datahubs/models.py +2 -3
camel/embeddings/mistral_embedding.py +5 -1
camel/embeddings/openai_compatible_embedding.py +6 -1
camel/embeddings/openai_embedding.py +5 -1
camel/interpreters/e2b_interpreter.py +5 -1
camel/loaders/__init__.py +2 -0
camel/loaders/apify_reader.py +5 -1
camel/loaders/chunkr_reader.py +5 -1
camel/loaders/firecrawl_reader.py +0 -30
camel/loaders/panda_reader.py +337 -0
camel/logger.py +11 -5
camel/messages/__init__.py +10 -4
camel/messages/conversion/conversation_models.py +5 -0
camel/messages/func_message.py +30 -22
camel/models/__init__.py +2 -0
camel/models/anthropic_model.py +6 -23
camel/models/azure_openai_model.py +1 -2
camel/models/cohere_model.py +13 -1
camel/models/deepseek_model.py +5 -1
camel/models/gemini_model.py +15 -2
camel/models/groq_model.py +5 -1
camel/models/internlm_model.py +143 -0
camel/models/mistral_model.py +19 -8
camel/models/model_factory.py +3 -0
camel/models/nemotron_model.py +5 -1
camel/models/nvidia_model.py +5 -1
camel/models/openai_model.py +5 -1
camel/models/qwen_model.py +5 -1
camel/models/reka_model.py +5 -1
camel/models/reward/__init__.py +2 -0
camel/models/reward/nemotron_model.py +5 -1
camel/models/reward/skywork_model.py +88 -0
camel/models/samba_model.py +5 -1
camel/models/togetherai_model.py +5 -1
camel/models/yi_model.py +5 -1
camel/models/zhipuai_model.py +5 -1
camel/schemas/openai_converter.py +5 -1
camel/storages/graph_storages/nebula_graph.py +89 -20
camel/storages/graph_storages/neo4j_graph.py +138 -0
camel/synthetic_datagen/source2synth/data_processor.py +373 -0
camel/synthetic_datagen/source2synth/models.py +68 -0
camel/synthetic_datagen/source2synth/user_data_processor_config.py +73 -0
camel/toolkits/__init__.py +4 -0
camel/toolkits/arxiv_toolkit.py +20 -3
camel/toolkits/dappier_toolkit.py +196 -0
camel/toolkits/function_tool.py +61 -61
camel/toolkits/google_scholar_toolkit.py +9 -0
camel/toolkits/meshy_toolkit.py +5 -1
camel/toolkits/notion_toolkit.py +1 -1
camel/toolkits/openbb_toolkit.py +869 -0
camel/toolkits/search_toolkit.py +91 -5
camel/toolkits/stripe_toolkit.py +5 -1
camel/toolkits/twitter_toolkit.py +24 -16
camel/types/__init__.py +4 -2
camel/types/enums.py +34 -1
camel/types/openai_types.py +6 -4
camel/types/unified_model_type.py +5 -0
camel/utils/__init__.py +2 -0
camel/utils/commons.py +104 -19
camel/utils/token_counting.py +3 -3
{camel_ai-0.2.15a0.dist-info → camel_ai-0.2.17.dist-info}/METADATA +160 -177
{camel_ai-0.2.15a0.dist-info → camel_ai-0.2.17.dist-info}/RECORD +94 -69
{camel_ai-0.2.15a0.dist-info → camel_ai-0.2.17.dist-info}/WHEEL +1 -1
camel/bots/discord_app.py +0 -138
{camel_ai-0.2.15a0.dist-info → camel_ai-0.2.17.dist-info}/LICENSE +0 -0

camel/configs/internlm_config.py ADDED Viewed

@@ -0,0 +1,60 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from typing import Optional, Union
+from camel.configs.base_config import BaseConfig
+class InternLMConfig(BaseConfig):
+    r"""Defines the parameters for generating chat completions using the
+    InternLM API. You can refer to the following link for more details:
+    https://internlm.intern-ai.org.cn/api/document
+    Args:
+        stream (bool, optional): Whether to stream the response.
+            (default: :obj:`False`)
+        temperature (float, optional): Controls the diversity and focus of
+            the generated results. Lower values make the output more focused,
+            while higher values make it more diverse. (default: :obj:`0.3`)
+        top_p (float, optional): Controls the diversity and focus of the
+            generated results. Higher values make the output more diverse,
+            while lower values make it more focused. (default: :obj:`0.9`)
+        max_tokens (Union[int, NotGiven], optional): Allows the model to
+            generate the maximum number of tokens.
+            (default: :obj:`NOT_GIVEN`)
+        tools (list, optional): Specifies an array of tools that the model can
+            call. It can contain one or more tool objects. During a function
+            call process, the model will select one tool from the array.
+            (default: :obj:`None`)
+        tool_choice (Union[dict[str, str], str], optional): Controls which (if
+            any) tool is called by the model. :obj:`"none"` means the model
+            will not call any tool and instead generates a message.
+            :obj:`"auto"` means the model can pick between generating a
+            message or calling one or more tools.  :obj:`"required"` means the
+            model must call one or more tools. Specifying a particular tool
+            via {"type": "function", "function": {"name": "my_function"}}
+            forces the model to call that tool. :obj:`"none"` is the default
+            when no tools are present. :obj:`"auto"` is the default if tools
+            are present.
+    """
+    stream: bool = False
+    temperature: float = 0.8
+    top_p: float = 0.9
+    max_tokens: Optional[int] = None
+    tool_choice: Optional[Union[dict[str, str], str]] = None
+INTERNLM_API_PARAMS = {param for param in InternLMConfig.model_fields.keys()}

camel/data_collector/base.py CHANGED Viewed

@@ -27,7 +27,7 @@ class CollectorData:
         self,
         id: UUID,
         name: str,
-        role: Literal["user", "assistant", "system", "function"],
+        role: Literal["user", "assistant", "system", "tool"],
         message: Optional[str] = None,
         function_call: Optional[Dict[str, Any]] = None,
     ) -> None:
@@ -52,7 +52,7 @@ class CollectorData:
             ValueError: If neither message nor function call is provided.
         """
-        if role not in ["user", "assistant", "system", "function"]:
+        if role not in ["user", "assistant", "system", "tool"]:
             raise ValueError(f"Role {role} not supported")
         if role == "system" and function_call:
             raise ValueError("System role cannot have function call")
@@ -82,7 +82,7 @@ class CollectorData:
             name=name,
             role=context["role"],
             message=context["content"],
-            function_call=context.get("function_call", None),
+            function_call=context.get("tool_calls", None),
         )
@@ -98,7 +98,7 @@ class BaseDataCollector(ABC):
     def step(
         self,
-        role: Literal["user", "assistant", "system", "function"],
+        role: Literal["user", "assistant", "system", "tool"],
         name: Optional[str] = None,
         message: Optional[str] = None,
         function_call: Optional[Dict[str, Any]] = None,
@@ -106,7 +106,7 @@ class BaseDataCollector(ABC):
         r"""Record a message.
         Args:
-            role (Literal["user", "assistant", "system", "function"]):
+            role (Literal["user", "assistant", "system", "tool"]):
                 The role of the message.
             name (Optional[str], optional): The name of the agent.
                 (default: :obj:`None`)

camel/data_collector/sharegpt_collector.py CHANGED Viewed

@@ -131,7 +131,7 @@ class ShareGPTDataCollector(BaseDataCollector):
                     conversations.append(
                         {"from": "gpt", "value": message.message}
                     )
-            elif role == "function":
+            elif role == "function" or role == "tool":
                 conversations.append(
                     {
                         "from": "observation",
@@ -182,7 +182,7 @@ class ShareGPTDataCollector(BaseDataCollector):
             if message.function_call:
                 context.append(prefix + json.dumps(message.function_call))
-            elif role == "function":
+            elif role == "function" or role == "tool":
                 context.append(prefix + json.dumps(message.message))  # type: ignore[attr-defined]
             else:
                 context.append(prefix + str(message.message))

camel/datagen/__init__.py CHANGED Viewed

@@ -12,6 +12,10 @@
 # limitations under the License.
 # ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
-from .o1datagen import O1DataGenerator
+from .cotdatagen import CoTDataGenerator
+from .self_instruct import SelfInstructPipeline
-__all__ = ['O1DataGenerator']
+__all__ = [
+    "CoTDataGenerator",
+    "SelfInstructPipeline",
+]

camel/datagen/{o1datagen.py → cotdatagen.py} RENAMED Viewed

@@ -22,7 +22,7 @@ from camel.agents import ChatAgent
 from camel.logger import get_logger
 # Get a logger for this module
-logger = get_logger('o1datagenerator')
+logger = get_logger('CoTDataGenerator')
 class AgentResponse(BaseModel):
@@ -60,11 +60,17 @@ class VerificationResponse(BaseModel):
     )
-class O1DataGenerator:
+class CoTDataGenerator:
     r"""Class for generating and managing data through chat agent interactions.
-    handling the generation of data by  a chat agent, managing golden answers,
-    and maintaining a solution tree for correct solution steps.
+    This module implements a sophisticated Chain of Thought data generation
+    system that combines several key algorithms to produce high-quality
+    reasoning paths. Methods implemented:
+    1. Monte Carlo Tree Search (MCTS)
+    2. Binary Search Error Detection
+    3. Dual-Agent Verification System
+    4. Solution Tree Management
     Args:
         chat_agent (Optional[ChatAgent]): Optional single agent
@@ -89,7 +95,7 @@ class O1DataGenerator:
         golden_answers: Dict[str, str],
         search_limit: int = 100,
     ):
-        r"""Initialize the O1DataGenerator.
+        r"""Initialize the CoTDataGenerator.
         This constructor supports both single-agent and dual-agent modes:
         1. Single-agent mode (legacy): Pass a single chat_agent that will be
@@ -131,7 +137,7 @@ class O1DataGenerator:
         self.search_limit = search_limit
         self.solution_tree: Dict[str, Dict[str, Union[str, int]]] = {}
         logger.info(
-            "O1DataGenerator initialized with search_limit=%d", search_limit
+            "CoTDataGenerator initialized with search_limit=%d", search_limit
         )
     def get_answer(self, question: str, context: str = "") -> str:
@@ -203,6 +209,13 @@ class O1DataGenerator:
     ) -> float:
         r"""Perform Monte Carlo Tree Search to find the best solution.
+        Process:
+        a. Selection: Choose promising partial solutions based on previous
+        scores
+        b. Expansion: Generate new solution steps using the generator agent
+        c. Simulation: Evaluate solution quality using similarity scores
+        d. Backpropagation: Update solution tree with new findings
         Args:
             question (str): The question to solve.
             partial_solution (str): The current partial solution.

camel/datagen/self_instruct/__init__.py ADDED Viewed

@@ -0,0 +1,36 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from .filter import (
+    FILTER_REGISTRY,
+    FilterFunction,
+    InstructionFilter,
+    KeywordFilter,
+    LengthFilter,
+    NonEnglishFilter,
+    PunctuationFilter,
+    RougeSimilarityFilter,
+)
+from .self_instruct import SelfInstructPipeline
+__all__ = [
+    'SelfInstructPipeline',
+    'InstructionFilter',
+    'NonEnglishFilter',
+    'PunctuationFilter',
+    'RougeSimilarityFilter',
+    'FilterFunction',
+    'KeywordFilter',
+    'LengthFilter',
+    'FILTER_REGISTRY',
+]

camel/datagen/self_instruct/filter/__init__.py ADDED Viewed

@@ -0,0 +1,34 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from .filter_function import (
+    FilterFunction,
+    KeywordFilter,
+    LengthFilter,
+    NonEnglishFilter,
+    PunctuationFilter,
+    RougeSimilarityFilter,
+)
+from .filter_registry import FILTER_REGISTRY
+from .instruction_filter import InstructionFilter
+__all__ = [
+    "LengthFilter",
+    "NonEnglishFilter",
+    "PunctuationFilter",
+    "RougeSimilarityFilter",
+    "FilterFunction",
+    "KeywordFilter",
+    "InstructionFilter",
+    "FILTER_REGISTRY",
+]

camel/datagen/self_instruct/filter/filter_function.py ADDED Viewed

@@ -0,0 +1,216 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+import re
+from abc import ABC, abstractmethod
+from typing import List
+from rouge import Rouge
+from camel.models.reward import BaseRewardModel
+class FilterFunction(ABC):
+    r"""A base abstract class for filter functions.
+    Subclasses must implement the `apply` method, which determines whether
+    a given instruction passes the filter criteria.
+    """
+    @abstractmethod
+    def apply(self, instruction: str) -> bool:
+        r"""Evaluate the given instruction based on the filter's criteria.
+        Args:
+            instruction (str): The instruction to evaluate.
+        Returns:
+            bool: True if the instruction passes the filter, False otherwise.
+        """
+        pass
+class LengthFilter(FilterFunction):
+    r"""Filters instructions based on their word count.
+    Args:
+        min_len (int): The minimum word count required for an instruction.
+            (default::obj:`5`)
+        max_len (int): The maximum word count allowed for an instruction.
+            (default::obj:`200`)
+    """
+    def __init__(self, min_len: int = 5, max_len: int = 200):
+        self.min_len = min_len
+        self.max_len = max_len
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): the instruction to be filtered.
+        Returns:
+            bool: True if the length of the instruction is within the range
+                of [min_len, max_len]
+        """
+        word_count = len(instruction.split())
+        return self.min_len <= word_count <= self.max_len
+class KeywordFilter(FilterFunction):
+    r"""Filters instructions that contain specific undesirable keywords.
+    Args:
+        keywords (List[str]): A list of keywords to filter out.
+    """
+    def __init__(self, keywords: List[str]):
+        self.keywords = [keyword.lower() for keyword in keywords]
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): the instruction to be filtered.
+        Returns:
+            bool: True Instruction must NOT contain any of the keywords.
+        """
+        lower_instr = instruction.lower()
+        return not any(keyword in lower_instr for keyword in self.keywords)
+class PunctuationFilter(FilterFunction):
+    r"""Filters instructions that begin with a non-alphanumeric character."""
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): the instruction to be filtered.
+        Returns:
+            bool: True if the instruction does not start with punctuation.
+        """
+        return not re.match(r'^[^\w\s]', instruction)
+class NonEnglishFilter(FilterFunction):
+    r"""Filters instructions that do not begin with English letters."""
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): the instruction to be filtered.
+        Returns:
+            bool: True if the instruction starts with an English letter.
+        """
+        return bool(re.match(r'^[A-Za-z]', instruction))
+class RougeSimilarityFilter(FilterFunction):
+    r"""Filters instructions that are too similar to existing instructions
+    based on ROUGE scores.
+    Args:
+        existing_instructions (List[str]): A list of existing instructions to
+            compare against.
+        threshold (float): The similarity threshold for filtering.
+            (default::obj:`0.7`)
+    """
+    def __init__(
+        self, existing_instructions: List[str], threshold: float = 0.7
+    ):
+        self.existing_instructions = existing_instructions
+        self.threshold = threshold
+        self.rouge = Rouge()
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): the instruction to be filtered.
+        Returns:
+            bool: True if the instruction's similarity to any existing
+                instruction is below the threshold.
+        """
+        if not self.existing_instructions:
+            return True
+        for existing_instr in self.existing_instructions:
+            scores = self.rouge.get_scores(instruction, existing_instr)
+            score = scores[0]['rouge-l']['f']
+            if score > self.threshold:
+                return False
+        return True
+class RewardModelFilter(FilterFunction):
+    r"""Filters instructions based on scores provided by a reward model.
+    Args:
+        reward_model (BaseRewardModel): The reward model used to evaluate
+            the instructions.
+        threshold (float): The minimum score required for an instruction
+            to pass the filter.
+    """
+    def __init__(
+        self,
+        reward_model: BaseRewardModel,
+        threshold: float = 0.5,
+    ):
+        self.prompt = ""
+        self.reward_model = reward_model
+        self.threshold = threshold
+    def apply(self, instruction: str) -> bool:
+        r"""Filter the instruction
+        Args:
+            instruction (str): The instruction to be filtered.
+        Returns:
+            bool: True if the instruction's score is above the threshold.
+        Raises:
+            ValueError: ValueError: If `score_types` is empty or if the
+                required score is not found in `scores`.
+        """
+        data = [
+            {"role": "user", "content": self.prompt},
+            {"role": "assistant", "content": instruction},
+        ]
+        scores = self.reward_model.evaluate(data)
+        score_types = self.reward_model.get_scores_types()
+        if not score_types:
+            raise ValueError("No score types available from the reward model.")
+        score_type = score_types[0]
+        score = scores.get(score_type, None)
+        if score is None:
+            raise ValueError(
+                f"Score type '{score_type}' is not found in the "
+                "evaluation scores."
+            )
+        return score >= self.threshold

camel/datagen/self_instruct/filter/filter_registry.py ADDED Viewed

@@ -0,0 +1,56 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from typing import Any, Callable, Dict
+from .filter_function import (
+    FilterFunction,
+    KeywordFilter,
+    LengthFilter,
+    NonEnglishFilter,
+    PunctuationFilter,
+    RewardModelFilter,
+    RougeSimilarityFilter,
+)
+FILTER_REGISTRY: Dict[str, Callable[[Dict[str, Any]], FilterFunction]] = {
+    "length": lambda kwargs: LengthFilter(
+        min_len=kwargs.get("min_len", 5), max_len=kwargs.get("max_len", 200)
+    ),
+    "keyword": lambda kwargs: KeywordFilter(
+        keywords=kwargs.get("keywords", ["image", "data"])
+    ),
+    "punctuation": lambda kwargs: PunctuationFilter(),
+    "non_english": lambda kwargs: NonEnglishFilter(),
+    "rouge_similarity": lambda kwargs: RougeSimilarityFilter(
+        existing_instructions=kwargs.get("existing_instructions", []),
+        threshold=kwargs.get("threshold", 0.7),
+    ),
+    "reward": lambda kwargs: RewardModelFilter(
+        reward_model=kwargs.get("reward_model"),  # type:ignore[arg-type]
+        threshold=kwargs.get("threshold", 0.7),
+    ),
+}
+def register_filter(
+    name: str, constructor: Callable[[Dict[str, Any]], FilterFunction]
+):
+    r"""Registers a new filter constructor in FILTER_REGISTRY.
+    Args:
+        name (str): Unique name of the filter.
+        constructor (Callable[[Dict[str, Any]], FilterFunction]): Function to
+            create the filter using a dictionary of parameters.
+    """
+    FILTER_REGISTRY[name] = constructor

camel/datagen/self_instruct/filter/instruction_filter.py ADDED Viewed

@@ -0,0 +1,81 @@
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
+from typing import Any, Dict, List
+from .filter_function import FilterFunction, RewardModelFilter
+from .filter_registry import FILTER_REGISTRY
+class InstructionFilter:
+    def __init__(self, filters_config: Dict[str, Dict[str, Any]]):
+        r"""Initialize the InstructionFilter with a dictionary of filter
+            configurations.
+        Args:
+            filters_config(Dict[str, Dict[str, Any]]):
+                Example filters_config:
+                {
+                    "length": {"min_len": 5, "max_len": 100},
+                    "keyword": {"keywords": ["image", "video"]},
+                    "non_english": {},
+                    "rouge_similarity": {
+                        "existing_instructions": ["Some existing text"],
+                        "threshold": 0.6
+                    }
+                }
+                Each key in filters_config corresponds to a filter name
+                    (registered in FILTER_REGISTRY).
+                Each value is a dict of parameters for that filter.
+        """
+        self.filters: List[FilterFunction] = []
+        for filter_name, params in filters_config.items():
+            if filter_name not in FILTER_REGISTRY:
+                raise ValueError(f"Unknown filter function: {filter_name}")
+            self.filters.append(FILTER_REGISTRY[filter_name](params))
+    def add_filter(self, filter_function: FilterFunction):
+        r"""Add a custom filter function to the InstructionFilter.
+        This allows adding filters that are not in the registry.
+        Args:
+            filter_function (FilterFunction): The filter function to be added
+        """
+        self.filters.append(filter_function)
+    def filter(
+        self, prompt: str, instruction: str, return_details: bool = False
+    ):
+        r"""Check if the given instruction passes all filter functions.
+        Args:
+            prompt (str): The prompt of generating the instruction.
+            instruction (str): The instruction to evaluate.
+            return_details (bool): If True, returns a tuple (bool, List[str])
+                where the list contains the names of filters that failed.
+                (default::obj:`False`)
+        Returns:
+            bool: True if the instruction passes all filters, False otherwise.
+                OR (bool, List[str]) if return_details is True.
+        """
+        failed_filters = []
+        for f in self.filters:
+            if isinstance(f, RewardModelFilter):
+                f.prompt = prompt
+            if not f.apply(instruction):
+                failed_filters.append(type(f).__name__)
+        if return_details:
+            return len(failed_filters) == 0, failed_filters
+        return len(failed_filters) == 0

camel-ai 0.2.15a0__py3-none-any.whl → 0.2.17__py3-none-any.whl

Potentially problematic release.

camel-ai 0.2.15a0py3-none-any.whl → 0.2.17py3-none-any.whl