PyPI - flock-core - Versions diffs - 0.4.505__py3-none-any.whl → 0.4.508__py3-none-any.whl - Mend

flock-core 0.4.505py3-none-any.whl → 0.4.508py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of flock-core might be problematic. Click here for more details.

Files changed (17) hide show

flock/core/evaluation/utils.py +85 -2
flock/core/flock.py +102 -56
flock/core/flock_agent.py +2 -2
flock/core/flock_evaluator.py +8 -1
flock/core/flock_factory.py +4 -0
flock/core/mixin/dspy_integration.py +7 -6
flock/evaluators/declarative/declarative_evaluator.py +112 -88
flock/webapp/templates/chat.html +1 -0
flock/webapp/templates/partials/_chat_messages.html +3 -2
{flock_core-0.4.505.dist-info → flock_core-0.4.508.dist-info}/METADATA +28 -10
{flock_core-0.4.505.dist-info → flock_core-0.4.508.dist-info}/RECORD +14 -17
flock/core/api/ui/__init__.py +0 -0
flock/core/api/ui/routes.py +0 -271
flock/core/api/ui/utils.py +0 -119
{flock_core-0.4.505.dist-info → flock_core-0.4.508.dist-info}/WHEEL +0 -0
{flock_core-0.4.505.dist-info → flock_core-0.4.508.dist-info}/entry_points.txt +0 -0
{flock_core-0.4.505.dist-info → flock_core-0.4.508.dist-info}/licenses/LICENSE +0 -0

flock/core/evaluation/utils.py CHANGED Viewed

@@ -7,8 +7,15 @@ from typing import Any, Union
 import pandas as pd
 from box import Box
-from datasets import get_dataset_config_names, load_dataset
+from datasets import (
+    Dataset as HFDataset,
+    get_dataset_config_names,
+    load_dataset,
+)
+from opik import Opik
+from opik.evaluation import evaluate
+from flock.core.flock import Flock
 from flock.core.flock_agent import FlockAgent
 from flock.core.flock_evaluator import FlockEvaluator
 from flock.core.logging.logging import get_logger
@@ -18,6 +25,64 @@ from flock.core.logging.logging import get_logger
 logger_helpers = get_logger("util.evaluation")
+def evaluate_with_opik(
+    dataset: str | Path | list[dict[str, Any]] | pd.DataFrame | HFDataset,
+    dataset_name: str,
+    experiment_name: str,
+    start_agent: FlockAgent | str,
+    input_mapping: dict[str, str],
+    answer_mapping: dict[str, str],
+    metrics: list[
+        str
+        | Callable[[Any, Any], bool | float | dict[str, Any]]
+        | FlockAgent
+        | FlockEvaluator
+    ],
+):
+    df = normalize_dataset(dataset)
+    client = Opik()
+    dataset = client.get_or_create_dataset(name=dataset_name)
+    dataset.insert_from_pandas(dataframe=df, ignore_keys=["source"])
+    # Create a single Flock instance outside the task function
+    shared_flock = Flock(
+        name="opik_eval", model="azure/gpt-4.1", show_flock_banner=False
+    )
+    shared_flock.add_agent(start_agent)
+    def evaluation_task(dataset_item):
+        agent_input = {
+            value: dataset_item[key] for key, value in input_mapping.items()
+        }
+        # Use the shared Flock instance instead of creating a new one
+        result_flock = shared_flock.run(
+            start_agent=start_agent, input=agent_input, box_result=False
+        )
+        # agent_output = result_flock.get(answer_mapping[key], "No answer found")
+        key = next(iter(answer_mapping.keys()))
+        reference = dataset_item[key]
+        answer = result_flock.get(answer_mapping[key], "No answer found")
+        result = {
+            "input": agent_input,
+            "output": answer,
+            "reference": reference,
+        }
+        return result
+    eval_results = evaluate(
+        experiment_name=experiment_name,
+        dataset=dataset,
+        task=evaluation_task,
+        scoring_metrics=metrics,
+    )
 def load_and_merge_all_configs(dataset_name: str) -> pd.DataFrame:
     all_configs = get_dataset_config_names(dataset_name)
     all_dfs = []
@@ -31,9 +96,27 @@ def load_and_merge_all_configs(dataset_name: str) -> pd.DataFrame:
             all_dfs.append(df)
     merged_df = pd.concat(all_dfs, ignore_index=True)
+    logger_helpers.info(f"merged_df.head(): {merged_df.head()}")
     return merged_df
+def import_hf_dataset_to_opik(dataset_name: str) -> pd.DataFrame:
+    df = load_and_merge_all_configs(dataset_name)
+    logger_helpers.info(
+        f"type(df): {type(df)}"
+    )  # ➜ <class 'pandas.core.frame.DataFrame'>
+    logger_helpers.info(f"df.shape: {df.shape}")  # e.g. (123456, N_COLUMNS+2)
+    logger_helpers.info(
+        f"df['split'].value_counts(): {df['split'].value_counts()}"
+    )
+    logger_helpers.info(f"df['config'].unique(): {df['config'].unique()}")
+    client = Opik()
+    dataset = client.get_or_create_dataset(name=dataset_name)
+    dataset.insert_from_pandas(dataframe=df, ignore_keys=["source"])
+    return df
 def normalize_dataset(dataset: Any) -> pd.DataFrame:
     """Converts various dataset formats into a pandas DataFrame."""
     if isinstance(dataset, pd.DataFrame):

flock/core/flock.py CHANGED Viewed

@@ -17,7 +17,6 @@ from typing import (
     TypeVar,
 )
-_R = TypeVar("_R")
 # Third-party imports
 from box import Box
 from temporalio import workflow
@@ -32,8 +31,11 @@ with workflow.unsafe.imports_passed_through():
     from flock.core.execution.local_executor import (
         run_local_workflow,
     )
+import opik
 from opentelemetry import trace
 from opentelemetry.baggage import get_baggage, set_baggage
+from opik.integrations.dspy.callback import OpikCallback
 from pandas import DataFrame  # type: ignore
 from pydantic import BaseModel, Field
@@ -67,7 +69,7 @@ try:
     PANDAS_AVAILABLE = True
 except ImportError:
-    pd = None # type: ignore
+    pd = None  # type: ignore
     PANDAS_AVAILABLE = False
 logger = get_logger("flock.api")
@@ -77,6 +79,7 @@ FlockRegistry = get_registry()  # Get the registry instance
 # Define TypeVar for generic class methods like from_dict
 T = TypeVar("T", bound="Flock")
+_R = TypeVar("_R")
 class Flock(BaseModel, Serializable):
@@ -103,6 +106,10 @@ class Flock(BaseModel, Serializable):
         default=False,
         description="If True, execute workflows via Temporal; otherwise, run locally.",
     )
+    enable_opik: bool = Field(
+        default=False,
+        description="If True, enable Opik for cost tracking and model management.",
+    )
     show_flock_banner: bool = Field(
         default=True,
         description="If True, show the Flock banner on console interactions.",
@@ -159,11 +166,11 @@ class Flock(BaseModel, Serializable):
         """
         try:
             asyncio.get_running_loop()
-        except RuntimeError:                       # no loop → simple
+        except RuntimeError:  # no loop → simple
             return asyncio.run(coro)
         # A loop is already running – Jupyter / ASGI / etc.
-        ctx = contextvars.copy_context()           # propagate baggage
+        ctx = contextvars.copy_context()  # propagate baggage
         with ThreadPoolExecutor(max_workers=1) as pool:
             future = pool.submit(ctx.run, asyncio.run, coro)
             try:
@@ -179,6 +186,7 @@ class Flock(BaseModel, Serializable):
         description: str | None = None,
         show_flock_banner: bool = True,
         enable_temporal: bool = False,
+        enable_opik: bool = False,
         agents: list[FlockAgent] | None = None,
         servers: list[FlockMCPServerBase] | None = None,
         temporal_config: TemporalWorkflowConfig | None = None,
@@ -195,6 +203,7 @@ class Flock(BaseModel, Serializable):
             model=model,
             description=description,
             enable_temporal=enable_temporal,
+            enable_opik=enable_opik,
             show_flock_banner=show_flock_banner,
             temporal_config=temporal_config,
             temporal_start_in_process_worker=temporal_start_in_process_worker,
@@ -208,7 +217,6 @@ class Flock(BaseModel, Serializable):
         self._start_input = {}
         self._mgr = FlockServerManager()
         # Register passed servers
         # (need to be registered first so that agents can retrieve them from the registry)
         # This will also add them to the managed list of self._mgr
@@ -225,7 +233,6 @@ class Flock(BaseModel, Serializable):
                         f"Item provided in 'servers' list is not a FlockMCPServer: {type(server)}"
                     )
         # Register passed agents
         if agents:
             from flock.core.flock_agent import (
@@ -241,7 +248,7 @@ class Flock(BaseModel, Serializable):
                     )
         # Initialize console if needed for banner
-        if self.show_flock_banner: # Check instance attribute
+        if self.show_flock_banner:  # Check instance attribute
             init_console(clear_screen=True, show_banner=self.show_flock_banner)
         # Set Temporal debug environment variable
@@ -252,6 +259,15 @@ class Flock(BaseModel, Serializable):
         FlockRegistry.discover_and_register_components()
+        if self.enable_opik:
+            import dspy
+            opik.configure(use_local=True, automatic_approvals=True)
+            opik_callback = OpikCallback(project_name=self.name, log_graph=True)
+            dspy.settings.configure(
+                callbacks=[opik_callback],
+            )
         logger.info(
             "Flock instance initialized",
             name=self.name,
@@ -259,39 +275,54 @@ class Flock(BaseModel, Serializable):
             enable_temporal=self.enable_temporal,
         )
-    def prepare_benchmark(self, agent: FlockAgent | str | None = None, input_field: str | None = None, eval_field: str | None = None):
+    def prepare_benchmark(
+        self,
+        agent: FlockAgent | str | None = None,
+        input_field: str | None = None,
+        eval_field: str | None = None,
+    ):
         """Prepare a benchmark for the Flock instance."""
         from flock.core.flock_agent import FlockAgent as ConcreteFlockAgent
-        logger.info(f"Preparing benchmark for Flock instance '{self.name}' with agent '{agent}'.")
+        logger.info(
+            f"Preparing benchmark for Flock instance '{self.name}' with agent '{agent}'."
+        )
         name = agent.name if isinstance(agent, ConcreteFlockAgent) else agent
         if self._agents.get(name) is None:
-            raise ValueError(f"Agent '{name}' not found in Flock instance '{self.name}'.")
+            raise ValueError(
+                f"Agent '{name}' not found in Flock instance '{self.name}'."
+            )
         self.benchmark_agent_name = name
         self.benchmark_eval_field = eval_field
         self.benchmark_input_field = input_field
     def inspect(self):
         """Inspect the Flock instance."""
-        logger.info(f"Inspecting Flock instance '{self.name}' with start agent '{self.benchmark_agent_name}' and input '{input}'.")
+        logger.info(
+            f"Inspecting Flock instance '{self.name}' with start agent '{self.benchmark_agent_name}' and input '{input}'."
+        )
-        async def run(input: dict[str, Any])-> dict[str, Any]:
+        async def run(input: dict[str, Any]) -> dict[str, Any]:
             """Inspect the Flock instance."""
-            logger.info(f"Inspecting Flock instance '{self.name}' with start agent '{self.benchmark_agent_name}' and input '{input}'.")
+            logger.info(
+                f"Inspecting Flock instance '{self.name}' with start agent '{self.benchmark_agent_name}' and input '{input}'."
+            )
             msg_content = input.get("messages")[0].get("content")
-            agent_input = {
-                self.benchmark_input_field: msg_content
-            }
+            agent_input = {self.benchmark_input_field: msg_content}
-            result = await self.run_async(start_agent=self.benchmark_agent_name, input=agent_input, box_result=False)
+            result = await self.run_async(
+                start_agent=self.benchmark_agent_name,
+                input=agent_input,
+                box_result=False,
+            )
-            agent_output = result.get(self.benchmark_eval_field, "No answer found")
+            agent_output = result.get(
+                self.benchmark_eval_field, "No answer found"
+            )
             return {
                 "output": agent_output,
@@ -299,8 +330,6 @@ class Flock(BaseModel, Serializable):
         return run
     def _set_temporal_debug_flag(self):
         """Set or remove LOCAL_DEBUG env var based on enable_temporal."""
         if not self.enable_temporal:
@@ -373,10 +402,14 @@ class Flock(BaseModel, Serializable):
         if agent.name in self._agents:
             # Allow re-adding the same instance, but raise error for different instance with same name
             if self._agents[agent.name] is not agent:
-                raise ValueError(f"Agent with name '{agent.name}' already exists with a different instance.")
+                raise ValueError(
+                    f"Agent with name '{agent.name}' already exists with a different instance."
+                )
             else:
-                logger.debug(f"Agent '{agent.name}' is already added. Skipping.")
-                return agent # Return existing agent
+                logger.debug(
+                    f"Agent '{agent.name}' is already added. Skipping."
+                )
+                return agent  # Return existing agent
         self._agents[agent.name] = agent
         FlockRegistry.register_agent(agent)  # Register globally
@@ -415,7 +448,7 @@ class Flock(BaseModel, Serializable):
         box_result: bool = True,
         agents: list[FlockAgent] | None = None,
         servers: list[FlockMCPServerBase] | None = None,
-        memo: dict[str, Any] | None = None
+        memo: dict[str, Any] | None = None,
     ) -> Box | dict:
         return self._run_sync(
             self.run_async(
@@ -430,7 +463,6 @@ class Flock(BaseModel, Serializable):
             )
         )
     async def run_async(
         self,
         start_agent: FlockAgent | str | None = None,
@@ -474,11 +506,13 @@ class Flock(BaseModel, Serializable):
             start_agent_name: str | None = None
             if isinstance(start_agent, ConcreteFlockAgent):
                 start_agent_name = start_agent.name
-                if start_agent_name not in self._agents: # Add if not already present
+                if (
+                    start_agent_name not in self._agents
+                ):  # Add if not already present
                     self.add_agent(start_agent)
             elif isinstance(start_agent, str):
                 start_agent_name = start_agent
-            else: # start_agent is None
+            else:  # start_agent is None
                 start_agent_name = self._start_agent_name
             # Default to first agent if only one exists and none specified
@@ -516,23 +550,27 @@ class Flock(BaseModel, Serializable):
             try:
                 resolved_start_agent = self._agents.get(start_agent_name)
-                if not resolved_start_agent: # Should have been handled by now
-                    raise ValueError(f"Start agent '{start_agent_name}' not found after checks.")
+                if not resolved_start_agent:  # Should have been handled by now
+                    raise ValueError(
+                        f"Start agent '{start_agent_name}' not found after checks."
+                    )
                 run_context = context if context else FlockContext()
-                set_baggage("run_id", effective_run_id) # Set for OpenTelemetry
+                set_baggage("run_id", effective_run_id)  # Set for OpenTelemetry
                 initialize_context(
                     run_context,
                     start_agent_name,
                     run_input,
                     effective_run_id,
-                    not self.enable_temporal, # local_debug is inverse of enable_temporal
+                    not self.enable_temporal,  # local_debug is inverse of enable_temporal
                     self.model or resolved_start_agent.model or DEFAULT_MODEL,
                 )
                 # Add agent definitions to context for routing/serialization within workflow
                 for agent_name_iter, agent_instance_iter in self.agents.items():
-                    agent_dict_repr = agent_instance_iter.to_dict() # Agents handle their own serialization
+                    agent_dict_repr = (
+                        agent_instance_iter.to_dict()
+                    )  # Agents handle their own serialization
                     run_context.add_agent_definition(
                         agent_type=type(agent_instance_iter),
                         agent_name=agent_name_iter,
@@ -568,13 +606,14 @@ class Flock(BaseModel, Serializable):
                     # Execute workflow
                     if not self.enable_temporal:
                         result = await run_local_workflow(
-                            run_context, box_result=False # Boxing handled below
+                            run_context,
+                            box_result=False,  # Boxing handled below
                         )
                     else:
                         result = await run_temporal_workflow(
-                            self, # Pass the Flock instance
+                            self,  # Pass the Flock instance
                             run_context,
-                            box_result=False, # Boxing handled below
+                            box_result=False,  # Boxing handled below
                             memo=memo,
                         )
@@ -616,7 +655,6 @@ class Flock(BaseModel, Serializable):
                 }
                 return Box(error_output) if box_result else error_output
     # --- Batch Processing (Delegation) ---
     async def run_batch_async(
         self,
@@ -689,19 +727,18 @@ class Flock(BaseModel, Serializable):
             )
         )
     # --- Evaluation (Delegation) ---
     async def evaluate_async(
         self,
-        dataset: str | Path | list[dict[str, Any]] | DataFrame | Dataset, # type: ignore
+        dataset: str | Path | list[dict[str, Any]] | DataFrame | Dataset,  # type: ignore
         start_agent: FlockAgent | str,
         input_mapping: dict[str, str],
         answer_mapping: dict[str, str],
         metrics: list[
             str
             | Callable[[Any, Any], bool | float | dict[str, Any]]
-            | FlockAgent # Type hint only
-            | FlockEvaluator # Type hint only
+            | FlockAgent  # Type hint only
+            | FlockEvaluator  # Type hint only
         ],
         metric_configs: dict[str, dict[str, Any]] | None = None,
         static_inputs: dict[str, Any] | None = None,
@@ -713,7 +750,7 @@ class Flock(BaseModel, Serializable):
         return_dataframe: bool = True,
         silent_mode: bool = False,
         metadata_columns: list[str] | None = None,
-    ) -> DataFrame | list[dict[str, Any]]: # type: ignore
+    ) -> DataFrame | list[dict[str, Any]]:  # type: ignore
         """Evaluates the Flock's performance against a dataset (delegated)."""
         # Import processor locally
         from flock.core.execution.evaluation_executor import (
@@ -741,15 +778,15 @@ class Flock(BaseModel, Serializable):
     def evaluate(
         self,
-        dataset: str | Path | list[dict[str, Any]] | DataFrame | Dataset, # type: ignore
+        dataset: str | Path | list[dict[str, Any]] | DataFrame | Dataset,  # type: ignore
         start_agent: FlockAgent | str,
         input_mapping: dict[str, str],
         answer_mapping: dict[str, str],
         metrics: list[
             str
             | Callable[[Any, Any], bool | float | dict[str, Any]]
-            | FlockAgent # Type hint only
-            | FlockEvaluator # Type hint only
+            | FlockAgent  # Type hint only
+            | FlockEvaluator  # Type hint only
         ],
         metric_configs: dict[str, dict[str, Any]] | None = None,
         static_inputs: dict[str, Any] | None = None,
@@ -761,7 +798,7 @@ class Flock(BaseModel, Serializable):
         return_dataframe: bool = True,
         silent_mode: bool = False,
         metadata_columns: list[str] | None = None,
-    ) -> DataFrame | list[dict[str, Any]]: # type: ignore
+    ) -> DataFrame | list[dict[str, Any]]:  # type: ignore
         return self._run_sync(
             self.evaluate_async(
                 dataset=dataset,
@@ -781,18 +818,22 @@ class Flock(BaseModel, Serializable):
                 metadata_columns=metadata_columns,
             )
         )
     # --- Server & CLI Starters (Delegation) ---
     def start_api(
         self,
         host: str = "127.0.0.1",
         port: int = 8344,
         server_name: str = "Flock Server",
-        create_ui: bool = True, # Default to True for the integrated experience
+        create_ui: bool = True,  # Default to True for the integrated experience
         ui_theme: str | None = None,
-        custom_endpoints: Sequence[FlockEndpoint] | dict[tuple[str, list[str] | None], Callable[..., Any]] | None = None,
+        custom_endpoints: Sequence[FlockEndpoint]
+        | dict[tuple[str, list[str] | None], Callable[..., Any]]
+        | None = None,
     ) -> None:
         """Starts a unified REST API server and/or Web UI for this Flock instance."""
         import warnings
         warnings.warn(
             "start_api() is deprecated and will be removed in a future release. "
             "Use serve() instead.",
@@ -825,7 +866,9 @@ class Flock(BaseModel, Serializable):
         chat_history_key: str = "history",
         chat_response_key: str = "response",
         ui_theme: str | None = None,
-        custom_endpoints: Sequence[FlockEndpoint] | dict[tuple[str, list[str] | None], Callable[..., Any]] | None = None,
+        custom_endpoints: Sequence[FlockEndpoint]
+        | dict[tuple[str, list[str] | None], Callable[..., Any]]
+        | None = None,
     ) -> None:
         """Launch an HTTP server that exposes the core REST API and, optionally, the
         browser-based UI.
@@ -871,7 +914,9 @@ class Flock(BaseModel, Serializable):
     def start_cli(
         self,
-        start_agent: FlockAgent | str | None = None, # Added start_agent to match method signature in file_26
+        start_agent: FlockAgent
+        | str
+        | None = None,  # Added start_agent to match method signature in file_26
         server_name: str = "Flock CLI",
         show_results: bool = False,
         edit_mode: bool = False,
@@ -893,14 +938,13 @@ class Flock(BaseModel, Serializable):
         # If start_agent is crucial here, start_flock_cli needs to handle it.
         logger.info(f"Starting CLI for Flock '{self.name}'...")
         start_flock_cli(
-            flock=self, # Pass the Flock instance
+            flock=self,  # Pass the Flock instance
             # start_agent=start_agent, # This argument is not in the definition of start_flock_cli in file_50
             server_name=server_name,
             show_results=show_results,
-            edit_mode=edit_mode
+            edit_mode=edit_mode,
         )
     # --- Serialization Delegation Methods ---
     def to_dict(self, path_type: str = "relative") -> dict[str, Any]:
         """Serialize Flock instance to dictionary using FlockSerializer."""
@@ -917,12 +961,14 @@ class Flock(BaseModel, Serializable):
     # --- Static Method Loader (Delegates to loader module) ---
     @staticmethod
-    def load_from_file(file_path: str) -> Flock: # Ensure return type is Flock
+    def load_from_file(file_path: str) -> Flock:  # Ensure return type is Flock
         """Load a Flock instance from various file formats (delegates to loader)."""
         from flock.core.util.loader import load_flock_from_file
         loaded_flock = load_flock_from_file(file_path)
         # Ensure the loaded object is indeed a Flock instance
         if not isinstance(loaded_flock, Flock):
-            raise TypeError(f"Loaded object from {file_path} is not a Flock instance, but {type(loaded_flock)}")
+            raise TypeError(
+                f"Loaded object from {file_path} is not a Flock instance, but {type(loaded_flock)}"
+            )
         return loaded_flock

flock/core/flock_agent.py CHANGED Viewed

@@ -691,8 +691,8 @@ class FlockAgent(BaseModel, Serializable, DSPyIntegrationMixin, ABC):
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         filename = f"{agent_name}_output_{timestamp}.json"
-        filepath = os.path.join("output/", filename)
-        os.makedirs("output/", exist_ok=True)
+        filepath = os.path.join(".flock/output/", filename)
+        os.makedirs(".flock/output/", exist_ok=True)
         output_data = {
             "agent": agent_name,

flock/core/flock_evaluator.py CHANGED Viewed

@@ -45,9 +45,16 @@ class FlockEvaluator(ABC, BaseModel):
         description="Evaluator configuration",
     )
+    def __init__(self, **data):
+        super().__init__(**data)
     @abstractmethod
     async def evaluate(
-        self, agent: Any, inputs: dict[str, Any], tools: list[Any], mcp_tools: list[Any] | None = None
+        self,
+        agent: Any,
+        inputs: dict[str, Any],
+        tools: list[Any],
+        mcp_tools: list[Any] | None = None,
     ) -> dict[str, Any]:
         """Evaluate inputs to produce outputs."""
         pass

flock/core/flock_factory.py CHANGED Viewed

@@ -321,6 +321,8 @@ class FlockFactory:
         wait_for_input: bool = False,
         temperature: float = 0.0,
         max_tokens: int = 8192,
+        max_tool_calls: int = 10,
+        max_retries: int = 3,
         alert_latency_threshold_ms: int = 30000,
         no_output: bool = False,
         print_context: bool = False,
@@ -343,6 +345,8 @@ class FlockFactory:
             use_cache=use_cache,
             max_tokens=max_tokens,
             temperature=temperature,
+            max_tool_calls=max_tool_calls,
+            max_retries=max_retries,
             stream=stream,
             include_thought_process=include_thought_process,
         )

flock/core/mixin/dspy_integration.py CHANGED Viewed

@@ -75,7 +75,9 @@ def _resolve_type_string(type_str: str) -> type:
                     try:
                         return tuple(ast.literal_eval(f"[{args_str}]"))
                     except (SyntaxError, ValueError) as exc:
-                        raise ValueError(f"Cannot parse {args_str!r} as literals") from exc
+                        raise ValueError(
+                            f"Cannot parse {args_str!r} as literals"
+                        ) from exc
                 literal_args = parse_literal_args(args_str)
                 logger.debug(
@@ -250,8 +252,7 @@ class DSPyIntegrationMixin:
                 f"Failed to create dynamic type 'dspy_{agent_name}': {e}",
                 exc_info=True,
             )
-            raise TypeError(
-                f"Could not create DSPy signature type: {e}") from e
+            raise TypeError(f"Could not create DSPy signature type: {e}") from e
     def _configure_language_model(
         self,
@@ -308,6 +309,7 @@ class DSPyIntegrationMixin:
         self,
         signature: Any,
         override_evaluator_type: AgentType,
+        max_tool_calls: int = 10,
         tools: list[Any] | None = None,
         mcp_tools: list[Any] | None = None,
         kwargs: dict[str, Any] = {},
@@ -370,7 +372,7 @@ class DSPyIntegrationMixin:
                 dspy_program = dspy.ChainOfThought(signature, **kwargs)
             elif selected_type == "ReAct":
                 if not kwargs:
-                    kwargs = {"max_iters": 10}
+                    kwargs = {"max_iters": max_tool_calls}
                 dspy_program = dspy.ReAct(
                     signature, tools=merged_tools or [], **kwargs
                 )
@@ -427,8 +429,7 @@ class DSPyIntegrationMixin:
             final_result = {**inputs, **output_dict}
             lm = dspy.settings.get("lm")
-            cost = sum([x["cost"]
-                       for x in lm.history if x["cost"] is not None])
+            cost = sum([x["cost"] for x in lm.history if x["cost"] is not None])
             lm_history = lm.history
             return final_result, cost, lm_history

flock-core 0.4.505__py3-none-any.whl → 0.4.508__py3-none-any.whl

Potentially problematic release.

flock-core 0.4.505py3-none-any.whl → 0.4.508py3-none-any.whl