PyPI - eval-protocol - Versions diffs - 0.2.30__tar.gz → 0.2.32__tar.gz - Mend

eval-protocol 0.2.30tar.gz → 0.2.32tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (397) hide show

{eval_protocol-0.2.30/eval_protocol.egg-info → eval_protocol-0.2.32}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.2.30
+Version: 0.2.32
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/_version.py RENAMED Viewed

@@ -8,11 +8,11 @@ import json
 version_json = '''
 {
- "date": "2025-09-26T14:10:14-0700",
+ "date": "2025-09-29T16:40:31-0700",
  "dirty": false,
  "error": null,
- "full-revisionid": "626a125899fb42ed135a1f223b3e827f37e44ae0",
- "version": "0.2.30"
+ "full-revisionid": "1744b558ceb39f3a910a898ed6dd3df6a4576691",
+ "version": "0.2.32"
 }
 '''  # END VERSION_JSON

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/pytest/evaluation_test.py RENAMED Viewed

@@ -79,6 +79,7 @@ def evaluation_test(
     aggregation_method: AggregationMethod = "mean",
     passed_threshold: EvaluationThreshold | float | EvaluationThresholdDict | None = None,
     num_runs: int = 1,
+    filtered_row_ids: Sequence[str] | None = None,
     max_dataset_rows: int | None = None,
     mcp_config_path: str | None = None,
     max_concurrent_rollouts: int = 8,
@@ -146,6 +147,7 @@ def evaluation_test(
             Success rate must be above success, and if set, standard error must be below standard_error.
             Success rate +/- one standard_error is equivalent to 68% confidence interval.
         num_runs: Number of times to repeat the rollout and evaluations.
+        filtered_row_ids: List of row_ids to filter for the evaluation. If provided, only the rows with the given row_ids will be evaluated.
         max_dataset_rows: Limit dataset to the first N rows.
         mcp_config_path: Path to MCP config file that follows MCPMultiClientConfiguration schema
         max_concurrent_rollouts: Maximum number of concurrent rollouts to run in parallel.
@@ -262,6 +264,9 @@ def evaluation_test(
                             results = data_loader.load()
                             for result in results:
                                 data.extend(result.rows)
+                        # Apply max_dataset_rows limit to data from data loaders
+                        if max_dataset_rows is not None:
+                            data = data[:max_dataset_rows]
                     elif "dataset_path" in kwargs and kwargs["dataset_path"] is not None:
                         ds_arg: list[str] = kwargs["dataset_path"]
                         # Support either a single path or a list of paths; if a list is provided,
@@ -283,6 +288,9 @@ def evaluation_test(
                     else:
                         raise ValueError("No input dataset, input messages, or input rows provided")
+                    if filtered_row_ids is not None:
+                        data = [row for row in data if row.input_metadata.row_id in filtered_row_ids]
                     """
                     data_loaders handles preprocess_fn internally so we want
                     to specially handle data_loaders here so we don't double

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/pytest/parameterize.py RENAMED Viewed

@@ -73,6 +73,9 @@ def _is_pytest_parametrize_with_completion_params(decorator: ast.expr) -> bool:
                 and decorator.func.value.attr == "mark"
                 and decorator.func.attr == "parametrize"
             ):
+                # Validate argvalues if present
+                _validate_parametrize_argvalues(decorator)
                 # Check positional arguments first (argnames is typically the first positional arg)
                 if len(decorator.args) > 0:
                     argnames_arg = decorator.args[0]
@@ -88,6 +91,90 @@ def _is_pytest_parametrize_with_completion_params(decorator: ast.expr) -> bool:
     return False
+def _ast_dict_to_string(dict_node: ast.Dict) -> str:
+    """
+    Convert an AST Dict node to its string representation.
+    Args:
+        dict_node: AST node representing a dictionary
+    Returns:
+        String representation of the dictionary
+    """
+    if not dict_node.keys:
+        return "{}"
+    pairs = []
+    for key, value in zip(dict_node.keys, dict_node.values):
+        if key is not None:
+            key_str = _ast_node_to_string(key)
+            value_str = _ast_node_to_string(value)
+            pairs.append(f"{key_str}: {value_str}")
+    return "{" + ", ".join(pairs) + "}"
+def _ast_node_to_string(node: ast.expr) -> str:
+    """
+    Convert an AST node to its string representation.
+    Args:
+        node: AST node to convert
+    Returns:
+        String representation of the node
+    """
+    if isinstance(node, ast.Constant):
+        if isinstance(node.value, str):
+            return repr(node.value)
+        else:
+            return str(node.value)
+    elif isinstance(node, ast.Name):
+        return node.id
+    elif isinstance(node, ast.Dict):
+        return _ast_dict_to_string(node)
+    elif isinstance(node, ast.List):
+        elements = [_ast_node_to_string(elt) for elt in node.elts]
+        return "[" + ", ".join(elements) + "]"
+    elif isinstance(node, ast.Tuple):
+        elements = [_ast_node_to_string(elt) for elt in node.elts]
+        return "(" + ", ".join(elements) + ")"
+    else:
+        # For complex expressions, return a simplified representation
+        return "<complex expression>"
+def _validate_parametrize_argvalues(decorator: ast.Call) -> None:
+    """
+    Validate that pytest.mark.parametrize argvalues is a list/tuple, not a dict.
+    Args:
+        decorator: AST node representing the pytest.mark.parametrize decorator call
+    Raises:
+        ValueError: If argvalues is a dict instead of a list/tuple
+    """
+    # Check positional arguments (argvalues is typically the second positional arg)
+    if len(decorator.args) > 1:
+        argvalues_arg = decorator.args[1]
+        if isinstance(argvalues_arg, ast.Dict):
+            dict_repr = _ast_dict_to_string(argvalues_arg)
+            raise ValueError(
+                f"For evaluation_test with completion_params, pytest.mark.parametrize argvalues must be a list or tuple, not a dict. "
+                f"Use [{dict_repr}] instead of {dict_repr}."
+            )
+    # Check keyword arguments for argvalues
+    for keyword in decorator.keywords:
+        if keyword.arg == "argvalues":
+            if isinstance(keyword.value, ast.Dict):
+                dict_repr = _ast_dict_to_string(keyword.value)
+                raise ValueError(
+                    f"For evaluation_test with completion_params, pytest.mark.parametrize argvalues must be a list or tuple, not a dict. "
+                    f"Use [{dict_repr}] instead of {dict_repr}."
+                )
 def _check_argnames_for_completion_params(argnames_node: ast.expr) -> bool:
     """
     Check if an argnames AST node contains "completion_params".

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/pytest/remote_rollout_processor.py RENAMED Viewed

@@ -22,6 +22,7 @@ class RemoteRolloutProcessor(RolloutProcessor):
         self,
         *,
         remote_base_url: Optional[str] = None,
+        model_base_url: Optional[str] = None,
         poll_interval: float = 1.0,
         timeout_seconds: float = 120.0,
         output_data_loader: Callable[[str], DynamicDataLoader],
@@ -29,6 +30,7 @@ class RemoteRolloutProcessor(RolloutProcessor):
         # Prefer constructor-provided configuration. These can be overridden via
         # config.kwargs at call time for backward compatibility.
         self._remote_base_url = remote_base_url
+        self._model_base_url = model_base_url
         self._poll_interval = poll_interval
         self._timeout_seconds = timeout_seconds
         self._output_data_loader = output_data_loader
@@ -38,6 +40,7 @@ class RemoteRolloutProcessor(RolloutProcessor):
         # Start with constructor values
         remote_base_url: Optional[str] = self._remote_base_url
+        model_base_url: Optional[str] = self._model_base_url
         poll_interval: float = self._poll_interval
         timeout_seconds: float = self._timeout_seconds
@@ -112,14 +115,25 @@ class RemoteRolloutProcessor(RolloutProcessor):
                 messages=clean_messages,
                 tools=row.tools,
                 metadata=meta,
-                model_base_url=config.kwargs.get("model_base_url", None),
+                model_base_url=model_base_url,
             )
             # Fire-and-poll
             def _post_init() -> None:
                 url = f"{remote_base_url}/init"
-                r = requests.post(url, json=init_payload.model_dump(), timeout=30)
-                r.raise_for_status()
+                try:
+                    r = requests.post(url, json=init_payload.model_dump(), timeout=30)
+                    r.raise_for_status()
+                except requests.exceptions.Timeout:
+                    raise TimeoutError(
+                        "The /init endpoint timed out after 30 seconds. "
+                        "CRITICAL: The /init endpoint must return immediately (within 30s) and NOT block on rollout execution. "
+                        "Your remote server should:\n"
+                        "1. Accept the /init request and return a 200 response immediately\n"
+                        "2. Process the actual rollout asynchronously in the background\n"
+                        "3. Use the /status endpoint to report progress\n"
+                        "For Python/Node.js: Start a separate process per rollout to avoid blocking the /init response."
+                    )
             await asyncio.to_thread(_post_init)
@@ -141,7 +155,13 @@ class RemoteRolloutProcessor(RolloutProcessor):
                 except Exception:
                     # transient errors; continue polling
                     pass
                 await asyncio.sleep(poll_interval)
+            else:
+                # Loop completed without breaking, which means we timed out
+                row.rollout_status = Status.rollout_error(
+                    f"Rollout {row.execution_metadata.rollout_id} timed out after {timeout_seconds} seconds"
+                )
             # Update duration, regardless of termination
             row.execution_metadata.duration_seconds = time.perf_counter() - start_time
@@ -164,14 +184,28 @@ class RemoteRolloutProcessor(RolloutProcessor):
             elif len(output_rows) == 1:  # Return the Langfuse row
                 langfuse_row = output_rows[0]
                 langfuse_row.input_metadata.completion_params = row.input_metadata.completion_params
+                # merge dataset_info dicts on input_metadata
+                if langfuse_row.input_metadata.dataset_info and row.input_metadata.dataset_info:
+                    langfuse_row.input_metadata.dataset_info = {
+                        **row.input_metadata.dataset_info,
+                        **langfuse_row.input_metadata.dataset_info,
+                    }
+                elif row.input_metadata.dataset_info:
+                    langfuse_row.input_metadata.dataset_info = row.input_metadata.dataset_info
                 langfuse_row.eval_metadata = row.eval_metadata
+                langfuse_row.ground_truth = row.ground_truth
                 return langfuse_row
             else:
                 raise ValueError("RemoteRolloutProcessor's output_data_loader should return exactly one row.")
-        for r in rows:
-            tasks.append(asyncio.create_task(_process_row(r)))
+        semaphore = config.semaphore
+        async def _sem_wrapper(r: EvaluationRow) -> EvaluationRow:
+            async with semaphore:
+                result = await _process_row(r)
+                return result
+        tasks = [asyncio.create_task(_sem_wrapper(row)) for row in rows]
         return tasks
     def cleanup(self) -> None:

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/types/remote_rollout_processor.py RENAMED Viewed

@@ -4,7 +4,7 @@ Request and response models for remote rollout processor servers.
 from typing import Any, Dict, List, Optional
 from pydantic import BaseModel, Field
-from eval_protocol.models import Message
+from eval_protocol.models import Message, Status
 class RolloutMetadata(BaseModel):
@@ -21,7 +21,7 @@ class InitRequest(BaseModel):
     """Request model for POST /init endpoint."""
     model: str
-    messages: List[Message] = Field(min_length=1)
+    messages: Optional[List[Message]] = None
     tools: Optional[List[Dict[str, Any]]] = None
     model_base_url: Optional[str] = None
@@ -40,6 +40,12 @@ class StatusResponse(BaseModel):
     terminated: bool
     info: Optional[Dict[str, Any]] = None
+    status: Optional[Status] = None
+    """
+    Optional status indicator for the rollout to be used by eval-protocol. This
+    is useful to distinguish between successful and failed rollouts.
+    """
 def create_langfuse_config_tags(init_request: InitRequest) -> List[str]:
     """Create Langfuse tags from InitRequest metadata."""

{eval_protocol-0.2.30 → eval_protocol-0.2.32/eval_protocol.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.2.30
+Version: 0.2.32
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/LICENSE RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/README.md RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/development/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/development/normalize_sandbox_fusion.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/development/utils/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/development/utils/generate_api_key.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/development/utils/subprocess_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/__main__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/base.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/bigquery.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/braintrust.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/huggingface.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/langchain.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/langfuse.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/langsmith.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/openai_responses.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/trl.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/adapters/utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/models.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/orchestrator.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resource_abc.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resource_pool.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/bfcl_envs/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/bfcl_envs/gorilla_file_system.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/bfcl_envs/math_api.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/bfcl_envs/posting_api.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/bfcl_sim_api_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/docker_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/filesystem_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/python_state_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/resources/sql_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/task_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/agent/tool_registry.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/auth.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/data/airline_dataset.jsonl RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/data/retail_dataset.jsonl RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/test_aime25.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/test_gpqa.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/test_livebench_data_analysis.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/test_tau_bench_airline.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/benchmarks/test_tau_bench_retail.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/agent_eval_cmd.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/common.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/deploy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/deploy_mcp.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/logs.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/preview.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/cli_commands/run_eval_cmd.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/common_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/config.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/data_loader/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/data_loader/dynamic_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/data_loader/factory_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/data_loader/inline_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/data_loader/models.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/dataset_logger/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/dataset_logger/dataset_logger.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/dataset_logger/local_fs_dataset_logger_adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/dataset_logger/sqlite_dataset_logger_adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/dataset_logger/sqlite_evaluation_row_store.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/datasets/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/datasets/loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/directory_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/evaluation.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/event_bus/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/event_bus/event_bus.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/event_bus/logger.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/event_bus/sqlite_event_bus.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/event_bus/sqlite_event_bus_database.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/execution/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/execution/pipeline.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/gcp_tools.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/generation/cache.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/generation/clients/base.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/generation/clients.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/generic_server.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/get_pep440_version.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/human_id/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/human_id/dictionary.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/integrations/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/integrations/deepeval.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/integrations/openeval.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/integrations/trl.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/logging_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/client/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/client/connection.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/clients.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/execution/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/execution/base_policy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/execution/manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/execution/policy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/grid_renderer.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/mcp_multi_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/mcpgym.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/process_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/session/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/session/manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/simple_process_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp/simulation_server.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/config.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/main.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/orchestration/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/orchestration/base_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/orchestration/local_docker_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_agent/orchestration/stdio_mcp_client_helper.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_env.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/README.md RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/airplane_environment/airline_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/mock_environment/mock_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/retail_environment/retail_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.30 → eval_protocol-0.2.32}/eval_protocol/mcp_servers/tau2/server.py RENAMED Viewed

File without changes

eval-protocol 0.2.30__tar.gz → 0.2.32__tar.gz

eval-protocol 0.2.30tar.gz → 0.2.32tar.gz