PyPI - eval-protocol - Versions diffs - 0.2.32__tar.gz → 0.2.34__tar.gz - Mend

eval-protocol 0.2.32tar.gz → 0.2.34tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (397) hide show

{eval_protocol-0.2.32/eval_protocol.egg-info → eval_protocol-0.2.34}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.2.32
+Version: 0.2.34
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/_version.py RENAMED Viewed

@@ -8,11 +8,11 @@ import json
 version_json = '''
 {
- "date": "2025-09-29T16:40:31-0700",
+ "date": "2025-09-30T15:39:15-0700",
  "dirty": false,
  "error": null,
- "full-revisionid": "1744b558ceb39f3a910a898ed6dd3df6a4576691",
- "version": "0.2.32"
+ "full-revisionid": "c09755b30386c03c95bd79d7b142ed614419c7c4",
+ "version": "0.2.34"
 }
 '''  # END VERSION_JSON

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/evaluation_test.py RENAMED Viewed

@@ -52,10 +52,12 @@ from eval_protocol.pytest.utils import (
     add_cost_metrics,
     log_eval_status_and_rows,
     parse_ep_completion_params,
+    parse_ep_completion_params_overwrite,
     parse_ep_max_concurrent_rollouts,
     parse_ep_max_rows,
     parse_ep_num_runs,
     parse_ep_passed_threshold,
+    parse_ep_dataloaders,
     rollout_processor_with_retry,
     run_tasks_with_eval_progress,
     run_tasks_with_run_progress,
@@ -189,10 +191,18 @@ def evaluation_test(
     max_concurrent_rollouts = parse_ep_max_concurrent_rollouts(max_concurrent_rollouts)
     max_dataset_rows = parse_ep_max_rows(max_dataset_rows)
     completion_params = parse_ep_completion_params(completion_params)
+    completion_params = parse_ep_completion_params_overwrite(completion_params)
     original_completion_params = completion_params
     passed_threshold = parse_ep_passed_threshold(passed_threshold)
+    data_loaders = parse_ep_dataloaders(data_loaders)
     custom_invocation_id = os.environ.get("EP_INVOCATION_ID", None)
+    # ignore other data input params when dataloader is provided
+    if data_loaders:
+        input_dataset = None
+        input_messages = None
+        input_rows = None
     def decorator(
         test_func: TestFunction,
     ) -> TestFunction:

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/handle_persist_flow.py RENAMED Viewed

@@ -16,9 +16,10 @@ import requests
 def handle_persist_flow(all_results: list[list[EvaluationRow]], test_func_name: str):
     try:
         # Default is to save and upload experiment JSONL files, unless explicitly disabled
-        should_save_and_upload = os.getenv("EP_NO_UPLOAD") != "1"
+        custom_output_dir = os.getenv("EP_OUTPUT_DIR")
+        should_save = os.getenv("EP_NO_UPLOAD") != "1" or custom_output_dir is not None
-        if should_save_and_upload:
+        if should_save:
             current_run_rows = [item for sublist in all_results for item in sublist]
             if current_run_rows:
                 experiments: dict[str, list[EvaluationRow]] = defaultdict(list)
@@ -27,6 +28,8 @@ def handle_persist_flow(all_results: list[list[EvaluationRow]], test_func_name:
                         experiments[row.execution_metadata.experiment_id].append(row)
                 eval_protocol_dir = find_eval_protocol_dir()
+                if custom_output_dir:
+                    eval_protocol_dir = custom_output_dir
                 exp_dir = pathlib.Path(eval_protocol_dir) / "experiment_results"
                 exp_dir.mkdir(parents=True, exist_ok=True)
@@ -81,6 +84,10 @@ def handle_persist_flow(all_results: list[list[EvaluationRow]], test_func_name:
                             json.dump(row_data, f, ensure_ascii=False)
                             f.write("\n")
+                    should_upload = os.getenv("EP_NO_UPLOAD") != "1"
+                    if not should_upload:
+                        continue
                     def get_auth_value(key: str) -> str | None:
                         """Get auth value from config file or environment."""
                         try:

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/plugin.py RENAMED Viewed

@@ -19,6 +19,7 @@ import json
 import pathlib
 import sys
 from pytest import StashKey
+import pytest
 def pytest_addoption(parser) -> None:
@@ -56,6 +57,7 @@ def pytest_addoption(parser) -> None:
         default=None,
         help=("Write a JSON summary artifact at the given path (e.g., ./outputs/aime_low.json)."),
     )
+    # deprecate this later
     group.addoption(
         "--ep-input-param",
         action="append",
@@ -115,6 +117,27 @@ def pytest_addoption(parser) -> None:
             "Default: false (experiment JSONs are saved and uploaded by default)."
         ),
     )
+    group.addoption(
+        "--ep-jsonl-path",
+        default=None,
+        help=("Load input from a jsonl file that is already in EvaluationRow or openai CHAT format"),
+    )
+    group.addoption(
+        "--ep-completion-params",
+        default=[],
+        action="append",
+        help=("Overwrite completion params with json. Can be used multiple times. "),
+    )
+    group.addoption(
+        "--ep-remote-rollout-processor-base-url",
+        default=None,
+        help=("If set, use this base URL for remote rollout processing. Example: http://localhost:8000"),
+    )
+    group.addoption(
+        "--ep-output-dir",
+        default=None,
+        help=("If set, save evaluation results to this directory in jsonl format."),
+    )
 def _normalize_max_rows(val: Optional[str]) -> Optional[str]:
@@ -240,9 +263,22 @@ def pytest_configure(config) -> None:
     if threshold_env is not None:
         os.environ["EP_PASSED_THRESHOLD"] = threshold_env
+    if config.getoption("--ep-output-dir"):
+        # set this to save eval results to the target dir in jsonl format
+        os.environ["EP_OUTPUT_DIR"] = config.getoption("--ep-output-dir")
     if config.getoption("--ep-no-upload"):
         os.environ["EP_NO_UPLOAD"] = "1"
+    if config.getoption("--ep-jsonl-path"):
+        os.environ["EP_JSONL_PATH"] = config.getoption("--ep-jsonl-path")
+    if config.getoption("--ep-completion-params"):
+        # redump to json to make sure they are legit
+        os.environ["EP_COMPLETION_PARAMS"] = json.dumps(
+            [json.loads(s) for s in config.getoption("--ep-completion-params") or []]
+        )
     # Allow ad-hoc overrides of input params via CLI flags
     try:
         merged: dict = {}

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/remote_rollout_processor.py RENAMED Viewed

@@ -9,6 +9,7 @@ from eval_protocol.data_loader.dynamic_data_loader import DynamicDataLoader
 from eval_protocol.types.remote_rollout_processor import InitRequest, RolloutMetadata
 from .rollout_processor import RolloutProcessor
 from .types import RolloutProcessorConfig
+import os
 class RemoteRolloutProcessor(RolloutProcessor):
@@ -31,6 +32,8 @@ class RemoteRolloutProcessor(RolloutProcessor):
         # config.kwargs at call time for backward compatibility.
         self._remote_base_url = remote_base_url
         self._model_base_url = model_base_url
+        if os.getenv("EP_REMOTE_ROLLOUT_PROCESSOR_BASE_URL"):
+            self._remote_base_url = os.getenv("EP_REMOTE_ROLLOUT_PROCESSOR_BASE_URL")
         self._poll_interval = poll_interval
         self._timeout_seconds = timeout_seconds
         self._output_data_loader = output_data_loader

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/utils.py RENAMED Viewed

@@ -19,6 +19,8 @@ from eval_protocol.models import (
     EvaluationThresholdDict,
     Status,
 )
+from eval_protocol.data_loader import DynamicDataLoader
+from eval_protocol.data_loader.models import EvaluationDataLoader
 from eval_protocol.pytest.rollout_processor import RolloutProcessor
 from eval_protocol.pytest.types import (
     RolloutProcessorConfig,
@@ -239,6 +241,45 @@ def parse_ep_completion_params(
     return completion_params
+def parse_ep_completion_params_overwrite(
+    completion_params: Sequence[CompletionParams | None] | None,
+) -> Sequence[CompletionParams | None]:
+    new_completion_params = os.getenv("EP_COMPLETION_PARAMS")
+    if new_completion_params:
+        try:
+            new_completion_params_list = json.loads(new_completion_params)
+            if isinstance(new_completion_params_list, list):
+                return new_completion_params_list
+        except Exception:
+            pass
+    return completion_params or []
+def _rows_from_jsonl(path: str) -> list[EvaluationRow]:
+    rows = []
+    try:
+        with open(path, "r", encoding="utf-8") as f:
+            for line in f:
+                rows.append(EvaluationRow(**json.loads(line)))
+    except Exception as e:
+        print(f"❌ Failed to load rows from JSONL at {path}: {e}")
+        return []
+    return rows
+def parse_ep_dataloaders(
+    dataloaders: Sequence[EvaluationDataLoader] | EvaluationDataLoader | None,
+) -> Sequence[EvaluationDataLoader] | EvaluationDataLoader | None:
+    try:
+        load_from_jsonl_path = os.getenv("EP_JSONL_PATH")
+        if load_from_jsonl_path:
+            return DynamicDataLoader(generators=[lambda path=load_from_jsonl_path: _rows_from_jsonl(path)])
+    except Exception:
+        pass
+    return dataloaders or None
 def parse_ep_passed_threshold(
     default_value: float | EvaluationThresholdDict | EvaluationThreshold | None,
 ) -> EvaluationThreshold | None:

{eval_protocol-0.2.32 → eval_protocol-0.2.34/eval_protocol.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.2.32
+Version: 0.2.34
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/LICENSE RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/README.md RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/development/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/development/normalize_sandbox_fusion.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/development/utils/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/development/utils/generate_api_key.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/development/utils/subprocess_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/__main__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/base.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/bigquery.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/braintrust.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/huggingface.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/langchain.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/langfuse.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/langsmith.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/openai_responses.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/trl.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/adapters/utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/models.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/orchestrator.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resource_abc.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resource_pool.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/bfcl_envs/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/bfcl_envs/gorilla_file_system.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/bfcl_envs/math_api.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/bfcl_envs/posting_api.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/bfcl_sim_api_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/docker_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/filesystem_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/python_state_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/resources/sql_resource.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/task_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/agent/tool_registry.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/auth.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/data/airline_dataset.jsonl RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/data/retail_dataset.jsonl RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/test_aime25.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/test_gpqa.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/test_livebench_data_analysis.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/test_tau_bench_airline.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/benchmarks/test_tau_bench_retail.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/agent_eval_cmd.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/common.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/deploy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/deploy_mcp.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/logs.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/preview.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/cli_commands/run_eval_cmd.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/common_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/config.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/data_loader/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/data_loader/dynamic_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/data_loader/factory_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/data_loader/inline_data_loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/data_loader/models.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/dataset_logger/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/dataset_logger/dataset_logger.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/dataset_logger/local_fs_dataset_logger_adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/dataset_logger/sqlite_dataset_logger_adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/dataset_logger/sqlite_evaluation_row_store.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/datasets/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/datasets/loader.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/directory_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/evaluation.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/event_bus/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/event_bus/event_bus.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/event_bus/logger.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/event_bus/sqlite_event_bus.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/event_bus/sqlite_event_bus_database.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/execution/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/execution/pipeline.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/gcp_tools.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/generation/cache.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/generation/clients/base.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/generation/clients.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/generic_server.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/get_pep440_version.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/human_id/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/human_id/dictionary.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/integrations/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/integrations/deepeval.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/integrations/openeval.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/integrations/trl.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/logging_utils.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/client/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/client/connection.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/clients.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/execution/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/execution/base_policy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/execution/manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/execution/policy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/grid_renderer.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/mcp_multi_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/mcpgym.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/process_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/session/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/session/manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/simple_process_manager.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp/simulation_server.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/config.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/main.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/orchestration/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/orchestration/base_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/orchestration/local_docker_client.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_agent/orchestration/stdio_mcp_client_helper.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_env.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/README.md RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/airplane_environment/airline_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/mock_environment/mock_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/retail_environment/retail_environment.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/server.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/tau2_mcp.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/tests/system_prompts/airline_agent_system_prompt.md RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/tests/system_prompts/mock_agent_system_prompt.md RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/tests/system_prompts/retail_agent_system_prompt.md RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/mcp_servers/tau2/tests/test_tau2_e2e.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/models.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/packaging.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/platform_api.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/playback_policy.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/__init__.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_agent_rollout_processor.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_dataset_adapter.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_langchain_rollout_processor.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_mcp_gym_rollout_processor.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_no_op_rollout_processor.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_pydantic_ai_rollout_processor.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/default_single_turn_rollout_process.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/dual_mode_wrapper.py RENAMED Viewed

File without changes

{eval_protocol-0.2.32 → eval_protocol-0.2.34}/eval_protocol/pytest/evaluation_test_postprocess.py RENAMED Viewed

File without changes

eval-protocol 0.2.32__tar.gz → 0.2.34__tar.gz

eval-protocol 0.2.32tar.gz → 0.2.34tar.gz