PyPI - eval-protocol - Versions diffs - 0.3.23__tar.gz → 0.3.25__tar.gz - Mend

eval-protocol 0.3.23tar.gz → 0.3.25tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (474) hide show

{eval_protocol-0.3.23/eval_protocol.egg-info → eval_protocol-0.3.25}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.3.23
+Version: 0.3.25
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT
@@ -24,7 +24,7 @@ Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: omegaconf>=2.3.0
 Requires-Dist: httpx>=0.24.0
 Requires-Dist: anthropic>=0.59.0
-Requires-Dist: litellm<1.82.0,>=1.81.0
+Requires-Dist: litellm<1.75.0
 Requires-Dist: pytest>=6.0.0
 Requires-Dist: pytest-asyncio>=0.21.0
 Requires-Dist: peewee>=3.18.2
@@ -111,14 +111,11 @@ Requires-Dist: langchain-core>=0.3.75; extra == "langgraph"
 Provides-Extra: langgraph-tools
 Requires-Dist: langgraph>=0.6.7; extra == "langgraph-tools"
 Requires-Dist: langchain>=0.3.0; extra == "langgraph-tools"
+Requires-Dist: langchain-fireworks>=0.3.0; extra == "langgraph-tools"
 Provides-Extra: proxy
 Requires-Dist: redis>=5.0.0; extra == "proxy"
 Requires-Dist: langfuse>=2.0.0; extra == "proxy"
 Requires-Dist: uuid6>=2025.0.0; extra == "proxy"
-Requires-Dist: litellm<1.82.0,>=1.81.0; extra == "proxy"
-Requires-Dist: opentelemetry-api>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-sdk>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-exporter-otlp>=1.29.0; extra == "proxy"
 Dynamic: license-file
 # Eval Protocol

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/_version.py RENAMED Viewed

@@ -8,11 +8,11 @@ import json
 version_json = '''
 {
- "date": "2026-03-06T17:59:19-0800",
+ "date": "2026-03-13T16:09:44-0700",
  "dirty": false,
  "error": null,
- "full-revisionid": "5ac0bb46b02200b500ae535dcc5a86c4179c8408",
- "version": "0.3.23"
+ "full-revisionid": "3c8d8f23f7b301697f246c64e57d08fa1c7af50b",
+ "version": "0.3.25"
 }
 '''  # END VERSION_JSON

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/adapters/fireworks_tracing.py RENAMED Viewed

@@ -8,10 +8,8 @@ from __future__ import annotations
 import logging
 import requests
 from datetime import datetime
-import ast
-import json
-import os
 from typing import Any, Dict, List, Optional, Protocol
+import os
 from eval_protocol.models import EvaluationRow, InputMetadata, ExecutionMetadata, Message
 from .base import BaseAdapter
@@ -46,43 +44,6 @@ class TraceDictConverter(Protocol):
         ...
-def extract_otel_attributes(observations: List[Dict[str, Any]]) -> Optional[Dict[str, Any]]:
-    """Attempt to extract and parse attributes from raw_gen_ai_request observation. This only works when stored in OTEL format.
-    Args:
-        observations: List of observation dictionaries from the trace
-    Returns:
-        Dict with all attributes parsed. Or None if not found.
-    """
-    for obs in observations:
-        if obs.get("name") == "raw_gen_ai_request" and obs.get("type") == "SPAN":
-            metadata = obs.get("metadata") or {}
-            attributes = metadata.get("attributes") or {}
-            result: Dict[str, Any] = {}
-            for key, value in attributes.items():
-                # Try to parse stringified objects (could be Python repr or JSON)
-                if isinstance(value, str) and value.startswith(("[", "{")):
-                    try:
-                        result[key] = ast.literal_eval(value)
-                    except Exception as e:
-                        logger.debug("Failed to parse %s with ast.literal_eval: %s", key, e)
-                        try:
-                            result[key] = json.loads(value)
-                        except Exception as e:
-                            logger.debug("Failed to parse %s with json.loads: %s", key, e)
-                            result[key] = value
-                else:
-                    result[key] = value
-            if result:
-                return result
-    return None
 def convert_trace_dict_to_evaluation_row(
     trace: Dict[str, Any], include_tool_calls: bool = True, span_name: Optional[str] = None
 ) -> Optional[EvaluationRow]:
@@ -135,19 +96,6 @@ def convert_trace_dict_to_evaluation_row(
                 ):
                     break  # Break early if we've found all the metadata we need
-        observations = trace.get("observations") or []
-        # We can only extract when stored in OTEL format.
-        otel_attributes = extract_otel_attributes(observations)
-        if otel_attributes:
-            # Find choices from any provider (llm.*.choices pattern)
-            choices = None
-            for key, value in otel_attributes.items():
-                if key.endswith(".choices") and isinstance(value, list):
-                    choices = value
-                    break
-            if choices and len(choices) > 0:
-                execution_metadata.finish_reason = choices[0].get("finish_reason")
         return EvaluationRow(
             messages=messages,
             tools=tools,
@@ -212,7 +160,7 @@ def extract_messages_from_trace_dict(
         # Fallback: use the last GENERATION observation which typically contains full chat history
         if not messages:
             try:
-                all_observations = trace.get("observations") or []
+                all_observations = trace.get("observations", [])
                 gens = [obs for obs in all_observations if obs.get("type") == "GENERATION"]
                 if gens:
                     gens.sort(key=lambda x: x.get("start_time", ""))
@@ -238,7 +186,7 @@ def get_final_generation_in_span_dict(trace: Dict[str, Any], span_name: str) ->
         The final generation dictionary, or None if not found
     """
     # Get all observations from the trace
-    all_observations = trace.get("observations") or []
+    all_observations = trace.get("observations", [])
     # Find a span with the given name that has generation children
     parent_span = None

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/proxy/proxy_core/app.py RENAMED Viewed

@@ -15,7 +15,7 @@ from contextlib import asynccontextmanager
 from .models import ProxyConfig, LangfuseTracesResponse, TracesParams, ChatParams, ChatRequestHook, TracesRequestHook
 from .auth import AuthProvider, NoAuthProvider
-from .litellm import handle_chat_completion
+from .litellm import handle_chat_completion, proxy_to_litellm
 from .langfuse import fetch_langfuse_traces, pointwise_fetch_langfuse_trace
 # Configure logging before any other imports (so all modules inherit this config)
@@ -35,6 +35,10 @@ def build_proxy_config(
     preprocess_traces_request: Optional[TracesRequestHook] = None,
 ) -> ProxyConfig:
     """Load environment and secrets, and build ProxyConfig"""
+    # Env
+    litellm_url = os.getenv("LITELLM_URL")
+    if not litellm_url:
+        raise ValueError("LITELLM_URL environment variable must be set")
     request_timeout = float(os.getenv("REQUEST_TIMEOUT", "300.0"))
     langfuse_host = os.getenv("LANGFUSE_HOST", "https://cloud.langfuse.com")
@@ -62,6 +66,7 @@ def build_proxy_config(
         raise ValueError(f"Invalid format in secrets file {secrets_path.name}: {e}")
     return ProxyConfig(
+        litellm_url=litellm_url,
         request_timeout=request_timeout,
         langfuse_host=langfuse_host,
         langfuse_keys=langfuse_keys,
@@ -108,16 +113,6 @@ def create_app(
         app.state.config = build_proxy_config(preprocess_chat_request, preprocess_traces_request)
         app.state.redis = init_redis()
-        config = app.state.config
-        default_keys = config.langfuse_keys[config.default_project_id]
-        os.environ["LANGFUSE_PUBLIC_KEY"] = default_keys["public_key"]
-        os.environ["LANGFUSE_SECRET_KEY"] = default_keys["secret_key"]
-        os.environ.setdefault("LANGFUSE_HOST", config.langfuse_host)
-        import litellm
-        litellm.callbacks = ["langfuse_otel"]
         try:
             yield
         finally:
@@ -302,4 +297,13 @@ def create_app(
     async def health():
         return {"status": "healthy", "service": "metadata-proxy"}
+    # Catch-all
+    @app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE", "PATCH"])
+    async def catch_all_proxy(
+        path: str,
+        request: Request,
+        config: ProxyConfig = Depends(get_config),
+    ):
+        return await proxy_to_litellm(config, path, request)
     return app

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/proxy/proxy_core/langfuse.py RENAMED Viewed

@@ -50,7 +50,6 @@ def _serialize_trace_to_dict(trace_full: Any) -> Dict[str, Any]:
                 "input": getattr(obs, "input", None),
                 "output": getattr(obs, "output", None),
                 "parent_observation_id": getattr(obs, "parent_observation_id", None),
-                "metadata": getattr(obs, "metadata", None),
             }
             for obs in getattr(trace_full, "observations", [])
         ]

eval_protocol-0.3.25/eval_protocol/proxy/proxy_core/litellm.py ADDED Viewed

@@ -0,0 +1,173 @@
+"""
+LiteLLM client - handles all communication with LiteLLM service.
+"""
+import json
+import base64
+import httpx
+import logging
+from uuid6 import uuid7
+from fastapi import Request, Response, HTTPException
+import redis
+from .redis_utils import register_insertion_id
+from .models import ProxyConfig, ChatParams
+logger = logging.getLogger(__name__)
+async def handle_chat_completion(
+    config: ProxyConfig,
+    redis_client: redis.Redis,
+    request: Request,
+    params: ChatParams,
+) -> Response:
+    """
+    Handle chat completion requests and forward to LiteLLM.
+    If metadata IDs (rollout_id, etc.) are provided, they'll be added as tags
+    and the assistant message count will be tracked in Redis.
+    If encoded_base_url is provided, it will be decoded and added to the request.
+    """
+    body = await request.body()
+    data = json.loads(body) if body else {}
+    if config.preprocess_chat_request:
+        data, params = config.preprocess_chat_request(data, request, params)
+    project_id = params.project_id
+    rollout_id = params.rollout_id
+    invocation_id = params.invocation_id
+    experiment_id = params.experiment_id
+    run_id = params.run_id
+    row_id = params.row_id
+    encoded_base_url = params.encoded_base_url
+    # Use default project if not specified
+    if project_id is None:
+        project_id = config.default_project_id
+    # Decode and add base_url if provided
+    if encoded_base_url:
+        try:
+            # Decode from URL-safe base64
+            decoded_bytes = base64.urlsafe_b64decode(encoded_base_url)
+            base_url = decoded_bytes.decode("utf-8")
+            data["base_url"] = base_url
+            logger.debug(f"Decoded base_url: {base_url}")
+        except Exception as e:
+            logger.error(f"Failed to decode base_url: {e}")
+            raise HTTPException(status_code=400, detail=f"Invalid encoded_base_url: {str(e)}")
+    # Extract API key from Authorization header and inject into request body
+    auth_header = request.headers.get("authorization", "")
+    if auth_header.startswith("Bearer "):
+        api_key = auth_header.replace("Bearer ", "").strip()
+        # Only inject API key if model is a Fireworks model
+        model = data.get("model")
+        if model and isinstance(model, str) and model.startswith("fireworks_ai"):
+            data["api_key"] = api_key
+    # If metadata IDs are provided, add them as tags
+    insertion_id = None
+    if rollout_id is not None:
+        insertion_id = str(uuid7())
+        if "metadata" not in data:
+            data["metadata"] = {}
+        if "tags" not in data["metadata"]:
+            data["metadata"]["tags"] = []
+        # Add extracted IDs as tags
+        data["metadata"]["tags"].extend(
+            [
+                f"rollout_id:{rollout_id}",
+                f"insertion_id:{insertion_id}",
+                f"invocation_id:{invocation_id}",
+                f"experiment_id:{experiment_id}",
+                f"run_id:{run_id}",
+                f"row_id:{row_id}",
+            ]
+        )
+    # Add Langfuse configuration
+    data["langfuse_public_key"] = config.langfuse_keys[project_id]["public_key"]
+    data["langfuse_secret_key"] = config.langfuse_keys[project_id]["secret_key"]
+    data["langfuse_host"] = config.langfuse_host
+    # Forward to LiteLLM's standard /chat/completions endpoint
+    # Set longer timeout for LLM API calls (LLMs can be slow)
+    timeout = httpx.Timeout(config.request_timeout)
+    async with httpx.AsyncClient(timeout=timeout) as client:
+        # Copy headers from original request but exclude content-length (httpx will set it correctly)
+        headers = dict(request.headers)
+        headers.pop("host", None)
+        headers.pop("content-length", None)  # Let httpx calculate the correct length
+        headers["content-type"] = "application/json"
+        # Forward to LiteLLM
+        litellm_url = f"{config.litellm_url}/chat/completions"
+        response = await client.post(
+            litellm_url,
+            json=data,  # httpx will serialize and set correct Content-Length
+            headers=headers,
+        )
+        # Register insertion_id in Redis only on successful response
+        if response.status_code == 200 and insertion_id is not None and rollout_id is not None:
+            register_insertion_id(redis_client, rollout_id, insertion_id)
+        # Return the response
+        return Response(
+            content=response.content,
+            status_code=response.status_code,
+            headers=dict(response.headers),
+        )
+async def proxy_to_litellm(config: ProxyConfig, path: str, request: Request) -> Response:
+    """
+    Catch-all proxy: Forward any request to LiteLLM, extracting API key from Authorization header.
+    """
+    # Set longer timeout for LLM API calls (LLMs can be slow)
+    timeout = httpx.Timeout(config.request_timeout)
+    async with httpx.AsyncClient(timeout=timeout) as client:
+        # Copy headers
+        headers = dict(request.headers)
+        headers.pop("host", None)
+        headers.pop("content-length", None)
+        # Get body
+        body = await request.body()
+        # Pass through API key from Authorization header
+        if request.method in ["POST", "PUT", "PATCH"] and body:
+            try:
+                data = json.loads(body)
+                auth_header = request.headers.get("authorization", "")
+                if auth_header.startswith("Bearer "):
+                    api_key = auth_header.replace("Bearer ", "").strip()
+                    data["api_key"] = api_key
+                # Re-serialize
+                body = json.dumps(data).encode()
+            except json.JSONDecodeError:
+                pass
+        # Forward to LiteLLM
+        litellm_url = f"{config.litellm_url}/{path}"
+        response = await client.request(
+            method=request.method,
+            url=litellm_url,
+            headers=headers,
+            content=body,
+        )
+        return Response(
+            content=response.content,
+            status_code=response.status_code,
+            headers=dict(response.headers),
+        )

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/proxy/proxy_core/models.py RENAMED Viewed

@@ -53,6 +53,7 @@ class TracesParams(BaseModel):
 class ProxyConfig(BaseModel):
     """Configuration model for the LiteLLM Metadata Proxy"""
+    litellm_url: str
     request_timeout: float = 300.0
     langfuse_host: str
     langfuse_keys: Dict[str, Dict[str, str]]
@@ -72,7 +73,6 @@ class ObservationResponse(BaseModel):
     input: Optional[Any] = None
     output: Optional[Any] = None
     parent_observation_id: Optional[str] = None
-    metadata: Optional[Dict[str, Any]] = None
 class TraceResponse(BaseModel):

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/pytest/evaluation_test.py RENAMED Viewed

@@ -449,6 +449,8 @@ def evaluation_test(
                         finally:
                             if output_buffer:
                                 await output_buffer.close()
+                            await rollout_processor.acleanup()
+                            rollout_processor.cleanup()
                         for res in priority_results:
                             run_idx = (res.execution_metadata.extra or {}).get("run_index", 0)
@@ -697,15 +699,19 @@ def evaluation_test(
                         # Lazy import (cached after first import above)
                         from eval_protocol.pytest.default_mcp_gym_rollout_processor import MCPGymRolloutProcessor
-                        if isinstance(rollout_processor, MCPGymRolloutProcessor):
-                            # For MCPGymRolloutProcessor, create and execute tasks one at a time to avoid port conflicts
-                            for run_idx in range(num_runs):
-                                task = asyncio.create_task(execute_run(run_idx, config))
-                                await task
-                        else:
-                            # For other processors, create all tasks at once and run in parallel
-                            # Concurrency is now controlled by the shared semaphore in each rollout processor
-                            await run_tasks_with_run_progress(execute_run, num_runs, config)
+                        try:
+                            if isinstance(rollout_processor, MCPGymRolloutProcessor):
+                                # For MCPGymRolloutProcessor, create and execute tasks one at a time to avoid port conflicts
+                                for run_idx in range(num_runs):
+                                    task = asyncio.create_task(execute_run(run_idx, config))
+                                    await task
+                            else:
+                                # For other processors, create all tasks at once and run in parallel
+                                # Concurrency is now controlled by the shared semaphore in each rollout processor
+                                await run_tasks_with_run_progress(execute_run, num_runs, config)
+                        finally:
+                            await rollout_processor.acleanup()
+                            rollout_processor.cleanup()
                         experiment_duration_seconds = time.perf_counter() - experiment_start_time

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/pytest/evaluation_test_utils.py RENAMED Viewed

@@ -476,8 +476,12 @@ async def rollout_processor_with_retry(
                 yield result
     finally:
-        await rollout_processor.acleanup()
-        rollout_processor.cleanup()
+        # Cleanup is intentionally NOT called here. rollout_processor_with_retry
+        # is invoked per-run, but the processor (and its session) is shared
+        # across parallel runs.  Closing per-run would kill in-flight requests
+        # in other runs.  Cleanup is called once after all runs complete in
+        # evaluation_test.py.
+        pass
 def sanitize_filename(text: str) -> str:

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/pytest/exception_config.py RENAMED Viewed

@@ -23,6 +23,7 @@ def get_default_retryable_exceptions() -> Set[Type[Exception]]:
         return _default_retryable_exceptions
     # Lazy imports (these are expensive)
+    import aiohttp
     import httpx
     import litellm
     import requests
@@ -32,6 +33,9 @@ def get_default_retryable_exceptions() -> Set[Type[Exception]]:
         ConnectionError,  # type: ignore[assignment]
         TimeoutError,  # type: ignore[assignment]
         OSError,  # type: ignore[assignment]  # Covers network-related OS errors
+        # aiohttp library exceptions
+        aiohttp.ClientConnectionError,
+        aiohttp.ServerDisconnectedError,
         # Requests library exceptions
         requests.exceptions.ConnectionError,
         requests.exceptions.Timeout,

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/pytest/remote_rollout_processor.py RENAMED Viewed

@@ -104,6 +104,9 @@ class RemoteRolloutProcessor(RolloutProcessor):
             try:
                 session = self._get_or_create_session()
                 async with session.post(init_url, json=init_payload.model_dump(), timeout=timeout_init) as resp:
+                    if resp.status >= 500:
+                        body = await resp.text()
+                        raise ConnectionError(f"Remote /init returned server error (HTTP {resp.status}): {body}")
                     if resp.status >= 400:
                         body = await resp.text()
                         raise RuntimeError(f"Remote /init failed (HTTP {resp.status}): {body}")
@@ -215,8 +218,6 @@ class RemoteRolloutProcessor(RolloutProcessor):
                 loop = asyncio.get_running_loop()
                 loop.create_task(self._session.close())
             except RuntimeError:
-                # No running event loop - can't safely close the session.
-                # The session will be garbage collected eventually, but warn about it.
                 logger.warning(
                     "RemoteRolloutProcessor.cleanup() called outside of async context. "
                     "Session may not be properly closed. Use `await processor.acleanup()` when possible."

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol/reward_function.py RENAMED Viewed

@@ -12,6 +12,7 @@ import requests
 from .models import EvaluateResult, MetricResult
 from .typed_interface import reward_function
+logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 T = TypeVar("T", bound=Callable[..., EvaluateResult])

{eval_protocol-0.3.23 → eval_protocol-0.3.25/eval_protocol.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.3.23
+Version: 0.3.25
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT
@@ -24,7 +24,7 @@ Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: omegaconf>=2.3.0
 Requires-Dist: httpx>=0.24.0
 Requires-Dist: anthropic>=0.59.0
-Requires-Dist: litellm<1.82.0,>=1.81.0
+Requires-Dist: litellm<1.75.0
 Requires-Dist: pytest>=6.0.0
 Requires-Dist: pytest-asyncio>=0.21.0
 Requires-Dist: peewee>=3.18.2
@@ -111,14 +111,11 @@ Requires-Dist: langchain-core>=0.3.75; extra == "langgraph"
 Provides-Extra: langgraph-tools
 Requires-Dist: langgraph>=0.6.7; extra == "langgraph-tools"
 Requires-Dist: langchain>=0.3.0; extra == "langgraph-tools"
+Requires-Dist: langchain-fireworks>=0.3.0; extra == "langgraph-tools"
 Provides-Extra: proxy
 Requires-Dist: redis>=5.0.0; extra == "proxy"
 Requires-Dist: langfuse>=2.0.0; extra == "proxy"
 Requires-Dist: uuid6>=2025.0.0; extra == "proxy"
-Requires-Dist: litellm<1.82.0,>=1.81.0; extra == "proxy"
-Requires-Dist: opentelemetry-api>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-sdk>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-exporter-otlp>=1.29.0; extra == "proxy"
 Dynamic: license-file
 # Eval Protocol

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/eval_protocol.egg-info/requires.txt RENAMED Viewed

@@ -12,7 +12,7 @@ hydra-core>=1.3.2
 omegaconf>=2.3.0
 httpx>=0.24.0
 anthropic>=0.59.0
-litellm<1.82.0,>=1.81.0
+litellm<1.75.0
 pytest>=6.0.0
 pytest-asyncio>=0.21.0
 peewee>=3.18.2
@@ -93,6 +93,7 @@ langchain-core>=0.3.75
 [langgraph_tools]
 langgraph>=0.6.7
 langchain>=0.3.0
+langchain-fireworks>=0.3.0
 [langsmith]
 langsmith>=0.1.86
@@ -107,10 +108,6 @@ openevals>=0.1.0
 redis>=5.0.0
 langfuse>=2.0.0
 uuid6>=2025.0.0
-litellm<1.82.0,>=1.81.0
-opentelemetry-api>=1.29.0
-opentelemetry-sdk>=1.29.0
-opentelemetry-exporter-otlp>=1.29.0
 [pydantic]
 pydantic-ai>=1.0.2

{eval_protocol-0.3.23 → eval_protocol-0.3.25}/pyproject.toml RENAMED Viewed

@@ -31,7 +31,7 @@ dependencies = [
     "omegaconf>=2.3.0",
     "httpx>=0.24.0",
     "anthropic>=0.59.0",
-    "litellm>=1.81.0,<1.82.0",
+    "litellm<1.75.0",
     "pytest>=6.0.0",
     "pytest-asyncio>=0.21.0",
     "peewee>=3.18.2",
@@ -146,17 +146,13 @@ langgraph = [
 langgraph_tools = [
     "langgraph>=0.6.7",
     "langchain>=0.3.0",
-    # langchain-fireworks removed: incompatible with fireworks-ai>=1.0.0
+    "langchain-fireworks>=0.3.0",
 ]
 proxy = [
     "redis>=5.0.0",
     "langfuse>=2.0.0",
     "uuid6>=2025.0.0",
-    "litellm>=1.81.0,<1.82.0",
-    "opentelemetry-api>=1.29.0",
-    "opentelemetry-sdk>=1.29.0",
-    "opentelemetry-exporter-otlp>=1.29.0",
 ]
 [project.scripts]

eval-protocol 0.3.23__tar.gz → 0.3.25__tar.gz

eval-protocol 0.3.23tar.gz → 0.3.25tar.gz