PyPI - eval-protocol - Versions diffs - 0.3.22__tar.gz → 0.3.24__tar.gz - Mend

eval-protocol 0.3.22tar.gz → 0.3.24tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (474) hide show

{eval_protocol-0.3.22/eval_protocol.egg-info → eval_protocol-0.3.24}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.3.22
+Version: 0.3.24
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT
@@ -24,12 +24,12 @@ Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: omegaconf>=2.3.0
 Requires-Dist: httpx>=0.24.0
 Requires-Dist: anthropic>=0.59.0
-Requires-Dist: litellm<1.82.0,>=1.81.0
+Requires-Dist: litellm<1.75.0
 Requires-Dist: pytest>=6.0.0
 Requires-Dist: pytest-asyncio>=0.21.0
 Requires-Dist: peewee>=3.18.2
 Requires-Dist: backoff>=2.2.0
-Requires-Dist: fireworks-ai==1.0.0a20
+Requires-Dist: fireworks-ai<2,>=1.0.0a20
 Requires-Dist: questionary>=2.0.0
 Requires-Dist: toml>=0.10.0
 Requires-Dist: loguru>=0.6.0
@@ -111,14 +111,11 @@ Requires-Dist: langchain-core>=0.3.75; extra == "langgraph"
 Provides-Extra: langgraph-tools
 Requires-Dist: langgraph>=0.6.7; extra == "langgraph-tools"
 Requires-Dist: langchain>=0.3.0; extra == "langgraph-tools"
+Requires-Dist: langchain-fireworks>=0.3.0; extra == "langgraph-tools"
 Provides-Extra: proxy
 Requires-Dist: redis>=5.0.0; extra == "proxy"
 Requires-Dist: langfuse>=2.0.0; extra == "proxy"
 Requires-Dist: uuid6>=2025.0.0; extra == "proxy"
-Requires-Dist: litellm<1.82.0,>=1.81.0; extra == "proxy"
-Requires-Dist: opentelemetry-api>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-sdk>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-exporter-otlp>=1.29.0; extra == "proxy"
 Dynamic: license-file
 # Eval Protocol

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/_version.py RENAMED Viewed

@@ -8,11 +8,11 @@ import json
 version_json = '''
 {
- "date": "2026-03-06T17:12:43-0800",
+ "date": "2026-03-10T03:58:26-0700",
  "dirty": false,
  "error": null,
- "full-revisionid": "9f0f5e4d564aa8bdbf2868848f91bb7e325183d4",
- "version": "0.3.22"
+ "full-revisionid": "0f3c47172cc248d6a9ebbec809ee870f59b03698",
+ "version": "0.3.24"
 }
 '''  # END VERSION_JSON

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/adapters/fireworks_tracing.py RENAMED Viewed

@@ -8,10 +8,8 @@ from __future__ import annotations
 import logging
 import requests
 from datetime import datetime
-import ast
-import json
-import os
 from typing import Any, Dict, List, Optional, Protocol
+import os
 from eval_protocol.models import EvaluationRow, InputMetadata, ExecutionMetadata, Message
 from .base import BaseAdapter
@@ -46,43 +44,6 @@ class TraceDictConverter(Protocol):
         ...
-def extract_otel_attributes(observations: List[Dict[str, Any]]) -> Optional[Dict[str, Any]]:
-    """Attempt to extract and parse attributes from raw_gen_ai_request observation. This only works when stored in OTEL format.
-    Args:
-        observations: List of observation dictionaries from the trace
-    Returns:
-        Dict with all attributes parsed. Or None if not found.
-    """
-    for obs in observations:
-        if obs.get("name") == "raw_gen_ai_request" and obs.get("type") == "SPAN":
-            metadata = obs.get("metadata") or {}
-            attributes = metadata.get("attributes") or {}
-            result: Dict[str, Any] = {}
-            for key, value in attributes.items():
-                # Try to parse stringified objects (could be Python repr or JSON)
-                if isinstance(value, str) and value.startswith(("[", "{")):
-                    try:
-                        result[key] = ast.literal_eval(value)
-                    except Exception as e:
-                        logger.debug("Failed to parse %s with ast.literal_eval: %s", key, e)
-                        try:
-                            result[key] = json.loads(value)
-                        except Exception as e:
-                            logger.debug("Failed to parse %s with json.loads: %s", key, e)
-                            result[key] = value
-                else:
-                    result[key] = value
-            if result:
-                return result
-    return None
 def convert_trace_dict_to_evaluation_row(
     trace: Dict[str, Any], include_tool_calls: bool = True, span_name: Optional[str] = None
 ) -> Optional[EvaluationRow]:
@@ -135,19 +96,6 @@ def convert_trace_dict_to_evaluation_row(
                 ):
                     break  # Break early if we've found all the metadata we need
-        observations = trace.get("observations") or []
-        # We can only extract when stored in OTEL format.
-        otel_attributes = extract_otel_attributes(observations)
-        if otel_attributes:
-            # Find choices from any provider (llm.*.choices pattern)
-            choices = None
-            for key, value in otel_attributes.items():
-                if key.endswith(".choices") and isinstance(value, list):
-                    choices = value
-                    break
-            if choices and len(choices) > 0:
-                execution_metadata.finish_reason = choices[0].get("finish_reason")
         return EvaluationRow(
             messages=messages,
             tools=tools,
@@ -212,7 +160,7 @@ def extract_messages_from_trace_dict(
         # Fallback: use the last GENERATION observation which typically contains full chat history
         if not messages:
             try:
-                all_observations = trace.get("observations") or []
+                all_observations = trace.get("observations", [])
                 gens = [obs for obs in all_observations if obs.get("type") == "GENERATION"]
                 if gens:
                     gens.sort(key=lambda x: x.get("start_time", ""))
@@ -238,7 +186,7 @@ def get_final_generation_in_span_dict(trace: Dict[str, Any], span_name: str) ->
         The final generation dictionary, or None if not found
     """
     # Get all observations from the trace
-    all_observations = trace.get("observations") or []
+    all_observations = trace.get("observations", [])
     # Find a span with the given name that has generation children
     parent_span = None

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/proxy/proxy_core/app.py RENAMED Viewed

@@ -15,7 +15,7 @@ from contextlib import asynccontextmanager
 from .models import ProxyConfig, LangfuseTracesResponse, TracesParams, ChatParams, ChatRequestHook, TracesRequestHook
 from .auth import AuthProvider, NoAuthProvider
-from .litellm import handle_chat_completion
+from .litellm import handle_chat_completion, proxy_to_litellm
 from .langfuse import fetch_langfuse_traces, pointwise_fetch_langfuse_trace
 # Configure logging before any other imports (so all modules inherit this config)
@@ -35,6 +35,10 @@ def build_proxy_config(
     preprocess_traces_request: Optional[TracesRequestHook] = None,
 ) -> ProxyConfig:
     """Load environment and secrets, and build ProxyConfig"""
+    # Env
+    litellm_url = os.getenv("LITELLM_URL")
+    if not litellm_url:
+        raise ValueError("LITELLM_URL environment variable must be set")
     request_timeout = float(os.getenv("REQUEST_TIMEOUT", "300.0"))
     langfuse_host = os.getenv("LANGFUSE_HOST", "https://cloud.langfuse.com")
@@ -62,6 +66,7 @@ def build_proxy_config(
         raise ValueError(f"Invalid format in secrets file {secrets_path.name}: {e}")
     return ProxyConfig(
+        litellm_url=litellm_url,
         request_timeout=request_timeout,
         langfuse_host=langfuse_host,
         langfuse_keys=langfuse_keys,
@@ -108,16 +113,6 @@ def create_app(
         app.state.config = build_proxy_config(preprocess_chat_request, preprocess_traces_request)
         app.state.redis = init_redis()
-        config = app.state.config
-        default_keys = config.langfuse_keys[config.default_project_id]
-        os.environ["LANGFUSE_PUBLIC_KEY"] = default_keys["public_key"]
-        os.environ["LANGFUSE_SECRET_KEY"] = default_keys["secret_key"]
-        os.environ.setdefault("LANGFUSE_HOST", config.langfuse_host)
-        import litellm
-        litellm.callbacks = ["langfuse_otel"]
         try:
             yield
         finally:
@@ -302,4 +297,13 @@ def create_app(
     async def health():
         return {"status": "healthy", "service": "metadata-proxy"}
+    # Catch-all
+    @app.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE", "PATCH"])
+    async def catch_all_proxy(
+        path: str,
+        request: Request,
+        config: ProxyConfig = Depends(get_config),
+    ):
+        return await proxy_to_litellm(config, path, request)
     return app

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/proxy/proxy_core/langfuse.py RENAMED Viewed

@@ -50,7 +50,6 @@ def _serialize_trace_to_dict(trace_full: Any) -> Dict[str, Any]:
                 "input": getattr(obs, "input", None),
                 "output": getattr(obs, "output", None),
                 "parent_observation_id": getattr(obs, "parent_observation_id", None),
-                "metadata": getattr(obs, "metadata", None),
             }
             for obs in getattr(trace_full, "observations", [])
         ]

eval_protocol-0.3.24/eval_protocol/proxy/proxy_core/litellm.py ADDED Viewed

@@ -0,0 +1,173 @@
+"""
+LiteLLM client - handles all communication with LiteLLM service.
+"""
+import json
+import base64
+import httpx
+import logging
+from uuid6 import uuid7
+from fastapi import Request, Response, HTTPException
+import redis
+from .redis_utils import register_insertion_id
+from .models import ProxyConfig, ChatParams
+logger = logging.getLogger(__name__)
+async def handle_chat_completion(
+    config: ProxyConfig,
+    redis_client: redis.Redis,
+    request: Request,
+    params: ChatParams,
+) -> Response:
+    """
+    Handle chat completion requests and forward to LiteLLM.
+    If metadata IDs (rollout_id, etc.) are provided, they'll be added as tags
+    and the assistant message count will be tracked in Redis.
+    If encoded_base_url is provided, it will be decoded and added to the request.
+    """
+    body = await request.body()
+    data = json.loads(body) if body else {}
+    if config.preprocess_chat_request:
+        data, params = config.preprocess_chat_request(data, request, params)
+    project_id = params.project_id
+    rollout_id = params.rollout_id
+    invocation_id = params.invocation_id
+    experiment_id = params.experiment_id
+    run_id = params.run_id
+    row_id = params.row_id
+    encoded_base_url = params.encoded_base_url
+    # Use default project if not specified
+    if project_id is None:
+        project_id = config.default_project_id
+    # Decode and add base_url if provided
+    if encoded_base_url:
+        try:
+            # Decode from URL-safe base64
+            decoded_bytes = base64.urlsafe_b64decode(encoded_base_url)
+            base_url = decoded_bytes.decode("utf-8")
+            data["base_url"] = base_url
+            logger.debug(f"Decoded base_url: {base_url}")
+        except Exception as e:
+            logger.error(f"Failed to decode base_url: {e}")
+            raise HTTPException(status_code=400, detail=f"Invalid encoded_base_url: {str(e)}")
+    # Extract API key from Authorization header and inject into request body
+    auth_header = request.headers.get("authorization", "")
+    if auth_header.startswith("Bearer "):
+        api_key = auth_header.replace("Bearer ", "").strip()
+        # Only inject API key if model is a Fireworks model
+        model = data.get("model")
+        if model and isinstance(model, str) and model.startswith("fireworks_ai"):
+            data["api_key"] = api_key
+    # If metadata IDs are provided, add them as tags
+    insertion_id = None
+    if rollout_id is not None:
+        insertion_id = str(uuid7())
+        if "metadata" not in data:
+            data["metadata"] = {}
+        if "tags" not in data["metadata"]:
+            data["metadata"]["tags"] = []
+        # Add extracted IDs as tags
+        data["metadata"]["tags"].extend(
+            [
+                f"rollout_id:{rollout_id}",
+                f"insertion_id:{insertion_id}",
+                f"invocation_id:{invocation_id}",
+                f"experiment_id:{experiment_id}",
+                f"run_id:{run_id}",
+                f"row_id:{row_id}",
+            ]
+        )
+    # Add Langfuse configuration
+    data["langfuse_public_key"] = config.langfuse_keys[project_id]["public_key"]
+    data["langfuse_secret_key"] = config.langfuse_keys[project_id]["secret_key"]
+    data["langfuse_host"] = config.langfuse_host
+    # Forward to LiteLLM's standard /chat/completions endpoint
+    # Set longer timeout for LLM API calls (LLMs can be slow)
+    timeout = httpx.Timeout(config.request_timeout)
+    async with httpx.AsyncClient(timeout=timeout) as client:
+        # Copy headers from original request but exclude content-length (httpx will set it correctly)
+        headers = dict(request.headers)
+        headers.pop("host", None)
+        headers.pop("content-length", None)  # Let httpx calculate the correct length
+        headers["content-type"] = "application/json"
+        # Forward to LiteLLM
+        litellm_url = f"{config.litellm_url}/chat/completions"
+        response = await client.post(
+            litellm_url,
+            json=data,  # httpx will serialize and set correct Content-Length
+            headers=headers,
+        )
+        # Register insertion_id in Redis only on successful response
+        if response.status_code == 200 and insertion_id is not None and rollout_id is not None:
+            register_insertion_id(redis_client, rollout_id, insertion_id)
+        # Return the response
+        return Response(
+            content=response.content,
+            status_code=response.status_code,
+            headers=dict(response.headers),
+        )
+async def proxy_to_litellm(config: ProxyConfig, path: str, request: Request) -> Response:
+    """
+    Catch-all proxy: Forward any request to LiteLLM, extracting API key from Authorization header.
+    """
+    # Set longer timeout for LLM API calls (LLMs can be slow)
+    timeout = httpx.Timeout(config.request_timeout)
+    async with httpx.AsyncClient(timeout=timeout) as client:
+        # Copy headers
+        headers = dict(request.headers)
+        headers.pop("host", None)
+        headers.pop("content-length", None)
+        # Get body
+        body = await request.body()
+        # Pass through API key from Authorization header
+        if request.method in ["POST", "PUT", "PATCH"] and body:
+            try:
+                data = json.loads(body)
+                auth_header = request.headers.get("authorization", "")
+                if auth_header.startswith("Bearer "):
+                    api_key = auth_header.replace("Bearer ", "").strip()
+                    data["api_key"] = api_key
+                # Re-serialize
+                body = json.dumps(data).encode()
+            except json.JSONDecodeError:
+                pass
+        # Forward to LiteLLM
+        litellm_url = f"{config.litellm_url}/{path}"
+        response = await client.request(
+            method=request.method,
+            url=litellm_url,
+            headers=headers,
+            content=body,
+        )
+        return Response(
+            content=response.content,
+            status_code=response.status_code,
+            headers=dict(response.headers),
+        )

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/proxy/proxy_core/models.py RENAMED Viewed

@@ -53,6 +53,7 @@ class TracesParams(BaseModel):
 class ProxyConfig(BaseModel):
     """Configuration model for the LiteLLM Metadata Proxy"""
+    litellm_url: str
     request_timeout: float = 300.0
     langfuse_host: str
     langfuse_keys: Dict[str, Dict[str, str]]
@@ -72,7 +73,6 @@ class ObservationResponse(BaseModel):
     input: Optional[Any] = None
     output: Optional[Any] = None
     parent_observation_id: Optional[str] = None
-    metadata: Optional[Dict[str, Any]] = None
 class TraceResponse(BaseModel):

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol/reward_function.py RENAMED Viewed

@@ -12,6 +12,7 @@ import requests
 from .models import EvaluateResult, MetricResult
 from .typed_interface import reward_function
+logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 T = TypeVar("T", bound=Callable[..., EvaluateResult])

{eval_protocol-0.3.22 → eval_protocol-0.3.24/eval_protocol.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: eval-protocol
-Version: 0.3.22
+Version: 0.3.24
 Summary: The official Python SDK for Eval Protocol (EP.) EP is an open protocol that standardizes how developers author evals for large language model (LLM) applications.
 Author-email: Fireworks AI <info@fireworks.ai>
 License-Expression: MIT
@@ -24,12 +24,12 @@ Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: omegaconf>=2.3.0
 Requires-Dist: httpx>=0.24.0
 Requires-Dist: anthropic>=0.59.0
-Requires-Dist: litellm<1.82.0,>=1.81.0
+Requires-Dist: litellm<1.75.0
 Requires-Dist: pytest>=6.0.0
 Requires-Dist: pytest-asyncio>=0.21.0
 Requires-Dist: peewee>=3.18.2
 Requires-Dist: backoff>=2.2.0
-Requires-Dist: fireworks-ai==1.0.0a20
+Requires-Dist: fireworks-ai<2,>=1.0.0a20
 Requires-Dist: questionary>=2.0.0
 Requires-Dist: toml>=0.10.0
 Requires-Dist: loguru>=0.6.0
@@ -111,14 +111,11 @@ Requires-Dist: langchain-core>=0.3.75; extra == "langgraph"
 Provides-Extra: langgraph-tools
 Requires-Dist: langgraph>=0.6.7; extra == "langgraph-tools"
 Requires-Dist: langchain>=0.3.0; extra == "langgraph-tools"
+Requires-Dist: langchain-fireworks>=0.3.0; extra == "langgraph-tools"
 Provides-Extra: proxy
 Requires-Dist: redis>=5.0.0; extra == "proxy"
 Requires-Dist: langfuse>=2.0.0; extra == "proxy"
 Requires-Dist: uuid6>=2025.0.0; extra == "proxy"
-Requires-Dist: litellm<1.82.0,>=1.81.0; extra == "proxy"
-Requires-Dist: opentelemetry-api>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-sdk>=1.29.0; extra == "proxy"
-Requires-Dist: opentelemetry-exporter-otlp>=1.29.0; extra == "proxy"
 Dynamic: license-file
 # Eval Protocol

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/eval_protocol.egg-info/requires.txt RENAMED Viewed

@@ -12,12 +12,12 @@ hydra-core>=1.3.2
 omegaconf>=2.3.0
 httpx>=0.24.0
 anthropic>=0.59.0
-litellm<1.82.0,>=1.81.0
+litellm<1.75.0
 pytest>=6.0.0
 pytest-asyncio>=0.21.0
 peewee>=3.18.2
 backoff>=2.2.0
-fireworks-ai==1.0.0a20
+fireworks-ai<2,>=1.0.0a20
 questionary>=2.0.0
 toml>=0.10.0
 loguru>=0.6.0
@@ -93,6 +93,7 @@ langchain-core>=0.3.75
 [langgraph_tools]
 langgraph>=0.6.7
 langchain>=0.3.0
+langchain-fireworks>=0.3.0
 [langsmith]
 langsmith>=0.1.86
@@ -107,10 +108,6 @@ openevals>=0.1.0
 redis>=5.0.0
 langfuse>=2.0.0
 uuid6>=2025.0.0
-litellm<1.82.0,>=1.81.0
-opentelemetry-api>=1.29.0
-opentelemetry-sdk>=1.29.0
-opentelemetry-exporter-otlp>=1.29.0
 [pydantic]
 pydantic-ai>=1.0.2

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/pyproject.toml RENAMED Viewed

@@ -31,12 +31,12 @@ dependencies = [
     "omegaconf>=2.3.0",
     "httpx>=0.24.0",
     "anthropic>=0.59.0",
-    "litellm>=1.81.0,<1.82.0",
+    "litellm<1.75.0",
     "pytest>=6.0.0",
     "pytest-asyncio>=0.21.0",
     "peewee>=3.18.2",
     "backoff>=2.2.0",
-    "fireworks-ai==1.0.0a20",
+    "fireworks-ai>=1.0.0a20,<2",
     "questionary>=2.0.0",
     # Dependencies for vendored tau2 package
     "toml>=0.10.0",
@@ -146,17 +146,13 @@ langgraph = [
 langgraph_tools = [
     "langgraph>=0.6.7",
     "langchain>=0.3.0",
-    # langchain-fireworks removed: incompatible with fireworks-ai>=1.0.0
+    "langchain-fireworks>=0.3.0",
 ]
 proxy = [
     "redis>=5.0.0",
     "langfuse>=2.0.0",
     "uuid6>=2025.0.0",
-    "litellm>=1.81.0,<1.82.0",
-    "opentelemetry-api>=1.29.0",
-    "opentelemetry-sdk>=1.29.0",
-    "opentelemetry-exporter-otlp>=1.29.0",
 ]
 [project.scripts]

eval_protocol-0.3.22/eval_protocol/proxy/proxy_core/litellm.py DELETED Viewed

@@ -1,154 +0,0 @@
-"""
-LiteLLM client - handles all LLM calls directly via LiteLLM SDK with Langfuse OTEL integration.
-"""
-import json
-import base64
-import logging
-from uuid6 import uuid7
-from fastapi import Request, Response, HTTPException
-from fastapi.responses import StreamingResponse
-import redis
-import openai
-from litellm import acompletion
-from .redis_utils import register_insertion_id
-from .models import ProxyConfig, ChatParams
-logger = logging.getLogger(__name__)
-async def handle_chat_completion(
-    config: ProxyConfig,
-    redis_client: redis.Redis,
-    request: Request,
-    params: ChatParams,
-) -> Response:
-    """
-    Handle chat completion requests using LiteLLM SDK directly with Langfuse OTEL.
-    If metadata IDs (rollout_id, etc.) are provided, they'll be added as tags
-    and the assistant message count will be tracked in Redis.
-    If encoded_base_url is provided, it will be decoded and used as api_base.
-    """
-    body = await request.body()
-    data = json.loads(body) if body else {}
-    if config.preprocess_chat_request:
-        data, params = config.preprocess_chat_request(data, request, params)
-    project_id = params.project_id
-    rollout_id = params.rollout_id
-    invocation_id = params.invocation_id
-    experiment_id = params.experiment_id
-    run_id = params.run_id
-    row_id = params.row_id
-    encoded_base_url = params.encoded_base_url
-    # Use default project if not specified
-    if project_id is None:
-        project_id = config.default_project_id
-    # Decode and add base_url if provided
-    if encoded_base_url:
-        try:
-            decoded_bytes = base64.urlsafe_b64decode(encoded_base_url)
-            data["base_url"] = decoded_bytes.decode("utf-8")
-            logger.debug(f"Decoded base_url: {data['base_url']}")
-        except Exception as e:
-            logger.error(f"Failed to decode base_url: {e}")
-            raise HTTPException(status_code=400, detail=f"Invalid encoded_base_url: {str(e)}")
-    # Extract API key from Authorization header and add to data
-    auth_header = request.headers.get("authorization", "")
-    if auth_header.startswith("Bearer "):
-        data["api_key"] = auth_header.replace("Bearer ", "").strip()
-    # Build metadata with tags for Langfuse
-    insertion_id = None
-    metadata = data.pop("metadata", {}) or {}
-    tags = list(metadata.pop("tags", []) or [])
-    if rollout_id is not None:
-        insertion_id = str(uuid7())
-        tags.extend(
-            [
-                f"rollout_id:{rollout_id}",
-                f"insertion_id:{insertion_id}",
-                f"invocation_id:{invocation_id}",
-                f"experiment_id:{experiment_id}",
-                f"run_id:{run_id}",
-                f"row_id:{row_id}",
-            ]
-        )
-    # Build Langfuse metadata (tags + user if present)
-    # Convert user_id (from preprocess hook) to trace_user_id for Langfuse
-    user_id = metadata.pop("user_id", None) or data.get("user")
-    litellm_metadata = {"tags": tags, **metadata}
-    if user_id:
-        litellm_metadata["trace_user_id"] = user_id
-    langfuse_keys = config.langfuse_keys[project_id]
-    # Check if streaming is requested
-    is_streaming = data.get("stream", False)
-    # Pop fields that we pass explicitly to avoid duplicate kwarg errors
-    request_timeout = data.pop("timeout", None) or config.request_timeout
-    data.pop("langfuse_public_key", None)
-    data.pop("langfuse_secret_key", None)
-    try:
-        # Make the completion call - pass all params through
-        # Note: langfuse_host is set via LANGFUSE_HOST env var at startup; OTEL doesn't support per-request host override
-        response = await acompletion(
-            **data,
-            metadata=litellm_metadata,
-            timeout=request_timeout,
-            langfuse_public_key=langfuse_keys["public_key"],
-            langfuse_secret_key=langfuse_keys["secret_key"],
-        )
-        if is_streaming:
-            # For streaming, return a StreamingResponse with SSE format
-            # Register insertion_id only after stream completes successfully
-            async def stream_generator():
-                async for chunk in response:  # type: ignore[union-attr]
-                    yield f"data: {chunk.model_dump_json()}\n\n"
-                yield "data: [DONE]\n\n"
-                # Stream completed successfully - now register
-                if insertion_id is not None and rollout_id is not None:
-                    register_insertion_id(redis_client, rollout_id, insertion_id)
-            return StreamingResponse(
-                stream_generator(),
-                media_type="text/event-stream",
-                headers={
-                    "Cache-Control": "no-cache",
-                    "Connection": "keep-alive",
-                },
-            )
-        else:
-            # Non-streaming: register insertion_id on success
-            if insertion_id is not None and rollout_id is not None:
-                register_insertion_id(redis_client, rollout_id, insertion_id)
-            return Response(
-                content=response.model_dump_json(),
-                status_code=200,
-                media_type="application/json",
-            )
-    except HTTPException:
-        raise
-    except openai.APIError as e:
-        # Convert to HTTPException and let FastAPI handle it
-        raise HTTPException(
-            status_code=getattr(e, "status_code", 500),
-            detail=str(e),
-        )
-    except Exception as e:
-        logger.error(f"Unexpected error: {e}", exc_info=True)
-        raise HTTPException(status_code=500, detail=str(e))

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/LICENSE RENAMED Viewed

File without changes

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/README.md RENAMED Viewed

File without changes

{eval_protocol-0.3.22 → eval_protocol-0.3.24}/development/__init__.py RENAMED Viewed

File without changes

eval-protocol 0.3.22__tar.gz → 0.3.24__tar.gz

eval-protocol 0.3.22tar.gz → 0.3.24tar.gz