PyPI - deepeval - Versions diffs - 3.7.8__py3-none-any.whl → 3.8.0__py3-none-any.whl - Mend

deepeval 3.7.8py3-none-any.whl → 3.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

deepeval/_version.py +1 -1
deepeval/benchmarks/drop/drop.py +5 -2
deepeval/benchmarks/mmlu/mmlu.py +6 -4
deepeval/cli/main.py +168 -0
deepeval/cli/utils.py +2 -2
deepeval/confident/api.py +2 -0
deepeval/config/settings.py +10 -0
deepeval/constants.py +1 -0
deepeval/integrations/langchain/callback.py +330 -158
deepeval/integrations/langchain/utils.py +31 -8
deepeval/key_handler.py +8 -1
deepeval/metrics/conversational_g_eval/conversational_g_eval.py +35 -0
deepeval/metrics/g_eval/g_eval.py +35 -1
deepeval/metrics/g_eval/utils.py +65 -0
deepeval/models/__init__.py +2 -0
deepeval/models/llms/__init__.py +2 -0
deepeval/models/llms/constants.py +23 -0
deepeval/models/llms/gemini_model.py +27 -29
deepeval/models/llms/openai_model.py +5 -4
deepeval/models/llms/openrouter_model.py +398 -0
deepeval/models/retry_policy.py +3 -0
deepeval/prompt/api.py +1 -0
deepeval/synthesizer/synthesizer.py +190 -82
deepeval/tracing/tracing.py +6 -1
deepeval/tracing/types.py +1 -1
deepeval/utils.py +21 -6
{deepeval-3.7.8.dist-info → deepeval-3.8.0.dist-info}/METADATA +7 -7
{deepeval-3.7.8.dist-info → deepeval-3.8.0.dist-info}/RECORD +31 -30
{deepeval-3.7.8.dist-info → deepeval-3.8.0.dist-info}/LICENSE.md +0 -0
{deepeval-3.7.8.dist-info → deepeval-3.8.0.dist-info}/WHEEL +0 -0
{deepeval-3.7.8.dist-info → deepeval-3.8.0.dist-info}/entry_points.txt +0 -0

deepeval/_version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__: str = "3.7.8"
1	+ __version__: str = "3.8.0"

deepeval/benchmarks/drop/drop.py CHANGED Viewed

@@ -279,8 +279,11 @@ class DROP(DeepEvalBaseBenchmark):
             prediction = predictions[i]
             golden = goldens[i]
             # Define Metric
-            score = self.scorer.quasi_exact_match_score(
-                golden.expected_output, prediction
+            expected_output = DROPTemplate.parse_str_to_list(
+                golden.expected_output, DELIMITER
+            )
+            score = self.scorer.quasi_contains_score(
+                expected_output, prediction
             )
             res.append({"prediction": prediction, "score": score})

deepeval/benchmarks/mmlu/mmlu.py CHANGED Viewed

@@ -224,10 +224,12 @@ class MMLU(DeepEvalBaseBenchmark):
             responses: List[MultipleChoiceSchema] = model.batch_generate(
                 prompts=prompts, schemas=[MultipleChoiceSchema for i in prompts]
             )
-            if isinstance(responses, (tuple, list)):
-                predictions = [res[0].answer for res in responses]
-            else:
-                predictions = [res.answer for res in responses]
+            if not isinstance(responses, list):
+                raise TypeError(
+                    "batch_generate must return List[MultipleChoiceSchema]"
+                )
+            predictions = [res.answer for res in responses]
         except TypeError:
             prompts = [
                 prompt

deepeval/cli/main.py CHANGED Viewed

@@ -2937,5 +2937,173 @@ def unset_portkey_model_env(
             )
+#############################################
+# OpenRouter Integration ####################
+#############################################
+@app.command(name="set-openrouter")
+def set_openrouter_model_env(
+    model: Optional[str] = typer.Option(
+        None,
+        "-m",
+        "--model",
+        help="Model identifier to use for this provider (e.g., `openai/gpt-4.1`).",
+    ),
+    prompt_api_key: bool = typer.Option(
+        False,
+        "-k",
+        "--prompt-api-key",
+        help=(
+            "Prompt for OPENROUTER_API_KEY (input hidden). Not suitable for CI. "
+            "If --save (or DEEPEVAL_DEFAULT_SAVE) is used, the key is written to dotenv in plaintext."
+        ),
+    ),
+    base_url: Optional[str] = typer.Option(
+        None,
+        "-u",
+        "--base-url",
+        help="Override the API endpoint/base URL used by this provider (default: https://openrouter.ai/api/v1).",
+    ),
+    temperature: Optional[float] = typer.Option(
+        None,
+        "-t",
+        "--temperature",
+        help="Override the global TEMPERATURE used by LLM providers (e.g., 0.0 for deterministic behavior).",
+    ),
+    cost_per_input_token: Optional[float] = typer.Option(
+        None,
+        "-i",
+        "--cost-per-input-token",
+        help=(
+            "USD per input token used for cost tracking. "
+            "If unset and OpenRouter does not return pricing metadata, "
+            "costs will not be calculated."
+        ),
+    ),
+    cost_per_output_token: Optional[float] = typer.Option(
+        None,
+        "-o",
+        "--cost-per-output-token",
+        help=(
+            "USD per output token used for cost tracking. "
+            "If unset and OpenRouter does not return pricing metadata, "
+            "costs will not be calculated."
+        ),
+    ),
+    save: Optional[str] = typer.Option(
+        None,
+        "-s",
+        "--save",
+        help="Persist CLI parameters as environment variables in a dotenv file. "
+        "Usage: --save=dotenv[:path] (default: .env.local)",
+    ),
+    quiet: bool = typer.Option(
+        False,
+        "-q",
+        "--quiet",
+        help="Suppress printing to the terminal (useful for CI).",
+    ),
+):
+    api_key = None
+    if prompt_api_key:
+        api_key = coerce_blank_to_none(
+            typer.prompt("OpenRouter API key", hide_input=True)
+        )
+    model = coerce_blank_to_none(model)
+    base_url = coerce_blank_to_none(base_url)
+    settings = get_settings()
+    with settings.edit(save=save) as edit_ctx:
+        edit_ctx.switch_model_provider(ModelKeyValues.USE_OPENROUTER_MODEL)
+        if model is not None:
+            settings.OPENROUTER_MODEL_NAME = model
+        if api_key is not None:
+            settings.OPENROUTER_API_KEY = api_key
+        if base_url is not None:
+            settings.OPENROUTER_BASE_URL = base_url
+        if temperature is not None:
+            settings.TEMPERATURE = temperature
+        if cost_per_input_token is not None:
+            settings.OPENROUTER_COST_PER_INPUT_TOKEN = cost_per_input_token
+        if cost_per_output_token is not None:
+            settings.OPENROUTER_COST_PER_OUTPUT_TOKEN = cost_per_output_token
+    handled, path, updates = edit_ctx.result
+    effective_model = settings.OPENROUTER_MODEL_NAME
+    if not effective_model:
+        raise typer.BadParameter(
+            "OpenRouter model name is not set. Pass --model (or set OPENROUTER_MODEL_NAME).",
+            param_hint="--model",
+        )
+    _handle_save_result(
+        handled=handled,
+        path=path,
+        updates=updates,
+        save=save,
+        quiet=quiet,
+        success_msg=(
+            f":raising_hands: Congratulations! You're now using OpenRouter `{escape(effective_model)}` for all evals that require an LLM."
+        ),
+    )
+@app.command(name="unset-openrouter")
+def unset_openrouter_model_env(
+    save: Optional[str] = typer.Option(
+        None,
+        "-s",
+        "--save",
+        help="Remove only the OpenRouter model related environment variables from a dotenv file. "
+        "Usage: --save=dotenv[:path] (default: .env.local)",
+    ),
+    clear_secrets: bool = typer.Option(
+        False,
+        "-x",
+        "--clear-secrets",
+        help="Also remove OPENROUTER_API_KEY from the dotenv store.",
+    ),
+    quiet: bool = typer.Option(
+        False,
+        "-q",
+        "--quiet",
+        help="Suppress printing to the terminal (useful for CI).",
+    ),
+):
+    settings = get_settings()
+    with settings.edit(save=save) as edit_ctx:
+        settings.USE_OPENROUTER_MODEL = None
+        settings.OPENROUTER_MODEL_NAME = None
+        settings.OPENROUTER_BASE_URL = None
+        settings.OPENROUTER_COST_PER_INPUT_TOKEN = None
+        settings.OPENROUTER_COST_PER_OUTPUT_TOKEN = None
+        # Intentionally do NOT touch TEMPERATURE here; it's a global dial.
+        if clear_secrets:
+            settings.OPENROUTER_API_KEY = None
+    handled, path, updates = edit_ctx.result
+    if _handle_save_result(
+        handled=handled,
+        path=path,
+        updates=updates,
+        save=save,
+        quiet=quiet,
+        updated_msg="Removed OpenRouter model environment variables from {path}.",
+        tip_msg=None,
+    ):
+        if is_openai_configured():
+            print(
+                ":raised_hands: OpenAI will still be used by default because OPENAI_API_KEY is set."
+            )
+        else:
+            print(
+                "The OpenRouter model configuration has been removed. No model is currently configured, but you can set one with the CLI or add credentials to .env[.local]."
+            )
 if __name__ == "__main__":
     app()

deepeval/cli/utils.py CHANGED Viewed

@@ -52,10 +52,10 @@ USE_EMBED_KEYS = [
 def render_login_message():
     print(
-        "🥳 Welcome to [rgb(106,0,255)]Confident AI[/rgb(106,0,255)], the DeepEval cloud platform 🏡❤️"
+        "🥳 Welcome to [rgb(106,0,255)]Confident AI[/rgb(106,0,255)], the evals cloud platform 🏡❤️"
     )
     print("")
-    print(pyfiglet.Figlet(font="big_money-ne").renderText("DeepEval Cloud"))
+    print(pyfiglet.Figlet(font="big_money-ne").renderText("Confident AI"))
 def upload_and_open_link(_span: Span):

deepeval/confident/api.py CHANGED Viewed

@@ -106,6 +106,8 @@ class Endpoints(Enum):
     EVALUATE_TRACE_ENDPOINT = "/v1/evaluate/traces/:traceUuid"
     EVALUATE_SPAN_ENDPOINT = "/v1/evaluate/spans/:spanUuid"
+    METRICS_ENDPOINT = "/v1/metrics"
 class Api:
     def __init__(self, api_key: Optional[str] = None):

deepeval/config/settings.py CHANGED Viewed

@@ -627,6 +627,16 @@ class Settings(BaseSettings):
     PORTKEY_PROVIDER_NAME: Optional[str] = Field(
         None, description="Provider name/routing hint for Portkey."
     )
+    # OpenRouter
+    USE_OPENROUTER_MODEL: Optional[bool] = None
+    OPENROUTER_API_KEY: Optional[SecretStr] = None
+    OPENROUTER_MODEL_NAME: Optional[str] = None
+    OPENROUTER_COST_PER_INPUT_TOKEN: Optional[float] = None
+    OPENROUTER_COST_PER_OUTPUT_TOKEN: Optional[float] = None
+    OPENROUTER_BASE_URL: Optional[AnyUrl] = Field(
+        None, description="OpenRouter base URL (if using a custom endpoint)."
+    )
     # Vertex AI
     VERTEX_AI_MODEL_NAME: Optional[str] = Field(
         None,

deepeval/constants.py CHANGED Viewed

@@ -35,6 +35,7 @@ class ProviderSlug(str, Enum):
     LITELLM = "litellm"
     LOCAL = "local"
     OLLAMA = "ollama"
+    OPENROUTER = "openrouter"
 def slugify(value: Union[str, ProviderSlug]) -> str:

deepeval 3.7.8__py3-none-any.whl → 3.8.0__py3-none-any.whl

deepeval 3.7.8py3-none-any.whl → 3.8.0py3-none-any.whl