PyPI - vllm-judge - Versions diffs - 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl - Mend

vllm-judge 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

vllm_judge/__init__.py +17 -3
vllm_judge/api/__init__.py +0 -3
vllm_judge/api/client.py +0 -3
vllm_judge/api/server.py +1 -5
vllm_judge/batch.py +2 -1
vllm_judge/builtin_metrics.py +907 -0
vllm_judge/cli.py +1 -5
vllm_judge/client.py +1 -6
vllm_judge/judge.py +2 -2
vllm_judge/models.py +3 -3
vllm_judge/{prompts.py → prompt_builder.py} +60 -38
{vllm_judge-0.1.4.dist-info → vllm_judge-0.1.6.dist-info}/METADATA +1 -1
vllm_judge-0.1.6.dist-info/RECORD +20 -0
vllm_judge/metrics.py +0 -582
vllm_judge-0.1.4.dist-info/RECORD +0 -20
/vllm_judge/{utils.py → parsers.py} +0 -0
{vllm_judge-0.1.4.dist-info → vllm_judge-0.1.6.dist-info}/WHEEL +0 -0
{vllm_judge-0.1.4.dist-info → vllm_judge-0.1.6.dist-info}/entry_points.txt +0 -0
{vllm_judge-0.1.4.dist-info → vllm_judge-0.1.6.dist-info}/top_level.txt +0 -0

vllm_judge/__init__.py CHANGED Viewed

@@ -5,7 +5,7 @@ A lightweight library for evaluating text responses using self-hosted language m
 via vLLM's OpenAI-compatible API.
 """
-__version__ = "0.1.4"
+__version__ = "0.1.6"
 from vllm_judge.judge import Judge
 from vllm_judge.models import (
@@ -17,17 +17,18 @@ from vllm_judge.models import (
     ModelSpecificMetric
 )
 from vllm_judge.templating import TemplateProcessor
-from vllm_judge.metrics import (
+from vllm_judge.builtin_metrics import (
     # General metrics
     HELPFULNESS,
     ACCURACY,
     CLARITY,
     CONCISENESS,
     RELEVANCE,
+    COHERENCE,
     # Safety metrics
     SAFETY,
     TOXICITY,
+    BIAS_DETECTION,
     LLAMA_GUARD_3_SAFETY,
     # Code metrics
@@ -61,6 +62,12 @@ from vllm_judge.metrics import (
     PRODUCT_REVIEW_TEMPLATE,
     MEDICAL_INFO_TEMPLATE,
     API_DOCS_TEMPLATE,
+    RAG_EVALUATION_TEMPLATE,
+    AGENT_PERFORMANCE_TEMPLATE,
+    # NLP metrics
+    TRANSLATION_QUALITY,
+    SUMMARIZATION_QUALITY,
 )
 from vllm_judge.exceptions import (
@@ -91,8 +98,10 @@ __all__ = [
     "CLARITY",
     "CONCISENESS",
     "RELEVANCE",
+    "COHERENCE",
     "SAFETY",
     "TOXICITY",
+    "BIAS_DETECTION",
     "LLAMA_GUARD_3_SAFETY",
     "CODE_QUALITY",
     "CODE_SECURITY",
@@ -112,6 +121,11 @@ __all__ = [
     "PRODUCT_REVIEW_TEMPLATE",
     "MEDICAL_INFO_TEMPLATE",
     "API_DOCS_TEMPLATE",
+    "RAG_EVALUATION_TEMPLATE",
+    "AGENT_PERFORMANCE_TEMPLATE",
+    "TRANSLATION_QUALITY",
+    "SUMMARIZATION_QUALITY",
     # Exceptions
     "VLLMJudgeError",
     "ConfigurationError",

vllm_judge/api/__init__.py CHANGED Viewed

@@ -1,6 +1,3 @@
-"""
-API module for vLLM Judge.
-"""
 from vllm_judge.api.server import app, create_app, start_server
 from vllm_judge.api.client import JudgeClient
 from vllm_judge.api.models import (

vllm_judge/api/client.py CHANGED Viewed

@@ -1,6 +1,3 @@
-"""
-HTTP client for vLLM Judge API.
-"""
 import asyncio
 from typing import Union, Dict, List, Optional, Tuple, Any, AsyncIterator
 import httpx

vllm_judge/api/server.py CHANGED Viewed

@@ -1,7 +1,3 @@
-"""
-FastAPI server for vLLM Judge API.
-"""
-import asyncio
 import time
 import uuid
 from datetime import datetime
@@ -14,7 +10,7 @@ import uvicorn
 from vllm_judge.judge import Judge
 from vllm_judge.models import EvaluationResult, JudgeConfig
-from vllm_judge.metrics import BUILTIN_METRICS
+from vllm_judge.builtin_metrics import BUILTIN_METRICS
 from vllm_judge.exceptions import VLLMJudgeError
 from vllm_judge.api.models import (
     EvaluateRequest,

vllm_judge/batch.py CHANGED Viewed

@@ -17,7 +17,8 @@ class BatchProcessor:
             max_concurrent: Maximum concurrent requests
         """
         self.judge = judge
-        self.semaphore = asyncio.Semaphore(max_concurrent)
+        self.max_concurrent = max_concurrent
+        self.semaphore = asyncio.Semaphore(self.max_concurrent)
         self.progress_lock = asyncio.Lock()
         self.completed = 0

vllm-judge 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl

vllm-judge 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl