judgeval 0.12.0__py3-none-any.whl → 0.13.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- judgeval/__init__.py +2 -2
- judgeval/api/api_types.py +81 -12
- judgeval/cli.py +2 -1
- judgeval/constants.py +0 -6
- judgeval/data/evaluation_run.py +2 -5
- judgeval/data/judgment_types.py +97 -12
- judgeval/data/trace.py +108 -1
- judgeval/dataset/__init__.py +72 -23
- judgeval/env.py +5 -20
- judgeval/integrations/langgraph/__init__.py +9 -785
- judgeval/scorers/api_scorer.py +7 -12
- judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py +0 -8
- judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py +0 -8
- judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py +0 -12
- judgeval/scorers/judgeval_scorers/api_scorers/prompt_scorer.py +22 -33
- judgeval/scorers/score.py +1 -1
- judgeval/scorers/utils.py +1 -4
- judgeval/tracer/__init__.py +175 -156
- judgeval/tracer/exporters/__init__.py +4 -1
- judgeval/tracer/keys.py +15 -25
- judgeval/tracer/llm/__init__.py +0 -1
- judgeval/tracer/llm/anthropic/__init__.py +20 -0
- judgeval/tracer/llm/google/__init__.py +21 -0
- judgeval/tracer/llm/groq/__init__.py +20 -0
- judgeval/tracer/llm/openai/__init__.py +32 -0
- judgeval/tracer/llm/providers.py +28 -79
- judgeval/tracer/llm/together/__init__.py +20 -0
- judgeval/tracer/managers.py +23 -48
- judgeval/tracer/processors/__init__.py +36 -75
- judgeval/tracer/utils.py +1 -2
- judgeval/utils/file_utils.py +0 -2
- judgeval/utils/meta.py +18 -5
- judgeval/utils/testing.py +0 -14
- judgeval/utils/version_check.py +2 -0
- judgeval/version.py +1 -1
- {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/METADATA +1 -7
- {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/RECORD +40 -35
- {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/WHEEL +0 -0
- {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/entry_points.txt +0 -0
- {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/licenses/LICENSE.md +0 -0
judgeval/env.py
CHANGED
@@ -32,7 +32,7 @@ JUDGMENT_API_KEY = required_env_var("JUDGMENT_API_KEY")
|
|
32
32
|
JUDGMENT_ORG_ID = required_env_var("JUDGMENT_ORG_ID")
|
33
33
|
JUDGMENT_API_URL = optional_env_var("JUDGMENT_API_URL", "https://api.judgmentlabs.ai")
|
34
34
|
|
35
|
-
JUDGMENT_DEFAULT_GPT_MODEL = optional_env_var("JUDGMENT_DEFAULT_GPT_MODEL", "gpt-
|
35
|
+
JUDGMENT_DEFAULT_GPT_MODEL = optional_env_var("JUDGMENT_DEFAULT_GPT_MODEL", "gpt-5")
|
36
36
|
JUDGMENT_DEFAULT_TOGETHER_MODEL = optional_env_var(
|
37
37
|
"JUDGMENT_DEFAULT_TOGETHER_MODEL", "meta-llama/Meta-Llama-3-8B-Instruct-Lite"
|
38
38
|
)
|
@@ -40,6 +40,10 @@ JUDGMENT_MAX_CONCURRENT_EVALUATIONS = int(
|
|
40
40
|
optional_env_var("JUDGMENT_MAX_CONCURRENT_EVALUATIONS", "10")
|
41
41
|
)
|
42
42
|
|
43
|
+
|
44
|
+
JUDGMENT_ENABLE_MONITORING = optional_env_var("JUDGMENT_ENABLE_MONITORING", "true")
|
45
|
+
JUDGMENT_ENABLE_EVALUATIONS = optional_env_var("JUDGMENT_ENABLE_EVALUATIONS", "true")
|
46
|
+
|
43
47
|
JUDGMENT_S3_ACCESS_KEY_ID = optional_env_var("JUDGMENT_S3_ACCESS_KEY_ID")
|
44
48
|
JUDGMENT_S3_SECRET_ACCESS_KEY = optional_env_var("JUDGMENT_S3_SECRET_ACCESS_KEY")
|
45
49
|
JUDGMENT_S3_REGION_NAME = optional_env_var("JUDGMENT_S3_REGION_NAME")
|
@@ -55,22 +59,3 @@ JUDGMENT_NO_COLOR = optional_env_var("JUDGMENT_NO_COLOR")
|
|
55
59
|
|
56
60
|
TOGETHERAI_API_KEY = optional_env_var("TOGETHERAI_API_KEY")
|
57
61
|
TOGETHER_API_KEY = optional_env_var("TOGETHER_API_KEY")
|
58
|
-
|
59
|
-
__all__ = (
|
60
|
-
"JUDGMENT_API_KEY",
|
61
|
-
"JUDGMENT_ORG_ID",
|
62
|
-
"JUDGMENT_API_URL",
|
63
|
-
"JUDGMENT_DEFAULT_GPT_MODEL",
|
64
|
-
"JUDGMENT_DEFAULT_TOGETHER_MODEL",
|
65
|
-
"JUDGMENT_MAX_CONCURRENT_EVALUATIONS",
|
66
|
-
"JUDGMENT_S3_ACCESS_KEY_ID",
|
67
|
-
"JUDGMENT_S3_SECRET_ACCESS_KEY",
|
68
|
-
"JUDGMENT_S3_REGION_NAME",
|
69
|
-
"JUDGMENT_S3_BUCKET_NAME",
|
70
|
-
"JUDGMENT_S3_PREFIX",
|
71
|
-
"JUDGMENT_S3_ENDPOINT_URL",
|
72
|
-
"JUDGMENT_S3_ADDRESSING_STYLE",
|
73
|
-
"JUDGMENT_NO_COLOR",
|
74
|
-
"TOGETHERAI_API_KEY",
|
75
|
-
"TOGETHER_API_KEY",
|
76
|
-
)
|