judgeval 0.12.0__py3-none-any.whl → 0.13.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (40) hide show
  1. judgeval/__init__.py +2 -2
  2. judgeval/api/api_types.py +81 -12
  3. judgeval/cli.py +2 -1
  4. judgeval/constants.py +0 -6
  5. judgeval/data/evaluation_run.py +2 -5
  6. judgeval/data/judgment_types.py +97 -12
  7. judgeval/data/trace.py +108 -1
  8. judgeval/dataset/__init__.py +72 -23
  9. judgeval/env.py +5 -20
  10. judgeval/integrations/langgraph/__init__.py +9 -785
  11. judgeval/scorers/api_scorer.py +7 -12
  12. judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py +0 -8
  13. judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py +0 -8
  14. judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py +0 -12
  15. judgeval/scorers/judgeval_scorers/api_scorers/prompt_scorer.py +22 -33
  16. judgeval/scorers/score.py +1 -1
  17. judgeval/scorers/utils.py +1 -4
  18. judgeval/tracer/__init__.py +175 -156
  19. judgeval/tracer/exporters/__init__.py +4 -1
  20. judgeval/tracer/keys.py +15 -25
  21. judgeval/tracer/llm/__init__.py +0 -1
  22. judgeval/tracer/llm/anthropic/__init__.py +20 -0
  23. judgeval/tracer/llm/google/__init__.py +21 -0
  24. judgeval/tracer/llm/groq/__init__.py +20 -0
  25. judgeval/tracer/llm/openai/__init__.py +32 -0
  26. judgeval/tracer/llm/providers.py +28 -79
  27. judgeval/tracer/llm/together/__init__.py +20 -0
  28. judgeval/tracer/managers.py +23 -48
  29. judgeval/tracer/processors/__init__.py +36 -75
  30. judgeval/tracer/utils.py +1 -2
  31. judgeval/utils/file_utils.py +0 -2
  32. judgeval/utils/meta.py +18 -5
  33. judgeval/utils/testing.py +0 -14
  34. judgeval/utils/version_check.py +2 -0
  35. judgeval/version.py +1 -1
  36. {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/METADATA +1 -7
  37. {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/RECORD +40 -35
  38. {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/WHEEL +0 -0
  39. {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/entry_points.txt +0 -0
  40. {judgeval-0.12.0.dist-info → judgeval-0.13.0.dist-info}/licenses/LICENSE.md +0 -0
judgeval/env.py CHANGED
@@ -32,7 +32,7 @@ JUDGMENT_API_KEY = required_env_var("JUDGMENT_API_KEY")
32
32
  JUDGMENT_ORG_ID = required_env_var("JUDGMENT_ORG_ID")
33
33
  JUDGMENT_API_URL = optional_env_var("JUDGMENT_API_URL", "https://api.judgmentlabs.ai")
34
34
 
35
- JUDGMENT_DEFAULT_GPT_MODEL = optional_env_var("JUDGMENT_DEFAULT_GPT_MODEL", "gpt-4.1")
35
+ JUDGMENT_DEFAULT_GPT_MODEL = optional_env_var("JUDGMENT_DEFAULT_GPT_MODEL", "gpt-5")
36
36
  JUDGMENT_DEFAULT_TOGETHER_MODEL = optional_env_var(
37
37
  "JUDGMENT_DEFAULT_TOGETHER_MODEL", "meta-llama/Meta-Llama-3-8B-Instruct-Lite"
38
38
  )
@@ -40,6 +40,10 @@ JUDGMENT_MAX_CONCURRENT_EVALUATIONS = int(
40
40
  optional_env_var("JUDGMENT_MAX_CONCURRENT_EVALUATIONS", "10")
41
41
  )
42
42
 
43
+
44
+ JUDGMENT_ENABLE_MONITORING = optional_env_var("JUDGMENT_ENABLE_MONITORING", "true")
45
+ JUDGMENT_ENABLE_EVALUATIONS = optional_env_var("JUDGMENT_ENABLE_EVALUATIONS", "true")
46
+
43
47
  JUDGMENT_S3_ACCESS_KEY_ID = optional_env_var("JUDGMENT_S3_ACCESS_KEY_ID")
44
48
  JUDGMENT_S3_SECRET_ACCESS_KEY = optional_env_var("JUDGMENT_S3_SECRET_ACCESS_KEY")
45
49
  JUDGMENT_S3_REGION_NAME = optional_env_var("JUDGMENT_S3_REGION_NAME")
@@ -55,22 +59,3 @@ JUDGMENT_NO_COLOR = optional_env_var("JUDGMENT_NO_COLOR")
55
59
 
56
60
  TOGETHERAI_API_KEY = optional_env_var("TOGETHERAI_API_KEY")
57
61
  TOGETHER_API_KEY = optional_env_var("TOGETHER_API_KEY")
58
-
59
- __all__ = (
60
- "JUDGMENT_API_KEY",
61
- "JUDGMENT_ORG_ID",
62
- "JUDGMENT_API_URL",
63
- "JUDGMENT_DEFAULT_GPT_MODEL",
64
- "JUDGMENT_DEFAULT_TOGETHER_MODEL",
65
- "JUDGMENT_MAX_CONCURRENT_EVALUATIONS",
66
- "JUDGMENT_S3_ACCESS_KEY_ID",
67
- "JUDGMENT_S3_SECRET_ACCESS_KEY",
68
- "JUDGMENT_S3_REGION_NAME",
69
- "JUDGMENT_S3_BUCKET_NAME",
70
- "JUDGMENT_S3_PREFIX",
71
- "JUDGMENT_S3_ENDPOINT_URL",
72
- "JUDGMENT_S3_ADDRESSING_STYLE",
73
- "JUDGMENT_NO_COLOR",
74
- "TOGETHERAI_API_KEY",
75
- "TOGETHER_API_KEY",
76
- )