judgeval 0.10.0__tar.gz → 0.10.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (122) hide show
  1. {judgeval-0.10.0 → judgeval-0.10.1}/PKG-INFO +1 -1
  2. {judgeval-0.10.0 → judgeval-0.10.1}/pyproject.toml +1 -1
  3. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/api/__init__.py +6 -0
  4. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/api/api_types.py +11 -0
  5. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/dataset/__init__.py +25 -2
  6. {judgeval-0.10.0 → judgeval-0.10.1}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  7. {judgeval-0.10.0 → judgeval-0.10.1}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  8. {judgeval-0.10.0 → judgeval-0.10.1}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  9. {judgeval-0.10.0 → judgeval-0.10.1}/.github/pull_request_template.md +0 -0
  10. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/blocked-pr.yaml +0 -0
  11. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/ci.yaml +0 -0
  12. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/claude-code-review.yml +0 -0
  13. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/claude.yml +0 -0
  14. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/lint.yaml +0 -0
  15. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/merge-branch-check.yaml +0 -0
  16. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/mypy.yaml +0 -0
  17. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/pre-commit-autoupdate.yaml +0 -0
  18. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/release.yaml +0 -0
  19. {judgeval-0.10.0 → judgeval-0.10.1}/.github/workflows/validate-branch.yaml +0 -0
  20. {judgeval-0.10.0 → judgeval-0.10.1}/.gitignore +0 -0
  21. {judgeval-0.10.0 → judgeval-0.10.1}/.pre-commit-config.yaml +0 -0
  22. {judgeval-0.10.0 → judgeval-0.10.1}/LICENSE.md +0 -0
  23. {judgeval-0.10.0 → judgeval-0.10.1}/README.md +0 -0
  24. {judgeval-0.10.0 → judgeval-0.10.1}/assets/Screenshot 2025-05-17 at 8.14.27/342/200/257PM.png" +0 -0
  25. {judgeval-0.10.0 → judgeval-0.10.1}/assets/agent.gif +0 -0
  26. {judgeval-0.10.0 → judgeval-0.10.1}/assets/agent_trace_example.png +0 -0
  27. {judgeval-0.10.0 → judgeval-0.10.1}/assets/data.gif +0 -0
  28. {judgeval-0.10.0 → judgeval-0.10.1}/assets/dataset_clustering_screenshot.png +0 -0
  29. {judgeval-0.10.0 → judgeval-0.10.1}/assets/dataset_clustering_screenshot_dm.png +0 -0
  30. {judgeval-0.10.0 → judgeval-0.10.1}/assets/datasets_preview_screenshot.png +0 -0
  31. {judgeval-0.10.0 → judgeval-0.10.1}/assets/document.gif +0 -0
  32. {judgeval-0.10.0 → judgeval-0.10.1}/assets/error_analysis_dashboard.png +0 -0
  33. {judgeval-0.10.0 → judgeval-0.10.1}/assets/errors.png +0 -0
  34. {judgeval-0.10.0 → judgeval-0.10.1}/assets/experiments_dashboard_screenshot.png +0 -0
  35. {judgeval-0.10.0 → judgeval-0.10.1}/assets/experiments_page.png +0 -0
  36. {judgeval-0.10.0 → judgeval-0.10.1}/assets/experiments_pagev2.png +0 -0
  37. {judgeval-0.10.0 → judgeval-0.10.1}/assets/logo-dark.svg +0 -0
  38. {judgeval-0.10.0 → judgeval-0.10.1}/assets/logo-light.svg +0 -0
  39. {judgeval-0.10.0 → judgeval-0.10.1}/assets/monitoring_screenshot.png +0 -0
  40. {judgeval-0.10.0 → judgeval-0.10.1}/assets/new_darkmode.svg +0 -0
  41. {judgeval-0.10.0 → judgeval-0.10.1}/assets/new_lightmode.svg +0 -0
  42. {judgeval-0.10.0 → judgeval-0.10.1}/assets/online_eval.png +0 -0
  43. {judgeval-0.10.0 → judgeval-0.10.1}/assets/product_shot.png +0 -0
  44. {judgeval-0.10.0 → judgeval-0.10.1}/assets/test.png +0 -0
  45. {judgeval-0.10.0 → judgeval-0.10.1}/assets/tests.png +0 -0
  46. {judgeval-0.10.0 → judgeval-0.10.1}/assets/trace.gif +0 -0
  47. {judgeval-0.10.0 → judgeval-0.10.1}/assets/trace_demo.png +0 -0
  48. {judgeval-0.10.0 → judgeval-0.10.1}/assets/trace_screenshot.png +0 -0
  49. {judgeval-0.10.0 → judgeval-0.10.1}/assets/trace_screenshot_old.png +0 -0
  50. {judgeval-0.10.0 → judgeval-0.10.1}/pytest.ini +0 -0
  51. {judgeval-0.10.0 → judgeval-0.10.1}/scripts/api_generator.py +0 -0
  52. {judgeval-0.10.0 → judgeval-0.10.1}/scripts/openapi_transform.py +0 -0
  53. {judgeval-0.10.0 → judgeval-0.10.1}/scripts/update_types.sh +0 -0
  54. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/__init__.py +0 -0
  55. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/cli.py +0 -0
  56. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/constants.py +0 -0
  57. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/__init__.py +0 -0
  58. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/evaluation_run.py +0 -0
  59. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/example.py +0 -0
  60. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/judgment_types.py +0 -0
  61. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/result.py +0 -0
  62. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/scorer_data.py +0 -0
  63. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/scripts/fix_default_factory.py +0 -0
  64. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/scripts/openapi_transform.py +0 -0
  65. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/tool.py +0 -0
  66. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/data/trace.py +0 -0
  67. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/env.py +0 -0
  68. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/evaluation/__init__.py +0 -0
  69. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/exceptions.py +0 -0
  70. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/integrations/langgraph/__init__.py +0 -0
  71. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/judges/__init__.py +0 -0
  72. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/judges/base_judge.py +0 -0
  73. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/judges/litellm_judge.py +0 -0
  74. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/judges/together_judge.py +0 -0
  75. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/judges/utils.py +0 -0
  76. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/logger.py +0 -0
  77. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/__init__.py +0 -0
  78. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/agent_scorer.py +0 -0
  79. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/api_scorer.py +0 -0
  80. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/base_scorer.py +0 -0
  81. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/example_scorer.py +0 -0
  82. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/exceptions.py +0 -0
  83. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/__init__.py +0 -0
  84. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/__init__.py +0 -0
  85. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py +0 -0
  86. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_relevancy.py +0 -0
  87. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py +0 -0
  88. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py +0 -0
  89. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/judgeval_scorers/api_scorers/prompt_scorer.py +0 -0
  90. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/score.py +0 -0
  91. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/scorers/utils.py +0 -0
  92. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/__init__.py +0 -0
  93. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/constants.py +0 -0
  94. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/exporters/__init__.py +0 -0
  95. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/exporters/s3.py +0 -0
  96. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/exporters/store.py +0 -0
  97. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/exporters/utils.py +0 -0
  98. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/keys.py +0 -0
  99. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/llm/__init__.py +0 -0
  100. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/llm/providers.py +0 -0
  101. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/local_eval_queue.py +0 -0
  102. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/managers.py +0 -0
  103. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/processors/__init__.py +0 -0
  104. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/tracer/utils.py +0 -0
  105. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/trainer/__init__.py +0 -0
  106. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/trainer/config.py +0 -0
  107. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/trainer/console.py +0 -0
  108. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/trainer/trainable_model.py +0 -0
  109. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/trainer/trainer.py +0 -0
  110. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/async_utils.py +0 -0
  111. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/decorators.py +0 -0
  112. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/file_utils.py +0 -0
  113. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/guards.py +0 -0
  114. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/meta.py +0 -0
  115. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/serialize.py +0 -0
  116. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/testing.py +0 -0
  117. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/url.py +0 -0
  118. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/utils/version_check.py +0 -0
  119. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/version.py +0 -0
  120. {judgeval-0.10.0 → judgeval-0.10.1}/src/judgeval/warnings.py +0 -0
  121. {judgeval-0.10.0 → judgeval-0.10.1}/update_version.py +0 -0
  122. {judgeval-0.10.0 → judgeval-0.10.1}/uv.lock +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: judgeval
3
- Version: 0.10.0
3
+ Version: 0.10.1
4
4
  Summary: Judgeval Package
5
5
  Project-URL: Homepage, https://github.com/JudgmentLabs/judgeval
6
6
  Project-URL: Issues, https://github.com/JudgmentLabs/judgeval/issues
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "judgeval"
3
- version = "0.10.0"
3
+ version = "0.10.1"
4
4
  authors = [
5
5
  { name = "Andrew Li", email = "andrew@judgmentlabs.ai" },
6
6
  { name = "Alex Shan", email = "alex@judgmentlabs.ai" },
@@ -137,6 +137,12 @@ class JudgmentSyncClient:
137
137
  payload,
138
138
  )
139
139
 
140
+ def datasets_pull_all_for_judgeval(self, payload: DatasetsFetch) -> List[DatasetInfo]:
141
+ return self._request(
142
+ "POST",
143
+ url_for("/datasets/pull_all_for_judgeval/"),
144
+ payload,
145
+ )
140
146
  def datasets_create_for_judgeval(self, payload: DatasetCreate) -> Any:
141
147
  return self._request(
142
148
  "POST",
@@ -19,6 +19,9 @@ class DatasetFetch(TypedDict):
19
19
  dataset_name: str
20
20
  project_name: str
21
21
 
22
+ class DatasetsFetch(TypedDict):
23
+ project_name: str
24
+
22
25
 
23
26
  class ProjectAdd(TypedDict):
24
27
  project_name: str
@@ -225,6 +228,14 @@ class DatasetReturn(TypedDict):
225
228
  project_name: str
226
229
  examples: NotRequired[Optional[List[Example]]]
227
230
 
231
+ class DatasetInfo(TypedDict):
232
+ dataset_id: str
233
+ name: str
234
+ created_at: str
235
+ dataset_kind: DatasetKind
236
+ entries: int
237
+ creator: str
238
+
228
239
 
229
240
  class DatasetCreate(TypedDict):
230
241
  name: str
@@ -11,6 +11,16 @@ from judgeval.api import JudgmentSyncClient
11
11
  from judgeval.logger import judgeval_logger
12
12
  from judgeval.env import JUDGMENT_API_KEY, JUDGMENT_ORG_ID
13
13
 
14
+ from judgeval.api.api_types import DatasetKind
15
+
16
+ @dataclass
17
+ class DatasetInfo:
18
+ dataset_id: str
19
+ name: str
20
+ created_at: str
21
+ dataset_kind: DatasetKind
22
+ entries: int
23
+ creator: str
14
24
 
15
25
  @dataclass
16
26
  class Dataset:
@@ -42,7 +52,7 @@ class Dataset:
42
52
  e.pop(
43
53
  "example_id"
44
54
  ) # TODO: remove once scorer data migraiton is complete
45
- judgeval_logger.info(f"Succesfully retrieved dataset {name}!")
55
+ judgeval_logger.info(f"Successfully retrieved dataset {name}!")
46
56
  return cls(
47
57
  name=name,
48
58
  project_name=project_name,
@@ -71,12 +81,25 @@ class Dataset:
71
81
  }
72
82
  )
73
83
 
74
- judgeval_logger.info(f"Succesfull created dataset {name}!")
84
+ judgeval_logger.info(f"Successfully created dataset {name}!")
75
85
  return cls(
76
86
  name=name,
77
87
  project_name=project_name,
78
88
  examples=examples,
79
89
  )
90
+ @classmethod
91
+ def list(
92
+ cls,
93
+ project_name: str
94
+ ):
95
+ client = JudgmentSyncClient(cls.judgment_api_key, cls.organization_id)
96
+ datasets = client.datasets_pull_all_for_judgeval(
97
+ {"project_name": project_name}
98
+ )
99
+
100
+ judgeval_logger.info(f"Fetched all datasets for project {project_name}!")
101
+
102
+ return [DatasetInfo(**dataset_info) for dataset_info in datasets]
80
103
 
81
104
  def add_from_json(self, file_path: str) -> None:
82
105
  """
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes