pydantic-evals 1.2.0__tar.gz → 1.3.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of pydantic-evals might be problematic. Click here for more details.
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/PKG-INFO +2 -2
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/dataset.py +2 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/.gitignore +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/LICENSE +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/README.md +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/__init__.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/_utils.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/__init__.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/_run_evaluator.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/common.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/context.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/evaluator.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/llm_as_a_judge.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/evaluators/spec.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/generation.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/otel/__init__.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/otel/_context_in_memory_span_exporter.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/otel/_context_subtree.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/otel/_errors.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/otel/span_tree.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/py.typed +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/reporting/__init__.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pydantic_evals/reporting/render_numbers.py +0 -0
- {pydantic_evals-1.2.0 → pydantic_evals-1.3.0}/pyproject.toml +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: pydantic-evals
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.3.0
|
|
4
4
|
Summary: Framework for evaluating stochastic code execution, especially code making use of LLMs
|
|
5
5
|
Project-URL: Homepage, https://ai.pydantic.dev/evals
|
|
6
6
|
Project-URL: Source, https://github.com/pydantic/pydantic-ai
|
|
@@ -30,7 +30,7 @@ Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
|
|
30
30
|
Requires-Python: >=3.10
|
|
31
31
|
Requires-Dist: anyio>=0
|
|
32
32
|
Requires-Dist: logfire-api>=3.14.1
|
|
33
|
-
Requires-Dist: pydantic-ai-slim==1.
|
|
33
|
+
Requires-Dist: pydantic-ai-slim==1.3.0
|
|
34
34
|
Requires-Dist: pydantic>=2.10
|
|
35
35
|
Requires-Dist: pyyaml>=6.0.2
|
|
36
36
|
Requires-Dist: rich>=13.9.4
|
|
@@ -343,6 +343,8 @@ class Dataset(BaseModel, Generic[InputsT, OutputT, MetadataT], extra='forbid', a
|
|
|
343
343
|
trace_id=trace_id,
|
|
344
344
|
)
|
|
345
345
|
if (averages := report.averages()) is not None and averages.assertions is not None:
|
|
346
|
+
experiment_metadata = {'n_cases': len(self.cases), 'averages': averages}
|
|
347
|
+
eval_span.set_attribute('logfire.experiment.metadata', experiment_metadata)
|
|
346
348
|
eval_span.set_attribute('assertion_pass_rate', averages.assertions)
|
|
347
349
|
return report
|
|
348
350
|
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|