fiddler-evals 0.1.1.dev12__tar.gz → 0.1.1.dev13__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (96) hide show
  1. {fiddler_evals-0.1.1.dev12/fiddler_evals.egg-info → fiddler_evals-0.1.1.dev13}/PKG-INFO +1 -1
  2. fiddler_evals-0.1.1.dev13/fiddler_evals/VERSION +1 -0
  3. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/dataset.py +4 -1
  4. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/experiment_result_publisher.py +1 -1
  5. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/experiment_runner.py +5 -0
  6. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/tests/test_evaluate.py +18 -1
  7. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13/fiddler_evals.egg-info}/PKG-INFO +1 -1
  8. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/pyproject.toml +1 -1
  9. fiddler_evals-0.1.1.dev12/fiddler_evals/VERSION +0 -1
  10. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/MANIFEST.in +0 -0
  11. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/PUBLIC.md +0 -0
  12. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/README.md +0 -0
  13. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/__init__.py +0 -0
  14. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/configs.py +0 -0
  15. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/conftest.py +0 -0
  16. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/connection.py +0 -0
  17. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/constants.py +0 -0
  18. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/decorators.py +0 -0
  19. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/__init__.py +0 -0
  20. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/application.py +0 -0
  21. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/base.py +0 -0
  22. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/experiment.py +0 -0
  23. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/project.py +0 -0
  24. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/__init__.py +0 -0
  25. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_application.py +0 -0
  26. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_dataset.py +0 -0
  27. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_dataset_items.py +0 -0
  28. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_experiment.py +0 -0
  29. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_experiment_items.py +0 -0
  30. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_experiment_results.py +0 -0
  31. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/entities/tests/test_project.py +0 -0
  32. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/__init__.py +0 -0
  33. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/answer_relevance.py +0 -0
  34. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/base.py +0 -0
  35. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/coherence.py +0 -0
  36. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/conciseness.py +0 -0
  37. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/eval_fn.py +0 -0
  38. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/ftl_prompt_safety.py +0 -0
  39. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/ftl_response_faithfulness.py +0 -0
  40. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/regex.py +0 -0
  41. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/sentiment.py +0 -0
  42. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/__init__.py +0 -0
  43. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_answer_relevance.py +0 -0
  44. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_coherence.py +0 -0
  45. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_conciseness.py +0 -0
  46. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_eval_fn.py +0 -0
  47. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_ftl_prompt_safety.py +0 -0
  48. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_ftl_response_faithfulness.py +0 -0
  49. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_regex.py +0 -0
  50. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_sentiment.py +0 -0
  51. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_topic_classification.py +0 -0
  52. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/tests/test_toxicity.py +0 -0
  53. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/topic.py +0 -0
  54. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/evaluators/toxicity.py +0 -0
  55. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/exceptions.py +0 -0
  56. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/__init__.py +0 -0
  57. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/http_client.py +0 -0
  58. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/json_encoder.py +0 -0
  59. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/semver.py +0 -0
  60. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/tests/__init__.py +0 -0
  61. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/tests/test_json_encoder.py +0 -0
  62. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/libs/tests/test_request_client.py +0 -0
  63. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/__init__.py +0 -0
  64. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/application.py +0 -0
  65. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/base.py +0 -0
  66. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/compact.py +0 -0
  67. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/dataset.py +0 -0
  68. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/error.py +0 -0
  69. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/evaluator.py +0 -0
  70. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/experiment.py +0 -0
  71. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/filter_query.py +0 -0
  72. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/project.py +0 -0
  73. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/response.py +0 -0
  74. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/score.py +0 -0
  75. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/pydantic_models/server_info.py +0 -0
  76. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/__init__.py +0 -0
  77. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/evaluation.py +0 -0
  78. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/executor.py +0 -0
  79. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/tests/__init__.py +0 -0
  80. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/runner/tests/test_experiment_result_publisher.py +0 -0
  81. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/tests/__init__.py +0 -0
  82. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/tests/constants.py +0 -0
  83. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/tests/test_connection.py +0 -0
  84. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/tests/test_decorators.py +0 -0
  85. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/__init__.py +0 -0
  86. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/environment.py +0 -0
  87. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/pd.py +0 -0
  88. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/tests/__init__.py +0 -0
  89. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/tests/test_environment.py +0 -0
  90. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/utils/tqdm.py +0 -0
  91. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals/version.py +0 -0
  92. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals.egg-info/SOURCES.txt +0 -0
  93. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals.egg-info/dependency_links.txt +0 -0
  94. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals.egg-info/requires.txt +0 -0
  95. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/fiddler_evals.egg-info/top_level.txt +0 -0
  96. {fiddler_evals-0.1.1.dev12 → fiddler_evals-0.1.1.dev13}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: fiddler-evals
3
- Version: 0.1.1.dev12
3
+ Version: 0.1.1.dev13
4
4
  Summary: Python SDK for evaluating LLM Applications
5
5
  Author-email: Fiddler AI <support@fiddler.ai>
6
6
  Maintainer-email: Fiddler AI <support@fiddler.ai>
@@ -0,0 +1 @@
1
+ 0.1.1.dev13
@@ -732,7 +732,10 @@ class Dataset(BaseEntity):
732
732
  with list(dataset.get_items()) if you need to iterate multiple times or get
733
733
  the total count. The iterator fetches items lazily from the API.
734
734
  """
735
- for item in self._paginate(url=f"{self._get_url(self.id)}/items"):
735
+ # Read upto 1K dataset items in a call to reduce network calls and latency
736
+ for item in self._paginate(
737
+ url=f"{self._get_url(self.id)}/items", page_size=1000
738
+ ):
736
739
  yield DatasetItem(**item)
737
740
 
738
741
  @handle_api_error
@@ -61,7 +61,7 @@ class ExperimentResultPublisher:
61
61
 
62
62
  # Auto-flush when batch size is reached
63
63
  if len(self._buffer) >= self._batch_size:
64
- logger.info(
64
+ logger.debug(
65
65
  "Flushing experiment result buffer of size %d", len(self._buffer)
66
66
  )
67
67
  self._flush_internal()
@@ -656,6 +656,11 @@ class ExperimentRunner:
656
656
  self._dataset.name,
657
657
  )
658
658
 
659
+ # Mark the experiment as in progress
660
+ self._experiment.update(
661
+ status=ExperimentStatus.IN_PROGRESS,
662
+ )
663
+
659
664
  # Use a thread pool to process the dataset items when max_workers > 1
660
665
  if self._max_workers > 1:
661
666
  results = thread_map(
@@ -1,3 +1,4 @@
1
+ import json
1
2
  from datetime import datetime
2
3
  from typing import Any
3
4
  from unittest import mock
@@ -147,7 +148,23 @@ def test_evaluate_with_regex_with_kwargs_mapping() -> None:
147
148
  json=EXPERIMENT_API_RESPONSE,
148
149
  )
149
150
 
150
- # Mock experiment updation
151
+ # Mock experiment status update to IN_PROGRESS with request body verification
152
+ in_progress_response = EXPERIMENT_API_RESPONSE.copy()
153
+ in_progress_response["data"]["status"] = ExperimentStatus.IN_PROGRESS
154
+
155
+ def in_progress_callback(request):
156
+ # Verify that the request body contains the correct status
157
+ request_body = json.loads(request.body)
158
+ assert request_body["status"] == ExperimentStatus.IN_PROGRESS
159
+ return (200, {}, json.dumps(in_progress_response))
160
+
161
+ responses.add_callback(
162
+ responses.PATCH,
163
+ url=f"{URL}/v3/evals/experiments/{EXPERIMENT_ID}",
164
+ callback=in_progress_callback,
165
+ )
166
+
167
+ # Mock experiment updation to COMPLETED
151
168
  updated_response = EXPERIMENT_API_RESPONSE.copy()
152
169
  updated_response["data"]["status"] = ExperimentStatus.COMPLETED
153
170
  responses.patch(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: fiddler-evals
3
- Version: 0.1.1.dev12
3
+ Version: 0.1.1.dev13
4
4
  Summary: Python SDK for evaluating LLM Applications
5
5
  Author-email: Fiddler AI <support@fiddler.ai>
6
6
  Maintainer-email: Fiddler AI <support@fiddler.ai>
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "fiddler-evals"
3
- version = "0.1.1.dev12"
3
+ version = "0.1.1.dev13"
4
4
  authors = [
5
5
  { name = "Fiddler AI", email = "support@fiddler.ai" },
6
6
  ]
@@ -1 +0,0 @@
1
- 0.1.1.dev12