scale-gp-beta 0.1.0a11__tar.gz → 0.1.0a12__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (144) hide show
  1. scale_gp_beta-0.1.0a12/.release-please-manifest.json +3 -0
  2. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/CHANGELOG.md +8 -0
  3. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/PKG-INFO +1 -1
  4. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/pyproject.toml +1 -1
  5. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_version.py +1 -1
  6. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_task.py +94 -1
  7. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_task_param.py +89 -1
  8. scale_gp_beta-0.1.0a11/.release-please-manifest.json +0 -3
  9. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/.gitignore +0 -0
  10. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/CONTRIBUTING.md +0 -0
  11. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/LICENSE +0 -0
  12. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/README.md +0 -0
  13. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/SECURITY.md +0 -0
  14. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/api.md +0 -0
  15. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/bin/check-release-environment +0 -0
  16. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/bin/publish-pypi +0 -0
  17. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/examples/.keep +0 -0
  18. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/mypy.ini +0 -0
  19. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/noxfile.py +0 -0
  20. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/release-please-config.json +0 -0
  21. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/requirements-dev.lock +0 -0
  22. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/requirements.lock +0 -0
  23. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp/lib/.keep +0 -0
  24. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/__init__.py +0 -0
  25. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_base_client.py +0 -0
  26. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_client.py +0 -0
  27. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_compat.py +0 -0
  28. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_constants.py +0 -0
  29. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_exceptions.py +0 -0
  30. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_files.py +0 -0
  31. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_models.py +0 -0
  32. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_qs.py +0 -0
  33. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_resource.py +0 -0
  34. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_response.py +0 -0
  35. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_streaming.py +0 -0
  36. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_types.py +0 -0
  37. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/__init__.py +0 -0
  38. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_logs.py +0 -0
  39. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_proxy.py +0 -0
  40. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_reflection.py +0 -0
  41. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_streams.py +0 -0
  42. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_sync.py +0 -0
  43. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_transform.py +0 -0
  44. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_typing.py +0 -0
  45. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/_utils/_utils.py +0 -0
  46. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/lib/.keep +0 -0
  47. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/pagination.py +0 -0
  48. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/py.typed +0 -0
  49. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/__init__.py +0 -0
  50. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/chat/__init__.py +0 -0
  51. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/chat/chat.py +0 -0
  52. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/chat/completions.py +0 -0
  53. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/completions.py +0 -0
  54. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/dataset_items.py +0 -0
  55. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/datasets.py +0 -0
  56. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/evaluation_items.py +0 -0
  57. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/evaluations.py +0 -0
  58. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/files/__init__.py +0 -0
  59. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/files/content.py +0 -0
  60. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/files/files.py +0 -0
  61. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/inference.py +0 -0
  62. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/models.py +0 -0
  63. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/resources/spans.py +0 -0
  64. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/__init__.py +0 -0
  65. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/chat/__init__.py +0 -0
  66. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/chat/chat_completion.py +0 -0
  67. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/chat/chat_completion_chunk.py +0 -0
  68. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/chat/completion_create_params.py +0 -0
  69. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/chat/completion_create_response.py +0 -0
  70. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/completion.py +0 -0
  71. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/completion_create_params.py +0 -0
  72. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset.py +0 -0
  73. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_create_params.py +0 -0
  74. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_delete_response.py +0 -0
  75. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item.py +0 -0
  76. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_batch_create_params.py +0 -0
  77. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_batch_create_response.py +0 -0
  78. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_delete_response.py +0 -0
  79. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_list_params.py +0 -0
  80. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_retrieve_params.py +0 -0
  81. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_item_update_params.py +0 -0
  82. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_list_params.py +0 -0
  83. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_retrieve_params.py +0 -0
  84. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/dataset_update_params.py +0 -0
  85. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation.py +0 -0
  86. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_archive_response.py +0 -0
  87. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_create_params.py +0 -0
  88. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_item.py +0 -0
  89. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_item_list_params.py +0 -0
  90. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_item_retrieve_params.py +0 -0
  91. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_list_params.py +0 -0
  92. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/evaluation_retrieve_params.py +0 -0
  93. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file.py +0 -0
  94. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file_create_params.py +0 -0
  95. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file_delete_response.py +0 -0
  96. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file_list.py +0 -0
  97. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file_list_params.py +0 -0
  98. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/file_update_params.py +0 -0
  99. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/files/__init__.py +0 -0
  100. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_create_params.py +0 -0
  101. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_create_response.py +0 -0
  102. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_model.py +0 -0
  103. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_model_list.py +0 -0
  104. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_response.py +0 -0
  105. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/inference_response_chunk.py +0 -0
  106. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/model_create_params.py +0 -0
  107. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/model_delete_response.py +0 -0
  108. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/model_list_params.py +0 -0
  109. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/model_update_params.py +0 -0
  110. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/span.py +0 -0
  111. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/span_create_params.py +0 -0
  112. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/span_list_params.py +0 -0
  113. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/scale_gp_beta/types/span_update_params.py +0 -0
  114. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/src/sgp_dev/lib/.keep +0 -0
  115. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/__init__.py +0 -0
  116. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/__init__.py +0 -0
  117. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/chat/__init__.py +0 -0
  118. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/chat/test_completions.py +0 -0
  119. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/files/__init__.py +0 -0
  120. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/files/test_content.py +0 -0
  121. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_completions.py +0 -0
  122. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_dataset_items.py +0 -0
  123. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_datasets.py +0 -0
  124. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_evaluation_items.py +0 -0
  125. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_evaluations.py +0 -0
  126. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_files.py +0 -0
  127. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_inference.py +0 -0
  128. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_models.py +0 -0
  129. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/api_resources/test_spans.py +0 -0
  130. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/conftest.py +0 -0
  131. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/sample_file.txt +0 -0
  132. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_client.py +0 -0
  133. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_deepcopy.py +0 -0
  134. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_extract_files.py +0 -0
  135. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_files.py +0 -0
  136. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_models.py +0 -0
  137. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_qs.py +0 -0
  138. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_required_args.py +0 -0
  139. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_response.py +0 -0
  140. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_streaming.py +0 -0
  141. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_transform.py +0 -0
  142. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_utils/test_proxy.py +0 -0
  143. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/test_utils/test_typing.py +0 -0
  144. {scale_gp_beta-0.1.0a11 → scale_gp_beta-0.1.0a12}/tests/utils.py +0 -0
@@ -0,0 +1,3 @@
1
+ {
2
+ ".": "0.1.0-alpha.12"
3
+ }
@@ -1,5 +1,13 @@
1
1
  # Changelog
2
2
 
3
+ ## 0.1.0-alpha.12 (2025-04-25)
4
+
5
+ Full Changelog: [v0.1.0-alpha.11...v0.1.0-alpha.12](https://github.com/scaleapi/sgp-python-beta/compare/v0.1.0-alpha.11...v0.1.0-alpha.12)
6
+
7
+ ### Features
8
+
9
+ * **api:** api update ([3cfce67](https://github.com/scaleapi/sgp-python-beta/commit/3cfce670301591436df98a53e816e806f2fd952e))
10
+
3
11
  ## 0.1.0-alpha.11 (2025-04-23)
4
12
 
5
13
  Full Changelog: [v0.1.0-alpha.10...v0.1.0-alpha.11](https://github.com/scaleapi/sgp-python-beta/compare/v0.1.0-alpha.10...v0.1.0-alpha.11)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: scale-gp-beta
3
- Version: 0.1.0a11
3
+ Version: 0.1.0a12
4
4
  Summary: The official Python library for the Scale GP API
5
5
  Project-URL: Homepage, https://github.com/scaleapi/sgp-python-beta
6
6
  Project-URL: Repository, https://github.com/scaleapi/sgp-python-beta
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "scale-gp-beta"
3
- version = "0.1.0-alpha.11"
3
+ version = "0.1.0-alpha.12"
4
4
  description = "The official Python library for the Scale GP API"
5
5
  dynamic = ["readme"]
6
6
  license = "Apache-2.0"
@@ -1,4 +1,4 @@
1
1
  # File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
2
2
 
3
3
  __title__ = "scale_gp_beta"
4
- __version__ = "0.1.0-alpha.11" # x-release-please-version
4
+ __version__ = "0.1.0-alpha.12" # x-release-please-version
@@ -21,6 +21,15 @@ __all__ = [
21
21
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverrides",
22
22
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverridesInitialState",
23
23
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverridesPartialTrace",
24
+ "MetricEvaluationTask",
25
+ "MetricEvaluationTaskConfiguration",
26
+ "MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator",
27
+ "MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator",
28
+ "MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator",
29
+ "MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator",
30
+ "MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator",
31
+ "MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator",
32
+ "MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator",
24
33
  ]
25
34
 
26
35
 
@@ -199,7 +208,91 @@ class ApplicationVariantV1EvaluationTask(BaseModel):
199
208
  task_type: Optional[Literal["application_variant"]] = None
200
209
 
201
210
 
211
+ class MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator(BaseModel):
212
+ candidate: str
213
+
214
+ reference: str
215
+
216
+ type: Literal["bleu"]
217
+
218
+
219
+ class MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator(BaseModel):
220
+ candidate: str
221
+
222
+ reference: str
223
+
224
+ type: Literal["meteor"]
225
+
226
+
227
+ class MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator(BaseModel):
228
+ candidate: str
229
+
230
+ reference: str
231
+
232
+ type: Literal["cosine_similarity"]
233
+
234
+
235
+ class MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator(BaseModel):
236
+ candidate: str
237
+
238
+ reference: str
239
+
240
+ type: Literal["f1"]
241
+
242
+
243
+ class MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator(BaseModel):
244
+ candidate: str
245
+
246
+ reference: str
247
+
248
+ type: Literal["rouge1"]
249
+
250
+
251
+ class MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator(BaseModel):
252
+ candidate: str
253
+
254
+ reference: str
255
+
256
+ type: Literal["rouge2"]
257
+
258
+
259
+ class MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator(BaseModel):
260
+ candidate: str
261
+
262
+ reference: str
263
+
264
+ type: Literal["rougeL"]
265
+
266
+
267
+ MetricEvaluationTaskConfiguration: TypeAlias = Annotated[
268
+ Union[
269
+ MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator,
270
+ MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator,
271
+ MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator,
272
+ MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator,
273
+ MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator,
274
+ MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator,
275
+ MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator,
276
+ ],
277
+ PropertyInfo(discriminator="type"),
278
+ ]
279
+
280
+
281
+ class MetricEvaluationTask(BaseModel):
282
+ configuration: MetricEvaluationTaskConfiguration
283
+
284
+ alias: Optional[str] = None
285
+ """Alias to title the results column. Defaults to the `task_type`"""
286
+
287
+ task_type: Optional[Literal["metric"]] = None
288
+
289
+
202
290
  EvaluationTask: TypeAlias = Annotated[
203
- Union[ChatCompletionEvaluationTask, GenericInferenceEvaluationTask, ApplicationVariantV1EvaluationTask],
291
+ Union[
292
+ ChatCompletionEvaluationTask,
293
+ GenericInferenceEvaluationTask,
294
+ ApplicationVariantV1EvaluationTask,
295
+ MetricEvaluationTask,
296
+ ],
204
297
  PropertyInfo(discriminator="task_type"),
205
298
  ]
@@ -20,6 +20,15 @@ __all__ = [
20
20
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverrides",
21
21
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverridesInitialState",
22
22
  "ApplicationVariantV1EvaluationTaskConfigurationOverridesAgenticApplicationOverridesPartialTrace",
23
+ "MetricEvaluationTask",
24
+ "MetricEvaluationTaskConfiguration",
25
+ "MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator",
26
+ "MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator",
27
+ "MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator",
28
+ "MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator",
29
+ "MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator",
30
+ "MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator",
31
+ "MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator",
23
32
  ]
24
33
 
25
34
 
@@ -201,6 +210,85 @@ class ApplicationVariantV1EvaluationTask(TypedDict, total=False):
201
210
  task_type: Literal["application_variant"]
202
211
 
203
212
 
213
+ class MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator(TypedDict, total=False):
214
+ candidate: Required[str]
215
+
216
+ reference: Required[str]
217
+
218
+ type: Required[Literal["bleu"]]
219
+
220
+
221
+ class MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator(TypedDict, total=False):
222
+ candidate: Required[str]
223
+
224
+ reference: Required[str]
225
+
226
+ type: Required[Literal["meteor"]]
227
+
228
+
229
+ class MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator(TypedDict, total=False):
230
+ candidate: Required[str]
231
+
232
+ reference: Required[str]
233
+
234
+ type: Required[Literal["cosine_similarity"]]
235
+
236
+
237
+ class MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator(TypedDict, total=False):
238
+ candidate: Required[str]
239
+
240
+ reference: Required[str]
241
+
242
+ type: Required[Literal["f1"]]
243
+
244
+
245
+ class MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator(TypedDict, total=False):
246
+ candidate: Required[str]
247
+
248
+ reference: Required[str]
249
+
250
+ type: Required[Literal["rouge1"]]
251
+
252
+
253
+ class MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator(TypedDict, total=False):
254
+ candidate: Required[str]
255
+
256
+ reference: Required[str]
257
+
258
+ type: Required[Literal["rouge2"]]
259
+
260
+
261
+ class MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator(TypedDict, total=False):
262
+ candidate: Required[str]
263
+
264
+ reference: Required[str]
265
+
266
+ type: Required[Literal["rougeL"]]
267
+
268
+
269
+ MetricEvaluationTaskConfiguration: TypeAlias = Union[
270
+ MetricEvaluationTaskConfigurationBleuScorerConfigWithItemLocator,
271
+ MetricEvaluationTaskConfigurationMeteorScorerConfigWithItemLocator,
272
+ MetricEvaluationTaskConfigurationCosineSimilarityScorerConfigWithItemLocator,
273
+ MetricEvaluationTaskConfigurationF1ScorerConfigWithItemLocator,
274
+ MetricEvaluationTaskConfigurationRougeScorer1ConfigWithItemLocator,
275
+ MetricEvaluationTaskConfigurationRougeScorer2ConfigWithItemLocator,
276
+ MetricEvaluationTaskConfigurationRougeScorerLConfigWithItemLocator,
277
+ ]
278
+
279
+
280
+ class MetricEvaluationTask(TypedDict, total=False):
281
+ configuration: Required[MetricEvaluationTaskConfiguration]
282
+
283
+ alias: str
284
+ """Alias to title the results column. Defaults to the `task_type`"""
285
+
286
+ task_type: Literal["metric"]
287
+
288
+
204
289
  EvaluationTaskParam: TypeAlias = Union[
205
- ChatCompletionEvaluationTask, GenericInferenceEvaluationTask, ApplicationVariantV1EvaluationTask
290
+ ChatCompletionEvaluationTask,
291
+ GenericInferenceEvaluationTask,
292
+ ApplicationVariantV1EvaluationTask,
293
+ MetricEvaluationTask,
206
294
  ]
@@ -1,3 +0,0 @@
1
- {
2
- ".": "0.1.0-alpha.11"
3
- }