azure-ai-evaluation 1.7.0__py3-none-any.whl → 1.9.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (136) hide show
  1. azure/ai/evaluation/__init__.py +13 -2
  2. azure/ai/evaluation/_aoai/__init__.py +1 -1
  3. azure/ai/evaluation/_aoai/aoai_grader.py +21 -11
  4. azure/ai/evaluation/_aoai/label_grader.py +3 -2
  5. azure/ai/evaluation/_aoai/score_model_grader.py +90 -0
  6. azure/ai/evaluation/_aoai/string_check_grader.py +3 -2
  7. azure/ai/evaluation/_aoai/text_similarity_grader.py +3 -2
  8. azure/ai/evaluation/_azure/_envs.py +9 -10
  9. azure/ai/evaluation/_azure/_token_manager.py +7 -1
  10. azure/ai/evaluation/_common/constants.py +11 -2
  11. azure/ai/evaluation/_common/evaluation_onedp_client.py +32 -26
  12. azure/ai/evaluation/_common/onedp/__init__.py +32 -32
  13. azure/ai/evaluation/_common/onedp/_client.py +136 -139
  14. azure/ai/evaluation/_common/onedp/_configuration.py +70 -73
  15. azure/ai/evaluation/_common/onedp/_patch.py +21 -21
  16. azure/ai/evaluation/_common/onedp/_utils/__init__.py +6 -0
  17. azure/ai/evaluation/_common/onedp/_utils/model_base.py +1232 -0
  18. azure/ai/evaluation/_common/onedp/_utils/serialization.py +2032 -0
  19. azure/ai/evaluation/_common/onedp/_validation.py +50 -50
  20. azure/ai/evaluation/_common/onedp/_version.py +9 -9
  21. azure/ai/evaluation/_common/onedp/aio/__init__.py +29 -29
  22. azure/ai/evaluation/_common/onedp/aio/_client.py +138 -143
  23. azure/ai/evaluation/_common/onedp/aio/_configuration.py +70 -75
  24. azure/ai/evaluation/_common/onedp/aio/_patch.py +21 -21
  25. azure/ai/evaluation/_common/onedp/aio/operations/__init__.py +37 -39
  26. azure/ai/evaluation/_common/onedp/aio/operations/_operations.py +4832 -4494
  27. azure/ai/evaluation/_common/onedp/aio/operations/_patch.py +21 -21
  28. azure/ai/evaluation/_common/onedp/models/__init__.py +168 -142
  29. azure/ai/evaluation/_common/onedp/models/_enums.py +230 -162
  30. azure/ai/evaluation/_common/onedp/models/_models.py +2685 -2228
  31. azure/ai/evaluation/_common/onedp/models/_patch.py +21 -21
  32. azure/ai/evaluation/_common/onedp/operations/__init__.py +37 -39
  33. azure/ai/evaluation/_common/onedp/operations/_operations.py +6106 -5655
  34. azure/ai/evaluation/_common/onedp/operations/_patch.py +21 -21
  35. azure/ai/evaluation/_common/rai_service.py +86 -50
  36. azure/ai/evaluation/_common/raiclient/__init__.py +1 -1
  37. azure/ai/evaluation/_common/raiclient/operations/_operations.py +14 -1
  38. azure/ai/evaluation/_common/utils.py +124 -3
  39. azure/ai/evaluation/_constants.py +2 -1
  40. azure/ai/evaluation/_converters/__init__.py +1 -1
  41. azure/ai/evaluation/_converters/_ai_services.py +9 -8
  42. azure/ai/evaluation/_converters/_models.py +46 -0
  43. azure/ai/evaluation/_converters/_sk_services.py +495 -0
  44. azure/ai/evaluation/_eval_mapping.py +2 -2
  45. azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py +4 -4
  46. azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py +2 -2
  47. azure/ai/evaluation/_evaluate/_evaluate.py +64 -58
  48. azure/ai/evaluation/_evaluate/_evaluate_aoai.py +130 -89
  49. azure/ai/evaluation/_evaluate/_telemetry/__init__.py +0 -1
  50. azure/ai/evaluation/_evaluate/_utils.py +24 -15
  51. azure/ai/evaluation/_evaluators/_bleu/_bleu.py +3 -3
  52. azure/ai/evaluation/_evaluators/_code_vulnerability/_code_vulnerability.py +12 -11
  53. azure/ai/evaluation/_evaluators/_coherence/_coherence.py +5 -5
  54. azure/ai/evaluation/_evaluators/_common/_base_eval.py +15 -5
  55. azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py +24 -9
  56. azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py +6 -1
  57. azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py +13 -13
  58. azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py +7 -7
  59. azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py +7 -7
  60. azure/ai/evaluation/_evaluators/_content_safety/_sexual.py +7 -7
  61. azure/ai/evaluation/_evaluators/_content_safety/_violence.py +6 -6
  62. azure/ai/evaluation/_evaluators/_document_retrieval/__init__.py +1 -5
  63. azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py +34 -64
  64. azure/ai/evaluation/_evaluators/_eci/_eci.py +3 -3
  65. azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py +4 -4
  66. azure/ai/evaluation/_evaluators/_fluency/_fluency.py +2 -2
  67. azure/ai/evaluation/_evaluators/_gleu/_gleu.py +3 -3
  68. azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py +11 -7
  69. azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py +30 -25
  70. azure/ai/evaluation/_evaluators/_intent_resolution/intent_resolution.prompty +210 -96
  71. azure/ai/evaluation/_evaluators/_meteor/_meteor.py +2 -3
  72. azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py +6 -6
  73. azure/ai/evaluation/_evaluators/_qa/_qa.py +4 -4
  74. azure/ai/evaluation/_evaluators/_relevance/_relevance.py +8 -13
  75. azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py +20 -25
  76. azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py +4 -4
  77. azure/ai/evaluation/_evaluators/_rouge/_rouge.py +25 -25
  78. azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py +5 -5
  79. azure/ai/evaluation/_evaluators/_similarity/_similarity.py +3 -3
  80. azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py +11 -14
  81. azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py +43 -34
  82. azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty +3 -3
  83. azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py +12 -11
  84. azure/ai/evaluation/_evaluators/_xpia/xpia.py +6 -6
  85. azure/ai/evaluation/_exceptions.py +10 -0
  86. azure/ai/evaluation/_http_utils.py +3 -3
  87. azure/ai/evaluation/_legacy/_batch_engine/_engine.py +3 -3
  88. azure/ai/evaluation/_legacy/_batch_engine/_openai_injector.py +5 -2
  89. azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py +5 -10
  90. azure/ai/evaluation/_legacy/_batch_engine/_utils.py +1 -4
  91. azure/ai/evaluation/_legacy/_common/_async_token_provider.py +12 -19
  92. azure/ai/evaluation/_legacy/_common/_thread_pool_executor_with_context.py +2 -0
  93. azure/ai/evaluation/_legacy/prompty/_prompty.py +11 -5
  94. azure/ai/evaluation/_safety_evaluation/__init__.py +1 -1
  95. azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py +193 -111
  96. azure/ai/evaluation/_user_agent.py +32 -1
  97. azure/ai/evaluation/_version.py +1 -1
  98. azure/ai/evaluation/red_team/__init__.py +3 -1
  99. azure/ai/evaluation/red_team/_agent/__init__.py +3 -0
  100. azure/ai/evaluation/red_team/_agent/_agent_functions.py +261 -0
  101. azure/ai/evaluation/red_team/_agent/_agent_tools.py +461 -0
  102. azure/ai/evaluation/red_team/_agent/_agent_utils.py +89 -0
  103. azure/ai/evaluation/red_team/_agent/_semantic_kernel_plugin.py +228 -0
  104. azure/ai/evaluation/red_team/_attack_objective_generator.py +94 -52
  105. azure/ai/evaluation/red_team/_attack_strategy.py +4 -1
  106. azure/ai/evaluation/red_team/_callback_chat_target.py +4 -9
  107. azure/ai/evaluation/red_team/_default_converter.py +1 -1
  108. azure/ai/evaluation/red_team/_red_team.py +1622 -765
  109. azure/ai/evaluation/red_team/_red_team_result.py +43 -38
  110. azure/ai/evaluation/red_team/_utils/__init__.py +1 -1
  111. azure/ai/evaluation/red_team/_utils/_rai_service_eval_chat_target.py +121 -0
  112. azure/ai/evaluation/red_team/_utils/_rai_service_target.py +595 -0
  113. azure/ai/evaluation/red_team/_utils/_rai_service_true_false_scorer.py +108 -0
  114. azure/ai/evaluation/red_team/_utils/constants.py +6 -12
  115. azure/ai/evaluation/red_team/_utils/formatting_utils.py +41 -44
  116. azure/ai/evaluation/red_team/_utils/logging_utils.py +17 -17
  117. azure/ai/evaluation/red_team/_utils/metric_mapping.py +33 -6
  118. azure/ai/evaluation/red_team/_utils/strategy_utils.py +35 -25
  119. azure/ai/evaluation/simulator/_adversarial_scenario.py +2 -0
  120. azure/ai/evaluation/simulator/_adversarial_simulator.py +34 -16
  121. azure/ai/evaluation/simulator/_conversation/__init__.py +2 -2
  122. azure/ai/evaluation/simulator/_direct_attack_simulator.py +8 -8
  123. azure/ai/evaluation/simulator/_indirect_attack_simulator.py +5 -5
  124. azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py +54 -23
  125. azure/ai/evaluation/simulator/_model_tools/_identity_manager.py +7 -1
  126. azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py +25 -15
  127. azure/ai/evaluation/simulator/_model_tools/_rai_client.py +19 -31
  128. azure/ai/evaluation/simulator/_model_tools/_template_handler.py +20 -6
  129. azure/ai/evaluation/simulator/_model_tools/models.py +1 -1
  130. azure/ai/evaluation/simulator/_simulator.py +9 -8
  131. {azure_ai_evaluation-1.7.0.dist-info → azure_ai_evaluation-1.9.0.dist-info}/METADATA +24 -1
  132. {azure_ai_evaluation-1.7.0.dist-info → azure_ai_evaluation-1.9.0.dist-info}/RECORD +135 -123
  133. azure/ai/evaluation/_common/onedp/aio/_vendor.py +0 -40
  134. {azure_ai_evaluation-1.7.0.dist-info → azure_ai_evaluation-1.9.0.dist-info}/NOTICE.txt +0 -0
  135. {azure_ai_evaluation-1.7.0.dist-info → azure_ai_evaluation-1.9.0.dist-info}/WHEEL +0 -0
  136. {azure_ai_evaluation-1.7.0.dist-info → azure_ai_evaluation-1.9.0.dist-info}/top_level.txt +0 -0
@@ -1,21 +1,21 @@
1
- # coding=utf-8
2
- # --------------------------------------------------------------------------
3
- # Copyright (c) Microsoft Corporation. All rights reserved.
4
- # Licensed under the MIT License. See License.txt in the project root for license information.
5
- # --------------------------------------------------------------------------
6
- """Customize generated code here.
7
-
8
- Follow our quickstart for examples: https://aka.ms/azsdk/python/dpcodegen/python/customize
9
- """
10
- from typing import List
11
-
12
- __all__: List[str] = [] # Add all objects you want publicly available to users at this package level
13
-
14
-
15
- def patch_sdk():
16
- """Do not remove from this file.
17
-
18
- `patch_sdk` is a last resort escape hatch that allows you to do customizations
19
- you can't accomplish using the techniques described in
20
- https://aka.ms/azsdk/python/dpcodegen/python/customize
21
- """
1
+ # coding=utf-8
2
+ # --------------------------------------------------------------------------
3
+ # Copyright (c) Microsoft Corporation. All rights reserved.
4
+ # Licensed under the MIT License. See License.txt in the project root for license information.
5
+ # --------------------------------------------------------------------------
6
+ """Customize generated code here.
7
+
8
+ Follow our quickstart for examples: https://aka.ms/azsdk/python/dpcodegen/python/customize
9
+ """
10
+ from typing import List
11
+
12
+ __all__: List[str] = [] # Add all objects you want publicly available to users at this package level
13
+
14
+
15
+ def patch_sdk():
16
+ """Do not remove from this file.
17
+
18
+ `patch_sdk` is a last resort escape hatch that allows you to do customizations
19
+ you can't accomplish using the techniques described in
20
+ https://aka.ms/azsdk/python/dpcodegen/python/customize
21
+ """
@@ -1,142 +1,168 @@
1
- # coding=utf-8
2
- # --------------------------------------------------------------------------
3
- # Copyright (c) Microsoft Corporation. All rights reserved.
4
- # Licensed under the MIT License. See License.txt in the project root for license information.
5
- # Code generated by Microsoft (R) Python Code Generator.
6
- # Changes may cause incorrect behavior and will be lost if the code is regenerated.
7
- # --------------------------------------------------------------------------
8
- # pylint: disable=wrong-import-position
9
-
10
- from typing import TYPE_CHECKING
11
-
12
- if TYPE_CHECKING:
13
- from ._patch import * # pylint: disable=unused-wildcard-import
14
-
15
-
16
- from ._models import ( # type: ignore
17
- AOAIModelConfig,
18
- AnnotationDTO,
19
- ApiKeyCredentials,
20
- AssetCredentialRequest,
21
- AssetCredentialResponse,
22
- AttackObjective,
23
- AzureAISearchIndex,
24
- BaseCredentials,
25
- BlobReferenceForConsumption,
26
- Connection,
27
- Content,
28
- CosmosDBIndex,
29
- CustomCredential,
30
- CustomizationParameters,
31
- DatasetVersion,
32
- Deployment,
33
- EmbeddingConfiguration,
34
- EntraIDCredentials,
35
- Evaluation,
36
- EvaluationResult,
37
- EvaluationTarget,
38
- EvaluationUpload,
39
- EvaluatorConfiguration,
40
- FileDatasetVersion,
41
- FolderDatasetVersion,
42
- Index,
43
- InputData,
44
- InputDataset,
45
- LongRunningResponse,
46
- MAASModelConfig,
47
- ManagedAzureAISearchIndex,
48
- Message,
49
- Metadata,
50
- ModelDeployment,
51
- NoAuthenticationCredentials,
52
- PendingUploadRequest,
53
- PendingUploadResponse,
54
- RedTeam,
55
- RedTeamUpload,
56
- SASCredentials,
57
- SasCredential,
58
- SimulationDTO,
59
- Sku,
60
- SystemData,
61
- TargetHarm,
62
- TargetModelConfig,
63
- )
64
-
65
- from ._enums import ( # type: ignore
66
- AttackStrategy,
67
- ConnectionType,
68
- CredentialType,
69
- DatasetType,
70
- DeploymentType,
71
- IndexType,
72
- ListViewType,
73
- PendingUploadType,
74
- ResultType,
75
- RiskCategory,
76
- SimulationType,
77
- )
78
- from ._patch import __all__ as _patch_all
79
- from ._patch import *
80
- from ._patch import patch_sdk as _patch_sdk
81
-
82
- __all__ = [
83
- "AOAIModelConfig",
84
- "AnnotationDTO",
85
- "ApiKeyCredentials",
86
- "AssetCredentialRequest",
87
- "AssetCredentialResponse",
88
- "AttackObjective",
89
- "AzureAISearchIndex",
90
- "BaseCredentials",
91
- "BlobReferenceForConsumption",
92
- "Connection",
93
- "Content",
94
- "CosmosDBIndex",
95
- "CustomCredential",
96
- "CustomizationParameters",
97
- "DatasetVersion",
98
- "Deployment",
99
- "EmbeddingConfiguration",
100
- "EntraIDCredentials",
101
- "Evaluation",
102
- "EvaluationResult",
103
- "EvaluationTarget",
104
- "EvaluationUpload",
105
- "EvaluatorConfiguration",
106
- "FileDatasetVersion",
107
- "FolderDatasetVersion",
108
- "Index",
109
- "InputData",
110
- "InputDataset",
111
- "LongRunningResponse",
112
- "MAASModelConfig",
113
- "ManagedAzureAISearchIndex",
114
- "Message",
115
- "Metadata",
116
- "ModelDeployment",
117
- "NoAuthenticationCredentials",
118
- "PendingUploadRequest",
119
- "PendingUploadResponse",
120
- "RedTeam",
121
- "RedTeamUpload",
122
- "SASCredentials",
123
- "SasCredential",
124
- "SimulationDTO",
125
- "Sku",
126
- "SystemData",
127
- "TargetHarm",
128
- "TargetModelConfig",
129
- "AttackStrategy",
130
- "ConnectionType",
131
- "CredentialType",
132
- "DatasetType",
133
- "DeploymentType",
134
- "IndexType",
135
- "ListViewType",
136
- "PendingUploadType",
137
- "ResultType",
138
- "RiskCategory",
139
- "SimulationType",
140
- ]
141
- __all__.extend([p for p in _patch_all if p not in __all__]) # pyright: ignore
142
- _patch_sdk()
1
+ # coding=utf-8
2
+ # --------------------------------------------------------------------------
3
+ # Copyright (c) Microsoft Corporation. All rights reserved.
4
+ # Licensed under the MIT License. See License.txt in the project root for license information.
5
+ # Code generated by Microsoft (R) Python Code Generator.
6
+ # Changes may cause incorrect behavior and will be lost if the code is regenerated.
7
+ # --------------------------------------------------------------------------
8
+ # pylint: disable=wrong-import-position
9
+
10
+ from typing import TYPE_CHECKING
11
+
12
+ if TYPE_CHECKING:
13
+ from ._patch import * # pylint: disable=unused-wildcard-import
14
+
15
+
16
+ from ._models import ( # type: ignore
17
+ AOAIModelConfig,
18
+ AgentEvaluation,
19
+ AgentEvaluationRedactionConfiguration,
20
+ AgentEvaluationRequest,
21
+ AgentEvaluationResult,
22
+ AgentEvaluationSamplingConfiguration,
23
+ AnnotationDTO,
24
+ ApiKeyCredentials,
25
+ AssetCredentialRequest,
26
+ AssetCredentialResponse,
27
+ AttackObjective,
28
+ AzureAISearchIndex,
29
+ BaseCredentials,
30
+ BlobReferenceForConsumption,
31
+ ChatChoice,
32
+ ChatCompletions,
33
+ ChatResponseMessage,
34
+ CompletionsUsage,
35
+ CompletionsUsageDetails,
36
+ Connection,
37
+ Content,
38
+ CosmosDBIndex,
39
+ CustomCredential,
40
+ CustomizationParameters,
41
+ DatasetVersion,
42
+ Deployment,
43
+ EmbeddingConfiguration,
44
+ EntraIDCredentials,
45
+ Evaluation,
46
+ EvaluationResult,
47
+ EvaluationTarget,
48
+ EvaluationUpload,
49
+ EvaluatorConfiguration,
50
+ FileDatasetVersion,
51
+ FolderDatasetVersion,
52
+ Index,
53
+ InputData,
54
+ InputDataset,
55
+ LongRunningResponse,
56
+ MAASModelConfig,
57
+ ManagedAzureAISearchIndex,
58
+ Message,
59
+ Metadata,
60
+ ModelDeployment,
61
+ NoAuthenticationCredentials,
62
+ PendingUploadRequest,
63
+ PendingUploadResponse,
64
+ PromptUsageDetails,
65
+ RedTeam,
66
+ RedTeamUpload,
67
+ SASCredentials,
68
+ SasCredential,
69
+ SimulationDTO,
70
+ Sku,
71
+ SystemData,
72
+ TargetHarm,
73
+ TargetModelConfig,
74
+ )
75
+
76
+ from ._enums import ( # type: ignore
77
+ AttackStrategy,
78
+ ChatRole,
79
+ CompletionsFinishReason,
80
+ ConnectionType,
81
+ CredentialType,
82
+ DatasetType,
83
+ DeploymentType,
84
+ IndexType,
85
+ ListViewType,
86
+ PendingUploadType,
87
+ ResultType,
88
+ RiskCategory,
89
+ SimulationType,
90
+ )
91
+ from ._patch import __all__ as _patch_all
92
+ from ._patch import *
93
+ from ._patch import patch_sdk as _patch_sdk
94
+
95
+ __all__ = [
96
+ "AOAIModelConfig",
97
+ "AgentEvaluation",
98
+ "AgentEvaluationRedactionConfiguration",
99
+ "AgentEvaluationRequest",
100
+ "AgentEvaluationResult",
101
+ "AgentEvaluationSamplingConfiguration",
102
+ "AnnotationDTO",
103
+ "ApiKeyCredentials",
104
+ "AssetCredentialRequest",
105
+ "AssetCredentialResponse",
106
+ "AttackObjective",
107
+ "AzureAISearchIndex",
108
+ "BaseCredentials",
109
+ "BlobReferenceForConsumption",
110
+ "ChatChoice",
111
+ "ChatCompletions",
112
+ "ChatResponseMessage",
113
+ "CompletionsUsage",
114
+ "CompletionsUsageDetails",
115
+ "Connection",
116
+ "Content",
117
+ "CosmosDBIndex",
118
+ "CustomCredential",
119
+ "CustomizationParameters",
120
+ "DatasetVersion",
121
+ "Deployment",
122
+ "EmbeddingConfiguration",
123
+ "EntraIDCredentials",
124
+ "Evaluation",
125
+ "EvaluationResult",
126
+ "EvaluationTarget",
127
+ "EvaluationUpload",
128
+ "EvaluatorConfiguration",
129
+ "FileDatasetVersion",
130
+ "FolderDatasetVersion",
131
+ "Index",
132
+ "InputData",
133
+ "InputDataset",
134
+ "LongRunningResponse",
135
+ "MAASModelConfig",
136
+ "ManagedAzureAISearchIndex",
137
+ "Message",
138
+ "Metadata",
139
+ "ModelDeployment",
140
+ "NoAuthenticationCredentials",
141
+ "PendingUploadRequest",
142
+ "PendingUploadResponse",
143
+ "PromptUsageDetails",
144
+ "RedTeam",
145
+ "RedTeamUpload",
146
+ "SASCredentials",
147
+ "SasCredential",
148
+ "SimulationDTO",
149
+ "Sku",
150
+ "SystemData",
151
+ "TargetHarm",
152
+ "TargetModelConfig",
153
+ "AttackStrategy",
154
+ "ChatRole",
155
+ "CompletionsFinishReason",
156
+ "ConnectionType",
157
+ "CredentialType",
158
+ "DatasetType",
159
+ "DeploymentType",
160
+ "IndexType",
161
+ "ListViewType",
162
+ "PendingUploadType",
163
+ "ResultType",
164
+ "RiskCategory",
165
+ "SimulationType",
166
+ ]
167
+ __all__.extend([p for p in _patch_all if p not in __all__]) # pyright: ignore
168
+ _patch_sdk()