azure-ai-evaluation 1.9.0__py3-none-any.whl → 1.10.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of azure-ai-evaluation might be problematic. Click here for more details.
- azure/ai/evaluation/__init__.py +46 -12
- azure/ai/evaluation/_aoai/python_grader.py +84 -0
- azure/ai/evaluation/_aoai/score_model_grader.py +1 -0
- azure/ai/evaluation/_common/rai_service.py +3 -3
- azure/ai/evaluation/_common/utils.py +74 -17
- azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py +70 -22
- azure/ai/evaluation/_evaluate/_evaluate.py +150 -40
- azure/ai/evaluation/_evaluate/_evaluate_aoai.py +2 -0
- azure/ai/evaluation/_evaluate/_utils.py +1 -2
- azure/ai/evaluation/_evaluators/_bleu/_bleu.py +1 -1
- azure/ai/evaluation/_evaluators/_code_vulnerability/_code_vulnerability.py +8 -1
- azure/ai/evaluation/_evaluators/_coherence/_coherence.py +1 -1
- azure/ai/evaluation/_evaluators/_common/_base_eval.py +30 -6
- azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py +18 -8
- azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py +15 -5
- azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py +4 -1
- azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py +4 -1
- azure/ai/evaluation/_evaluators/_content_safety/_sexual.py +5 -2
- azure/ai/evaluation/_evaluators/_content_safety/_violence.py +4 -1
- azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py +3 -0
- azure/ai/evaluation/_evaluators/_eci/_eci.py +3 -0
- azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py +1 -1
- azure/ai/evaluation/_evaluators/_fluency/_fluency.py +1 -1
- azure/ai/evaluation/_evaluators/_gleu/_gleu.py +1 -1
- azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py +1 -1
- azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py +1 -1
- azure/ai/evaluation/_evaluators/_meteor/_meteor.py +1 -1
- azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py +8 -1
- azure/ai/evaluation/_evaluators/_qa/_qa.py +1 -1
- azure/ai/evaluation/_evaluators/_relevance/_relevance.py +54 -2
- azure/ai/evaluation/_evaluators/_relevance/relevance.prompty +140 -59
- azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py +1 -1
- azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py +1 -1
- azure/ai/evaluation/_evaluators/_rouge/_rouge.py +1 -1
- azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py +2 -1
- azure/ai/evaluation/_evaluators/_similarity/_similarity.py +1 -1
- azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py +16 -10
- azure/ai/evaluation/_evaluators/_task_adherence/task_adherence.prompty +354 -66
- azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py +169 -186
- azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty +101 -23
- azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py +8 -1
- azure/ai/evaluation/_evaluators/_xpia/xpia.py +4 -1
- azure/ai/evaluation/_legacy/_batch_engine/_config.py +6 -3
- azure/ai/evaluation/_legacy/_batch_engine/_engine.py +115 -30
- azure/ai/evaluation/_legacy/_batch_engine/_result.py +2 -0
- azure/ai/evaluation/_legacy/_batch_engine/_run.py +2 -2
- azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py +28 -31
- azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py +2 -0
- azure/ai/evaluation/_version.py +1 -1
- azure/ai/evaluation/red_team/__init__.py +2 -2
- azure/ai/evaluation/red_team/_red_team.py +838 -478
- azure/ai/evaluation/red_team/_red_team_result.py +6 -0
- azure/ai/evaluation/red_team/_utils/_rai_service_eval_chat_target.py +8 -3
- azure/ai/evaluation/red_team/_utils/constants.py +0 -2
- azure/ai/evaluation/simulator/_adversarial_simulator.py +5 -2
- azure/ai/evaluation/simulator/_indirect_attack_simulator.py +13 -1
- azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py +2 -2
- azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py +20 -2
- azure/ai/evaluation/simulator/_simulator.py +12 -0
- {azure_ai_evaluation-1.9.0.dist-info → azure_ai_evaluation-1.10.0.dist-info}/METADATA +32 -3
- {azure_ai_evaluation-1.9.0.dist-info → azure_ai_evaluation-1.10.0.dist-info}/RECORD +64 -63
- {azure_ai_evaluation-1.9.0.dist-info → azure_ai_evaluation-1.10.0.dist-info}/NOTICE.txt +0 -0
- {azure_ai_evaluation-1.9.0.dist-info → azure_ai_evaluation-1.10.0.dist-info}/WHEEL +0 -0
- {azure_ai_evaluation-1.9.0.dist-info → azure_ai_evaluation-1.10.0.dist-info}/top_level.txt +0 -0
|
@@ -185,11 +185,14 @@ class RedTeamingParameters(TypedDict):
|
|
|
185
185
|
:type attack_complexity: List[str]
|
|
186
186
|
:param techniques_used: Dictionary mapping complexity levels to lists of converter techniques used
|
|
187
187
|
:type techniques_used: Dict[str, List[str]]
|
|
188
|
+
:param attack_success_thresholds: Thresholds used for determining attack success per risk category
|
|
189
|
+
:type attack_success_thresholds: Dict[str, Any]
|
|
188
190
|
"""
|
|
189
191
|
|
|
190
192
|
attack_objective_generated_from: AttackObjectiveSource
|
|
191
193
|
attack_complexity: List[str]
|
|
192
194
|
techniques_used: Dict[str, List[str]]
|
|
195
|
+
attack_success_thresholds: Dict[str, Dict[str, int]]
|
|
193
196
|
|
|
194
197
|
|
|
195
198
|
@experimental
|
|
@@ -228,6 +231,8 @@ class AttackDetails(TypedDict):
|
|
|
228
231
|
:type conversation: List[Dict[str, str]]
|
|
229
232
|
:param risk_assessment: Dictionary containing content safety assessment for the conversation
|
|
230
233
|
:type risk_assessment: Optional[RiskAssessment]
|
|
234
|
+
:param attack_success_threshold: The threshold value used to determine attack success
|
|
235
|
+
:type attack_success_threshold: Optional[int]
|
|
231
236
|
"""
|
|
232
237
|
|
|
233
238
|
attack_success: Optional[bool]
|
|
@@ -236,6 +241,7 @@ class AttackDetails(TypedDict):
|
|
|
236
241
|
risk_category: str
|
|
237
242
|
conversation: List[Dict[str, str]]
|
|
238
243
|
risk_assessment: Optional[RiskAssessment]
|
|
244
|
+
attack_success_threshold: Optional[int]
|
|
239
245
|
|
|
240
246
|
|
|
241
247
|
@experimental
|
|
@@ -11,11 +11,16 @@ import asyncio
|
|
|
11
11
|
import re
|
|
12
12
|
from typing import Dict, Optional, Any, Tuple, List
|
|
13
13
|
from azure.ai.evaluation._common.rai_service import evaluate_with_rai_service
|
|
14
|
-
from azure.ai.evaluation.simulator._model_tools._generated_rai_client import
|
|
14
|
+
from azure.ai.evaluation.simulator._model_tools._generated_rai_client import (
|
|
15
|
+
GeneratedRAIClient,
|
|
16
|
+
)
|
|
15
17
|
from pyrit.models import PromptRequestResponse, construct_response_from_request
|
|
16
18
|
from pyrit.prompt_target import PromptChatTarget
|
|
17
|
-
|
|
18
|
-
from .metric_mapping import
|
|
19
|
+
|
|
20
|
+
from .metric_mapping import (
|
|
21
|
+
get_metric_from_risk_category,
|
|
22
|
+
get_annotation_task_from_risk_category,
|
|
23
|
+
)
|
|
19
24
|
from .._attack_objective_generator import RiskCategory
|
|
20
25
|
|
|
21
26
|
|
|
@@ -239,8 +239,11 @@ class AdversarialSimulator:
|
|
|
239
239
|
# So randomize a the selection instead of the parameter list directly,
|
|
240
240
|
# or a potentially large deep copy.
|
|
241
241
|
if randomization_seed is not None:
|
|
242
|
-
random
|
|
243
|
-
|
|
242
|
+
# Create a local random instance to avoid polluting global state
|
|
243
|
+
local_random = random.Random(randomization_seed)
|
|
244
|
+
local_random.shuffle(templates)
|
|
245
|
+
else:
|
|
246
|
+
random.shuffle(templates)
|
|
244
247
|
|
|
245
248
|
# Prepare task parameters based on scenario - but use a single append call for all scenarios
|
|
246
249
|
tasks = []
|
|
@@ -5,7 +5,8 @@
|
|
|
5
5
|
# noqa: E501
|
|
6
6
|
import asyncio
|
|
7
7
|
import logging
|
|
8
|
-
|
|
8
|
+
import random
|
|
9
|
+
from typing import Callable, cast, Union, Optional
|
|
9
10
|
|
|
10
11
|
from tqdm import tqdm
|
|
11
12
|
|
|
@@ -105,6 +106,7 @@ class IndirectAttackSimulator(AdversarialSimulator):
|
|
|
105
106
|
api_call_retry_sleep_sec: int = 1,
|
|
106
107
|
api_call_delay_sec: int = 0,
|
|
107
108
|
concurrent_async_task: int = 3,
|
|
109
|
+
randomization_seed: Optional[int] = None,
|
|
108
110
|
**kwargs,
|
|
109
111
|
):
|
|
110
112
|
"""
|
|
@@ -130,6 +132,9 @@ class IndirectAttackSimulator(AdversarialSimulator):
|
|
|
130
132
|
:keyword concurrent_async_task: The number of asynchronous tasks to run concurrently during the simulation.
|
|
131
133
|
Defaults to 3.
|
|
132
134
|
:paramtype concurrent_async_task: int
|
|
135
|
+
:keyword randomization_seed: The seed used to randomize prompt selection. If unset, the system's
|
|
136
|
+
default seed is used. Defaults to None.
|
|
137
|
+
:paramtype randomization_seed: Optional[int]
|
|
133
138
|
:return: A list of dictionaries, each representing a simulated conversation. Each dictionary contains:
|
|
134
139
|
|
|
135
140
|
- 'template_parameters': A dictionary with parameters used in the conversation template,
|
|
@@ -190,6 +195,13 @@ class IndirectAttackSimulator(AdversarialSimulator):
|
|
|
190
195
|
ncols=100,
|
|
191
196
|
unit="simulations",
|
|
192
197
|
)
|
|
198
|
+
|
|
199
|
+
# Apply randomization to templates if seed is provided
|
|
200
|
+
if randomization_seed is not None:
|
|
201
|
+
# Create a local random instance to avoid polluting global state
|
|
202
|
+
local_random = random.Random(randomization_seed)
|
|
203
|
+
local_random.shuffle(templates)
|
|
204
|
+
|
|
193
205
|
for template in templates:
|
|
194
206
|
for parameter in template.template_parameters:
|
|
195
207
|
tasks.append(
|
|
@@ -124,7 +124,7 @@ class GeneratedRAIClient:
|
|
|
124
124
|
risk_category=risk_category,
|
|
125
125
|
lang="en",
|
|
126
126
|
strategy=strategy,
|
|
127
|
-
headers={"
|
|
127
|
+
headers={"x-ms-client-request-id": scan_session_id},
|
|
128
128
|
)
|
|
129
129
|
return response
|
|
130
130
|
|
|
@@ -146,7 +146,7 @@ class GeneratedRAIClient:
|
|
|
146
146
|
try:
|
|
147
147
|
# Send the request using the autogenerated client
|
|
148
148
|
response = self._client.get_jail_break_dataset_with_type(
|
|
149
|
-
type="upia", headers={"
|
|
149
|
+
type="upia", headers={"x-ms-client-request-id": scan_session_id}
|
|
150
150
|
)
|
|
151
151
|
if isinstance(response, list):
|
|
152
152
|
return response
|
|
@@ -10,7 +10,7 @@ from typing import Any, Dict, List, Optional, cast, Union
|
|
|
10
10
|
|
|
11
11
|
from azure.ai.evaluation._http_utils import AsyncHttpPipeline, get_async_http_client
|
|
12
12
|
from azure.ai.evaluation._user_agent import UserAgentSingleton
|
|
13
|
-
from azure.core.exceptions import HttpResponseError
|
|
13
|
+
from azure.core.exceptions import HttpResponseError, ServiceResponseError
|
|
14
14
|
from azure.core.pipeline.policies import AsyncRetryPolicy, RetryMode
|
|
15
15
|
from azure.ai.evaluation._common.onedp._client import AIProjectClient
|
|
16
16
|
from azure.ai.evaluation._common.onedp.models import SimulationDTO
|
|
@@ -225,7 +225,25 @@ class ProxyChatCompletionsModel(OpenAIChatCompletionsModel):
|
|
|
225
225
|
sleep_time = RAIService.SLEEP_TIME**request_count
|
|
226
226
|
await asyncio.sleep(sleep_time)
|
|
227
227
|
else:
|
|
228
|
-
|
|
228
|
+
# Retry policy for POST request to RAI service
|
|
229
|
+
service_call_retry_policy = AsyncRetryPolicy(
|
|
230
|
+
retry_on_exceptions=[ServiceResponseError],
|
|
231
|
+
retry_total=7,
|
|
232
|
+
retry_backoff_factor=10.0,
|
|
233
|
+
retry_backoff_max=180,
|
|
234
|
+
retry_mode=RetryMode.Exponential,
|
|
235
|
+
)
|
|
236
|
+
|
|
237
|
+
response = None
|
|
238
|
+
async with get_async_http_client().with_policies(retry_policy=service_call_retry_policy) as retry_client:
|
|
239
|
+
try:
|
|
240
|
+
response = await retry_client.post(
|
|
241
|
+
url=self.endpoint_url, headers=proxy_headers, json=sim_request_dto.to_dict()
|
|
242
|
+
)
|
|
243
|
+
except ServiceResponseError as e:
|
|
244
|
+
self.logger.error("ServiceResponseError during POST request to rai svc after retries: %s", str(e))
|
|
245
|
+
raise
|
|
246
|
+
|
|
229
247
|
# response.raise_for_status()
|
|
230
248
|
if response.status_code != 202:
|
|
231
249
|
raise HttpResponseError(
|
|
@@ -7,6 +7,7 @@ import asyncio
|
|
|
7
7
|
import importlib.resources as pkg_resources
|
|
8
8
|
import json
|
|
9
9
|
import os
|
|
10
|
+
import random
|
|
10
11
|
import re
|
|
11
12
|
import warnings
|
|
12
13
|
from typing import Any, Callable, Dict, List, Optional, Union, Tuple
|
|
@@ -104,6 +105,7 @@ class Simulator:
|
|
|
104
105
|
user_simulator_prompty_options: Dict[str, Any] = {},
|
|
105
106
|
conversation_turns: List[List[Union[str, Dict[str, Any]]]] = [],
|
|
106
107
|
concurrent_async_tasks: int = 5,
|
|
108
|
+
randomization_seed: Optional[int] = None,
|
|
107
109
|
**kwargs,
|
|
108
110
|
) -> List[JsonLineChatProtocol]:
|
|
109
111
|
"""
|
|
@@ -134,6 +136,9 @@ class Simulator:
|
|
|
134
136
|
:keyword concurrent_async_tasks: The number of asynchronous tasks to run concurrently during the simulation.
|
|
135
137
|
Defaults to 5.
|
|
136
138
|
:paramtype concurrent_async_tasks: int
|
|
139
|
+
:keyword randomization_seed: The seed used to randomize task/query order. If unset, the system's
|
|
140
|
+
default seed is used. Defaults to None.
|
|
141
|
+
:paramtype randomization_seed: Optional[int]
|
|
137
142
|
:return: A list of simulated conversations represented as JsonLineChatProtocol objects.
|
|
138
143
|
:rtype: List[JsonLineChatProtocol]
|
|
139
144
|
|
|
@@ -159,6 +164,13 @@ class Simulator:
|
|
|
159
164
|
f"Only the first {num_queries} lines of the specified tasks will be simulated."
|
|
160
165
|
)
|
|
161
166
|
|
|
167
|
+
# Apply randomization to tasks if seed is provided
|
|
168
|
+
if randomization_seed is not None and tasks:
|
|
169
|
+
# Create a local random instance to avoid polluting global state
|
|
170
|
+
local_random = random.Random(randomization_seed)
|
|
171
|
+
tasks = tasks.copy() # Don't modify the original list
|
|
172
|
+
local_random.shuffle(tasks)
|
|
173
|
+
|
|
162
174
|
max_conversation_turns *= 2 # account for both user and assistant turns
|
|
163
175
|
|
|
164
176
|
prompty_model_config = self.model_config
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: azure-ai-evaluation
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.10.0
|
|
4
4
|
Summary: Microsoft Azure Evaluation Library for Python
|
|
5
5
|
Home-page: https://github.com/Azure/azure-sdk-for-python
|
|
6
6
|
Author: Microsoft Corporation
|
|
@@ -21,8 +21,6 @@ Classifier: Operating System :: OS Independent
|
|
|
21
21
|
Requires-Python: >=3.9
|
|
22
22
|
Description-Content-Type: text/markdown
|
|
23
23
|
License-File: NOTICE.txt
|
|
24
|
-
Requires-Dist: promptflow-devkit>=1.17.1
|
|
25
|
-
Requires-Dist: promptflow-core>=1.17.1
|
|
26
24
|
Requires-Dist: pyjwt>=2.8.0
|
|
27
25
|
Requires-Dist: azure-identity>=1.16.0
|
|
28
26
|
Requires-Dist: azure-core>=1.30.2
|
|
@@ -400,6 +398,34 @@ This project has adopted the [Microsoft Open Source Code of Conduct][code_of_con
|
|
|
400
398
|
|
|
401
399
|
# Release History
|
|
402
400
|
|
|
401
|
+
## 1.10.0 (2025-07-31)
|
|
402
|
+
|
|
403
|
+
### Breaking Changes
|
|
404
|
+
|
|
405
|
+
- Added `evaluate_query` parameter to all RAI service evaluators that can be passed as a keyword argument. This parameter controls whether queries are included in evaluation data when evaluating query-response pairs. Previously, queries were always included in evaluations. When set to `True`, both query and response will be evaluated; when set to `False` (default), only the response will be evaluated. This parameter is available across all RAI service evaluators including `ContentSafetyEvaluator`, `ViolenceEvaluator`, `SexualEvaluator`, `SelfHarmEvaluator`, `HateUnfairnessEvaluator`, `ProtectedMaterialEvaluator`, `IndirectAttackEvaluator`, `CodeVulnerabilityEvaluator`, `UngroundedAttributesEvaluator`, `GroundednessProEvaluator`, and `EciEvaluator`. Existing code that relies on queries being evaluated will need to explicitly set `evaluate_query=True` to maintain the previous behavior.
|
|
406
|
+
|
|
407
|
+
### Features Added
|
|
408
|
+
|
|
409
|
+
- Added support for Azure OpenAI Python grader via `AzureOpenAIPythonGrader` class, which serves as a wrapper around Azure Open AI Python grader configurations. This new grader object can be supplied to the main `evaluate` method as if it were a normal callable evaluator.
|
|
410
|
+
- Added `attack_success_thresholds` parameter to `RedTeam` class for configuring custom thresholds that determine attack success. This allows users to set specific threshold values for each risk category, with scores greater than the threshold considered successful attacks (i.e. higher threshold means higher
|
|
411
|
+
tolerance for harmful responses).
|
|
412
|
+
- Enhanced threshold reporting in RedTeam results to include default threshold values when custom thresholds aren't specified, providing better transparency about the evaluation criteria used.
|
|
413
|
+
|
|
414
|
+
|
|
415
|
+
### Bugs Fixed
|
|
416
|
+
|
|
417
|
+
- Fixed red team scan `output_path` issue where individual evaluation results were overwriting each other instead of being preserved as separate files. Individual evaluations now create unique files while the user's `output_path` is reserved for final aggregated results.
|
|
418
|
+
- Significant improvements to TaskAdherence evaluator. New version has less variance, is much faster and consumes fewer tokens.
|
|
419
|
+
- Significant improvements to Relevance evaluator. New version has more concrete rubrics and has less variance, is much faster and consumes fewer tokens.
|
|
420
|
+
|
|
421
|
+
|
|
422
|
+
### Other Changes
|
|
423
|
+
|
|
424
|
+
- The default engine for evaluation was changed from `promptflow` (PFClient) to an in-SDK batch client (RunSubmitterClient)
|
|
425
|
+
- Note: We've temporarily kept an escape hatch to fall back to the legacy `promptflow` implementation by setting `_use_pf_client=True` when invoking `evaluate()`.
|
|
426
|
+
This is due to be removed in a future release.
|
|
427
|
+
|
|
428
|
+
|
|
403
429
|
## 1.9.0 (2025-07-02)
|
|
404
430
|
|
|
405
431
|
### Features Added
|
|
@@ -411,8 +437,11 @@ This project has adopted the [Microsoft Open Source Code of Conduct][code_of_con
|
|
|
411
437
|
### Bugs Fixed
|
|
412
438
|
|
|
413
439
|
- Significant improvements to IntentResolution evaluator. New version has less variance, is nearly 2x faster and consumes fewer tokens.
|
|
440
|
+
|
|
441
|
+
- Fixes and improvements to ToolCallAccuracy evaluator. New version has less variance. and now works on all tool calls that happen in a turn at once. Previously, it worked on each tool call independently without having context on the other tool calls that happen in the same turn, and then aggregated the results to a score in the range [0-1]. The score range is now [1-5].
|
|
414
442
|
- Fixed MeteorScoreEvaluator and other threshold-based evaluators returning incorrect binary results due to integer conversion of decimal scores. Previously, decimal scores like 0.9375 were incorrectly converted to integers (0) before threshold comparison, causing them to fail even when above the threshold. [#41415](https://github.com/Azure/azure-sdk-for-python/issues/41415)
|
|
415
443
|
- Added a new enum `ADVERSARIAL_QA_DOCUMENTS` which moves all the "file_content" type prompts away from `ADVERSARIAL_QA` to the new enum
|
|
444
|
+
- `AzureOpenAIScoreModelGrader` evaluator now supports `pass_threshold` parameter to set the minimum score required for a response to be considered passing. This allows users to define custom thresholds for evaluation results, enhancing flexibility in grading AI model responses.
|
|
416
445
|
|
|
417
446
|
## 1.8.0 (2025-05-29)
|
|
418
447
|
|
|
@@ -1,16 +1,17 @@
|
|
|
1
|
-
azure/ai/evaluation/__init__.py,sha256=
|
|
1
|
+
azure/ai/evaluation/__init__.py,sha256=hrP2gqioHoUe5QBvpkmNpQ45zu6g-ErReY-fqzWeOf8,5298
|
|
2
2
|
azure/ai/evaluation/_constants.py,sha256=FNVxCt3_0MwZHtDsjRYPH5h6mT_48KCbJTBWBDTNujE,3729
|
|
3
3
|
azure/ai/evaluation/_eval_mapping.py,sha256=CHabrfaRlWbrAYUZV5YXYH0GX_zk9tG9y1og6RtUAnU,2584
|
|
4
4
|
azure/ai/evaluation/_exceptions.py,sha256=y5zVwhyoNuqjaE8P6E65j0-NRDE2Nx0iMq8F7_0kO-4,5848
|
|
5
5
|
azure/ai/evaluation/_http_utils.py,sha256=d1McnMRT5lnaoR8x4r3pkfH2ic4T3JArclOK4kAaUmg,17261
|
|
6
6
|
azure/ai/evaluation/_model_configurations.py,sha256=MNN6cQlz7P9vNfHmfEKsUcly3j1FEOEFsA8WV7GPuKQ,4043
|
|
7
7
|
azure/ai/evaluation/_user_agent.py,sha256=SgUm6acnwyoENu8KroyaWRrJroJNqLZBccpQoeKyrHw,1144
|
|
8
|
-
azure/ai/evaluation/_version.py,sha256=
|
|
8
|
+
azure/ai/evaluation/_version.py,sha256=6wd-PDI7lXxIj0JWkLpHM3nxqs22YSfHFt4rjZRC69E,230
|
|
9
9
|
azure/ai/evaluation/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
10
10
|
azure/ai/evaluation/_aoai/__init__.py,sha256=0Ji05ShlsJaytvexXUpCe69t0jSNd3PpNbhr0zCkr6A,265
|
|
11
11
|
azure/ai/evaluation/_aoai/aoai_grader.py,sha256=8mp_dwMK-MdKkoiTud9ra6ExKyYV1SAPXr1m46j4lm4,4434
|
|
12
12
|
azure/ai/evaluation/_aoai/label_grader.py,sha256=5HOLLkiqCOQS5LPJ5Nm0PE5I1uGEhvoi-6DRgG-H1KM,2696
|
|
13
|
-
azure/ai/evaluation/_aoai/
|
|
13
|
+
azure/ai/evaluation/_aoai/python_grader.py,sha256=Ef3Rkr2dTi751RbCb9XpqHZgHmN1ueen_w3IUxuek00,3120
|
|
14
|
+
azure/ai/evaluation/_aoai/score_model_grader.py,sha256=jJPZIARbZj6PTd7h072tZf5eFaTfQ-DO-2YmnBwNGRM,3737
|
|
14
15
|
azure/ai/evaluation/_aoai/string_check_grader.py,sha256=5aRMEMoM0FUvxx_ftwySV-KN_Daw3R4-brFaND_NR_E,2321
|
|
15
16
|
azure/ai/evaluation/_aoai/text_similarity_grader.py,sha256=BxJ5Z6npKPkfuVzy84IZXHZVlg4EJrkq2NA8XixBxm4,2889
|
|
16
17
|
azure/ai/evaluation/_azure/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
@@ -23,8 +24,8 @@ azure/ai/evaluation/_common/_experimental.py,sha256=GVtSn9r1CeR_yEa578dJVNDJ3P24
|
|
|
23
24
|
azure/ai/evaluation/_common/constants.py,sha256=lkdGK6xrMhVogqBudU4B8-6Ko2aSxKl3HzzVTh1D9Ho,2286
|
|
24
25
|
azure/ai/evaluation/_common/evaluation_onedp_client.py,sha256=3HMiG37Cl46q9-kE6zxIEoQbgK96YelX1AFWldfk7Ok,7485
|
|
25
26
|
azure/ai/evaluation/_common/math.py,sha256=d4bwWe35_RWDIZNcbV1BTBbHNx2QHQ4-I3EofDyyNE0,2863
|
|
26
|
-
azure/ai/evaluation/_common/rai_service.py,sha256=
|
|
27
|
-
azure/ai/evaluation/_common/utils.py,sha256=
|
|
27
|
+
azure/ai/evaluation/_common/rai_service.py,sha256=jyBLRWpaQY2qGumP3JyTrRb3bAIqu5d6CPRtMYaJi5w,35491
|
|
28
|
+
azure/ai/evaluation/_common/utils.py,sha256=GWeNGUdEup2qzmn0N-D1Os_xlpIKFdTe6Y7Qn0AF0uQ,30120
|
|
28
29
|
azure/ai/evaluation/_common/onedp/__init__.py,sha256=C7Ddtjy__BxKkRCydRS7BhtQnM7TFZo179UUVC5krVY,1026
|
|
29
30
|
azure/ai/evaluation/_common/onedp/_client.py,sha256=cE37dQkl6aFfPZD-jyDa1QKUYKe5UQuC3SJX6XndFFY,6667
|
|
30
31
|
azure/ai/evaluation/_common/onedp/_configuration.py,sha256=F_KmJnzEgtmPTZViFS2nTMtKYHxi_YOn81BDx24L3gI,3629
|
|
@@ -97,11 +98,11 @@ azure/ai/evaluation/_converters/_models.py,sha256=WjAJntMPlc_CpnHZ2pFqW5yezlvfGJ
|
|
|
97
98
|
azure/ai/evaluation/_converters/_sk_services.py,sha256=NfjflVgeJUF0MrvAiUd_uF2magn38Q_MKmHzaY41vOA,18239
|
|
98
99
|
azure/ai/evaluation/_evaluate/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
99
100
|
azure/ai/evaluation/_evaluate/_eval_run.py,sha256=ZlDvTNDiMSZ2VfzVicPmEGx65LL3LmcKcPWft6XjWcA,21991
|
|
100
|
-
azure/ai/evaluation/_evaluate/_evaluate.py,sha256=
|
|
101
|
-
azure/ai/evaluation/_evaluate/_evaluate_aoai.py,sha256
|
|
102
|
-
azure/ai/evaluation/_evaluate/_utils.py,sha256=
|
|
101
|
+
azure/ai/evaluation/_evaluate/_evaluate.py,sha256=XlJT0VWuNDIRSee7z63p5AP3dRNwZ7vJbSYOUGJfD_E,56540
|
|
102
|
+
azure/ai/evaluation/_evaluate/_evaluate_aoai.py,sha256=-5oR9rPzXns6DQMiwJAp0iBHdK74JtlpTlx-xoGDhmo,26222
|
|
103
|
+
azure/ai/evaluation/_evaluate/_utils.py,sha256=e9Jha5zAkDaidZjFf1-FnNSmT02BjYWkleV9P1E0Iq8,19095
|
|
103
104
|
azure/ai/evaluation/_evaluate/_batch_run/__init__.py,sha256=cPLi_MJ_pCp8eKBxJbiSoxgTnN3nDLuaP57dMkKuyhg,552
|
|
104
|
-
azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py,sha256=
|
|
105
|
+
azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py,sha256=2Rl4j_f4qK6_J-Gl_qUV-4elpWbegWzIkJuQOdPP-ig,7046
|
|
105
106
|
azure/ai/evaluation/_evaluate/_batch_run/batch_clients.py,sha256=dTZYdQGweGzEN6OHtn1jOmGG767AJ7RJwfHoCCeRddg,2761
|
|
106
107
|
azure/ai/evaluation/_evaluate/_batch_run/code_client.py,sha256=n4JxDAFNnetfpAj4FyhtZms3kuGmDWXCBOogqeO4F98,8607
|
|
107
108
|
azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py,sha256=Z0m6nDNF7TiIIW1woC7TCeuh7XIBAwTNFfPKXJhE7_k,4076
|
|
@@ -110,74 +111,74 @@ azure/ai/evaluation/_evaluate/_batch_run/target_run_context.py,sha256=TrZ_IkbU8D
|
|
|
110
111
|
azure/ai/evaluation/_evaluate/_telemetry/__init__.py,sha256=KARq4sFLAh72Rhr8nefbOLXFnKqdO6i6zAYRqr4SWJ4,3475
|
|
111
112
|
azure/ai/evaluation/_evaluators/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
112
113
|
azure/ai/evaluation/_evaluators/_bleu/__init__.py,sha256=quKKO0kvOSkky5hcoNBvgBuMeeVRFCE9GSv70mAdGP4,260
|
|
113
|
-
azure/ai/evaluation/_evaluators/_bleu/_bleu.py,sha256=
|
|
114
|
+
azure/ai/evaluation/_evaluators/_bleu/_bleu.py,sha256=CJOmTL_5vC477Q4dAKTArApj2d4UZVHuz_KB8Aw7ZMk,4935
|
|
114
115
|
azure/ai/evaluation/_evaluators/_code_vulnerability/__init__.py,sha256=zRHHxYA6CI72iqZaZz9eSbDHwhhjp5hjicEK_RWXlL0,109
|
|
115
|
-
azure/ai/evaluation/_evaluators/_code_vulnerability/_code_vulnerability.py,sha256=
|
|
116
|
+
azure/ai/evaluation/_evaluators/_code_vulnerability/_code_vulnerability.py,sha256=KrOtAxtipZf2FDQ9uiHQ4pTAzD-aev14EPgaQUdFVNA,4890
|
|
116
117
|
azure/ai/evaluation/_evaluators/_coherence/__init__.py,sha256=GRqcSCQse02Spyki0UsRNWMIXiea2lLtPPXNGvkJzQ0,258
|
|
117
|
-
azure/ai/evaluation/_evaluators/_coherence/_coherence.py,sha256=
|
|
118
|
+
azure/ai/evaluation/_evaluators/_coherence/_coherence.py,sha256=MqifhqPRbvMH1AsvAO8D7sbN1xSZ7VtkiWQIFFrR0_8,5844
|
|
118
119
|
azure/ai/evaluation/_evaluators/_coherence/coherence.prompty,sha256=ANvh9mDFW7KMejrgdWqBLjj4SIqEO5WW9gg5pE0RLJk,6798
|
|
119
120
|
azure/ai/evaluation/_evaluators/_common/__init__.py,sha256=xAymP_CZy4aPzWplMdXgQUQVDIUEMI-0nbgdm_umFYY,498
|
|
120
|
-
azure/ai/evaluation/_evaluators/_common/_base_eval.py,sha256=
|
|
121
|
+
azure/ai/evaluation/_evaluators/_common/_base_eval.py,sha256=qv1W6gQR5-SLq6hTvDBqSusaPzOX6I6mH8feI2JFSOk,26050
|
|
121
122
|
azure/ai/evaluation/_evaluators/_common/_base_multi_eval.py,sha256=yYFpoCDe2wMFQck0ykbX8IJBBidk6NT1wUTkVFlVSy8,2728
|
|
122
123
|
azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py,sha256=11ZMNPLF50O7om7UOq8BzeWiarVpU9qnC1exotnw1Lo,6866
|
|
123
|
-
azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py,sha256=
|
|
124
|
+
azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py,sha256=mW8jErfouw1rVST2YO5nWEdMwIaXWCaw46-s8-Avilc,9068
|
|
124
125
|
azure/ai/evaluation/_evaluators/_common/_conversation_aggregators.py,sha256=gjDBjRxJKwaHbshWH0j2idjlzfzNMnT9a9RL0fQiKeM,2129
|
|
125
126
|
azure/ai/evaluation/_evaluators/_content_safety/__init__.py,sha256=PEYMIybfP64f7byhuTaiq4RiqsYbjqejpW1JsJIG1jA,556
|
|
126
|
-
azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py,sha256=
|
|
127
|
-
azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py,sha256=
|
|
128
|
-
azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py,sha256=
|
|
129
|
-
azure/ai/evaluation/_evaluators/_content_safety/_sexual.py,sha256=
|
|
130
|
-
azure/ai/evaluation/_evaluators/_content_safety/_violence.py,sha256=
|
|
127
|
+
azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py,sha256=0JVsptT5koRCXOhcd5_NIvQPQxMRHhlCfisc_KRKE6k,7502
|
|
128
|
+
azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py,sha256=j2WNVtDuacrNMO5NbKjwxtugvOlG0Mroo_RIxfeZhFA,7365
|
|
129
|
+
azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py,sha256=Qof3CIDOY3X71Jy55ZT4Pv5hrk27DLmYBJqo9NKA6ZY,6149
|
|
130
|
+
azure/ai/evaluation/_evaluators/_content_safety/_sexual.py,sha256=ssBNqH7lSJ6Ifw87lT6z3vo1v9oepjWXECmRs5vznKE,6707
|
|
131
|
+
azure/ai/evaluation/_evaluators/_content_safety/_violence.py,sha256=MDHnSbefslrlarkh5rcjJVIwpkMl9oZJBJLra5XylDg,6779
|
|
131
132
|
azure/ai/evaluation/_evaluators/_document_retrieval/__init__.py,sha256=wEAbjkMQTlwmRsa7_XeOP0EAT1g7AJyaYlvPdZElAb4,385
|
|
132
|
-
azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py,sha256=
|
|
133
|
+
azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py,sha256=fEkwnuvOCLUiyNMf1c_BmdLwR0ECgieRtAri_CPE9PI,20338
|
|
133
134
|
azure/ai/evaluation/_evaluators/_eci/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
134
|
-
azure/ai/evaluation/_evaluators/_eci/_eci.py,sha256=
|
|
135
|
+
azure/ai/evaluation/_evaluators/_eci/_eci.py,sha256=3Zrf6xxaw7e2adQLb0TM_KFWf-4RSTnjI4uYfHev2tQ,3103
|
|
135
136
|
azure/ai/evaluation/_evaluators/_f1_score/__init__.py,sha256=aEVbO7iMoF20obdpLQKcKm69Yyu3mYnblKELLqu8OGI,260
|
|
136
|
-
azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py,sha256=
|
|
137
|
+
azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py,sha256=8xKB0SDqseQ2Vnhf3CNftXVMjV6co8h-gfKOTcmNJJw,6940
|
|
137
138
|
azure/ai/evaluation/_evaluators/_fluency/__init__.py,sha256=EEJw39xRa0bOAA1rELTTKXQu2s60n_7CZQRD0Gu2QVw,259
|
|
138
|
-
azure/ai/evaluation/_evaluators/_fluency/_fluency.py,sha256=
|
|
139
|
+
azure/ai/evaluation/_evaluators/_fluency/_fluency.py,sha256=iIgN2DQDvAoZldeCYRv8Z-kzNvEPsS4KEuDQBhXiQog,5552
|
|
139
140
|
azure/ai/evaluation/_evaluators/_fluency/fluency.prompty,sha256=n9v0W9eYwgIO-JSsLTSKEM_ApJuxxuKWQpNblrTEkFY,4861
|
|
140
141
|
azure/ai/evaluation/_evaluators/_gleu/__init__.py,sha256=Ae2EvQ7gqiYAoNO3LwGIhdAAjJPJDfT85rQGKrRrmbA,260
|
|
141
|
-
azure/ai/evaluation/_evaluators/_gleu/_gleu.py,sha256=
|
|
142
|
+
azure/ai/evaluation/_evaluators/_gleu/_gleu.py,sha256=bm46V_t4NpIEaAAZMtMAxMMe_u3SgOY0201RihpFxEc,4884
|
|
142
143
|
azure/ai/evaluation/_evaluators/_groundedness/__init__.py,sha256=UYNJUeRvBwcSVFyZpdsf29un5eyaDzYoo3QvC1gvlLg,274
|
|
143
|
-
azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py,sha256=
|
|
144
|
+
azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py,sha256=DF1rEC1AZp8yXGVQc4i_0Nn4joKVCas2cBKyVOgJnPg,8208
|
|
144
145
|
azure/ai/evaluation/_evaluators/_groundedness/groundedness_with_query.prompty,sha256=v7TOm75DyW_1gOU6gSiZoPcRnHcJ65DrzR2cL_ucWDY,5814
|
|
145
146
|
azure/ai/evaluation/_evaluators/_groundedness/groundedness_without_query.prompty,sha256=8kNShdfxQvkII7GnqjmdqQ5TNelA2B6cjnqWZk8FFe4,5296
|
|
146
147
|
azure/ai/evaluation/_evaluators/_intent_resolution/__init__.py,sha256=Lr8krXt2yfShFTAuwjTFgrUbO75boLLrRSnF1mriN_Q,280
|
|
147
|
-
azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py,sha256=
|
|
148
|
+
azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py,sha256=3cWMeUSUGJmFtIFLHNH0rHX4KNUfVeermeTJpIRHh4M,11431
|
|
148
149
|
azure/ai/evaluation/_evaluators/_intent_resolution/intent_resolution.prompty,sha256=5xLdYQ9FUfJVNtkbFMjiFhFH17eyRYF4WFIE6_3zvxc,8449
|
|
149
150
|
azure/ai/evaluation/_evaluators/_meteor/__init__.py,sha256=209na3pPsdmcuYpYHUYtqQybCpc3yZkc93HnRdicSlI,266
|
|
150
|
-
azure/ai/evaluation/_evaluators/_meteor/_meteor.py,sha256=
|
|
151
|
+
azure/ai/evaluation/_evaluators/_meteor/_meteor.py,sha256=6OkRH78wfn61lkR-1MuDw2J980SCm7LU-B567cS_8ho,5926
|
|
151
152
|
azure/ai/evaluation/_evaluators/_protected_material/__init__.py,sha256=eRAQIU9diVXfO5bp6aLWxZoYUvOsrDIfy1gnDOeNTiI,109
|
|
152
|
-
azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py,sha256=
|
|
153
|
+
azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py,sha256=95vJ55K3ONCmF4MP_q4FiuJhe8iejLHOA1k1o7DtWKo,5407
|
|
153
154
|
azure/ai/evaluation/_evaluators/_qa/__init__.py,sha256=bcXfT--C0hjym2haqd1B2-u9bDciyM0ThOFtU1Q69sk,244
|
|
154
|
-
azure/ai/evaluation/_evaluators/_qa/_qa.py,sha256=
|
|
155
|
+
azure/ai/evaluation/_evaluators/_qa/_qa.py,sha256=y8Magyzb2DESoN6vFllJkf8bLZ28UFFYyKVHCv1ah3o,6270
|
|
155
156
|
azure/ai/evaluation/_evaluators/_relevance/__init__.py,sha256=JlxytW32Nl8pbE-fI3GRpfgVuY9EG6zxIAn5VZGSwyc,265
|
|
156
|
-
azure/ai/evaluation/_evaluators/_relevance/_relevance.py,sha256=
|
|
157
|
-
azure/ai/evaluation/_evaluators/_relevance/relevance.prompty,sha256=
|
|
157
|
+
azure/ai/evaluation/_evaluators/_relevance/_relevance.py,sha256=TwApL9yRB47O_n8OOGhg7E2WLpNAWWX6Pqiku3PIR2Q,8944
|
|
158
|
+
azure/ai/evaluation/_evaluators/_relevance/relevance.prompty,sha256=1F45mS6phDhUCjWD7AVAeCJE8UJHytCgRwHrndcH99E,6462
|
|
158
159
|
azure/ai/evaluation/_evaluators/_response_completeness/__init__.py,sha256=U3eqkQQAgRif46B6UGdq3yWefgbkZGJ3ZE2sKoZQDlU,292
|
|
159
|
-
azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py,sha256=
|
|
160
|
+
azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py,sha256=gNZHxw-sk99DDvwhLGh3Az4RVfauPv9QMRt6d2lyNoY,7922
|
|
160
161
|
azure/ai/evaluation/_evaluators/_response_completeness/response_completeness.prompty,sha256=25PqzWWtpwvsKNnBGDNfqsKKo2RpyeiIFzvK8sauPDg,7520
|
|
161
162
|
azure/ai/evaluation/_evaluators/_retrieval/__init__.py,sha256=kMu47ZyTZ7f-4Yh6H3KHxswmxitmPJ8FPSk90qgR0XI,265
|
|
162
|
-
azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py,sha256=
|
|
163
|
+
azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py,sha256=hiCVZOg_dn7q87OPdizhdYqK3SkK46evpEUBphNfIBY,6254
|
|
163
164
|
azure/ai/evaluation/_evaluators/_retrieval/retrieval.prompty,sha256=_YVoO4Gt_WD42bUcj5n6BDW0dMUqNf0yF3Nj5XMOX2c,16490
|
|
164
165
|
azure/ai/evaluation/_evaluators/_rouge/__init__.py,sha256=kusCDaYcXogDugGefRP8MQSn9xv107oDbrMCqZ6K4GA,291
|
|
165
|
-
azure/ai/evaluation/_evaluators/_rouge/_rouge.py,sha256=
|
|
166
|
+
azure/ai/evaluation/_evaluators/_rouge/_rouge.py,sha256=6xfAc18Cqa2bq_GtGTKUEIZdWFqdjAYPjsqNl1ok10E,10033
|
|
166
167
|
azure/ai/evaluation/_evaluators/_service_groundedness/__init__.py,sha256=0DODUGTOgaYyFbO9_zxuwifixDL3SIm3EkwP1sdwn6M,288
|
|
167
|
-
azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py,sha256=
|
|
168
|
+
azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py,sha256=qdwVlgoPB870mcwDzDfsfmWlSocpyQJPvQxROGaiTXg,8158
|
|
168
169
|
azure/ai/evaluation/_evaluators/_similarity/__init__.py,sha256=V2Mspog99_WBltxTkRHG5NpN5s9XoiTSN4I8POWEkLA,268
|
|
169
|
-
azure/ai/evaluation/_evaluators/_similarity/_similarity.py,sha256=
|
|
170
|
+
azure/ai/evaluation/_evaluators/_similarity/_similarity.py,sha256=W86KDcAjf6_tXUVEYM80mmWNHVJ2O_WQD1AT6yRQ6r8,5460
|
|
170
171
|
azure/ai/evaluation/_evaluators/_similarity/similarity.prompty,sha256=eoludASychZoGL625bFCaZai-OY7DIAg90ZLax_o4XE,4594
|
|
171
172
|
azure/ai/evaluation/_evaluators/_task_adherence/__init__.py,sha256=9HtNrG7yYX0Ygq3cZoS_0obAvGgmy5HWcsBcPKoB15c,271
|
|
172
|
-
azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py,sha256=
|
|
173
|
-
azure/ai/evaluation/_evaluators/_task_adherence/task_adherence.prompty,sha256=
|
|
173
|
+
azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py,sha256=DjlgI9LWhVZEJAnLhh4X2rH76ON4ORVfWpoVreSsOfE,11054
|
|
174
|
+
azure/ai/evaluation/_evaluators/_task_adherence/task_adherence.prompty,sha256=b1beQUEBPFLkcJUhiVvH7s07RArcPRVtHvXKKZKHbPg,12795
|
|
174
175
|
azure/ai/evaluation/_evaluators/_tool_call_accuracy/__init__.py,sha256=vYB4Y_3n1LqTiEeZB1O1A0b14wpURBwtW0wPEN2FG9Q,288
|
|
175
|
-
azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py,sha256=
|
|
176
|
-
azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty,sha256=
|
|
176
|
+
azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py,sha256=lyqy4Gm1n0_6ixrYLb39wSA6a0B-sH8GspbdZL2QiTY,17399
|
|
177
|
+
azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty,sha256=mJ8fILFrJ8AjJ-kNwDk_zrOUxWxYBBJVHeL5_6MX48M,10488
|
|
177
178
|
azure/ai/evaluation/_evaluators/_ungrounded_attributes/__init__.py,sha256=wGZBd_cRDgkuS-0HV9qm81dHK7ScYdKd98xLPtk6EwQ,118
|
|
178
|
-
azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py,sha256=
|
|
179
|
+
azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py,sha256=5Y4JMUGRkGiMyBg95OgMVf2AFLEtKnP_GbpeDqwxIGE,4656
|
|
179
180
|
azure/ai/evaluation/_evaluators/_xpia/__init__.py,sha256=VMEL8WrpJQeh4sQiOLzP7hRFPnjzsvwfvTzaGCVJPCM,88
|
|
180
|
-
azure/ai/evaluation/_evaluators/_xpia/xpia.py,sha256=
|
|
181
|
+
azure/ai/evaluation/_evaluators/_xpia/xpia.py,sha256=YJqcl86-IJWxKVKNyq5lTdDyoeRRyv632JUxGkBV1e8,6610
|
|
181
182
|
azure/ai/evaluation/_legacy/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
182
183
|
azure/ai/evaluation/_legacy/_adapters/__init__.py,sha256=LGQk1gGjDTCtd-vEQj6ObYyK7Mff9zL1jFOq7iTrOSU,450
|
|
183
184
|
azure/ai/evaluation/_legacy/_adapters/_check.py,sha256=ojKjHEtjzfg9QA4o4vH4cLVpdw1F-7snxCQ-sdjRFig,426
|
|
@@ -192,14 +193,14 @@ azure/ai/evaluation/_legacy/_adapters/tracing.py,sha256=jm-lkzLA-agRY1meIzs9mFrz
|
|
|
192
193
|
azure/ai/evaluation/_legacy/_adapters/types.py,sha256=q7n0TtpFxd1WttbUR_Q8ODd8bTcMaJjIrxLXx1onirc,447
|
|
193
194
|
azure/ai/evaluation/_legacy/_adapters/utils.py,sha256=2KdYqfeuHLcfqk1qJRviNoqqsghxBZNmyoGcUTNphl0,1306
|
|
194
195
|
azure/ai/evaluation/_legacy/_batch_engine/__init__.py,sha256=NNX2DhtPVzJCX8kR_QzZ6EkUsdGifvwip2LHEcRwy1Y,594
|
|
195
|
-
azure/ai/evaluation/_legacy/_batch_engine/_config.py,sha256
|
|
196
|
-
azure/ai/evaluation/_legacy/_batch_engine/_engine.py,sha256=
|
|
196
|
+
azure/ai/evaluation/_legacy/_batch_engine/_config.py,sha256=9fdRz5YVdf_95mCOugiJuna2pYMEmWKcsWaZCT4IwXM,1820
|
|
197
|
+
azure/ai/evaluation/_legacy/_batch_engine/_engine.py,sha256=MY7nHt36ABwPaj47agPJXF2bn3GHGGHBKNkOS4qAznw,19580
|
|
197
198
|
azure/ai/evaluation/_legacy/_batch_engine/_exceptions.py,sha256=_QQLowht6ww4wBJbShQBo00Y8HFdaWh-dWd44sGvJBc,2870
|
|
198
199
|
azure/ai/evaluation/_legacy/_batch_engine/_openai_injector.py,sha256=jP_ZHre2REdQh2l2JJNuP6arW9pHxOlc-WHG5jLnX6g,5059
|
|
199
|
-
azure/ai/evaluation/_legacy/_batch_engine/_result.py,sha256=
|
|
200
|
-
azure/ai/evaluation/_legacy/_batch_engine/_run.py,sha256
|
|
200
|
+
azure/ai/evaluation/_legacy/_batch_engine/_result.py,sha256=mqwCNATvH2Tavpnk_u1000HfXLauNMgcPT9dpqKh4L4,3516
|
|
201
|
+
azure/ai/evaluation/_legacy/_batch_engine/_run.py,sha256=-fXq3s6_anZ3Qf0i16D_HNGzgjPKCiNwXaUz3qUG3EQ,4537
|
|
201
202
|
azure/ai/evaluation/_legacy/_batch_engine/_run_storage.py,sha256=KjiKaSjT16L_wLYrZpIeBANtin3fa4Gqd3L-Xjw-59I,3418
|
|
202
|
-
azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py,sha256=
|
|
203
|
+
azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py,sha256=wtRQ7COg3fstHqcjhCf-M-Au3G6OVE0sDlCM-ELNOjs,11064
|
|
203
204
|
azure/ai/evaluation/_legacy/_batch_engine/_status.py,sha256=xSpJaMmBroGOL8U_iTpAr_PgyNKaxfawqak6TpuUrkk,780
|
|
204
205
|
azure/ai/evaluation/_legacy/_batch_engine/_trace.py,sha256=xh52vKgs8TKYj1WlqcenlOXiPmcfgdPei2P8BLAIO5g,4430
|
|
205
206
|
azure/ai/evaluation/_legacy/_batch_engine/_utils.py,sha256=pBOw5WTt64POR1c6yxGH5D5MhUxvXcMKJ2Rzzqth0XQ,2957
|
|
@@ -216,41 +217,41 @@ azure/ai/evaluation/_legacy/prompty/_utils.py,sha256=NCuZYuAZSguDtFsLAcgVwwPyAPM
|
|
|
216
217
|
azure/ai/evaluation/_legacy/prompty/_yaml_utils.py,sha256=pVL6xgTHC3AKKD5plJ4d6hiBuComaOlUww1uqqDQlB4,3350
|
|
217
218
|
azure/ai/evaluation/_safety_evaluation/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
218
219
|
azure/ai/evaluation/_safety_evaluation/_generated_rai_client.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
219
|
-
azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py,sha256=
|
|
220
|
+
azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py,sha256=OlylVGIM8aI7cX8qsUzFEZuylS5mhWThhvJ6qS7_FfI,45047
|
|
220
221
|
azure/ai/evaluation/_vendor/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
221
222
|
azure/ai/evaluation/_vendor/rouge_score/__init__.py,sha256=03OkyfS_UmzRnHv6-z9juTaJ6OXJoEJM989hgifIZbc,607
|
|
222
223
|
azure/ai/evaluation/_vendor/rouge_score/rouge_scorer.py,sha256=DtNSeshHipzc6vFnvx7kbs5viXe4LNq-ZrgllFvfR4U,11299
|
|
223
224
|
azure/ai/evaluation/_vendor/rouge_score/scoring.py,sha256=0sqdiNE-4R_EmTTqyWL9_DAOgl54250H5004tZDGxEE,1878
|
|
224
225
|
azure/ai/evaluation/_vendor/rouge_score/tokenize.py,sha256=IyHVsWY6IFFZdB23cLiJs8iBZ0DXk1mQlWE1xtdjuuk,1826
|
|
225
226
|
azure/ai/evaluation/_vendor/rouge_score/tokenizers.py,sha256=3_-y1TyvyluHuERhSJ5CdXSwnpcMA7aAKU6PCz9wH_Q,1745
|
|
226
|
-
azure/ai/evaluation/red_team/__init__.py,sha256=
|
|
227
|
+
azure/ai/evaluation/red_team/__init__.py,sha256=goB0RudQS4_BFvhvb634RXGR2FoZ49Q-fDfQfHDtucQ,632
|
|
227
228
|
azure/ai/evaluation/red_team/_attack_objective_generator.py,sha256=3l5cOfWCfX9-fdFkBdJ0yONv7kL7w6TyghzPVErYN_w,11070
|
|
228
229
|
azure/ai/evaluation/red_team/_attack_strategy.py,sha256=5VEES4AdiHc057Bt8STAKpKvpJ7gKPGxjkh6kjlQ2og,1488
|
|
229
230
|
azure/ai/evaluation/red_team/_callback_chat_target.py,sha256=-kd5voHTnWtTwQVXr3fl_OaxKXLic-GnwELN_e9SG_g,3016
|
|
230
231
|
azure/ai/evaluation/red_team/_default_converter.py,sha256=tewcQgYNqQA8EJ0IIDOA3HhZOR7vpCn8E1hP787gg9k,776
|
|
231
|
-
azure/ai/evaluation/red_team/_red_team.py,sha256=
|
|
232
|
-
azure/ai/evaluation/red_team/_red_team_result.py,sha256=
|
|
232
|
+
azure/ai/evaluation/red_team/_red_team.py,sha256=Hn1jbyd2ywZQ4XYirTVJxIHee9xfauUMzeu3-Jov6ZA,177525
|
|
233
|
+
azure/ai/evaluation/red_team/_red_team_result.py,sha256=9DM8vDQWDhQ1TBj2KsQCCd5fGAh2gZBeT4evJnsq0Vk,17410
|
|
233
234
|
azure/ai/evaluation/red_team/_agent/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
234
235
|
azure/ai/evaluation/red_team/_agent/_agent_functions.py,sha256=kLV2lQ5PHMucGK9IsrnZsmSvlhL2fhgzxa1G0NPF6eM,10482
|
|
235
236
|
azure/ai/evaluation/red_team/_agent/_agent_tools.py,sha256=-ClGcNexUYa6_SxBPERAl2u4LgR0UP5Dk0TeYfUcBW8,20653
|
|
236
237
|
azure/ai/evaluation/red_team/_agent/_agent_utils.py,sha256=3wtUg0BUp68l5Vm01K3zjzd1CKKt_N2Xd295yY1itdo,3224
|
|
237
238
|
azure/ai/evaluation/red_team/_agent/_semantic_kernel_plugin.py,sha256=Q-9uVkIM9Hq63pXhnxg6vwmIf9gTVXmmnC3c3ikbO0w,10601
|
|
238
239
|
azure/ai/evaluation/red_team/_utils/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
239
|
-
azure/ai/evaluation/red_team/_utils/_rai_service_eval_chat_target.py,sha256=
|
|
240
|
+
azure/ai/evaluation/red_team/_utils/_rai_service_eval_chat_target.py,sha256=mC3MmSyfTvyKzZ0p4_bQ2lDh7Sk_v4vLLRcJ0iHh3mw,4940
|
|
240
241
|
azure/ai/evaluation/red_team/_utils/_rai_service_target.py,sha256=BsSffRght1caZh9EsUpRcb8fh5W78ORmTUE7X9XvWd0,29811
|
|
241
242
|
azure/ai/evaluation/red_team/_utils/_rai_service_true_false_scorer.py,sha256=_NZ1OGgXPtKPaOqRjOr-59JguHT_EOfeFuZUQ5FmwAE,4119
|
|
242
|
-
azure/ai/evaluation/red_team/_utils/constants.py,sha256=
|
|
243
|
+
azure/ai/evaluation/red_team/_utils/constants.py,sha256=Lujaa8X72lieAiYK0TLn59fErb1v9hWAI8JlMpmM92w,1948
|
|
243
244
|
azure/ai/evaluation/red_team/_utils/formatting_utils.py,sha256=zoTywXnslhQBUz2NLowny6Q0FclijDxiahsuoON-GQs,6263
|
|
244
245
|
azure/ai/evaluation/red_team/_utils/logging_utils.py,sha256=1EK7xRO0eA0nKJmqz7WhMwjP8M3i1je1KxHdGfH9HVI,4775
|
|
245
246
|
azure/ai/evaluation/red_team/_utils/metric_mapping.py,sha256=TU9Z9umtjwmJy3SQNqbc2Fj-oJUX_7rFlg1NEGXaSK4,2130
|
|
246
247
|
azure/ai/evaluation/red_team/_utils/strategy_utils.py,sha256=gW0cfsB8alXTIV02RHNVsz7vmQLjq7SXNf8ZHY0_OHs,8088
|
|
247
248
|
azure/ai/evaluation/simulator/__init__.py,sha256=JbrPZ8pvTBalyX94SvZ9btHNoovX8rbZV03KmzxxWys,552
|
|
248
249
|
azure/ai/evaluation/simulator/_adversarial_scenario.py,sha256=ISMjXfcmquvuBhM8l2u_X3jbEbNa7F7dR-AwgKNaJw0,1884
|
|
249
|
-
azure/ai/evaluation/simulator/_adversarial_simulator.py,sha256=
|
|
250
|
+
azure/ai/evaluation/simulator/_adversarial_simulator.py,sha256=NuUhI-wzFylCwpQxaQYJ-Q67bQ4dn0Jp70TGHNnsCq0,25711
|
|
250
251
|
azure/ai/evaluation/simulator/_constants.py,sha256=jtsj-XzbseurEAxWmB-iSPmXu7B6ZHrM3bl07j-zruM,875
|
|
251
252
|
azure/ai/evaluation/simulator/_direct_attack_simulator.py,sha256=g3170PdieqzN_98PHVbpmoFKUapLN_Yns_JBF71UNog,11025
|
|
252
|
-
azure/ai/evaluation/simulator/_indirect_attack_simulator.py,sha256=
|
|
253
|
-
azure/ai/evaluation/simulator/_simulator.py,sha256=
|
|
253
|
+
azure/ai/evaluation/simulator/_indirect_attack_simulator.py,sha256=VPTq33pRiXbiGrUo4UPPvYLSuCK0uR39Ylm0WQ2k0Yc,11810
|
|
254
|
+
azure/ai/evaluation/simulator/_simulator.py,sha256=T1w_mF40KLoYQJNUTVO34D_Vuv1I_O43Ii_9L_4u_ps,37267
|
|
254
255
|
azure/ai/evaluation/simulator/_utils.py,sha256=16NltlywpbMtoFtULwTKqeURguIS1kSKSo3g8uKV8TA,5181
|
|
255
256
|
azure/ai/evaluation/simulator/_conversation/__init__.py,sha256=x8bDZIVm10DynqpfrURbeoidAjYv_EFxWr7G7sFShZA,18236
|
|
256
257
|
azure/ai/evaluation/simulator/_conversation/_conversation.py,sha256=aWiodVvzA9yy1itkoVtW88B4qhEpxpnztx0G1-w7U_Y,7729
|
|
@@ -261,17 +262,17 @@ azure/ai/evaluation/simulator/_helpers/__init__.py,sha256=FQwgrJvzq_nv3wF9DBr2py
|
|
|
261
262
|
azure/ai/evaluation/simulator/_helpers/_language_suffix_mapping.py,sha256=sbKc3O5qsg77LEaSEQfWDfzqEFXVDw612BaDcBo3E7A,1095
|
|
262
263
|
azure/ai/evaluation/simulator/_helpers/_simulator_data_classes.py,sha256=BOttMTec3muMiA4OzwD_iW08GTrhja7PL9XVjRCN3jM,3029
|
|
263
264
|
azure/ai/evaluation/simulator/_model_tools/__init__.py,sha256=soaUHfmd_IK1FINPRKgKens7qKOVw9BZwc7ms7N6zrk,860
|
|
264
|
-
azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py,sha256=
|
|
265
|
+
azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py,sha256=m8VSBeFYyj1OKgOKHEoDKvmYSYlIg6RZkPyqbTWw7y0,7945
|
|
265
266
|
azure/ai/evaluation/simulator/_model_tools/_identity_manager.py,sha256=kRmKm8etMq6fM2PjVKL0P7TtXfhDESNME3PenGTryjU,6475
|
|
266
|
-
azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py,sha256=
|
|
267
|
+
azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py,sha256=GJkxtEHp1lv0kQ1gnK-D04Ci18KFkMQ8MZK_2OgJgWo,11827
|
|
267
268
|
azure/ai/evaluation/simulator/_model_tools/_rai_client.py,sha256=fC38IptUtoumxu2CWLmErNoGxMdVlNr60XbpJeKdQ18,11379
|
|
268
269
|
azure/ai/evaluation/simulator/_model_tools/_template_handler.py,sha256=ghQNP8ur19BfbLilEnIio85RbYwQ8APAm45-iNcimYY,8375
|
|
269
270
|
azure/ai/evaluation/simulator/_model_tools/models.py,sha256=H7tjmj9wzLT-6bI542eAfecOKl1sHBZhcd-YNF522Sg,22372
|
|
270
271
|
azure/ai/evaluation/simulator/_prompty/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
271
272
|
azure/ai/evaluation/simulator/_prompty/task_query_response.prompty,sha256=2BzSqDDYilDushvR56vMRDmqFIaIYAewdUlUZg_elMg,2182
|
|
272
273
|
azure/ai/evaluation/simulator/_prompty/task_simulate.prompty,sha256=NE6lH4bfmibgMn4NgJtm9_l3PMoHSFrfjjosDJEKM0g,939
|
|
273
|
-
azure_ai_evaluation-1.
|
|
274
|
-
azure_ai_evaluation-1.
|
|
275
|
-
azure_ai_evaluation-1.
|
|
276
|
-
azure_ai_evaluation-1.
|
|
277
|
-
azure_ai_evaluation-1.
|
|
274
|
+
azure_ai_evaluation-1.10.0.dist-info/METADATA,sha256=jPRl1bvOIg6J2b2pCfoLPp4esbKesiUEFy1bbomwpyQ,42772
|
|
275
|
+
azure_ai_evaluation-1.10.0.dist-info/NOTICE.txt,sha256=4tzi_Yq4-eBGhBvveobWHCgUIVF-ZeouGN0m7hVq5Mk,3592
|
|
276
|
+
azure_ai_evaluation-1.10.0.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
|
277
|
+
azure_ai_evaluation-1.10.0.dist-info/top_level.txt,sha256=S7DhWV9m80TBzAhOFjxDUiNbKszzoThbnrSz5MpbHSQ,6
|
|
278
|
+
azure_ai_evaluation-1.10.0.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|