azure-ai-evaluation 1.4.0__py3-none-any.whl → 1.6.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of azure-ai-evaluation might be problematic. Click here for more details.
- azure/ai/evaluation/__init__.py +9 -16
- azure/ai/evaluation/_aoai/__init__.py +10 -0
- azure/ai/evaluation/_aoai/aoai_grader.py +89 -0
- azure/ai/evaluation/_aoai/label_grader.py +66 -0
- azure/ai/evaluation/_aoai/string_check_grader.py +65 -0
- azure/ai/evaluation/_aoai/text_similarity_grader.py +88 -0
- azure/ai/evaluation/_azure/_clients.py +4 -4
- azure/ai/evaluation/_azure/_envs.py +208 -0
- azure/ai/evaluation/_azure/_token_manager.py +12 -7
- azure/ai/evaluation/_common/__init__.py +5 -0
- azure/ai/evaluation/_common/evaluation_onedp_client.py +118 -0
- azure/ai/evaluation/_common/onedp/__init__.py +32 -0
- azure/ai/evaluation/_common/onedp/_client.py +139 -0
- azure/ai/evaluation/_common/onedp/_configuration.py +73 -0
- azure/ai/evaluation/_common/onedp/_model_base.py +1232 -0
- azure/ai/evaluation/_common/onedp/_patch.py +21 -0
- azure/ai/evaluation/_common/onedp/_serialization.py +2032 -0
- azure/ai/evaluation/_common/onedp/_types.py +21 -0
- azure/ai/evaluation/_common/onedp/_validation.py +50 -0
- azure/ai/evaluation/_common/onedp/_vendor.py +50 -0
- azure/ai/evaluation/_common/onedp/_version.py +9 -0
- azure/ai/evaluation/_common/onedp/aio/__init__.py +29 -0
- azure/ai/evaluation/_common/onedp/aio/_client.py +143 -0
- azure/ai/evaluation/_common/onedp/aio/_configuration.py +75 -0
- azure/ai/evaluation/_common/onedp/aio/_patch.py +21 -0
- azure/ai/evaluation/_common/onedp/aio/_vendor.py +40 -0
- azure/ai/evaluation/_common/onedp/aio/operations/__init__.py +39 -0
- azure/ai/evaluation/_common/onedp/aio/operations/_operations.py +4494 -0
- azure/ai/evaluation/_common/onedp/aio/operations/_patch.py +21 -0
- azure/ai/evaluation/_common/onedp/models/__init__.py +142 -0
- azure/ai/evaluation/_common/onedp/models/_enums.py +162 -0
- azure/ai/evaluation/_common/onedp/models/_models.py +2228 -0
- azure/ai/evaluation/_common/onedp/models/_patch.py +21 -0
- azure/ai/evaluation/_common/onedp/operations/__init__.py +39 -0
- azure/ai/evaluation/_common/onedp/operations/_operations.py +5655 -0
- azure/ai/evaluation/_common/onedp/operations/_patch.py +21 -0
- azure/ai/evaluation/_common/onedp/py.typed +1 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/__init__.py +1 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/aio/__init__.py +1 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/__init__.py +25 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_operations.py +34 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_patch.py +20 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/__init__.py +1 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/__init__.py +1 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/__init__.py +22 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_operations.py +29 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_patch.py +20 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/__init__.py +22 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_operations.py +29 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_patch.py +20 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/operations/__init__.py +25 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/operations/_operations.py +34 -0
- azure/ai/evaluation/_common/onedp/servicepatterns/operations/_patch.py +20 -0
- azure/ai/evaluation/_common/rai_service.py +159 -29
- azure/ai/evaluation/_common/raiclient/_version.py +1 -1
- azure/ai/evaluation/_common/utils.py +80 -2
- azure/ai/evaluation/_constants.py +16 -0
- azure/ai/evaluation/_converters/__init__.py +1 -1
- azure/ai/evaluation/_converters/_ai_services.py +4 -4
- azure/ai/evaluation/_eval_mapping.py +71 -0
- azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py +30 -16
- azure/ai/evaluation/_evaluate/_batch_run/code_client.py +18 -12
- azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py +17 -4
- azure/ai/evaluation/_evaluate/_batch_run/proxy_client.py +47 -22
- azure/ai/evaluation/_evaluate/_batch_run/target_run_context.py +18 -2
- azure/ai/evaluation/_evaluate/_eval_run.py +2 -2
- azure/ai/evaluation/_evaluate/_evaluate.py +372 -105
- azure/ai/evaluation/_evaluate/_evaluate_aoai.py +534 -0
- azure/ai/evaluation/_evaluate/_telemetry/__init__.py +5 -89
- azure/ai/evaluation/_evaluate/_utils.py +120 -7
- azure/ai/evaluation/_evaluators/_common/_base_eval.py +9 -4
- azure/ai/evaluation/_evaluators/_common/_base_multi_eval.py +1 -1
- azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py +12 -3
- azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py +2 -2
- azure/ai/evaluation/_evaluators/_document_retrieval/__init__.py +11 -0
- azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py +467 -0
- azure/ai/evaluation/_evaluators/_fluency/_fluency.py +1 -1
- azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py +2 -2
- azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py +6 -2
- azure/ai/evaluation/_evaluators/_relevance/_relevance.py +1 -1
- azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py +8 -2
- azure/ai/evaluation/_evaluators/_response_completeness/response_completeness.prompty +31 -46
- azure/ai/evaluation/_evaluators/_similarity/_similarity.py +1 -1
- azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py +5 -2
- azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py +6 -2
- azure/ai/evaluation/_exceptions.py +2 -0
- azure/ai/evaluation/_legacy/_adapters/__init__.py +7 -0
- azure/ai/evaluation/_legacy/_adapters/_check.py +17 -0
- azure/ai/evaluation/_legacy/_adapters/_configuration.py +45 -0
- azure/ai/evaluation/_legacy/_adapters/_constants.py +10 -0
- azure/ai/evaluation/_legacy/_adapters/_errors.py +29 -0
- azure/ai/evaluation/_legacy/_adapters/_flows.py +28 -0
- azure/ai/evaluation/_legacy/_adapters/_service.py +16 -0
- azure/ai/evaluation/_legacy/_adapters/client.py +51 -0
- azure/ai/evaluation/_legacy/_adapters/entities.py +26 -0
- azure/ai/evaluation/_legacy/_adapters/tracing.py +28 -0
- azure/ai/evaluation/_legacy/_adapters/types.py +15 -0
- azure/ai/evaluation/_legacy/_adapters/utils.py +31 -0
- azure/ai/evaluation/_legacy/_batch_engine/_engine.py +51 -32
- azure/ai/evaluation/_legacy/_batch_engine/_openai_injector.py +114 -8
- azure/ai/evaluation/_legacy/_batch_engine/_result.py +7 -1
- azure/ai/evaluation/_legacy/_batch_engine/_run.py +6 -0
- azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py +69 -29
- azure/ai/evaluation/_legacy/_batch_engine/_status.py +1 -1
- azure/ai/evaluation/_legacy/_batch_engine/_trace.py +54 -62
- azure/ai/evaluation/_legacy/_batch_engine/_utils.py +19 -1
- azure/ai/evaluation/{_red_team/_utils → _legacy/_common}/__init__.py +1 -1
- azure/ai/evaluation/_legacy/_common/_async_token_provider.py +124 -0
- azure/ai/evaluation/_legacy/_common/_thread_pool_executor_with_context.py +15 -0
- azure/ai/evaluation/_legacy/prompty/_connection.py +11 -74
- azure/ai/evaluation/_legacy/prompty/_exceptions.py +80 -0
- azure/ai/evaluation/_legacy/prompty/_prompty.py +119 -9
- azure/ai/evaluation/_legacy/prompty/_utils.py +72 -2
- azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py +90 -17
- azure/ai/evaluation/_version.py +1 -1
- azure/ai/evaluation/red_team/__init__.py +19 -0
- azure/ai/evaluation/{_red_team → red_team}/_attack_objective_generator.py +3 -0
- azure/ai/evaluation/{_red_team → red_team}/_attack_strategy.py +4 -1
- azure/ai/evaluation/{_red_team → red_team}/_red_team.py +885 -481
- azure/ai/evaluation/red_team/_red_team_result.py +382 -0
- azure/ai/evaluation/{_red_team → red_team}/_utils/constants.py +2 -1
- azure/ai/evaluation/{_red_team → red_team}/_utils/formatting_utils.py +23 -22
- azure/ai/evaluation/{_red_team → red_team}/_utils/logging_utils.py +1 -1
- azure/ai/evaluation/red_team/_utils/metric_mapping.py +23 -0
- azure/ai/evaluation/{_red_team → red_team}/_utils/strategy_utils.py +9 -5
- azure/ai/evaluation/simulator/_adversarial_simulator.py +63 -39
- azure/ai/evaluation/simulator/_constants.py +1 -0
- azure/ai/evaluation/simulator/_conversation/__init__.py +13 -6
- azure/ai/evaluation/simulator/_conversation/_conversation.py +2 -1
- azure/ai/evaluation/simulator/_direct_attack_simulator.py +35 -22
- azure/ai/evaluation/simulator/_helpers/_language_suffix_mapping.py +1 -0
- azure/ai/evaluation/simulator/_indirect_attack_simulator.py +40 -25
- azure/ai/evaluation/simulator/_model_tools/__init__.py +2 -1
- azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py +24 -18
- azure/ai/evaluation/simulator/_model_tools/_identity_manager.py +5 -10
- azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py +65 -41
- azure/ai/evaluation/simulator/_model_tools/_template_handler.py +9 -5
- azure/ai/evaluation/simulator/_model_tools/models.py +20 -17
- azure/ai/evaluation/simulator/_simulator.py +1 -1
- {azure_ai_evaluation-1.4.0.dist-info → azure_ai_evaluation-1.6.0.dist-info}/METADATA +36 -2
- {azure_ai_evaluation-1.4.0.dist-info → azure_ai_evaluation-1.6.0.dist-info}/RECORD +148 -80
- azure/ai/evaluation/_red_team/_red_team_result.py +0 -246
- azure/ai/evaluation/simulator/_tracing.py +0 -89
- /azure/ai/evaluation/_legacy/{_batch_engine → _common}/_logging.py +0 -0
- /azure/ai/evaluation/{_red_team → red_team}/_callback_chat_target.py +0 -0
- /azure/ai/evaluation/{_red_team → red_team}/_default_converter.py +0 -0
- /azure/ai/evaluation/{_red_team → red_team/_utils}/__init__.py +0 -0
- {azure_ai_evaluation-1.4.0.dist-info → azure_ai_evaluation-1.6.0.dist-info}/NOTICE.txt +0 -0
- {azure_ai_evaluation-1.4.0.dist-info → azure_ai_evaluation-1.6.0.dist-info}/WHEEL +0 -0
- {azure_ai_evaluation-1.4.0.dist-info → azure_ai_evaluation-1.6.0.dist-info}/top_level.txt +0 -0
|
@@ -1,28 +1,78 @@
|
|
|
1
|
-
azure/ai/evaluation/__init__.py,sha256=
|
|
2
|
-
azure/ai/evaluation/_constants.py,sha256=
|
|
3
|
-
azure/ai/evaluation/
|
|
1
|
+
azure/ai/evaluation/__init__.py,sha256=hMKlEJjyULlBUt6ansPS1_2cLdz8iR715fikuMUZbyE,3794
|
|
2
|
+
azure/ai/evaluation/_constants.py,sha256=kptry2VQRoInON1SpCZ6yJSVNvdgYC0wfkxsV4K8u1w,3727
|
|
3
|
+
azure/ai/evaluation/_eval_mapping.py,sha256=skdfUfV1jG6jTdWTLVfOh0eeS60Gt0kvr-PJlDcvkzQ,2496
|
|
4
|
+
azure/ai/evaluation/_exceptions.py,sha256=XVliA6hj3C9Pz1ryBn0aC2izpno953VZwarTEfRumi0,5409
|
|
4
5
|
azure/ai/evaluation/_http_utils.py,sha256=1bGce6pKAL-vmaUGRPxVX7DVO05XVQ8YPIwIQ3q7mfA,17221
|
|
5
6
|
azure/ai/evaluation/_model_configurations.py,sha256=MNN6cQlz7P9vNfHmfEKsUcly3j1FEOEFsA8WV7GPuKQ,4043
|
|
6
7
|
azure/ai/evaluation/_user_agent.py,sha256=O2y-QPBAcw7w7qQ6M2aRPC3Vy3TKd789u5lcs2yuFaI,290
|
|
7
|
-
azure/ai/evaluation/_version.py,sha256=
|
|
8
|
+
azure/ai/evaluation/_version.py,sha256=cr6NakZmKvQuqv3P6cLeR8lJWiSwLUCWVqlMj_ZkEmA,229
|
|
8
9
|
azure/ai/evaluation/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
10
|
+
azure/ai/evaluation/_aoai/__init__.py,sha256=DE9av37bnDMCbYjgXAY9pcmCol7URCMkJCTIbRn1xHo,264
|
|
11
|
+
azure/ai/evaluation/_aoai/aoai_grader.py,sha256=PmpawSTWGGh6dwvwQYWvL19BDNbS77mVDSivuftQh_0,4128
|
|
12
|
+
azure/ai/evaluation/_aoai/label_grader.py,sha256=jTWIBOhF9qWlZl7kKH__Ynq6-YqKNgw91nHZfL2vnhw,2690
|
|
13
|
+
azure/ai/evaluation/_aoai/string_check_grader.py,sha256=sc5-D_aXYQGBeqX1U_rGKdO5hhSN7_u60Lesc3V9SsA,2303
|
|
14
|
+
azure/ai/evaluation/_aoai/text_similarity_grader.py,sha256=Hq2qIF4htGddW87gGFvBQTXCMOpjifZTpJtTTRQNg2Q,2874
|
|
9
15
|
azure/ai/evaluation/_azure/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
10
|
-
azure/ai/evaluation/_azure/_clients.py,sha256=
|
|
16
|
+
azure/ai/evaluation/_azure/_clients.py,sha256=YugjJQKqbilvU2gorgtUiKFi3AQZLlsqPPQeWee4WbE,9116
|
|
17
|
+
azure/ai/evaluation/_azure/_envs.py,sha256=SBJL7wHOCzJ59nuHiOXK5fkoqe8CHMMKCLoPUWm6qRM,9393
|
|
11
18
|
azure/ai/evaluation/_azure/_models.py,sha256=Vxcg7WfpAyxLQ-EesZzLGqopguV9Oohfjf-vWKTOA-8,12527
|
|
12
|
-
azure/ai/evaluation/_azure/_token_manager.py,sha256=
|
|
13
|
-
azure/ai/evaluation/_common/__init__.py,sha256=
|
|
19
|
+
azure/ai/evaluation/_azure/_token_manager.py,sha256=_CGub9uIA-N6-9M6mm7gyk9m-B8kr4i1bw9GkqDKLQs,5450
|
|
20
|
+
azure/ai/evaluation/_common/__init__.py,sha256=vqpCpekamv-Cc75OuoGI06tywmX419hqYVztVMZYaLo,797
|
|
14
21
|
azure/ai/evaluation/_common/_experimental.py,sha256=GVtSn9r1CeR_yEa578dJVNDJ3P24eqe8WYdH7llbiQY,5694
|
|
15
22
|
azure/ai/evaluation/_common/constants.py,sha256=7gwcSbcJr-KHA-7Llmpuo4kap_l3X5-emAn2LMb_wk4,2281
|
|
23
|
+
azure/ai/evaluation/_common/evaluation_onedp_client.py,sha256=SU6udOg8lVJ6qZZeMm_GEhAYfbEBYOgjMAAjEbbyCjw,5537
|
|
16
24
|
azure/ai/evaluation/_common/math.py,sha256=d4bwWe35_RWDIZNcbV1BTBbHNx2QHQ4-I3EofDyyNE0,2863
|
|
17
|
-
azure/ai/evaluation/_common/rai_service.py,sha256=
|
|
18
|
-
azure/ai/evaluation/_common/utils.py,sha256=
|
|
25
|
+
azure/ai/evaluation/_common/rai_service.py,sha256=_V7nw27GPle94orsbxJtlGetATY8RvKEzf7SKgPMM9M,34454
|
|
26
|
+
azure/ai/evaluation/_common/utils.py,sha256=mbmPSjOxQHir6QfUDMZXFP85qBc_SQhZ8G1mFKd601M,21531
|
|
27
|
+
azure/ai/evaluation/_common/onedp/__init__.py,sha256=7bv0pblNvJFyhZArS85JZ1KLyVQ6Cly8z2q30wvEq2M,1058
|
|
28
|
+
azure/ai/evaluation/_common/onedp/_client.py,sha256=Gc_mtATKUHML5znufEDlfTx8F08UYBLASSNC3Gb2tZ8,7045
|
|
29
|
+
azure/ai/evaluation/_common/onedp/_configuration.py,sha256=tPyQO1oE9BnPX23L65idp-BAIcOvfD2FP3S3ihiW4LY,3968
|
|
30
|
+
azure/ai/evaluation/_common/onedp/_model_base.py,sha256=tbXHyIgoCiU8Uh3SB5Jjz2TuPnyRP1_bCt6_BBb9r2c,46553
|
|
31
|
+
azure/ai/evaluation/_common/onedp/_patch.py,sha256=xrdxsiXieQiFZyh8B1lHWF80DiQWHmbyjZR5mb8coyM,868
|
|
32
|
+
azure/ai/evaluation/_common/onedp/_serialization.py,sha256=k_AMNNhSC5sPfO7dRCNJCofOjY7aN3V87RBVWJLEnrY,83996
|
|
33
|
+
azure/ai/evaluation/_common/onedp/_types.py,sha256=qau1w2QFg7SfL3E7kmzae7csROBC9ItzP1weVxen1Wg,1002
|
|
34
|
+
azure/ai/evaluation/_common/onedp/_validation.py,sha256=YJCAW5n9KBiqy4VhHiyi8RsPrZow6MEqLg5aJBSxCS4,2145
|
|
35
|
+
azure/ai/evaluation/_common/onedp/_vendor.py,sha256=CGcoyL5I2sHqUfQSqadr_wcuYGsgVCB2MABM-48nK9I,1974
|
|
36
|
+
azure/ai/evaluation/_common/onedp/_version.py,sha256=ZQEsxtJ7-eB_7Kd1H2WlD4WBVQa9O1w38FjpdWxfcZM,495
|
|
37
|
+
azure/ai/evaluation/_common/onedp/py.typed,sha256=dcrsqJrcYfTX-ckLFJMTaj6mD8aDe2u0tkQG-ZYxnEg,26
|
|
38
|
+
azure/ai/evaluation/_common/onedp/aio/__init__.py,sha256=oJCCFsFKTRCs199f2Ai_pIrSOuDyN31Oy1nU8Ix5MbY,1002
|
|
39
|
+
azure/ai/evaluation/_common/onedp/aio/_client.py,sha256=cAs4ZFBDR7LMnkljtjL3OyYh59jLoQ3LvXe1PPF6mKo,7240
|
|
40
|
+
azure/ai/evaluation/_common/onedp/aio/_configuration.py,sha256=Ej37oE15iQQvQWrBlFd41JIlQDTIOd3_uYd_s0e_oYY,4027
|
|
41
|
+
azure/ai/evaluation/_common/onedp/aio/_patch.py,sha256=xrdxsiXieQiFZyh8B1lHWF80DiQWHmbyjZR5mb8coyM,868
|
|
42
|
+
azure/ai/evaluation/_common/onedp/aio/_vendor.py,sha256=lBk0_C6_NYtQeLUL7uM-wFVQJiZAKIdzWct_FPqBKVc,1553
|
|
43
|
+
azure/ai/evaluation/_common/onedp/aio/operations/__init__.py,sha256=2rIhesutTPrcc8BUqSVkRpkQdxTI5lzucEOqj552P0E,1618
|
|
44
|
+
azure/ai/evaluation/_common/onedp/aio/operations/_operations.py,sha256=gMarwhuHtGir6Dms-IHeYZ95oRPnIskq7pHkI_ea7do,194836
|
|
45
|
+
azure/ai/evaluation/_common/onedp/aio/operations/_patch.py,sha256=xrdxsiXieQiFZyh8B1lHWF80DiQWHmbyjZR5mb8coyM,868
|
|
46
|
+
azure/ai/evaluation/_common/onedp/models/__init__.py,sha256=p79kpWIXyKU6pq2JdTzzqsel_LT_MmvOAxo2ja_4aF0,3545
|
|
47
|
+
azure/ai/evaluation/_common/onedp/models/_enums.py,sha256=xWkVAfjZGxnQsaGENmgpfKADv38Sb0mVliUW8i-dCeQ,5814
|
|
48
|
+
azure/ai/evaluation/_common/onedp/models/_models.py,sha256=VIP7RCP-48LSMfc4m0HPSgt40sCnciKNjlV_C-p5H0E,92197
|
|
49
|
+
azure/ai/evaluation/_common/onedp/models/_patch.py,sha256=xrdxsiXieQiFZyh8B1lHWF80DiQWHmbyjZR5mb8coyM,868
|
|
50
|
+
azure/ai/evaluation/_common/onedp/operations/__init__.py,sha256=2rIhesutTPrcc8BUqSVkRpkQdxTI5lzucEOqj552P0E,1618
|
|
51
|
+
azure/ai/evaluation/_common/onedp/operations/_operations.py,sha256=ctlV_BRhHimvHawGXCSCtdoC7BvnrRAUGDxBm8tmf5o,240792
|
|
52
|
+
azure/ai/evaluation/_common/onedp/operations/_patch.py,sha256=xrdxsiXieQiFZyh8B1lHWF80DiQWHmbyjZR5mb8coyM,868
|
|
53
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/__init__.py,sha256=SXUyE9hmQeYBcmIxmXrAZAIeYfMHAA7cy2vPwgRceTo,82
|
|
54
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/aio/__init__.py,sha256=SXUyE9hmQeYBcmIxmXrAZAIeYfMHAA7cy2vPwgRceTo,82
|
|
55
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/__init__.py,sha256=EJcjNzeaFGEcGGDiRmhJKlwinPSKrnC75puUAuvgIxU,968
|
|
56
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_operations.py,sha256=CaLZlRTwEtb3zM4aOoNbvYpqfdVRub8UjoKyeD03JNc,1710
|
|
57
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_patch.py,sha256=YTV6yZ9bRfBBaw2z7v4MdzR-zeHkdtKkGb4SU8C25mE,694
|
|
58
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/__init__.py,sha256=SXUyE9hmQeYBcmIxmXrAZAIeYfMHAA7cy2vPwgRceTo,82
|
|
59
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/__init__.py,sha256=SXUyE9hmQeYBcmIxmXrAZAIeYfMHAA7cy2vPwgRceTo,82
|
|
60
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/__init__.py,sha256=ExsXzY-HrLRduI0vvK8pgfQ-I1PRDJ0gIt-l3L-ykBc,864
|
|
61
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_operations.py,sha256=vZQ_OM2Bbs_H_EHhoJklVtF5tzmI4O0cGEoytseqC5Y,1465
|
|
62
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_patch.py,sha256=YTV6yZ9bRfBBaw2z7v4MdzR-zeHkdtKkGb4SU8C25mE,694
|
|
63
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/__init__.py,sha256=ExsXzY-HrLRduI0vvK8pgfQ-I1PRDJ0gIt-l3L-ykBc,864
|
|
64
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_operations.py,sha256=VO7oD8sQVy5OvpY9oat7em_hDC9D_MCPna2pTj32FuQ,1437
|
|
65
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_patch.py,sha256=YTV6yZ9bRfBBaw2z7v4MdzR-zeHkdtKkGb4SU8C25mE,694
|
|
66
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/operations/__init__.py,sha256=EJcjNzeaFGEcGGDiRmhJKlwinPSKrnC75puUAuvgIxU,968
|
|
67
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/operations/_operations.py,sha256=sCKc8EBwTsb4n_R7XkN0lTKDgEn_Rpn-aTmZR4vf4AU,1677
|
|
68
|
+
azure/ai/evaluation/_common/onedp/servicepatterns/operations/_patch.py,sha256=YTV6yZ9bRfBBaw2z7v4MdzR-zeHkdtKkGb4SU8C25mE,694
|
|
19
69
|
azure/ai/evaluation/_common/raiclient/__init__.py,sha256=SaoPfbEPhdoXpIKqOPmRVNyYky1mW5c7UobHt08ksAI,1153
|
|
20
70
|
azure/ai/evaluation/_common/raiclient/_client.py,sha256=ZnFRcpZ0UD3MeFWnJ44AbkbUqPHsvGM502ra28pm_No,5812
|
|
21
71
|
azure/ai/evaluation/_common/raiclient/_configuration.py,sha256=exABHzDcOl5295p5LnWxL82x21z6_ruyBbigW3WoQRA,4246
|
|
22
72
|
azure/ai/evaluation/_common/raiclient/_model_base.py,sha256=loH1BeKpp3UeO6hFvAzcNbT2hhotWQIDu3JRQgQZV_M,45135
|
|
23
73
|
azure/ai/evaluation/_common/raiclient/_patch.py,sha256=P7PMm3Gbjlk56lI6B_Ra43hSW5qGMEmN3cNYGH5uZ3s,674
|
|
24
74
|
azure/ai/evaluation/_common/raiclient/_serialization.py,sha256=vN_jYB0jHUw2hVIWB6M9n6_0AvFw9mFa3ndcz2y6gaQ,82802
|
|
25
|
-
azure/ai/evaluation/_common/raiclient/_version.py,sha256=
|
|
75
|
+
azure/ai/evaluation/_common/raiclient/_version.py,sha256=76LuocLOwOy3djE39t9CSJF4weFNBTrW_dLz8HaJpQo,484
|
|
26
76
|
azure/ai/evaluation/_common/raiclient/py.typed,sha256=dcrsqJrcYfTX-ckLFJMTaj6mD8aDe2u0tkQG-ZYxnEg,26
|
|
27
77
|
azure/ai/evaluation/_common/raiclient/aio/__init__.py,sha256=hq21DCvcidiGXghKHYHLNSfEMNjbj43jyVssEV6fF3M,1001
|
|
28
78
|
azure/ai/evaluation/_common/raiclient/aio/_client.py,sha256=D8Qx3tiOEgbnv1M8nU6_rJB8QG0JdY7rwwTcLLgv36w,5961
|
|
@@ -38,21 +88,22 @@ azure/ai/evaluation/_common/raiclient/models/_patch.py,sha256=P7PMm3Gbjlk56lI6B_
|
|
|
38
88
|
azure/ai/evaluation/_common/raiclient/operations/__init__.py,sha256=Ah41eszCE4ZDISukKSdOWQQcZGv0TbDduaT35Q8PQz8,925
|
|
39
89
|
azure/ai/evaluation/_common/raiclient/operations/_operations.py,sha256=_-B8zU6GQ4RciGvBcAoVNlfGdNXaqf2XsS3EP-kYu10,50944
|
|
40
90
|
azure/ai/evaluation/_common/raiclient/operations/_patch.py,sha256=P7PMm3Gbjlk56lI6B_Ra43hSW5qGMEmN3cNYGH5uZ3s,674
|
|
41
|
-
azure/ai/evaluation/_converters/__init__.py,sha256=
|
|
42
|
-
azure/ai/evaluation/_converters/_ai_services.py,sha256=
|
|
91
|
+
azure/ai/evaluation/_converters/__init__.py,sha256=UwArlb5cGLN4pRUm8nG7mXsmxhgdIving2OslYhQDAg,179
|
|
92
|
+
azure/ai/evaluation/_converters/_ai_services.py,sha256=U2s-KdCAv4ja-Xo0nGUhjIQEoyg9QmSj2Dqt73uufUo,37091
|
|
43
93
|
azure/ai/evaluation/_converters/_models.py,sha256=LlrB7Vj_uW3-Ng06b3EHahRXf690W4j2XfYihS7dejo,11029
|
|
44
94
|
azure/ai/evaluation/_evaluate/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
45
|
-
azure/ai/evaluation/_evaluate/_eval_run.py,sha256=
|
|
46
|
-
azure/ai/evaluation/_evaluate/_evaluate.py,sha256=
|
|
47
|
-
azure/ai/evaluation/_evaluate/
|
|
95
|
+
azure/ai/evaluation/_evaluate/_eval_run.py,sha256=ZlDvTNDiMSZ2VfzVicPmEGx65LL3LmcKcPWft6XjWcA,21991
|
|
96
|
+
azure/ai/evaluation/_evaluate/_evaluate.py,sha256=Loh9IlLzrPnEdxm9dsfQhBT0PLmrOujbMhNe1G1zT10,50689
|
|
97
|
+
azure/ai/evaluation/_evaluate/_evaluate_aoai.py,sha256=lxBPDBTddEVAIwoXTEbwNmuaR10Wdcqz6NVmBSZxjio,23899
|
|
98
|
+
azure/ai/evaluation/_evaluate/_utils.py,sha256=w-71izKmbqaA4aOLCop6Jj39Z6bWGpB1INy70MpYxws,18899
|
|
48
99
|
azure/ai/evaluation/_evaluate/_batch_run/__init__.py,sha256=cPLi_MJ_pCp8eKBxJbiSoxgTnN3nDLuaP57dMkKuyhg,552
|
|
49
|
-
azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py,sha256=
|
|
100
|
+
azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py,sha256=UkqF7iJUY9lxxMKPuLSsOtLpp3rzq-PTbUnSLq-LQc0,4650
|
|
50
101
|
azure/ai/evaluation/_evaluate/_batch_run/batch_clients.py,sha256=dTZYdQGweGzEN6OHtn1jOmGG767AJ7RJwfHoCCeRddg,2761
|
|
51
|
-
azure/ai/evaluation/_evaluate/_batch_run/code_client.py,sha256=
|
|
52
|
-
azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py,sha256=
|
|
53
|
-
azure/ai/evaluation/_evaluate/_batch_run/proxy_client.py,sha256=
|
|
54
|
-
azure/ai/evaluation/_evaluate/_batch_run/target_run_context.py,sha256=
|
|
55
|
-
azure/ai/evaluation/_evaluate/_telemetry/__init__.py,sha256=
|
|
102
|
+
azure/ai/evaluation/_evaluate/_batch_run/code_client.py,sha256=n4JxDAFNnetfpAj4FyhtZms3kuGmDWXCBOogqeO4F98,8607
|
|
103
|
+
azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py,sha256=RlmmmKKIoosXW2lGXM3crYBYWHHYHQAXU9JO5ATOrIQ,4052
|
|
104
|
+
azure/ai/evaluation/_evaluate/_batch_run/proxy_client.py,sha256=jgHSi0ixvwla9q0EoMDHsN7fm8nezU0iuj4qyNLRHV8,4853
|
|
105
|
+
azure/ai/evaluation/_evaluate/_batch_run/target_run_context.py,sha256=TrZ_IkbU8DeJkZajw22F9DWWFVg0sCBY6bgC9QlHTQ0,2420
|
|
106
|
+
azure/ai/evaluation/_evaluate/_telemetry/__init__.py,sha256=tBZ98BC8sIuANCTZsgONQblR-Vrw2oIcRqjjyHxbZio,3513
|
|
56
107
|
azure/ai/evaluation/_evaluators/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
57
108
|
azure/ai/evaluation/_evaluators/_bleu/__init__.py,sha256=quKKO0kvOSkky5hcoNBvgBuMeeVRFCE9GSv70mAdGP4,260
|
|
58
109
|
azure/ai/evaluation/_evaluators/_bleu/_bleu.py,sha256=ZX12bWcDop7HX5hXT2im2KLIJTWik9ok67zK2hZo1WY,4429
|
|
@@ -62,10 +113,10 @@ azure/ai/evaluation/_evaluators/_coherence/__init__.py,sha256=GRqcSCQse02Spyki0U
|
|
|
62
113
|
azure/ai/evaluation/_evaluators/_coherence/_coherence.py,sha256=IFk4RYa0h39i9GbtUYDph78ELx9GTJ6gzk4-oBtdL34,5378
|
|
63
114
|
azure/ai/evaluation/_evaluators/_coherence/coherence.prompty,sha256=ANvh9mDFW7KMejrgdWqBLjj4SIqEO5WW9gg5pE0RLJk,6798
|
|
64
115
|
azure/ai/evaluation/_evaluators/_common/__init__.py,sha256=xAymP_CZy4aPzWplMdXgQUQVDIUEMI-0nbgdm_umFYY,498
|
|
65
|
-
azure/ai/evaluation/_evaluators/_common/_base_eval.py,sha256
|
|
66
|
-
azure/ai/evaluation/_evaluators/_common/_base_multi_eval.py,sha256=
|
|
67
|
-
azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py,sha256=
|
|
68
|
-
azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py,sha256=
|
|
116
|
+
azure/ai/evaluation/_evaluators/_common/_base_eval.py,sha256=-ay2631R91F7qjTpqAGJLsPnNYB8rXAhyU0wkZQTExk,25744
|
|
117
|
+
azure/ai/evaluation/_evaluators/_common/_base_multi_eval.py,sha256=yYFpoCDe2wMFQck0ykbX8IJBBidk6NT1wUTkVFlVSy8,2728
|
|
118
|
+
azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py,sha256=p7i5WkRljrCtidd6oF_A6iWcwNFrZMVoaVjEyoBTXig,6715
|
|
119
|
+
azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py,sha256=pJHOMYS7vmVEk6PYvIu1VTi0WbNXTZhuh5q2p12ydgg,8569
|
|
69
120
|
azure/ai/evaluation/_evaluators/_common/_conversation_aggregators.py,sha256=gjDBjRxJKwaHbshWH0j2idjlzfzNMnT9a9RL0fQiKeM,2129
|
|
70
121
|
azure/ai/evaluation/_evaluators/_content_safety/__init__.py,sha256=PEYMIybfP64f7byhuTaiq4RiqsYbjqejpW1JsJIG1jA,556
|
|
71
122
|
azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py,sha256=xZwQnmSqaKmLtZaDAoM4vZxOVeudGQaVxa5GLV03NwI,6309
|
|
@@ -73,21 +124,23 @@ azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py,sha256=uEnsy
|
|
|
73
124
|
azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py,sha256=wNyUm2QT1_Jpm7a8uOy74rOMF3yGNupC10g_kbEwRBI,5854
|
|
74
125
|
azure/ai/evaluation/_evaluators/_content_safety/_sexual.py,sha256=-yuKdXd98wQazlQ8s1bB7yee-sAIm-vHlVzDW1sC1t0,6099
|
|
75
126
|
azure/ai/evaluation/_evaluators/_content_safety/_violence.py,sha256=8SwwogI7gBFep_KQKh0SjiNkbxreQToXtUDMr1L6jpA,6159
|
|
127
|
+
azure/ai/evaluation/_evaluators/_document_retrieval/__init__.py,sha256=nefQB4uzoFDrITcU3aYY1lou2pc4ASGvSeMoejS8jM8,399
|
|
128
|
+
azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py,sha256=jqTENMQ6DvVfh04tqiEPbWyUETzcQ7CgV7Oo8j8tMec,19875
|
|
76
129
|
azure/ai/evaluation/_evaluators/_eci/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
77
130
|
azure/ai/evaluation/_evaluators/_eci/_eci.py,sha256=a36sLZPHKi3YAdl0JvpL6vboZMqgGjnmz0qZ-o8vcWY,2934
|
|
78
131
|
azure/ai/evaluation/_evaluators/_f1_score/__init__.py,sha256=aEVbO7iMoF20obdpLQKcKm69Yyu3mYnblKELLqu8OGI,260
|
|
79
132
|
azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py,sha256=Nt4QgiJew6cuLyE3fsy9tizNsC8Rk2vCBiu1FA2doAY,6483
|
|
80
133
|
azure/ai/evaluation/_evaluators/_fluency/__init__.py,sha256=EEJw39xRa0bOAA1rELTTKXQu2s60n_7CZQRD0Gu2QVw,259
|
|
81
|
-
azure/ai/evaluation/_evaluators/_fluency/_fluency.py,sha256=
|
|
134
|
+
azure/ai/evaluation/_evaluators/_fluency/_fluency.py,sha256=BcIElBCXVAB0BOy-PO8Do3wbYW7kisnBOse1DAh1I34,5092
|
|
82
135
|
azure/ai/evaluation/_evaluators/_fluency/fluency.prompty,sha256=n9v0W9eYwgIO-JSsLTSKEM_ApJuxxuKWQpNblrTEkFY,4861
|
|
83
136
|
azure/ai/evaluation/_evaluators/_gleu/__init__.py,sha256=Ae2EvQ7gqiYAoNO3LwGIhdAAjJPJDfT85rQGKrRrmbA,260
|
|
84
137
|
azure/ai/evaluation/_evaluators/_gleu/_gleu.py,sha256=QnogGvw2JmmV4YZCOvoZMMvoB9JMAjnac2r5h806zmI,4421
|
|
85
138
|
azure/ai/evaluation/_evaluators/_groundedness/__init__.py,sha256=UYNJUeRvBwcSVFyZpdsf29un5eyaDzYoo3QvC1gvlLg,274
|
|
86
|
-
azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py,sha256=
|
|
139
|
+
azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py,sha256=f048eUv5z2vt_TULghxplAinhp8nqWkO5_AX4AgLWyM,7634
|
|
87
140
|
azure/ai/evaluation/_evaluators/_groundedness/groundedness_with_query.prompty,sha256=v7TOm75DyW_1gOU6gSiZoPcRnHcJ65DrzR2cL_ucWDY,5814
|
|
88
141
|
azure/ai/evaluation/_evaluators/_groundedness/groundedness_without_query.prompty,sha256=8kNShdfxQvkII7GnqjmdqQ5TNelA2B6cjnqWZk8FFe4,5296
|
|
89
142
|
azure/ai/evaluation/_evaluators/_intent_resolution/__init__.py,sha256=Lr8krXt2yfShFTAuwjTFgrUbO75boLLrRSnF1mriN_Q,280
|
|
90
|
-
azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py,sha256=
|
|
143
|
+
azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py,sha256=ybloJdawB6CyB23dEUo3yfKGNO7CxHk6gxWTJYA5ka8,10895
|
|
91
144
|
azure/ai/evaluation/_evaluators/_intent_resolution/intent_resolution.prompty,sha256=p8_V-bB3uOqqXWRsDNa4eIOoP8U-_D-5fZuCNSL8ZUU,7467
|
|
92
145
|
azure/ai/evaluation/_evaluators/_meteor/__init__.py,sha256=209na3pPsdmcuYpYHUYtqQybCpc3yZkc93HnRdicSlI,266
|
|
93
146
|
azure/ai/evaluation/_evaluators/_meteor/_meteor.py,sha256=DCWzH-wtWlWKkMUXK7nN-hpBYqEKT5cZSl6ikMNaNkw,5462
|
|
@@ -96,11 +149,11 @@ azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py,sha25
|
|
|
96
149
|
azure/ai/evaluation/_evaluators/_qa/__init__.py,sha256=bcXfT--C0hjym2haqd1B2-u9bDciyM0ThOFtU1Q69sk,244
|
|
97
150
|
azure/ai/evaluation/_evaluators/_qa/_qa.py,sha256=A0amMuVRCgcHP567LkXnFXJAWCzdPQfSxisbKLycASw,5772
|
|
98
151
|
azure/ai/evaluation/_evaluators/_relevance/__init__.py,sha256=JlxytW32Nl8pbE-fI3GRpfgVuY9EG6zxIAn5VZGSwyc,265
|
|
99
|
-
azure/ai/evaluation/_evaluators/_relevance/_relevance.py,sha256=
|
|
152
|
+
azure/ai/evaluation/_evaluators/_relevance/_relevance.py,sha256=ArHNIBnoSLoedjenuZD4cq-p15I31BjIZDs-17OZpNk,6068
|
|
100
153
|
azure/ai/evaluation/_evaluators/_relevance/relevance.prompty,sha256=VHKzVlC2Cv1xuholgIGmerPspspAI0t6IgJ2cxOuYDE,4811
|
|
101
154
|
azure/ai/evaluation/_evaluators/_response_completeness/__init__.py,sha256=U3eqkQQAgRif46B6UGdq3yWefgbkZGJ3ZE2sKoZQDlU,292
|
|
102
|
-
azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py,sha256=
|
|
103
|
-
azure/ai/evaluation/_evaluators/_response_completeness/response_completeness.prompty,sha256=
|
|
155
|
+
azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py,sha256=oClDNyE42eI3K6qz5n8yIpFhtBqwmDhQU6tBMUQMZrs,7553
|
|
156
|
+
azure/ai/evaluation/_evaluators/_response_completeness/response_completeness.prompty,sha256=25PqzWWtpwvsKNnBGDNfqsKKo2RpyeiIFzvK8sauPDg,7520
|
|
104
157
|
azure/ai/evaluation/_evaluators/_retrieval/__init__.py,sha256=kMu47ZyTZ7f-4Yh6H3KHxswmxitmPJ8FPSk90qgR0XI,265
|
|
105
158
|
azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py,sha256=eddgpihSjZwQH58lcfL0vYh-07H_TOVT8dt_MxRZfBk,5791
|
|
106
159
|
azure/ai/evaluation/_evaluators/_retrieval/retrieval.prompty,sha256=_YVoO4Gt_WD42bUcj5n6BDW0dMUqNf0yF3Nj5XMOX2c,16490
|
|
@@ -109,89 +162,104 @@ azure/ai/evaluation/_evaluators/_rouge/_rouge.py,sha256=BrOr7qj_jLDPSbOy4jupF6FW
|
|
|
109
162
|
azure/ai/evaluation/_evaluators/_service_groundedness/__init__.py,sha256=0DODUGTOgaYyFbO9_zxuwifixDL3SIm3EkwP1sdwn6M,288
|
|
110
163
|
azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py,sha256=YkmGxWOIzuPaBoxY2rxlkOQzw-atyo9lKtGgv34wulw,7544
|
|
111
164
|
azure/ai/evaluation/_evaluators/_similarity/__init__.py,sha256=V2Mspog99_WBltxTkRHG5NpN5s9XoiTSN4I8POWEkLA,268
|
|
112
|
-
azure/ai/evaluation/_evaluators/_similarity/_similarity.py,sha256=
|
|
165
|
+
azure/ai/evaluation/_evaluators/_similarity/_similarity.py,sha256=AbvDy2Cj6XTFCWa4plnPfPt-ElObI-9Xp5bH3Lr40MI,4934
|
|
113
166
|
azure/ai/evaluation/_evaluators/_similarity/similarity.prompty,sha256=eoludASychZoGL625bFCaZai-OY7DIAg90ZLax_o4XE,4594
|
|
114
167
|
azure/ai/evaluation/_evaluators/_task_adherence/__init__.py,sha256=9HtNrG7yYX0Ygq3cZoS_0obAvGgmy5HWcsBcPKoB15c,271
|
|
115
|
-
azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py,sha256=
|
|
168
|
+
azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py,sha256=Cj1GbAV_VHvVcgelKcfbqxhb2HFIVazFLPIk32qC4I4,9788
|
|
116
169
|
azure/ai/evaluation/_evaluators/_task_adherence/task_adherence.prompty,sha256=tOgTrDO41jsFHloabSBCWcbwKB1MtGGxHH_pyFIn2Vk,5350
|
|
117
170
|
azure/ai/evaluation/_evaluators/_tool_call_accuracy/__init__.py,sha256=vYB4Y_3n1LqTiEeZB1O1A0b14wpURBwtW0wPEN2FG9Q,288
|
|
118
|
-
azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py,sha256=
|
|
171
|
+
azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py,sha256=t4muegaCS-NP1BW0a3ojST1Ws9ZVZYSnyFixZP_0Mtg,14706
|
|
119
172
|
azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty,sha256=0YgN5SwlWCdcqHAhRU5NEVlZL062tQMiFil0bvdppn4,3890
|
|
120
173
|
azure/ai/evaluation/_evaluators/_ungrounded_attributes/__init__.py,sha256=wGZBd_cRDgkuS-0HV9qm81dHK7ScYdKd98xLPtk6EwQ,118
|
|
121
174
|
azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py,sha256=h534CBX_OfFcmb_QmGKl6MURvmvewbleqeg8iCBZq8c,3800
|
|
122
175
|
azure/ai/evaluation/_evaluators/_xpia/__init__.py,sha256=VMEL8WrpJQeh4sQiOLzP7hRFPnjzsvwfvTzaGCVJPCM,88
|
|
123
176
|
azure/ai/evaluation/_evaluators/_xpia/xpia.py,sha256=64ersTyBvmkl2lvuuh5YJqJ2Ow0RUzjlqxZCnhYhS0g,5958
|
|
124
177
|
azure/ai/evaluation/_legacy/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
178
|
+
azure/ai/evaluation/_legacy/_adapters/__init__.py,sha256=LGQk1gGjDTCtd-vEQj6ObYyK7Mff9zL1jFOq7iTrOSU,450
|
|
179
|
+
azure/ai/evaluation/_legacy/_adapters/_check.py,sha256=ojKjHEtjzfg9QA4o4vH4cLVpdw1F-7snxCQ-sdjRFig,426
|
|
180
|
+
azure/ai/evaluation/_legacy/_adapters/_configuration.py,sha256=aDukrNbyXz9zPHYKpmXrLthnJoJQziP1WL793nIuC28,1677
|
|
181
|
+
azure/ai/evaluation/_legacy/_adapters/_constants.py,sha256=MmTUbPSCiM4eLtAA5LIsD6sN1B9IuFB-RTuUnxbwZSs,386
|
|
182
|
+
azure/ai/evaluation/_legacy/_adapters/_errors.py,sha256=SSyaGsqGzzrIeOKEGTtIzhKnAIg_oJw5ze5KMPIfw2Y,1175
|
|
183
|
+
azure/ai/evaluation/_legacy/_adapters/_flows.py,sha256=Mk9YXp3bIRCp_HQDFXcN5n2C8lrkAwWQAo6g9XZxf-Q,769
|
|
184
|
+
azure/ai/evaluation/_legacy/_adapters/_service.py,sha256=4xlpxSCrH0jWyKVazu-qhe42KgFksKWVPQqDqf7CFGY,423
|
|
185
|
+
azure/ai/evaluation/_legacy/_adapters/client.py,sha256=76XEJJ2GoKJsfHfMSvixU8oSI6ePtJQBG10x9PXVUxM,1770
|
|
186
|
+
azure/ai/evaluation/_legacy/_adapters/entities.py,sha256=4ZYXfawx5w7t0pyEdm7g49eAJwct2QtcZX0ZvB_6uHU,710
|
|
187
|
+
azure/ai/evaluation/_legacy/_adapters/tracing.py,sha256=jm-lkzLA-agRY1meIzs9mFrzJ1A3dBodi6HgjklIjD0,1162
|
|
188
|
+
azure/ai/evaluation/_legacy/_adapters/types.py,sha256=q7n0TtpFxd1WttbUR_Q8ODd8bTcMaJjIrxLXx1onirc,447
|
|
189
|
+
azure/ai/evaluation/_legacy/_adapters/utils.py,sha256=2KdYqfeuHLcfqk1qJRviNoqqsghxBZNmyoGcUTNphl0,1306
|
|
125
190
|
azure/ai/evaluation/_legacy/_batch_engine/__init__.py,sha256=NNX2DhtPVzJCX8kR_QzZ6EkUsdGifvwip2LHEcRwy1Y,594
|
|
126
191
|
azure/ai/evaluation/_legacy/_batch_engine/_config.py,sha256=-B37cIbWOWEB3kTaNjHGLfQNbLa-XAP1gWm0Kvyv82k,1724
|
|
127
|
-
azure/ai/evaluation/_legacy/_batch_engine/_engine.py,sha256=
|
|
192
|
+
azure/ai/evaluation/_legacy/_batch_engine/_engine.py,sha256=ZXTqKxUlhTfEoU3iyx6Y3Ru6akXVrgOD9ArkUMfs5VI,16659
|
|
128
193
|
azure/ai/evaluation/_legacy/_batch_engine/_exceptions.py,sha256=_QQLowht6ww4wBJbShQBo00Y8HFdaWh-dWd44sGvJBc,2870
|
|
129
|
-
azure/ai/evaluation/_legacy/_batch_engine/
|
|
130
|
-
azure/ai/evaluation/_legacy/_batch_engine/
|
|
131
|
-
azure/ai/evaluation/_legacy/_batch_engine/
|
|
132
|
-
azure/ai/evaluation/_legacy/_batch_engine/_run.py,sha256=b9eJOorEHcGJqE7cApvJpY3JpUdCv3ZVNFo4ZKlfWNA,4343
|
|
194
|
+
azure/ai/evaluation/_legacy/_batch_engine/_openai_injector.py,sha256=nmljSr5yGgiYRi6gD80IiTMSQNwDlAep9ILjZqRYJEI,5027
|
|
195
|
+
azure/ai/evaluation/_legacy/_batch_engine/_result.py,sha256=tPnI7Ab2t89ri4kvplJPvKBb0BOrMDQm3HAPXZuhp60,3471
|
|
196
|
+
azure/ai/evaluation/_legacy/_batch_engine/_run.py,sha256=iNLMtkjvsbgivB59xWuB77kyZKxU40YhwoaJ_djuAcc,4491
|
|
133
197
|
azure/ai/evaluation/_legacy/_batch_engine/_run_storage.py,sha256=KjiKaSjT16L_wLYrZpIeBANtin3fa4Gqd3L-Xjw-59I,3418
|
|
134
|
-
azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py,sha256=
|
|
135
|
-
azure/ai/evaluation/_legacy/_batch_engine/_status.py,sha256=
|
|
136
|
-
azure/ai/evaluation/_legacy/_batch_engine/_trace.py,sha256=
|
|
137
|
-
azure/ai/evaluation/_legacy/_batch_engine/_utils.py,sha256=
|
|
198
|
+
azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py,sha256=sGv91UgMZ2rK1Iq0J1CfQX824YSn6s-IR05NPWGCDmE,11208
|
|
199
|
+
azure/ai/evaluation/_legacy/_batch_engine/_status.py,sha256=xSpJaMmBroGOL8U_iTpAr_PgyNKaxfawqak6TpuUrkk,780
|
|
200
|
+
azure/ai/evaluation/_legacy/_batch_engine/_trace.py,sha256=xh52vKgs8TKYj1WlqcenlOXiPmcfgdPei2P8BLAIO5g,4430
|
|
201
|
+
azure/ai/evaluation/_legacy/_batch_engine/_utils.py,sha256=EQsRDLh9UA7KNC3L_g7jVGjwc9957EtiBQ8o5pgUSfo,2981
|
|
138
202
|
azure/ai/evaluation/_legacy/_batch_engine/_utils_deprecated.py,sha256=hBm4gh_m8BCWDAryKmqO4ZsypuGE1QSh3K_DxfoEKpc,5917
|
|
203
|
+
azure/ai/evaluation/_legacy/_common/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
204
|
+
azure/ai/evaluation/_legacy/_common/_async_token_provider.py,sha256=VQrdiaH2j3DAMCO8OEhfXCgS18FGmi-JrGQFL7XxqqY,5527
|
|
205
|
+
azure/ai/evaluation/_legacy/_common/_logging.py,sha256=aEZsfS2wqbqVEA-vBsfg0-sCWyssGf2L1oWFmu9cego,11398
|
|
206
|
+
azure/ai/evaluation/_legacy/_common/_thread_pool_executor_with_context.py,sha256=PoMMrG9p_ryNgxpv7zBb362lS2md02qON1H0Xroa95w,630
|
|
139
207
|
azure/ai/evaluation/_legacy/prompty/__init__.py,sha256=nWpB3ApQWzlzgbhvNkjHq3sL5tnpwfwmSsTKBmhxmN8,1660
|
|
140
|
-
azure/ai/evaluation/_legacy/prompty/_connection.py,sha256=
|
|
141
|
-
azure/ai/evaluation/_legacy/prompty/_exceptions.py,sha256=
|
|
142
|
-
azure/ai/evaluation/_legacy/prompty/_prompty.py,sha256=
|
|
143
|
-
azure/ai/evaluation/_legacy/prompty/_utils.py,sha256=
|
|
208
|
+
azure/ai/evaluation/_legacy/prompty/_connection.py,sha256=ZaO-TkUsWglsEEwek58MsvKSxXU13Xrai-O5DCqCuT8,3891
|
|
209
|
+
azure/ai/evaluation/_legacy/prompty/_exceptions.py,sha256=BmYd5D3_ZnDRpbeWoMFO1GA6mjVOaNkFAksEGbHQwzM,7267
|
|
210
|
+
azure/ai/evaluation/_legacy/prompty/_prompty.py,sha256=apbuS-TkMFIqryWJLfD3IiDO4X-0LS3C8AnXjrRTljc,16457
|
|
211
|
+
azure/ai/evaluation/_legacy/prompty/_utils.py,sha256=NCuZYuAZSguDtFsLAcgVwwPyAPM_MvdJnonup_KoEfs,25650
|
|
144
212
|
azure/ai/evaluation/_legacy/prompty/_yaml_utils.py,sha256=pVL6xgTHC3AKKD5plJ4d6hiBuComaOlUww1uqqDQlB4,3350
|
|
145
|
-
azure/ai/evaluation/_red_team/__init__.py,sha256=UwArlb5cGLN4pRUm8nG7mXsmxhgdIving2OslYhQDAg,179
|
|
146
|
-
azure/ai/evaluation/_red_team/_attack_objective_generator.py,sha256=fkKrobdFSnOEsOOpsY6gpEiyIWhi5hV4TImbWj6fBeE,10683
|
|
147
|
-
azure/ai/evaluation/_red_team/_attack_strategy.py,sha256=8n2M-BM8TDRs8bAfZAgwDl0MzIXqf8eeKNsg5V83m_s,1348
|
|
148
|
-
azure/ai/evaluation/_red_team/_callback_chat_target.py,sha256=H58nU6IVEpeDuTZPsxIoYKXAvU3dAWnLRhA8wyaY11s,3071
|
|
149
|
-
azure/ai/evaluation/_red_team/_default_converter.py,sha256=K8G775VVdQLsAqff60BBNFrNRj8JijB7St9XOHmGQGA,775
|
|
150
|
-
azure/ai/evaluation/_red_team/_red_team.py,sha256=Khe5zRBPk5D6CMpc6I2pQZT2Mtl7a4wn6kuim6gYjwg,103691
|
|
151
|
-
azure/ai/evaluation/_red_team/_red_team_result.py,sha256=qPEazh6rhtcj8dEHozZVNxC5JuHRoBDmC-2RfdCOd2k,11312
|
|
152
|
-
azure/ai/evaluation/_red_team/_utils/__init__.py,sha256=UwArlb5cGLN4pRUm8nG7mXsmxhgdIving2OslYhQDAg,179
|
|
153
|
-
azure/ai/evaluation/_red_team/_utils/constants.py,sha256=ROM2jbmw3_VOiRoC2AwoUxVxFxVV5wmN-G-QGhmiH60,2256
|
|
154
|
-
azure/ai/evaluation/_red_team/_utils/formatting_utils.py,sha256=m7vZDv1gzFl1jnaegpSI6o6XQmTwy4fFh1j25w8dG_E,6352
|
|
155
|
-
azure/ai/evaluation/_red_team/_utils/logging_utils.py,sha256=Kviojc9PCyArVSRZ_9qJ00zwIsWobKdw7OlOzKjkFOw,4823
|
|
156
|
-
azure/ai/evaluation/_red_team/_utils/strategy_utils.py,sha256=AMi8PAB2UISXLXzRDNnuJHwPc50RZ7Y5WrkTaArJOCY,7809
|
|
157
213
|
azure/ai/evaluation/_safety_evaluation/__init__.py,sha256=UwArlb5cGLN4pRUm8nG7mXsmxhgdIving2OslYhQDAg,179
|
|
158
214
|
azure/ai/evaluation/_safety_evaluation/_generated_rai_client.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
159
|
-
azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py,sha256=
|
|
215
|
+
azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py,sha256=V_AZthT294sCdFVEuNum6mILerMqH-ANYd9B-S78NvA,40890
|
|
160
216
|
azure/ai/evaluation/_vendor/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
161
217
|
azure/ai/evaluation/_vendor/rouge_score/__init__.py,sha256=03OkyfS_UmzRnHv6-z9juTaJ6OXJoEJM989hgifIZbc,607
|
|
162
218
|
azure/ai/evaluation/_vendor/rouge_score/rouge_scorer.py,sha256=DtNSeshHipzc6vFnvx7kbs5viXe4LNq-ZrgllFvfR4U,11299
|
|
163
219
|
azure/ai/evaluation/_vendor/rouge_score/scoring.py,sha256=0sqdiNE-4R_EmTTqyWL9_DAOgl54250H5004tZDGxEE,1878
|
|
164
220
|
azure/ai/evaluation/_vendor/rouge_score/tokenize.py,sha256=IyHVsWY6IFFZdB23cLiJs8iBZ0DXk1mQlWE1xtdjuuk,1826
|
|
165
221
|
azure/ai/evaluation/_vendor/rouge_score/tokenizers.py,sha256=3_-y1TyvyluHuERhSJ5CdXSwnpcMA7aAKU6PCz9wH_Q,1745
|
|
222
|
+
azure/ai/evaluation/red_team/__init__.py,sha256=wAjy_85gzdX0YyUlj6kHWrpo01zz2mgOJ1AbH5EkH8s,613
|
|
223
|
+
azure/ai/evaluation/red_team/_attack_objective_generator.py,sha256=yMK5z91_w6GIzbqTQtUXfABuGeH3nfVgF8feOMd37K4,10765
|
|
224
|
+
azure/ai/evaluation/red_team/_attack_strategy.py,sha256=CmMYhp9cm8xTr63LbrFnfFyTxXQ3Xn4PZ5tEfMRFVIQ,1431
|
|
225
|
+
azure/ai/evaluation/red_team/_callback_chat_target.py,sha256=H58nU6IVEpeDuTZPsxIoYKXAvU3dAWnLRhA8wyaY11s,3071
|
|
226
|
+
azure/ai/evaluation/red_team/_default_converter.py,sha256=K8G775VVdQLsAqff60BBNFrNRj8JijB7St9XOHmGQGA,775
|
|
227
|
+
azure/ai/evaluation/red_team/_red_team.py,sha256=Wy4dhMfTqaFjsU8MzrJ8NxeSt5UwZzTa2oSbTGEsxrY,129881
|
|
228
|
+
azure/ai/evaluation/red_team/_red_team_result.py,sha256=BwHf0KBGe9hqyWeTYDOOuoIxJ0rqkY9lHLUOZ02wPJI,17340
|
|
229
|
+
azure/ai/evaluation/red_team/_utils/__init__.py,sha256=UwArlb5cGLN4pRUm8nG7mXsmxhgdIving2OslYhQDAg,179
|
|
230
|
+
azure/ai/evaluation/red_team/_utils/constants.py,sha256=ctSsuWiavhaGApRgP6fL3OtNGphnCKuesTQOwR833nk,2289
|
|
231
|
+
azure/ai/evaluation/red_team/_utils/formatting_utils.py,sha256=jztERWOb1P3ClOKEr6-sMmLDQ8subjKUVBKVVxeSFcY,6416
|
|
232
|
+
azure/ai/evaluation/red_team/_utils/logging_utils.py,sha256=jjNq37zlJz0KPo9g8NuuhnDJo56T-06ElJ-7yyeD46M,4838
|
|
233
|
+
azure/ai/evaluation/red_team/_utils/metric_mapping.py,sha256=HhN3YWDNDs41jtGCUJ0HJ7fg-2AuQKIdUsOucOdw9TI,950
|
|
234
|
+
azure/ai/evaluation/red_team/_utils/strategy_utils.py,sha256=wImNcnKNNC-Z8L8TdLCSNfftK8pLTA2RLLoyMXPSRc8,8059
|
|
166
235
|
azure/ai/evaluation/simulator/__init__.py,sha256=JbrPZ8pvTBalyX94SvZ9btHNoovX8rbZV03KmzxxWys,552
|
|
167
236
|
azure/ai/evaluation/simulator/_adversarial_scenario.py,sha256=FQ9ZNruqPY4o06uu2uig2MZSbearwAJwieIB26GbPOU,1833
|
|
168
|
-
azure/ai/evaluation/simulator/_adversarial_simulator.py,sha256
|
|
169
|
-
azure/ai/evaluation/simulator/_constants.py,sha256=
|
|
170
|
-
azure/ai/evaluation/simulator/_direct_attack_simulator.py,sha256=
|
|
171
|
-
azure/ai/evaluation/simulator/_indirect_attack_simulator.py,sha256=
|
|
172
|
-
azure/ai/evaluation/simulator/_simulator.py,sha256=
|
|
173
|
-
azure/ai/evaluation/simulator/_tracing.py,sha256=frZ4-usrzINast9F4-ONRzEGGox71y8bYw0UHNufL1Y,3069
|
|
237
|
+
azure/ai/evaluation/simulator/_adversarial_simulator.py,sha256=-vkPNop_dJDG8skju4v3skCjdx2brl7OomoSP37q-GM,24791
|
|
238
|
+
azure/ai/evaluation/simulator/_constants.py,sha256=jtsj-XzbseurEAxWmB-iSPmXu7B6ZHrM3bl07j-zruM,875
|
|
239
|
+
azure/ai/evaluation/simulator/_direct_attack_simulator.py,sha256=_5m_WUMD2WimrCV1HWC-xrsdnHppaxwIY-y1hdaqwcI,10968
|
|
240
|
+
azure/ai/evaluation/simulator/_indirect_attack_simulator.py,sha256=qy1WHO4_37gnYGfSFj0eaQi_jg2ocSfL4FdJO_h09n0,11159
|
|
241
|
+
azure/ai/evaluation/simulator/_simulator.py,sha256=aVoPvTQsY7u4O0YYQm4pug368UelKefAxa38dJVZ4ps,36513
|
|
174
242
|
azure/ai/evaluation/simulator/_utils.py,sha256=16NltlywpbMtoFtULwTKqeURguIS1kSKSo3g8uKV8TA,5181
|
|
175
|
-
azure/ai/evaluation/simulator/_conversation/__init__.py,sha256=
|
|
176
|
-
azure/ai/evaluation/simulator/_conversation/_conversation.py,sha256=
|
|
243
|
+
azure/ai/evaluation/simulator/_conversation/__init__.py,sha256=bhAXScChUuJrBoUNEWeDLRoM8wntXEXosUhr7-1Amq4,18257
|
|
244
|
+
azure/ai/evaluation/simulator/_conversation/_conversation.py,sha256=aWiodVvzA9yy1itkoVtW88B4qhEpxpnztx0G1-w7U_Y,7729
|
|
177
245
|
azure/ai/evaluation/simulator/_conversation/constants.py,sha256=3v7zkjPwJAPbSpJYIK6VOZZy70bJXMo_QTVqSFGlq9A,984
|
|
178
246
|
azure/ai/evaluation/simulator/_data_sources/__init__.py,sha256=Yx1Iq2GNKQ5lYxTotvPwkPL4u0cm6YVxUe-iVbu1clI,180
|
|
179
247
|
azure/ai/evaluation/simulator/_data_sources/grounding.json,sha256=jqdqHrCgS7hN7K2kXSEcPCmzFjV4cv_qcCSR-Hutwx4,1257075
|
|
180
248
|
azure/ai/evaluation/simulator/_helpers/__init__.py,sha256=FQwgrJvzq_nv3wF9DBr2pyLn2V2hKGmtp0QN9nwpAww,203
|
|
181
|
-
azure/ai/evaluation/simulator/_helpers/_language_suffix_mapping.py,sha256=
|
|
249
|
+
azure/ai/evaluation/simulator/_helpers/_language_suffix_mapping.py,sha256=sbKc3O5qsg77LEaSEQfWDfzqEFXVDw612BaDcBo3E7A,1095
|
|
182
250
|
azure/ai/evaluation/simulator/_helpers/_simulator_data_classes.py,sha256=BOttMTec3muMiA4OzwD_iW08GTrhja7PL9XVjRCN3jM,3029
|
|
183
|
-
azure/ai/evaluation/simulator/_model_tools/__init__.py,sha256=
|
|
184
|
-
azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py,sha256=
|
|
185
|
-
azure/ai/evaluation/simulator/_model_tools/_identity_manager.py,sha256
|
|
186
|
-
azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py,sha256=
|
|
251
|
+
azure/ai/evaluation/simulator/_model_tools/__init__.py,sha256=soaUHfmd_IK1FINPRKgKens7qKOVw9BZwc7ms7N6zrk,860
|
|
252
|
+
azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py,sha256=ssWbQ8RCsojwqkcqp9FLuFfTnzUCAca7ygJ_gOC-au4,6692
|
|
253
|
+
azure/ai/evaluation/simulator/_model_tools/_identity_manager.py,sha256=DO9vRSLsp974S1f8KdK3w2fTicdAcv3Y0gntwtXehm4,6433
|
|
254
|
+
azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py,sha256=BCKOS3QY1iUn6gLB00fXzKervpzbeufJ8gx__Fb5-8U,10587
|
|
187
255
|
azure/ai/evaluation/simulator/_model_tools/_rai_client.py,sha256=nvDS33uaxLpuvZEC4aotu-P9-CHqLiyCInED6Xq9ZQ0,11643
|
|
188
|
-
azure/ai/evaluation/simulator/_model_tools/_template_handler.py,sha256=
|
|
189
|
-
azure/ai/evaluation/simulator/_model_tools/models.py,sha256=
|
|
256
|
+
azure/ai/evaluation/simulator/_model_tools/_template_handler.py,sha256=5XoM3H3_fk7SoxHoxEsBtkP_Y26Rx4KLpN__Z-u9BxU,7445
|
|
257
|
+
azure/ai/evaluation/simulator/_model_tools/models.py,sha256=V3Rs9htzt0XtLdLZRaHB_hxMRcJ-z_VR9eXwBOKpi_Y,22373
|
|
190
258
|
azure/ai/evaluation/simulator/_prompty/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
191
259
|
azure/ai/evaluation/simulator/_prompty/task_query_response.prompty,sha256=2BzSqDDYilDushvR56vMRDmqFIaIYAewdUlUZg_elMg,2182
|
|
192
260
|
azure/ai/evaluation/simulator/_prompty/task_simulate.prompty,sha256=NE6lH4bfmibgMn4NgJtm9_l3PMoHSFrfjjosDJEKM0g,939
|
|
193
|
-
azure_ai_evaluation-1.
|
|
194
|
-
azure_ai_evaluation-1.
|
|
195
|
-
azure_ai_evaluation-1.
|
|
196
|
-
azure_ai_evaluation-1.
|
|
197
|
-
azure_ai_evaluation-1.
|
|
261
|
+
azure_ai_evaluation-1.6.0.dist-info/METADATA,sha256=XwCqViFvDnLxvcp9ZWgA3qiLpevbcCL7w0D6xiavMvE,37287
|
|
262
|
+
azure_ai_evaluation-1.6.0.dist-info/NOTICE.txt,sha256=4tzi_Yq4-eBGhBvveobWHCgUIVF-ZeouGN0m7hVq5Mk,3592
|
|
263
|
+
azure_ai_evaluation-1.6.0.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
|
264
|
+
azure_ai_evaluation-1.6.0.dist-info/top_level.txt,sha256=S7DhWV9m80TBzAhOFjxDUiNbKszzoThbnrSz5MpbHSQ,6
|
|
265
|
+
azure_ai_evaluation-1.6.0.dist-info/RECORD,,
|
|
@@ -1,246 +0,0 @@
|
|
|
1
|
-
# ---------------------------------------------------------
|
|
2
|
-
# Copyright (c) Microsoft Corporation. All rights reserved.
|
|
3
|
-
# ---------------------------------------------------------
|
|
4
|
-
from typing import Dict, List, Optional, TypedDict
|
|
5
|
-
import json
|
|
6
|
-
|
|
7
|
-
class _RiskCategorySummary(TypedDict):
|
|
8
|
-
"""Summary of attack success rates across risk categories."""
|
|
9
|
-
overall_asr: float
|
|
10
|
-
overall_total: int
|
|
11
|
-
overall_successful_attacks: int
|
|
12
|
-
hate_unfairness_asr: float
|
|
13
|
-
hate_unfairness_total: int
|
|
14
|
-
hate_unfairness_successful_attacks: int
|
|
15
|
-
violence_asr: float
|
|
16
|
-
violence_total: int
|
|
17
|
-
violence_successful_attacks: int
|
|
18
|
-
sexual_asr: float
|
|
19
|
-
sexual_total: int
|
|
20
|
-
sexual_successful_attacks: int
|
|
21
|
-
self_harm_asr: float
|
|
22
|
-
self_harm_total: int
|
|
23
|
-
self_harm_successful_attacks: int
|
|
24
|
-
|
|
25
|
-
class _AttackTechniqueSummary(TypedDict):
|
|
26
|
-
"""Summary of attack success rates across complexity levels."""
|
|
27
|
-
overall_asr: float
|
|
28
|
-
overall_total: int
|
|
29
|
-
overall_successful_attacks: int
|
|
30
|
-
baseline_asr: float
|
|
31
|
-
baseline_total: int
|
|
32
|
-
baseline_successful_attacks: int
|
|
33
|
-
easy_complexity_asr: float
|
|
34
|
-
easy_complexity_total: int
|
|
35
|
-
easy_complexity_successful_attacks: int
|
|
36
|
-
moderate_complexity_asr: float
|
|
37
|
-
moderate_complexity_total: int
|
|
38
|
-
moderate_complexity_successful_attacks: int
|
|
39
|
-
difficult_complexity_asr: float
|
|
40
|
-
difficult_complexity_total: int
|
|
41
|
-
difficult_complexity_successful_attacks: int
|
|
42
|
-
|
|
43
|
-
class _JointRiskAttackSummaryItem(TypedDict):
|
|
44
|
-
"""Summary of attack success rates for a specific risk category across complexity levels."""
|
|
45
|
-
risk_category: str
|
|
46
|
-
baseline_asr: float
|
|
47
|
-
easy_complexity_asr: float
|
|
48
|
-
moderate_complexity_asr: float
|
|
49
|
-
difficult_complexity_asr: float
|
|
50
|
-
|
|
51
|
-
class _RedTeamingScorecard(TypedDict):
|
|
52
|
-
"""TypedDict representation of a Red Team Agent scorecard with the updated structure.
|
|
53
|
-
|
|
54
|
-
The scorecard contains four main sections:
|
|
55
|
-
- risk_category_summary: Overall metrics by risk category
|
|
56
|
-
- attack_technique_summary: Overall metrics by attack technique complexity
|
|
57
|
-
- joint_risk_attack_summary: Detailed metrics by risk category and complexity level
|
|
58
|
-
- detailed_joint_risk_attack_asr: Detailed ASR information broken down by complexity level, risk category, and converter
|
|
59
|
-
"""
|
|
60
|
-
risk_category_summary: List[_RiskCategorySummary]
|
|
61
|
-
attack_technique_summary: List[_AttackTechniqueSummary]
|
|
62
|
-
joint_risk_attack_summary: List[_JointRiskAttackSummaryItem]
|
|
63
|
-
detailed_joint_risk_attack_asr: Dict[str, Dict[str, Dict[str, float]]]
|
|
64
|
-
|
|
65
|
-
class _AttackObjectiveSource(TypedDict):
|
|
66
|
-
"""Information about how attack objectives were generated."""
|
|
67
|
-
application_scenario: str
|
|
68
|
-
risk_categories: List[str]
|
|
69
|
-
custom_attack_seed_prompts: str
|
|
70
|
-
policy_document: str
|
|
71
|
-
|
|
72
|
-
class _RedTeamingParameters(TypedDict):
|
|
73
|
-
"""TypedDict representation of parameters used in a red team evaluation with the updated structure.
|
|
74
|
-
|
|
75
|
-
This class defines the structure for capturing metadata about an evaluation run, including:
|
|
76
|
-
- attack_objective_generated_from: Information about the source of attack objectives
|
|
77
|
-
- attack_complexity: List of complexity levels used in the attacks (e.g., "Easy", "Moderate", "Difficult")
|
|
78
|
-
- techniques_used: Dictionary mapping complexity levels to lists of converter techniques used
|
|
79
|
-
"""
|
|
80
|
-
attack_objective_generated_from: _AttackObjectiveSource
|
|
81
|
-
attack_complexity: List[str]
|
|
82
|
-
techniques_used: Dict[str, List[str]]
|
|
83
|
-
|
|
84
|
-
class _RiskAssessment(TypedDict):
|
|
85
|
-
"""Assessment of content safety risks in a conversation."""
|
|
86
|
-
violence: Dict[str, str]
|
|
87
|
-
sexual: Dict[str, str]
|
|
88
|
-
self_harm: Dict[str, str]
|
|
89
|
-
hate_unfair: Dict[str, str]
|
|
90
|
-
|
|
91
|
-
class _Conversation(TypedDict):
|
|
92
|
-
"""TypedDict representation of a simulated conversation in a red team evaluation.
|
|
93
|
-
|
|
94
|
-
This class defines the structure for capturing information about a simulated conversation, including:
|
|
95
|
-
- attack_success: Whether the attack was successful
|
|
96
|
-
- attack_technique: The attack technique used in the conversation
|
|
97
|
-
- attack_complexity: The complexity level of the attack
|
|
98
|
-
- conversation: List of messages exchanged in the conversation
|
|
99
|
-
- risk_assessment: Dictionary containing content safety assessment for the conversation
|
|
100
|
-
"""
|
|
101
|
-
attack_success: Optional[bool]
|
|
102
|
-
attack_technique: str
|
|
103
|
-
attack_complexity: str
|
|
104
|
-
risk_category: str
|
|
105
|
-
conversation: List[Dict[str, str]]
|
|
106
|
-
risk_assessment: Optional[_RiskAssessment]
|
|
107
|
-
|
|
108
|
-
class _RedTeamResult(TypedDict):
|
|
109
|
-
"""TypedDict representation of a Red Team Agent evaluation result with the updated structure.
|
|
110
|
-
|
|
111
|
-
This class defines the structure for capturing the results of a red team evaluation, including:
|
|
112
|
-
- redteaming_scorecard: Scorecard containing summary and detailed ASR information
|
|
113
|
-
- redteaming_parameters: Parameters containing metadata about the evaluation run
|
|
114
|
-
- redteaming_data: List of _Conversation objects representing the conversations in the evaluation
|
|
115
|
-
"""
|
|
116
|
-
redteaming_scorecard: _RedTeamingScorecard
|
|
117
|
-
redteaming_parameters: _RedTeamingParameters
|
|
118
|
-
redteaming_data: List[_Conversation]
|
|
119
|
-
studio_url: Optional[str]
|
|
120
|
-
|
|
121
|
-
class RedTeamOutput():
|
|
122
|
-
def __init__(self, red_team_result: Optional[_RedTeamResult] = None, redteaming_data: Optional[List[_Conversation]] = None):
|
|
123
|
-
self.red_team_result = red_team_result
|
|
124
|
-
self.redteaming_data = redteaming_data
|
|
125
|
-
|
|
126
|
-
def to_json(self) -> str:
|
|
127
|
-
"""
|
|
128
|
-
Converts a _RedTeamResult object to a JSON-serializable dictionary.
|
|
129
|
-
|
|
130
|
-
:returns: A string containing the _RedTeamResult in JSON format.
|
|
131
|
-
:rtype: str
|
|
132
|
-
"""
|
|
133
|
-
return json.dumps(self.red_team_result) if self.red_team_result else ""
|
|
134
|
-
|
|
135
|
-
def to_scorecard(self) -> Optional[_RedTeamingScorecard]:
|
|
136
|
-
"""Extracts the scorecard from a _RedTeamResult object."""
|
|
137
|
-
return self.red_team_result.get("redteaming_scorecard", None) if self.red_team_result else None
|
|
138
|
-
|
|
139
|
-
def to_eval_qr_json_lines(self) -> str:
|
|
140
|
-
"""
|
|
141
|
-
Converts conversations in messages format to query-response format suitable for evaluation.
|
|
142
|
-
|
|
143
|
-
The output format follows the JSONL pattern with each line containing:
|
|
144
|
-
{
|
|
145
|
-
"query": "user message content",
|
|
146
|
-
"response": "assistant message content",
|
|
147
|
-
"risk_category": "risk category",
|
|
148
|
-
"attack_strategy": "strategy name",
|
|
149
|
-
"attack_complexity": "complexity level",
|
|
150
|
-
"attack_success": "true|false", (if available from evaluation)
|
|
151
|
-
"category": "risk category", (if available from evaluation)
|
|
152
|
-
"severity_level": "low|medium|high", (if available from evaluation)
|
|
153
|
-
"threshold": "threshold value" (if available from evaluation)
|
|
154
|
-
}
|
|
155
|
-
|
|
156
|
-
:returns: A list of strings containing query-response pairs in JSONL format.
|
|
157
|
-
:rtype: List[str]
|
|
158
|
-
"""
|
|
159
|
-
if not self.redteaming_data:
|
|
160
|
-
return ""
|
|
161
|
-
|
|
162
|
-
result_lines = []
|
|
163
|
-
|
|
164
|
-
for conversation in self.redteaming_data:
|
|
165
|
-
messages = conversation.get("conversation", [])
|
|
166
|
-
attack_technique = conversation.get("attack_technique", "")
|
|
167
|
-
attack_complexity = conversation.get("attack_complexity", "")
|
|
168
|
-
risk_category = conversation.get("risk_category", "")
|
|
169
|
-
attack_success = conversation.get("attack_success")
|
|
170
|
-
risk_assessment = conversation.get("risk_assessment", {})
|
|
171
|
-
|
|
172
|
-
for i in range(0, len(messages) - 1, 2):
|
|
173
|
-
if i + 1 < len(messages):
|
|
174
|
-
user_msg = messages[i]
|
|
175
|
-
assistant_msg = messages[i + 1]
|
|
176
|
-
|
|
177
|
-
if user_msg.get("role") == "user" and assistant_msg.get("role") == "assistant":
|
|
178
|
-
# Create the base query-response pair
|
|
179
|
-
qr_pair = {
|
|
180
|
-
"query": user_msg.get("content", ""),
|
|
181
|
-
"response": assistant_msg.get("content", ""),
|
|
182
|
-
"risk_category": risk_category,
|
|
183
|
-
"attack_strategy": attack_technique,
|
|
184
|
-
"attack_complexity": attack_complexity
|
|
185
|
-
}
|
|
186
|
-
|
|
187
|
-
# Add evaluation data if available
|
|
188
|
-
if attack_success is not None:
|
|
189
|
-
qr_pair["attack_success"] = str(attack_success).lower()
|
|
190
|
-
|
|
191
|
-
# Add risk assessment data if available
|
|
192
|
-
for category, assessment in risk_assessment.items() if risk_assessment else {}:
|
|
193
|
-
if assessment and assessment.get("severity_label", None):
|
|
194
|
-
qr_pair["category"] = category
|
|
195
|
-
qr_pair["severity_level"] = assessment.get("severity_label", "").lower()
|
|
196
|
-
# Add threshold if available in the future
|
|
197
|
-
|
|
198
|
-
result_lines.append(json.dumps(qr_pair))
|
|
199
|
-
|
|
200
|
-
return result_lines
|
|
201
|
-
|
|
202
|
-
def attack_simulation(self) -> str:
|
|
203
|
-
"""
|
|
204
|
-
Returns the attack simulation data in a human-readable format.
|
|
205
|
-
:returns: A string containing the attack simulation data in a human-readable format.
|
|
206
|
-
:rtype: str
|
|
207
|
-
"""
|
|
208
|
-
if not self.redteaming_data:
|
|
209
|
-
return ""
|
|
210
|
-
|
|
211
|
-
result_lines = []
|
|
212
|
-
|
|
213
|
-
for conversation in self.redteaming_data:
|
|
214
|
-
messages = conversation.get("conversation", [])
|
|
215
|
-
attack_technique = conversation.get("attack_technique", "")
|
|
216
|
-
attack_complexity = conversation.get("attack_complexity", "")
|
|
217
|
-
risk_category = conversation.get("risk_category", "")
|
|
218
|
-
attack_success = conversation.get("attack_success")
|
|
219
|
-
risk_assessment = conversation.get("risk_assessment", {})
|
|
220
|
-
|
|
221
|
-
result_lines.append(f"Attack Technique: {attack_technique}")
|
|
222
|
-
result_lines.append(f"Attack Complexity: {attack_complexity}")
|
|
223
|
-
result_lines.append(f"Risk Category: {risk_category}")
|
|
224
|
-
result_lines.append("")
|
|
225
|
-
|
|
226
|
-
for i in range(0, len(messages) - 1, 2):
|
|
227
|
-
if i + 1 < len(messages):
|
|
228
|
-
user_msg = messages[i]
|
|
229
|
-
assistant_msg = messages[i + 1]
|
|
230
|
-
|
|
231
|
-
if user_msg.get("role") == "user" and assistant_msg.get("role") == "assistant":
|
|
232
|
-
result_lines.append(f"User: {user_msg.get('content', '')}")
|
|
233
|
-
result_lines.append(f"Assistant: {assistant_msg.get('content', '')}")
|
|
234
|
-
result_lines.append("")
|
|
235
|
-
|
|
236
|
-
if attack_success is not None:
|
|
237
|
-
result_lines.append(f"Attack Success: {'Successful' if attack_success else 'Failed'}")
|
|
238
|
-
result_lines.append("")
|
|
239
|
-
|
|
240
|
-
for category, assessment in risk_assessment.items() if risk_assessment else {}:
|
|
241
|
-
if assessment and assessment.get("severity_label", None):
|
|
242
|
-
result_lines.append(f"Category: {category}")
|
|
243
|
-
result_lines.append(f"Severity Level: {assessment.get('severity_label', '')}")
|
|
244
|
-
result_lines.append("")
|
|
245
|
-
|
|
246
|
-
return "\n".join(result_lines)
|