azure-ai-evaluation 1.6.0__tar.gz → 1.7.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of azure-ai-evaluation might be problematic. Click here for more details.
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/CHANGELOG.md +5 -0
- {azure_ai_evaluation-1.6.0/azure_ai_evaluation.egg-info → azure_ai_evaluation-1.7.0}/PKG-INFO +26 -3
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/README.md +18 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/__init__.py +1 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/aoai_grader.py +1 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/label_grader.py +2 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/string_check_grader.py +2 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/text_similarity_grader.py +2 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/__init__.py +3 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/evaluation_onedp_client.py +50 -5
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/operations/_operations.py +1 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/rai_service.py +7 -6
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_converters/_ai_services.py +162 -118
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_converters/_models.py +76 -6
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_eval_mapping.py +2 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_evaluate.py +11 -13
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_evaluate_aoai.py +24 -5
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_bleu/_bleu.py +11 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_code_vulnerability/_code_vulnerability.py +9 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_coherence/_coherence.py +12 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/_base_eval.py +4 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py +12 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py +14 -4
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py +9 -8
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/_sexual.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/_violence.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_document_retrieval/_document_retrieval.py +31 -29
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_f1_score/_f1_score.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_fluency/_fluency.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_gleu/_gleu.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_groundedness/_groundedness.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_intent_resolution/_intent_resolution.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_meteor/_meteor.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py +11 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_qa/_qa.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_relevance/_relevance.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_response_completeness/_response_completeness.py +13 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_rouge/_rouge.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_service_groundedness/_service_groundedness.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_similarity/_similarity.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_task_adherence/_task_adherence.py +11 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_tool_call_accuracy/_tool_call_accuracy.py +80 -10
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_ungrounded_attributes/_ungrounded_attributes.py +10 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_xpia/xpia.py +11 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_safety_evaluation/_safety_evaluation.py +26 -7
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_version.py +1 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_red_team.py +183 -128
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_conversation/constants.py +1 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_direct_attack_simulator.py +3 -3
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_indirect_attack_simulator.py +3 -3
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/_generated_rai_client.py +2 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/_template_handler.py +6 -5
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0/azure_ai_evaluation.egg-info}/PKG-INFO +26 -3
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure_ai_evaluation.egg-info/SOURCES.txt +3 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure_ai_evaluation.egg-info/requires.txt +2 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/pyproject.toml +2 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/agent_evaluation.ipynb +154 -28
- azure_ai_evaluation-1.7.0/samples/evaluation_samples_evaluate_fdp.py +526 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/evaluation_samples_threshold.py +2 -2
- azure_ai_evaluation-1.7.0/samples/red_team_skip_upload.py +95 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/setup.py +2 -1
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/conftest.py +23 -4
- azure_ai_evaluation-1.7.0/tests/converters/ai_agent_converter/serialization_helper.py +211 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/converters/ai_agent_converter/test_ai_agent_converter_internals.py +101 -9
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_aoai_graders.py +2 -2
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_mass_evaluate.py +26 -4
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_document_retrieval_evaluator.py +12 -13
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_safety_evaluation.py +22 -0
- azure_ai_evaluation-1.7.0/tests/unittests/test_tool_call_accuracy_evaluator.py +446 -0
- azure_ai_evaluation-1.6.0/tests/converters/ai_agent_converter/serialization_helper.py +0 -110
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/MANIFEST.in +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/NOTICE.txt +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/TROUBLESHOOTING.md +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_azure/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_azure/_clients.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_azure/_envs.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_azure/_models.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_azure/_token_manager.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/_experimental.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/math.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_configuration.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_model_base.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_serialization.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_types.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_validation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_vendor.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/_version.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/_configuration.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/_vendor.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/aio/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/models/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/models/_enums.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/models/_models.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/models/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/py.typed +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/aio/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/aio/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/aio/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/buildingblocks/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/onedp/servicepatterns/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_configuration.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_model_base.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_serialization.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/_version.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/_configuration.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/aio/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/models/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/models/_enums.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/models/_models.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/models/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/operations/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/operations/_operations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/operations/_patch.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/raiclient/py.typed +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_converters/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/_run_submitter_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/batch_clients.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/code_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/eval_run_context.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/proxy_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_batch_run/target_run_context.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_eval_run.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_telemetry/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluate/_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_bleu/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_code_vulnerability/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_coherence/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_coherence/coherence.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/_base_multi_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/_base_prompty_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_common/_conversation_aggregators.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_content_safety/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_document_retrieval/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_eci/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_eci/_eci.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_f1_score/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_fluency/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_fluency/fluency.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_gleu/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_groundedness/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_groundedness/groundedness_with_query.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_groundedness/groundedness_without_query.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_intent_resolution/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_intent_resolution/intent_resolution.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_meteor/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_protected_material/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_qa/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_relevance/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_relevance/relevance.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_response_completeness/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_response_completeness/response_completeness.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_retrieval/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_retrieval/retrieval.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_rouge/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_service_groundedness/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_similarity/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_similarity/similarity.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_task_adherence/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_task_adherence/task_adherence.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_tool_call_accuracy/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_tool_call_accuracy/tool_call_accuracy.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_ungrounded_attributes/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_evaluators/_xpia/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_exceptions.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_http_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_check.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_configuration.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_errors.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_flows.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/_service.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/entities.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/tracing.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/types.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_adapters/utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_config.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_engine.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_exceptions.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_openai_injector.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_result.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_run.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_run_storage.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_run_submitter.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_status.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_trace.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_batch_engine/_utils_deprecated.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_common/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_common/_async_token_provider.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_common/_logging.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/_common/_thread_pool_executor_with_context.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/_connection.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/_exceptions.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/_prompty.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_legacy/prompty/_yaml_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_model_configurations.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_safety_evaluation/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_safety_evaluation/_generated_rai_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_user_agent.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/rouge_score/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/rouge_score/rouge_scorer.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/rouge_score/scoring.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/rouge_score/tokenize.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_vendor/rouge_score/tokenizers.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/py.typed +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_attack_objective_generator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_attack_strategy.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_callback_chat_target.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_default_converter.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_red_team_result.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/formatting_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/logging_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/metric_mapping.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/red_team/_utils/strategy_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_adversarial_scenario.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_adversarial_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_conversation/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_conversation/_conversation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_data_sources/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_data_sources/grounding.json +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_helpers/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_helpers/_language_suffix_mapping.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_helpers/_simulator_data_classes.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/_identity_manager.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/_proxy_completion_model.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/_rai_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_model_tools/models.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_prompty/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_prompty/task_query_response.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_prompty/task_simulate.prompty +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/simulator/_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure_ai_evaluation.egg-info/dependency_links.txt +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure_ai_evaluation.egg-info/not-zip-safe +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure_ai_evaluation.egg-info/top_level.txt +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/migration_guide.md +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/README.md +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/instructions.md +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/intent_resolution.ipynb +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/response_completeness.ipynb +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/sample_synthetic_conversations.jsonl +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/task_adherence.ipynb +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/tool_call_accuracy.ipynb +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/agent_evaluators/user_functions.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/data/evaluate_test_data.jsonl +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/evaluation_samples_common.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/evaluation_samples_evaluate.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/evaluation_samples_safety_evaluation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/evaluation_samples_simulate.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/red_team_agent_tool_sample.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/red_team_samples.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/samples/semantic_kernel_red_team_agent_sample.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/setup.cfg +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/__openai_patcher.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/converters/ai_agent_converter/test_run_ids_from_conversation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/custom_evaluators/answer_length_with_aggregation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/target_fn.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_adv_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_builtin_evaluators.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_evaluate.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_lite_management_client.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_metrics_upload.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_prompty_async.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_remote_evaluation.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/e2etests/test_sim_and_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_agent_evaluators.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_aoai_integration_features.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_batch_run_context.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_built_in_evaluator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_completeness_evaluator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_content_safety_defect_rate.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_content_safety_rai_script.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_eval_run.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluate.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluate_performance.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluators/slow_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluators/test_conversation_thresholds.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluators/test_inputs_evaluators.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluators/test_service_evaluator_thresholds.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_evaluators/test_threshold_behavior.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_jailbreak_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_non_adv_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/__init__.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_attack_objective_generator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_attack_strategy.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_callback_chat_target.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_constants.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_formatting_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_red_team.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_red_team_result.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_redteam/test_strategy_utils.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_remote_evaluation_features.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_save_eval.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_simulator.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_synthetic_callback_conv_bot.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_synthetic_conversation_bot.py +0 -0
- {azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/tests/unittests/test_utils.py +0 -0
{azure_ai_evaluation-1.6.0/azure_ai_evaluation.egg-info → azure_ai_evaluation-1.7.0}/PKG-INFO
RENAMED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: azure-ai-evaluation
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.7.0
|
|
4
4
|
Summary: Microsoft Azure Evaluation Library for Python
|
|
5
5
|
Home-page: https://github.com/Azure/azure-sdk-for-python
|
|
6
6
|
Author: Microsoft Corporation
|
|
@@ -30,10 +30,11 @@ Requires-Dist: nltk>=3.9.1
|
|
|
30
30
|
Requires-Dist: azure-storage-blob>=12.10.0
|
|
31
31
|
Requires-Dist: httpx>=0.25.1
|
|
32
32
|
Requires-Dist: pandas<3.0.0,>=2.1.2
|
|
33
|
-
Requires-Dist: openai>=1.
|
|
33
|
+
Requires-Dist: openai>=1.78.0
|
|
34
34
|
Requires-Dist: ruamel.yaml<1.0.0,>=0.17.10
|
|
35
35
|
Requires-Dist: msrest>=0.6.21
|
|
36
36
|
Requires-Dist: Jinja2>=3.1.6
|
|
37
|
+
Requires-Dist: aiohttp>=3.0
|
|
37
38
|
Provides-Extra: redteam
|
|
38
39
|
Requires-Dist: pyrit==0.8.1; extra == "redteam"
|
|
39
40
|
|
|
@@ -115,13 +116,23 @@ result = relevance_evaluator(
|
|
|
115
116
|
response="The capital of Japan is Tokyo."
|
|
116
117
|
)
|
|
117
118
|
|
|
118
|
-
#
|
|
119
|
+
# There are two ways to provide Azure AI Project.
|
|
120
|
+
# Option #1 : Using Azure AI Project Details
|
|
119
121
|
azure_ai_project = {
|
|
120
122
|
"subscription_id": "<subscription_id>",
|
|
121
123
|
"resource_group_name": "<resource_group_name>",
|
|
122
124
|
"project_name": "<project_name>",
|
|
123
125
|
}
|
|
124
126
|
|
|
127
|
+
violence_evaluator = ViolenceEvaluator(azure_ai_project)
|
|
128
|
+
result = violence_evaluator(
|
|
129
|
+
query="What is the capital of France?",
|
|
130
|
+
response="Paris."
|
|
131
|
+
)
|
|
132
|
+
|
|
133
|
+
# Option # 2 : Using Azure AI Project Url
|
|
134
|
+
azure_ai_project = "https://{resource_name}.services.ai.azure.com/api/projects/{project_name}"
|
|
135
|
+
|
|
125
136
|
violence_evaluator = ViolenceEvaluator(azure_ai_project)
|
|
126
137
|
result = violence_evaluator(
|
|
127
138
|
query="What is the capital of France?",
|
|
@@ -272,11 +283,18 @@ with open("simulator_output.jsonl", "w") as f:
|
|
|
272
283
|
```python
|
|
273
284
|
from azure.ai.evaluation.simulator import AdversarialSimulator, AdversarialScenario
|
|
274
285
|
from azure.identity import DefaultAzureCredential
|
|
286
|
+
|
|
287
|
+
# There are two ways to provide Azure AI Project.
|
|
288
|
+
# Option #1 : Using Azure AI Project
|
|
275
289
|
azure_ai_project = {
|
|
276
290
|
"subscription_id": <subscription_id>,
|
|
277
291
|
"resource_group_name": <resource_group_name>,
|
|
278
292
|
"project_name": <project_name>
|
|
279
293
|
}
|
|
294
|
+
|
|
295
|
+
# Option #2 : Using Azure AI Project Url
|
|
296
|
+
azure_ai_project = "https://{resource_name}.services.ai.azure.com/api/projects/{project_name}"
|
|
297
|
+
|
|
280
298
|
scenario = AdversarialScenario.ADVERSARIAL_QA
|
|
281
299
|
simulator = AdversarialSimulator(azure_ai_project=azure_ai_project, credential=DefaultAzureCredential())
|
|
282
300
|
|
|
@@ -382,6 +400,11 @@ This project has adopted the [Microsoft Open Source Code of Conduct][code_of_con
|
|
|
382
400
|
|
|
383
401
|
# Release History
|
|
384
402
|
|
|
403
|
+
## 1.7.0 (2025-05-12)
|
|
404
|
+
|
|
405
|
+
### Bugs Fixed
|
|
406
|
+
- azure-ai-evaluation failed with module not found [#40992](https://github.com/Azure/azure-sdk-for-python/issues/40992)
|
|
407
|
+
|
|
385
408
|
## 1.6.0 (2025-05-07)
|
|
386
409
|
|
|
387
410
|
### Features Added
|
|
@@ -76,13 +76,23 @@ result = relevance_evaluator(
|
|
|
76
76
|
response="The capital of Japan is Tokyo."
|
|
77
77
|
)
|
|
78
78
|
|
|
79
|
-
#
|
|
79
|
+
# There are two ways to provide Azure AI Project.
|
|
80
|
+
# Option #1 : Using Azure AI Project Details
|
|
80
81
|
azure_ai_project = {
|
|
81
82
|
"subscription_id": "<subscription_id>",
|
|
82
83
|
"resource_group_name": "<resource_group_name>",
|
|
83
84
|
"project_name": "<project_name>",
|
|
84
85
|
}
|
|
85
86
|
|
|
87
|
+
violence_evaluator = ViolenceEvaluator(azure_ai_project)
|
|
88
|
+
result = violence_evaluator(
|
|
89
|
+
query="What is the capital of France?",
|
|
90
|
+
response="Paris."
|
|
91
|
+
)
|
|
92
|
+
|
|
93
|
+
# Option # 2 : Using Azure AI Project Url
|
|
94
|
+
azure_ai_project = "https://{resource_name}.services.ai.azure.com/api/projects/{project_name}"
|
|
95
|
+
|
|
86
96
|
violence_evaluator = ViolenceEvaluator(azure_ai_project)
|
|
87
97
|
result = violence_evaluator(
|
|
88
98
|
query="What is the capital of France?",
|
|
@@ -233,11 +243,18 @@ with open("simulator_output.jsonl", "w") as f:
|
|
|
233
243
|
```python
|
|
234
244
|
from azure.ai.evaluation.simulator import AdversarialSimulator, AdversarialScenario
|
|
235
245
|
from azure.identity import DefaultAzureCredential
|
|
246
|
+
|
|
247
|
+
# There are two ways to provide Azure AI Project.
|
|
248
|
+
# Option #1 : Using Azure AI Project
|
|
236
249
|
azure_ai_project = {
|
|
237
250
|
"subscription_id": <subscription_id>,
|
|
238
251
|
"resource_group_name": <resource_group_name>,
|
|
239
252
|
"project_name": <project_name>
|
|
240
253
|
}
|
|
254
|
+
|
|
255
|
+
# Option #2 : Using Azure AI Project Url
|
|
256
|
+
azure_ai_project = "https://{resource_name}.services.ai.azure.com/api/projects/{project_name}"
|
|
257
|
+
|
|
241
258
|
scenario = AdversarialScenario.ADVERSARIAL_QA
|
|
242
259
|
simulator = AdversarialSimulator(azure_ai_project=azure_ai_project, credential=DefaultAzureCredential())
|
|
243
260
|
|
|
@@ -31,6 +31,7 @@ from ._evaluators._xpia import IndirectAttackEvaluator
|
|
|
31
31
|
from ._evaluators._code_vulnerability import CodeVulnerabilityEvaluator
|
|
32
32
|
from ._evaluators._ungrounded_attributes import UngroundedAttributesEvaluator
|
|
33
33
|
from ._evaluators._tool_call_accuracy import ToolCallAccuracyEvaluator
|
|
34
|
+
from ._evaluators._document_retrieval import DocumentRetrievalEvaluator
|
|
34
35
|
from ._model_configurations import (
|
|
35
36
|
AzureAIProject,
|
|
36
37
|
AzureOpenAIModelConfiguration,
|
{azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/aoai_grader.py
RENAMED
|
@@ -77,7 +77,7 @@ class AzureOpenAIGrader():
|
|
|
77
77
|
return AzureOpenAI(
|
|
78
78
|
azure_endpoint=self._model_config["azure_endpoint"],
|
|
79
79
|
api_key=self._model_config.get("api_key", None), # Default-style access to appease linters.
|
|
80
|
-
api_version=
|
|
80
|
+
api_version=DEFAULT_AOAI_API_VERSION, # Force a known working version
|
|
81
81
|
azure_deployment=self._model_config.get("azure_deployment", ""),
|
|
82
82
|
)
|
|
83
83
|
from openai import OpenAI
|
{azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_aoai/label_grader.py
RENAMED
|
@@ -4,7 +4,7 @@
|
|
|
4
4
|
from typing import Any, Dict, Union, List
|
|
5
5
|
|
|
6
6
|
from azure.ai.evaluation._model_configurations import AzureOpenAIModelConfiguration, OpenAIModelConfiguration
|
|
7
|
-
from openai.types.
|
|
7
|
+
from openai.types.graders import LabelModelGrader
|
|
8
8
|
from azure.ai.evaluation._common._experimental import experimental
|
|
9
9
|
|
|
10
10
|
from .aoai_grader import AzureOpenAIGrader
|
|
@@ -55,7 +55,7 @@ class AzureOpenAILabelGrader(AzureOpenAIGrader):
|
|
|
55
55
|
passing_labels: List[str],
|
|
56
56
|
**kwargs: Any
|
|
57
57
|
):
|
|
58
|
-
grader =
|
|
58
|
+
grader = LabelModelGrader(
|
|
59
59
|
input=input,
|
|
60
60
|
labels=labels,
|
|
61
61
|
model=model,
|
|
@@ -5,7 +5,7 @@ from typing import Any, Dict, Union
|
|
|
5
5
|
from typing_extensions import Literal
|
|
6
6
|
|
|
7
7
|
from azure.ai.evaluation._model_configurations import AzureOpenAIModelConfiguration, OpenAIModelConfiguration
|
|
8
|
-
from openai.types.
|
|
8
|
+
from openai.types.graders import StringCheckGrader
|
|
9
9
|
from azure.ai.evaluation._common._experimental import experimental
|
|
10
10
|
|
|
11
11
|
from .aoai_grader import AzureOpenAIGrader
|
|
@@ -55,7 +55,7 @@ class AzureOpenAIStringCheckGrader(AzureOpenAIGrader):
|
|
|
55
55
|
reference: str,
|
|
56
56
|
**kwargs: Any
|
|
57
57
|
):
|
|
58
|
-
grader =
|
|
58
|
+
grader = StringCheckGrader(
|
|
59
59
|
input=input,
|
|
60
60
|
name=name,
|
|
61
61
|
operation=operation,
|
|
@@ -5,7 +5,7 @@ from typing import Any, Dict, Union
|
|
|
5
5
|
from typing_extensions import Literal
|
|
6
6
|
|
|
7
7
|
from azure.ai.evaluation._model_configurations import AzureOpenAIModelConfiguration, OpenAIModelConfiguration
|
|
8
|
-
from openai.types.
|
|
8
|
+
from openai.types.graders import TextSimilarityGrader
|
|
9
9
|
from azure.ai.evaluation._common._experimental import experimental
|
|
10
10
|
|
|
11
11
|
from .aoai_grader import AzureOpenAIGrader
|
|
@@ -77,7 +77,7 @@ class AzureOpenAITextSimilarityGrader(AzureOpenAIGrader):
|
|
|
77
77
|
name: str,
|
|
78
78
|
**kwargs: Any
|
|
79
79
|
):
|
|
80
|
-
grader =
|
|
80
|
+
grader = TextSimilarityGrader(
|
|
81
81
|
evaluation_metric=evaluation_metric,
|
|
82
82
|
input=input,
|
|
83
83
|
pass_threshold=pass_threshold,
|
{azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/__init__.py
RENAMED
|
@@ -9,7 +9,7 @@ from . import constants
|
|
|
9
9
|
from .rai_service import evaluate_with_rai_service
|
|
10
10
|
from .utils import get_harm_severity_level
|
|
11
11
|
from .evaluation_onedp_client import EvaluationServiceOneDPClient
|
|
12
|
-
from .onedp.models import EvaluationUpload, EvaluationResult
|
|
12
|
+
from .onedp.models import EvaluationUpload, EvaluationResult, RedTeamUpload, ResultType
|
|
13
13
|
|
|
14
14
|
__all__ = [
|
|
15
15
|
"get_harm_severity_level",
|
|
@@ -18,4 +18,6 @@ __all__ = [
|
|
|
18
18
|
"EvaluationServiceOneDPClient",
|
|
19
19
|
"EvaluationResult",
|
|
20
20
|
"EvaluationUpload",
|
|
21
|
+
"RedTeamUpload",
|
|
22
|
+
"ResultType",
|
|
21
23
|
]
|
|
@@ -7,7 +7,7 @@ from typing import Union, Any, Dict
|
|
|
7
7
|
from azure.core.credentials import AzureKeyCredential, TokenCredential
|
|
8
8
|
from azure.ai.evaluation._common.onedp import AIProjectClient as RestEvaluationServiceClient
|
|
9
9
|
from azure.ai.evaluation._common.onedp.models import (PendingUploadRequest, PendingUploadType, EvaluationResult,
|
|
10
|
-
ResultType, AssetCredentialRequest, EvaluationUpload, InputDataset)
|
|
10
|
+
ResultType, AssetCredentialRequest, EvaluationUpload, InputDataset, RedTeamUpload)
|
|
11
11
|
from azure.storage.blob import ContainerClient
|
|
12
12
|
from .utils import upload
|
|
13
13
|
|
|
@@ -22,7 +22,8 @@ class EvaluationServiceOneDPClient:
|
|
|
22
22
|
**kwargs,
|
|
23
23
|
)
|
|
24
24
|
|
|
25
|
-
def create_evaluation_result(
|
|
25
|
+
def create_evaluation_result(
|
|
26
|
+
self, *, name: str, path: str, version=1, metrics: Dict[str, int]=None, result_type: ResultType=ResultType.EVALUATION, **kwargs) -> EvaluationResult:
|
|
26
27
|
"""Create and upload evaluation results to Azure evaluation service.
|
|
27
28
|
|
|
28
29
|
This method uploads evaluation results from a local path to Azure Blob Storage
|
|
@@ -39,14 +40,16 @@ class EvaluationServiceOneDPClient:
|
|
|
39
40
|
:param version: The version number for the evaluation results, defaults to 1
|
|
40
41
|
:type version: int, optional
|
|
41
42
|
:param metrics: Metrics to be added to evaluation result
|
|
42
|
-
:type
|
|
43
|
+
:type metrics: Dict[str, int], optional
|
|
44
|
+
:param result_type: Evaluation Result Type to create
|
|
45
|
+
:type result_type: ResultType, optional
|
|
43
46
|
:param kwargs: Additional keyword arguments to pass to the underlying API calls
|
|
44
47
|
:return: The response from creating the evaluation result version
|
|
45
48
|
:rtype: EvaluationResult
|
|
46
49
|
:raises: Various exceptions from the underlying API calls or upload process
|
|
47
50
|
"""
|
|
48
51
|
|
|
49
|
-
LOGGER.debug(f"Creating evaluation result for {name} with version {version} from path {path}")
|
|
52
|
+
LOGGER.debug(f"Creating evaluation result for {name} with version {version} type {result_type} from path {path}")
|
|
50
53
|
start_pending_upload_response = self.rest_client.evaluation_results.start_pending_upload(
|
|
51
54
|
name=name,
|
|
52
55
|
version=version,
|
|
@@ -63,7 +66,7 @@ class EvaluationServiceOneDPClient:
|
|
|
63
66
|
create_version_response = self.rest_client.evaluation_results.create_or_update_version(
|
|
64
67
|
body=EvaluationResult(
|
|
65
68
|
blob_uri=start_pending_upload_response.blob_reference_for_consumption.blob_uri,
|
|
66
|
-
result_type=
|
|
69
|
+
result_type=result_type,
|
|
67
70
|
name=name,
|
|
68
71
|
version=version,
|
|
69
72
|
metrics=metrics,
|
|
@@ -115,4 +118,46 @@ class EvaluationServiceOneDPClient:
|
|
|
115
118
|
**kwargs
|
|
116
119
|
)
|
|
117
120
|
|
|
121
|
+
return update_run_response
|
|
122
|
+
|
|
123
|
+
def start_red_team_run(self, *, red_team: RedTeamUpload, **kwargs):
|
|
124
|
+
"""Start a new red team run in the Azure evaluation service.
|
|
125
|
+
|
|
126
|
+
This method creates a new red team run with the provided configuration details.
|
|
127
|
+
|
|
128
|
+
:param red_team: The red team configuration to upload
|
|
129
|
+
:type red_team: ~azure.ai.evaluation._common.onedp.models.RedTeamUpload
|
|
130
|
+
:param kwargs: Additional keyword arguments to pass to the underlying API calls
|
|
131
|
+
:return: The created red team run object
|
|
132
|
+
:rtype: ~azure.ai.evaluation._common.onedp.models.RedTeamUpload
|
|
133
|
+
:raises: Various exceptions from the underlying API calls
|
|
134
|
+
"""
|
|
135
|
+
upload_run_response = self.rest_client.red_teams.upload_run(
|
|
136
|
+
redteam=red_team,
|
|
137
|
+
**kwargs
|
|
138
|
+
)
|
|
139
|
+
|
|
140
|
+
return upload_run_response
|
|
141
|
+
|
|
142
|
+
def update_red_team_run(self, *, name: str, red_team: RedTeamUpload, **kwargs):
|
|
143
|
+
"""Update an existing red team run in the Azure evaluation service.
|
|
144
|
+
|
|
145
|
+
This method updates a red team run with new information such as status changes,
|
|
146
|
+
result references, or other metadata.
|
|
147
|
+
|
|
148
|
+
:param name: The identifier of the red team run to update
|
|
149
|
+
:type name: str
|
|
150
|
+
:param red_team: The updated red team configuration
|
|
151
|
+
:type red_team: ~azure.ai.evaluation._common.onedp.models.RedTeamUpload
|
|
152
|
+
:param kwargs: Additional keyword arguments to pass to the underlying API calls
|
|
153
|
+
:return: The updated red team run object
|
|
154
|
+
:rtype: ~azure.ai.evaluation._common.onedp.models.RedTeamUpload
|
|
155
|
+
:raises: Various exceptions from the underlying API calls
|
|
156
|
+
"""
|
|
157
|
+
update_run_response = self.rest_client.red_teams.upload_update_run(
|
|
158
|
+
name=name,
|
|
159
|
+
redteam=red_team,
|
|
160
|
+
**kwargs
|
|
161
|
+
)
|
|
162
|
+
|
|
118
163
|
return update_run_response
|
|
@@ -4267,7 +4267,7 @@ class RedTeamsOperations:
|
|
|
4267
4267
|
if isinstance(redteam, (IOBase, bytes)):
|
|
4268
4268
|
_content = redteam
|
|
4269
4269
|
else:
|
|
4270
|
-
_content = json.dumps(redteam, cls=SdkJSONEncoder, exclude_readonly=
|
|
4270
|
+
_content = json.dumps(redteam, cls=SdkJSONEncoder, exclude_readonly=False) # type: ignore
|
|
4271
4271
|
|
|
4272
4272
|
_request = build_red_teams_upload_update_run_request(
|
|
4273
4273
|
name=name,
|
{azure_ai_evaluation-1.6.0 → azure_ai_evaluation-1.7.0}/azure/ai/evaluation/_common/rai_service.py
RENAMED
|
@@ -629,8 +629,9 @@ async def evaluate_with_rai_service(
|
|
|
629
629
|
:type data: dict
|
|
630
630
|
:param metric_name: The evaluation metric to use.
|
|
631
631
|
:type metric_name: str
|
|
632
|
-
:param project_scope: The Azure AI project
|
|
633
|
-
|
|
632
|
+
:param project_scope: The Azure AI project, which can either be a string representing the project endpoint
|
|
633
|
+
or an instance of AzureAIProject. It contains subscription id, resource group, and project name.
|
|
634
|
+
:type project_scope: Union[str, AzureAIProject]
|
|
634
635
|
:param credential: The Azure authentication credential.
|
|
635
636
|
:type credential: ~azure.core.credentials.TokenCredential
|
|
636
637
|
:param annotation_task: The annotation task to use.
|
|
@@ -777,11 +778,11 @@ async def evaluate_with_rai_service_multimodal(
|
|
|
777
778
|
:type messages: str
|
|
778
779
|
:param metric_name: The evaluation metric to use.
|
|
779
780
|
:type metric_name: str
|
|
780
|
-
:param project_scope: The Azure AI project
|
|
781
|
-
|
|
781
|
+
:param project_scope: The Azure AI project, which can either be a string representing the project endpoint
|
|
782
|
+
or an instance of AzureAIProject. It contains subscription id, resource group, and project name.
|
|
783
|
+
:type project_scope: Union[str, AzureAIProject]
|
|
782
784
|
:param credential: The Azure authentication credential.
|
|
783
|
-
:type credential:
|
|
784
|
-
~azure.core.credentials.TokenCredential
|
|
785
|
+
:type credential: ~azure.core.credentials.TokenCredential
|
|
785
786
|
:return: The parsed annotation result.
|
|
786
787
|
:rtype: List[List[Dict]]
|
|
787
788
|
"""
|