eval-studio-client 0.8.0a2__py3-none-any.whl → 1.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- eval_studio_client/__init__.py +2 -1
- eval_studio_client/api/__init__.py +125 -120
- eval_studio_client/api/api/__init__.py +1 -0
- eval_studio_client/api/api/dashboard_service_api.py +71 -71
- eval_studio_client/api/api/document_service_api.py +64 -64
- eval_studio_client/api/api/evaluation_service_api.py +42 -42
- eval_studio_client/api/api/evaluator_service_api.py +50 -50
- eval_studio_client/api/api/info_service_api.py +8 -8
- eval_studio_client/api/api/leaderboard_service_api.py +126 -126
- eval_studio_client/api/api/model_service_api.py +92 -92
- eval_studio_client/api/api/operation_progress_service_api.py +8 -8
- eval_studio_client/api/api/operation_service_api.py +36 -36
- eval_studio_client/api/api/perturbation_service_api.py +8 -8
- eval_studio_client/api/api/perturbator_service_api.py +15 -15
- eval_studio_client/api/api/prompt_generation_service_api.py +321 -0
- eval_studio_client/api/api/test_case_service_api.py +57 -57
- eval_studio_client/api/api/test_class_service_api.py +15 -15
- eval_studio_client/api/api/test_lab_service_api.py +22 -22
- eval_studio_client/api/api/test_service_api.py +376 -92
- eval_studio_client/api/api/who_am_i_service_api.py +8 -8
- eval_studio_client/api/api_client.py +1 -1
- eval_studio_client/api/configuration.py +1 -1
- eval_studio_client/api/docs/DashboardServiceApi.md +38 -38
- eval_studio_client/api/docs/DocumentServiceApi.md +34 -34
- eval_studio_client/api/docs/EvaluationServiceApi.md +22 -22
- eval_studio_client/api/docs/EvaluatorServiceApi.md +26 -26
- eval_studio_client/api/docs/InfoServiceApi.md +4 -4
- eval_studio_client/api/docs/LeaderboardServiceApi.md +66 -66
- eval_studio_client/api/docs/ModelServiceApi.md +50 -50
- eval_studio_client/api/docs/OperationProgressServiceApi.md +4 -4
- eval_studio_client/api/docs/OperationServiceApi.md +20 -20
- eval_studio_client/api/docs/PerturbationServiceApi.md +4 -4
- eval_studio_client/api/docs/PerturbationServiceCreatePerturbationRequest.md +3 -3
- eval_studio_client/api/docs/PerturbatorServiceApi.md +8 -8
- eval_studio_client/api/docs/PromptGenerationServiceApi.md +78 -0
- eval_studio_client/api/docs/PromptGenerationServiceAutoGeneratePromptsRequest.md +35 -0
- eval_studio_client/api/docs/RequiredTheDashboardToUpdate.md +1 -1
- eval_studio_client/api/docs/RequiredTheLeaderboardToUpdate.md +4 -4
- eval_studio_client/api/docs/RequiredTheModelToUpdate.md +1 -1
- eval_studio_client/api/docs/TestCaseServiceApi.md +31 -31
- eval_studio_client/api/docs/TestClassServiceApi.md +8 -8
- eval_studio_client/api/docs/TestLabServiceApi.md +11 -11
- eval_studio_client/api/docs/TestServiceApi.md +119 -49
- eval_studio_client/api/docs/TestServiceGenerateTestCasesRequest.md +33 -0
- eval_studio_client/api/docs/TestServicePerturbTestRequest.md +1 -1
- eval_studio_client/api/docs/V1BatchCreateLeaderboardsRequest.md +31 -0
- eval_studio_client/api/docs/V1BatchCreateLeaderboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteDashboardsRequest.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteDashboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteDocumentsRequest.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteDocumentsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteEvaluatorsRequest.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteEvaluatorsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteLeaderboardsRequest.md +30 -0
- eval_studio_client/api/docs/V1BatchDeleteLeaderboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteModelsRequest.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchDeleteTestCasesResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaBatchDeleteTestsRequest.md → V1BatchDeleteTestsRequest.md} +8 -8
- eval_studio_client/api/docs/V1BatchDeleteTestsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetDashboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetDocumentsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetLeaderboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetOperationsResponse.md +29 -0
- eval_studio_client/api/docs/V1BatchGetTestsResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaBatchImportLeaderboardRequest.md → V1BatchImportLeaderboardRequest.md} +9 -9
- eval_studio_client/api/docs/V1BatchImportLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaBatchImportTestsRequest.md → V1BatchImportTestsRequest.md} +8 -8
- eval_studio_client/api/docs/V1BatchImportTestsResponse.md +29 -0
- eval_studio_client/api/docs/V1CheckBaseModelsResponse.md +30 -0
- eval_studio_client/api/docs/{V1alphaCollectionInfo.md → V1CollectionInfo.md} +8 -8
- eval_studio_client/api/docs/V1CreateDashboardResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateDocumentResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaCreateEvaluationRequest.md → V1CreateEvaluationRequest.md} +10 -10
- eval_studio_client/api/docs/V1CreateEvaluatorResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateLeaderboardRequest.md +29 -0
- eval_studio_client/api/docs/V1CreateLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateLeaderboardWithoutCacheResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateModelResponse.md +29 -0
- eval_studio_client/api/docs/V1CreatePerturbationResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateTestCaseResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateTestLabResponse.md +29 -0
- eval_studio_client/api/docs/V1CreateTestResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaDashboard.md → V1Dashboard.md} +9 -9
- eval_studio_client/api/docs/{V1alphaDashboardStatus.md → V1DashboardStatus.md} +1 -1
- eval_studio_client/api/docs/V1DeleteDashboardResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteDocumentResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteEvaluatorResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteModelResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteTestCaseResponse.md +29 -0
- eval_studio_client/api/docs/V1DeleteTestResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaDocument.md → V1Document.md} +8 -8
- eval_studio_client/api/docs/V1EvaluationTest.md +32 -0
- eval_studio_client/api/docs/{V1alphaEvaluator.md → V1Evaluator.md} +10 -9
- eval_studio_client/api/docs/{V1alphaEvaluatorParamType.md → V1EvaluatorParamType.md} +1 -1
- eval_studio_client/api/docs/{V1alphaEvaluatorParameter.md → V1EvaluatorParameter.md} +9 -9
- eval_studio_client/api/docs/{V1alphaEvaluatorView.md → V1EvaluatorView.md} +1 -1
- eval_studio_client/api/docs/V1FinalizeOperationResponse.md +29 -0
- eval_studio_client/api/docs/V1FindAllTestCasesByIDResponse.md +29 -0
- eval_studio_client/api/docs/V1FindTestLabResponse.md +29 -0
- eval_studio_client/api/docs/V1GenerateTestCasesResponse.md +29 -0
- eval_studio_client/api/docs/V1GetDashboardResponse.md +29 -0
- eval_studio_client/api/docs/V1GetDocumentResponse.md +29 -0
- eval_studio_client/api/docs/V1GetEvaluatorResponse.md +29 -0
- eval_studio_client/api/docs/V1GetInfoResponse.md +29 -0
- eval_studio_client/api/docs/V1GetLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/V1GetModelResponse.md +29 -0
- eval_studio_client/api/docs/V1GetOperationProgressByParentResponse.md +29 -0
- eval_studio_client/api/docs/V1GetOperationResponse.md +29 -0
- eval_studio_client/api/docs/V1GetPerturbatorResponse.md +29 -0
- eval_studio_client/api/docs/V1GetTestCaseResponse.md +29 -0
- eval_studio_client/api/docs/V1GetTestClassResponse.md +29 -0
- eval_studio_client/api/docs/V1GetTestResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaImportEvaluationRequest.md → V1ImportEvaluationRequest.md} +9 -9
- eval_studio_client/api/docs/{V1alphaImportLeaderboardRequest.md → V1ImportLeaderboardRequest.md} +9 -9
- eval_studio_client/api/docs/V1ImportLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaInfo.md → V1Info.md} +8 -8
- eval_studio_client/api/docs/{V1alphaInsight.md → V1Insight.md} +8 -8
- eval_studio_client/api/docs/{V1alphaLeaderboard.md → V1Leaderboard.md} +12 -12
- eval_studio_client/api/docs/{V1alphaLeaderboardStatus.md → V1LeaderboardStatus.md} +1 -1
- eval_studio_client/api/docs/{V1alphaLeaderboardType.md → V1LeaderboardType.md} +1 -1
- eval_studio_client/api/docs/{V1alphaLeaderboardView.md → V1LeaderboardView.md} +1 -1
- eval_studio_client/api/docs/V1ListBaseModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListDashboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListDocumentsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListEvaluatorsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListLLMModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListLeaderboardsResponse.md +30 -0
- eval_studio_client/api/docs/V1ListModelCollectionsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListMostRecentDashboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListMostRecentLeaderboardsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListMostRecentModelsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListMostRecentTestsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListOperationsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListPerturbatorsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListRAGCollectionsResponse.md +29 -0
- eval_studio_client/api/docs/V1ListTestCasesResponse.md +29 -0
- eval_studio_client/api/docs/V1ListTestClassesResponse.md +29 -0
- eval_studio_client/api/docs/V1ListTestsResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaModel.md → V1Model.md} +9 -9
- eval_studio_client/api/docs/{V1alphaModelType.md → V1ModelType.md} +1 -1
- eval_studio_client/api/docs/{V1alphaOperation.md → V1Operation.md} +8 -8
- eval_studio_client/api/docs/{V1alphaOperationProgress.md → V1OperationProgress.md} +8 -8
- eval_studio_client/api/docs/V1PerturbTestResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaPerturbator.md → V1Perturbator.md} +8 -8
- eval_studio_client/api/docs/V1PerturbatorConfiguration.md +32 -0
- eval_studio_client/api/docs/{V1alphaPerturbatorIntensity.md → V1PerturbatorIntensity.md} +1 -1
- eval_studio_client/api/docs/{V1alphaProblemAndAction.md → V1ProblemAndAction.md} +8 -8
- eval_studio_client/api/docs/{V1alphaTest.md → V1Test.md} +8 -8
- eval_studio_client/api/docs/{V1alphaTestCase.md → V1TestCase.md} +8 -8
- eval_studio_client/api/docs/{V1alphaTestCaseRelationship.md → V1TestCaseRelationship.md} +8 -8
- eval_studio_client/api/docs/V1TestCasesGenerator.md +11 -0
- eval_studio_client/api/docs/{V1alphaTestClass.md → V1TestClass.md} +9 -9
- eval_studio_client/api/docs/{V1alphaTestClassType.md → V1TestClassType.md} +1 -1
- eval_studio_client/api/docs/{V1alphaTestLab.md → V1TestLab.md} +8 -8
- eval_studio_client/api/docs/V1UpdateDashboardResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateDocumentResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateLeaderboardResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateModelResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateOperationResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateTestCaseResponse.md +29 -0
- eval_studio_client/api/docs/V1UpdateTestResponse.md +29 -0
- eval_studio_client/api/docs/{V1alphaWhoAmIResponse.md → V1WhoAmIResponse.md} +8 -8
- eval_studio_client/api/docs/WhoAmIServiceApi.md +4 -4
- eval_studio_client/api/exceptions.py +1 -1
- eval_studio_client/api/models/__init__.py +124 -120
- eval_studio_client/api/models/perturbation_service_create_perturbation_request.py +10 -10
- eval_studio_client/api/models/prompt_generation_service_auto_generate_prompts_request.py +104 -0
- eval_studio_client/api/models/protobuf_any.py +1 -1
- eval_studio_client/api/models/required_the_dashboard_to_update.py +3 -3
- eval_studio_client/api/models/required_the_document_to_update.py +1 -1
- eval_studio_client/api/models/required_the_leaderboard_to_update.py +11 -11
- eval_studio_client/api/models/required_the_model_to_update.py +3 -3
- eval_studio_client/api/models/required_the_operation_to_finalize.py +1 -1
- eval_studio_client/api/models/required_the_operation_to_update.py +1 -1
- eval_studio_client/api/models/required_the_test_case_to_update.py +1 -1
- eval_studio_client/api/models/required_the_test_to_update.py +1 -1
- eval_studio_client/api/models/rpc_status.py +1 -1
- eval_studio_client/api/models/test_case_service_batch_delete_test_cases_request.py +1 -1
- eval_studio_client/api/models/test_service_generate_test_cases_request.py +96 -0
- eval_studio_client/api/models/test_service_perturb_test_request.py +4 -4
- eval_studio_client/api/models/{v1alpha_batch_create_leaderboards_request.py → v1_batch_create_leaderboards_request.py} +8 -8
- eval_studio_client/api/models/{v1alpha_update_operation_response.py → v1_batch_create_leaderboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_dashboards_request.py → v1_batch_delete_dashboards_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_dashboards_response.py → v1_batch_delete_dashboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_documents_request.py → v1_batch_delete_documents_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_documents_response.py → v1_batch_delete_documents_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_evaluators_request.py → v1_batch_delete_evaluators_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_evaluators_response.py → v1_batch_delete_evaluators_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_leaderboards_request.py → v1_batch_delete_leaderboards_request.py} +7 -7
- eval_studio_client/api/models/{v1alpha_batch_get_leaderboards_response.py → v1_batch_delete_leaderboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_models_request.py → v1_batch_delete_models_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_models_response.py → v1_batch_delete_models_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_test_cases_response.py → v1_batch_delete_test_cases_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_tests_request.py → v1_batch_delete_tests_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_tests_response.py → v1_batch_delete_tests_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_get_dashboards_response.py → v1_batch_get_dashboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_get_documents_response.py → v1_batch_get_documents_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_leaderboards_response.py → v1_batch_get_leaderboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_get_models_response.py → v1_batch_get_models_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_operations_response.py → v1_batch_get_operations_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_get_tests_response.py → v1_batch_get_tests_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_import_leaderboard_request.py → v1_batch_import_leaderboard_request.py} +7 -7
- eval_studio_client/api/models/{v1alpha_import_leaderboard_response.py → v1_batch_import_leaderboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_import_tests_request.py → v1_batch_import_tests_request.py} +5 -5
- eval_studio_client/api/models/{v1alpha_batch_delete_tests_response.py → v1_batch_import_tests_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_check_base_models_response.py → v1_check_base_models_response.py} +5 -5
- eval_studio_client/api/models/{v1alpha_collection_info.py → v1_collection_info.py} +4 -4
- eval_studio_client/api/models/{v1alpha_get_dashboard_response.py → v1_create_dashboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_document_response.py → v1_create_document_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_evaluation_request.py → v1_create_evaluation_request.py} +11 -11
- eval_studio_client/api/models/{v1alpha_get_evaluator_response.py → v1_create_evaluator_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_leaderboard_response.py → v1_create_leaderboard_request.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_operation_response.py → v1_create_leaderboard_response.py} +8 -8
- eval_studio_client/api/models/v1_create_leaderboard_without_cache_response.py +91 -0
- eval_studio_client/api/models/{v1alpha_get_model_response.py → v1_create_model_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_perturbation_response.py → v1_create_perturbation_response.py} +5 -5
- eval_studio_client/api/models/{v1alpha_get_test_case_response.py → v1_create_test_case_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_find_test_lab_response.py → v1_create_test_lab_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_test_response.py → v1_create_test_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_dashboard.py → v1_dashboard.py} +7 -7
- eval_studio_client/api/models/{v1alpha_dashboard_status.py → v1_dashboard_status.py} +3 -3
- eval_studio_client/api/models/{v1alpha_update_dashboard_response.py → v1_delete_dashboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_update_document_response.py → v1_delete_document_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_evaluator_response.py → v1_delete_evaluator_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_leaderboard_request.py → v1_delete_leaderboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_model_response.py → v1_delete_model_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_delete_test_case_response.py → v1_delete_test_case_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_test_response.py → v1_delete_test_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_document.py → v1_document.py} +5 -5
- eval_studio_client/api/models/{v1alpha_evaluation_test.py → v1_evaluation_test.py} +10 -10
- eval_studio_client/api/models/{v1alpha_evaluator.py → v1_evaluator.py} +14 -10
- eval_studio_client/api/models/{v1alpha_evaluator_param_type.py → v1_evaluator_param_type.py} +3 -3
- eval_studio_client/api/models/{v1alpha_evaluator_parameter.py → v1_evaluator_parameter.py} +7 -7
- eval_studio_client/api/models/{v1alpha_evaluator_view.py → v1_evaluator_view.py} +3 -3
- eval_studio_client/api/models/{v1alpha_create_leaderboard_response.py → v1_finalize_operation_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_find_all_test_cases_by_id_response.py → v1_find_all_test_cases_by_id_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_test_lab_response.py → v1_find_test_lab_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_finalize_operation_response.py → v1_generate_test_cases_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_dashboard_response.py → v1_get_dashboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_delete_document_response.py → v1_get_document_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_delete_evaluator_response.py → v1_get_evaluator_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_info_response.py → v1_get_info_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_update_leaderboard_response.py → v1_get_leaderboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_update_model_response.py → v1_get_model_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_operation_progress_by_parent_response.py → v1_get_operation_progress_by_parent_response.py} +8 -8
- eval_studio_client/api/models/v1_get_operation_response.py +91 -0
- eval_studio_client/api/models/{v1alpha_get_perturbator_response.py → v1_get_perturbator_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_test_case_response.py → v1_get_test_case_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_get_test_class_response.py → v1_get_test_class_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_update_test_response.py → v1_get_test_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_import_evaluation_request.py → v1_import_evaluation_request.py} +8 -8
- eval_studio_client/api/models/{v1alpha_import_leaderboard_request.py → v1_import_leaderboard_request.py} +7 -7
- eval_studio_client/api/models/v1_import_leaderboard_response.py +91 -0
- eval_studio_client/api/models/{v1alpha_info.py → v1_info.py} +5 -5
- eval_studio_client/api/models/{v1alpha_insight.py → v1_insight.py} +4 -4
- eval_studio_client/api/models/{v1alpha_leaderboard.py → v1_leaderboard.py} +15 -15
- eval_studio_client/api/models/{v1alpha_leaderboard_status.py → v1_leaderboard_status.py} +3 -3
- eval_studio_client/api/models/{v1alpha_leaderboard_type.py → v1_leaderboard_type.py} +3 -3
- eval_studio_client/api/models/{v1alpha_leaderboard_view.py → v1_leaderboard_view.py} +3 -3
- eval_studio_client/api/models/{v1alpha_list_base_models_response.py → v1_list_base_models_response.py} +5 -5
- eval_studio_client/api/models/{v1alpha_batch_delete_dashboards_response.py → v1_list_dashboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_documents_response.py → v1_list_documents_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_evaluators_response.py → v1_list_evaluators_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_leaderboards_response.py → v1_list_leaderboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_llm_models_response.py → v1_list_llm_models_response.py} +5 -5
- eval_studio_client/api/models/{v1alpha_list_model_collections_response.py → v1_list_model_collections_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_models_response.py → v1_list_models_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_most_recent_dashboards_response.py → v1_list_most_recent_dashboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_most_recent_leaderboards_response.py → v1_list_most_recent_leaderboards_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_most_recent_models_response.py → v1_list_most_recent_models_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_import_tests_response.py → v1_list_most_recent_tests_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_get_operations_response.py → v1_list_operations_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_perturbators_response.py → v1_list_perturbators_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_rag_collections_response.py → v1_list_rag_collections_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_batch_delete_test_cases_response.py → v1_list_test_cases_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_list_test_classes_response.py → v1_list_test_classes_response.py} +8 -8
- eval_studio_client/api/models/v1_list_tests_response.py +95 -0
- eval_studio_client/api/models/{v1alpha_model.py → v1_model.py} +7 -7
- eval_studio_client/api/models/{v1alpha_model_type.py → v1_model_type.py} +3 -3
- eval_studio_client/api/models/{v1alpha_operation.py → v1_operation.py} +4 -4
- eval_studio_client/api/models/{v1alpha_operation_progress.py → v1_operation_progress.py} +5 -5
- eval_studio_client/api/models/{v1alpha_delete_test_response.py → v1_perturb_test_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_perturbator.py → v1_perturbator.py} +5 -5
- eval_studio_client/api/models/{v1alpha_perturbator_configuration.py → v1_perturbator_configuration.py} +6 -6
- eval_studio_client/api/models/{v1alpha_perturbator_intensity.py → v1_perturbator_intensity.py} +4 -4
- eval_studio_client/api/models/{v1alpha_problem_and_action.py → v1_problem_and_action.py} +5 -5
- eval_studio_client/api/models/{v1alpha_test.py → v1_test.py} +5 -5
- eval_studio_client/api/models/{v1alpha_test_case.py → v1_test_case.py} +5 -5
- eval_studio_client/api/models/{v1alpha_test_case_relationship.py → v1_test_case_relationship.py} +5 -5
- eval_studio_client/api/models/v1_test_cases_generator.py +50 -0
- eval_studio_client/api/models/{v1alpha_test_class.py → v1_test_class.py} +7 -7
- eval_studio_client/api/models/{v1alpha_test_class_type.py → v1_test_class_type.py} +3 -3
- eval_studio_client/api/models/{v1alpha_test_lab.py → v1_test_lab.py} +5 -5
- eval_studio_client/api/models/{v1alpha_delete_dashboard_response.py → v1_update_dashboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_create_document_response.py → v1_update_document_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_delete_leaderboard_response.py → v1_update_leaderboard_response.py} +8 -8
- eval_studio_client/api/models/{v1alpha_delete_model_response.py → v1_update_model_response.py} +8 -8
- eval_studio_client/api/models/v1_update_operation_response.py +91 -0
- eval_studio_client/api/models/{v1alpha_update_test_case_response.py → v1_update_test_case_response.py} +8 -8
- eval_studio_client/api/models/v1_update_test_response.py +91 -0
- eval_studio_client/api/models/{v1alpha_who_am_i_response.py → v1_who_am_i_response.py} +5 -5
- eval_studio_client/api/rest.py +1 -1
- eval_studio_client/api/test/test_dashboard_service_api.py +1 -1
- eval_studio_client/api/test/test_document_service_api.py +1 -1
- eval_studio_client/api/test/test_evaluation_service_api.py +1 -1
- eval_studio_client/api/test/test_evaluator_service_api.py +1 -1
- eval_studio_client/api/test/test_info_service_api.py +1 -1
- eval_studio_client/api/test/test_leaderboard_service_api.py +1 -1
- eval_studio_client/api/test/test_model_service_api.py +1 -1
- eval_studio_client/api/test/test_operation_progress_service_api.py +1 -1
- eval_studio_client/api/test/test_operation_service_api.py +1 -1
- eval_studio_client/api/test/test_perturbation_service_api.py +1 -1
- eval_studio_client/api/test/test_perturbation_service_create_perturbation_request.py +4 -4
- eval_studio_client/api/test/test_perturbator_service_api.py +1 -1
- eval_studio_client/api/test/test_prompt_generation_service_api.py +37 -0
- eval_studio_client/api/test/test_prompt_generation_service_auto_generate_prompts_request.py +75 -0
- eval_studio_client/api/test/test_protobuf_any.py +1 -1
- eval_studio_client/api/test/test_required_the_dashboard_to_update.py +1 -1
- eval_studio_client/api/test/test_required_the_document_to_update.py +1 -1
- eval_studio_client/api/test/test_required_the_leaderboard_to_update.py +3 -3
- eval_studio_client/api/test/test_required_the_model_to_update.py +1 -1
- eval_studio_client/api/test/test_required_the_operation_to_finalize.py +1 -1
- eval_studio_client/api/test/test_required_the_operation_to_update.py +1 -1
- eval_studio_client/api/test/test_required_the_test_case_to_update.py +1 -1
- eval_studio_client/api/test/test_required_the_test_to_update.py +1 -1
- eval_studio_client/api/test/test_rpc_status.py +1 -1
- eval_studio_client/api/test/test_test_case_service_api.py +1 -1
- eval_studio_client/api/test/test_test_case_service_batch_delete_test_cases_request.py +1 -1
- eval_studio_client/api/test/test_test_class_service_api.py +1 -1
- eval_studio_client/api/test/test_test_lab_service_api.py +1 -1
- eval_studio_client/api/test/test_test_service_api.py +7 -1
- eval_studio_client/api/test/test_test_service_generate_test_cases_request.py +57 -0
- eval_studio_client/api/test/test_test_service_perturb_test_request.py +2 -2
- eval_studio_client/api/test/{test_v1alpha_batch_create_leaderboards_request.py → test_v1_batch_create_leaderboards_request.py} +16 -16
- eval_studio_client/api/test/{test_v1alpha_create_leaderboard_response.py → test_v1_batch_create_leaderboards_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_models_request.py → test_v1_batch_delete_dashboards_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_get_dashboards_response.py → test_v1_batch_delete_dashboards_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_documents_request.py → test_v1_batch_delete_documents_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_get_documents_response.py → test_v1_batch_delete_documents_response.py} +13 -13
- eval_studio_client/api/test/test_v1_batch_delete_evaluators_request.py +53 -0
- eval_studio_client/api/test/{test_v1alpha_batch_delete_evaluators_response.py → test_v1_batch_delete_evaluators_response.py} +15 -14
- eval_studio_client/api/test/{test_v1alpha_batch_delete_leaderboards_request.py → test_v1_batch_delete_leaderboards_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_get_leaderboards_response.py → test_v1_batch_delete_leaderboards_response.py} +15 -15
- eval_studio_client/api/test/test_v1_batch_delete_models_request.py +53 -0
- eval_studio_client/api/test/{test_v1alpha_batch_get_models_response.py → test_v1_batch_delete_models_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_test_cases_response.py → test_v1_batch_delete_test_cases_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_tests_request.py → test_v1_batch_delete_tests_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_get_tests_response.py → test_v1_batch_delete_tests_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_dashboards_response.py → test_v1_batch_get_dashboards_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_documents_response.py → test_v1_batch_get_documents_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_leaderboards_response.py → test_v1_batch_get_leaderboards_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_list_models_response.py → test_v1_batch_get_models_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_operations_response.py → test_v1_batch_get_operations_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_tests_response.py → test_v1_batch_get_tests_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_import_leaderboard_request.py → test_v1_batch_import_leaderboard_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_import_leaderboard_response.py → test_v1_batch_import_leaderboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_import_tests_request.py → test_v1_batch_import_tests_request.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_import_tests_response.py → test_v1_batch_import_tests_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_check_base_models_response.py → test_v1_check_base_models_response.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_collection_info.py → test_v1_collection_info.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_get_dashboard_response.py → test_v1_create_dashboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_get_document_response.py → test_v1_create_document_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_evaluation_request.py → test_v1_create_evaluation_request.py} +16 -16
- eval_studio_client/api/test/{test_v1alpha_get_evaluator_response.py → test_v1_create_evaluator_response.py} +15 -14
- eval_studio_client/api/test/{test_v1alpha_get_leaderboard_response.py → test_v1_create_leaderboard_request.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_update_operation_response.py → test_v1_create_leaderboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_import_leaderboard_response.py → test_v1_create_leaderboard_without_cache_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_get_model_response.py → test_v1_create_model_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_perturbation_response.py → test_v1_create_perturbation_response.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_get_test_case_response.py → test_v1_create_test_case_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_find_test_lab_response.py → test_v1_create_test_lab_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_get_test_response.py → test_v1_create_test_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_dashboard.py → test_v1_dashboard.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_evaluator_view.py → test_v1_dashboard_status.py} +7 -7
- eval_studio_client/api/test/{test_v1alpha_update_dashboard_response.py → test_v1_delete_dashboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_update_document_response.py → test_v1_delete_document_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_delete_evaluator_response.py → test_v1_delete_evaluator_response.py} +15 -14
- eval_studio_client/api/test/{test_v1alpha_create_leaderboard_request.py → test_v1_delete_leaderboard_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_delete_model_response.py → test_v1_delete_model_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_test_case_response.py → test_v1_delete_test_case_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_test_response.py → test_v1_delete_test_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_document.py → test_v1_document.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_evaluation_test.py → test_v1_evaluation_test.py} +14 -14
- eval_studio_client/api/test/{test_v1alpha_evaluator.py → test_v1_evaluator.py} +14 -13
- eval_studio_client/api/test/{test_v1alpha_test_class_type.py → test_v1_evaluator_param_type.py} +7 -7
- eval_studio_client/api/test/{test_v1alpha_evaluator_parameter.py → test_v1_evaluator_parameter.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_model_type.py → test_v1_evaluator_view.py} +7 -7
- eval_studio_client/api/test/{test_v1alpha_get_operation_response.py → test_v1_finalize_operation_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_find_all_test_cases_by_id_response.py → test_v1_find_all_test_cases_by_id_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_test_lab_response.py → test_v1_find_test_lab_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_finalize_operation_response.py → test_v1_generate_test_cases_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_dashboard_response.py → test_v1_get_dashboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_delete_document_response.py → test_v1_get_document_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_evaluator_response.py → test_v1_get_evaluator_response.py} +15 -14
- eval_studio_client/api/test/{test_v1alpha_get_info_response.py → test_v1_get_info_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_delete_leaderboard_response.py → test_v1_get_leaderboard_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_create_model_response.py → test_v1_get_model_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_get_operation_progress_by_parent_response.py → test_v1_get_operation_progress_by_parent_response.py} +13 -13
- eval_studio_client/api/test/test_v1_get_operation_response.py +71 -0
- eval_studio_client/api/test/{test_v1alpha_get_perturbator_response.py → test_v1_get_perturbator_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_delete_test_case_response.py → test_v1_get_test_case_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_get_test_class_response.py → test_v1_get_test_class_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_delete_test_response.py → test_v1_get_test_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_import_evaluation_request.py → test_v1_import_evaluation_request.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_import_leaderboard_request.py → test_v1_import_leaderboard_request.py} +12 -12
- eval_studio_client/api/test/test_v1_import_leaderboard_response.py +71 -0
- eval_studio_client/api/test/{test_v1alpha_info.py → test_v1_info.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_insight.py → test_v1_insight.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_leaderboard.py → test_v1_leaderboard.py} +14 -14
- eval_studio_client/api/test/{test_v1alpha_dashboard_status.py → test_v1_leaderboard_status.py} +7 -7
- eval_studio_client/api/test/test_v1_leaderboard_type.py +33 -0
- eval_studio_client/api/test/test_v1_leaderboard_view.py +33 -0
- eval_studio_client/api/test/{test_v1alpha_list_base_models_response.py → test_v1_list_base_models_response.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_batch_delete_dashboards_response.py → test_v1_list_dashboards_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_documents_response.py → test_v1_list_documents_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_evaluators_response.py → test_v1_list_evaluators_response.py} +15 -14
- eval_studio_client/api/test/{test_v1alpha_list_leaderboards_response.py → test_v1_list_leaderboards_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_list_llm_models_response.py → test_v1_list_llm_models_response.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_list_rag_collections_response.py → test_v1_list_model_collections_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_models_response.py → test_v1_list_models_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_most_recent_dashboards_response.py → test_v1_list_most_recent_dashboards_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_most_recent_leaderboards_response.py → test_v1_list_most_recent_leaderboards_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_list_most_recent_models_response.py → test_v1_list_most_recent_models_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_delete_tests_response.py → test_v1_list_most_recent_tests_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_batch_get_operations_response.py → test_v1_list_operations_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_perturbators_response.py → test_v1_list_perturbators_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_model_collections_response.py → test_v1_list_rag_collections_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_test_cases_response.py → test_v1_list_test_cases_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_list_test_classes_response.py → test_v1_list_test_classes_response.py} +13 -13
- eval_studio_client/api/test/test_v1_list_tests_response.py +69 -0
- eval_studio_client/api/test/{test_v1alpha_model.py → test_v1_model.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_leaderboard_view.py → test_v1_model_type.py} +7 -7
- eval_studio_client/api/test/{test_v1alpha_operation.py → test_v1_operation.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_operation_progress.py → test_v1_operation_progress.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_update_test_response.py → test_v1_perturb_test_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_perturbator.py → test_v1_perturbator.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_perturbator_configuration.py → test_v1_perturbator_configuration.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_leaderboard_type.py → test_v1_perturbator_intensity.py} +7 -7
- eval_studio_client/api/test/{test_v1alpha_problem_and_action.py → test_v1_problem_and_action.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_test.py → test_v1_test.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_test_case.py → test_v1_test_case.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_test_case_relationship.py → test_v1_test_case_relationship.py} +12 -12
- eval_studio_client/api/test/test_v1_test_cases_generator.py +33 -0
- eval_studio_client/api/test/{test_v1alpha_test_class.py → test_v1_test_class.py} +12 -12
- eval_studio_client/api/test/test_v1_test_class_type.py +33 -0
- eval_studio_client/api/test/{test_v1alpha_test_lab.py → test_v1_test_lab.py} +12 -12
- eval_studio_client/api/test/{test_v1alpha_delete_dashboard_response.py → test_v1_update_dashboard_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_create_document_response.py → test_v1_update_document_response.py} +13 -13
- eval_studio_client/api/test/{test_v1alpha_update_leaderboard_response.py → test_v1_update_leaderboard_response.py} +15 -15
- eval_studio_client/api/test/{test_v1alpha_update_model_response.py → test_v1_update_model_response.py} +13 -13
- eval_studio_client/api/test/test_v1_update_operation_response.py +71 -0
- eval_studio_client/api/test/{test_v1alpha_update_test_case_response.py → test_v1_update_test_case_response.py} +13 -13
- eval_studio_client/api/test/test_v1_update_test_response.py +67 -0
- eval_studio_client/api/test/{test_v1alpha_who_am_i_response.py → test_v1_who_am_i_response.py} +12 -12
- eval_studio_client/api/test/test_who_am_i_service_api.py +1 -1
- eval_studio_client/dashboards.py +50 -9
- eval_studio_client/documents.py +3 -3
- eval_studio_client/evaluators.py +1 -1
- eval_studio_client/gen/openapiv2/eval_studio.swagger.json +568 -387
- eval_studio_client/insights.py +1 -1
- eval_studio_client/leaderboards.py +16 -13
- eval_studio_client/models.py +117 -29
- eval_studio_client/perturbators.py +5 -7
- eval_studio_client/problems.py +1 -1
- eval_studio_client/test_labs.py +2 -2
- eval_studio_client/tests.py +222 -8
- eval_studio_client/utils.py +26 -0
- {eval_studio_client-0.8.0a2.dist-info → eval_studio_client-1.0.0.dist-info}/METADATA +2 -2
- eval_studio_client-1.0.0.dist-info/RECORD +486 -0
- {eval_studio_client-0.8.0a2.dist-info → eval_studio_client-1.0.0.dist-info}/WHEEL +1 -1
- eval_studio_client/api/docs/V1alphaBatchCreateLeaderboardsRequest.md +0 -31
- eval_studio_client/api/docs/V1alphaBatchCreateLeaderboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteDashboardsRequest.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteDashboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteDocumentsRequest.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteDocumentsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteEvaluatorsRequest.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteEvaluatorsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteLeaderboardsRequest.md +0 -30
- eval_studio_client/api/docs/V1alphaBatchDeleteLeaderboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteModelsRequest.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteTestCasesResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchDeleteTestsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetDashboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetDocumentsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetLeaderboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetOperationsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchGetTestsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchImportLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaBatchImportTestsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCheckBaseModelsResponse.md +0 -30
- eval_studio_client/api/docs/V1alphaCreateDashboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateDocumentResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateEvaluatorResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateLeaderboardRequest.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateLeaderboardWithoutCacheResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateModelResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreatePerturbationResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateTestCaseResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateTestLabResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaCreateTestResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteDashboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteDocumentResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteEvaluatorResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteModelResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteTestCaseResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaDeleteTestResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaEvaluationTest.md +0 -32
- eval_studio_client/api/docs/V1alphaFinalizeOperationResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaFindAllTestCasesByIDResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaFindTestLabResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetDashboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetDocumentResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetEvaluatorResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetInfoResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetModelResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetOperationProgressByParentResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetOperationResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetPerturbatorResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetTestCaseResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetTestClassResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaGetTestResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaImportLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListBaseModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListDashboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListDocumentsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListEvaluatorsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListLLMModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListLeaderboardsResponse.md +0 -30
- eval_studio_client/api/docs/V1alphaListModelCollectionsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListMostRecentDashboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListMostRecentLeaderboardsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListMostRecentModelsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListMostRecentTestsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListOperationsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListPerturbatorsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListRAGCollectionsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListTestCasesResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListTestClassesResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaListTestsResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaPerturbTestResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaPerturbatorConfiguration.md +0 -32
- eval_studio_client/api/docs/V1alphaUpdateDashboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateDocumentResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateLeaderboardResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateModelResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateOperationResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateTestCaseResponse.md +0 -29
- eval_studio_client/api/docs/V1alphaUpdateTestResponse.md +0 -29
- eval_studio_client/api/models/v1alpha_batch_create_leaderboards_response.py +0 -91
- eval_studio_client/api/models/v1alpha_batch_import_leaderboard_response.py +0 -91
- eval_studio_client/api/models/v1alpha_create_leaderboard_without_cache_response.py +0 -91
- eval_studio_client/api/models/v1alpha_list_most_recent_tests_response.py +0 -95
- eval_studio_client/api/models/v1alpha_perturb_test_response.py +0 -91
- eval_studio_client/api/test/test_v1alpha_batch_create_leaderboards_response.py +0 -71
- eval_studio_client/api/test/test_v1alpha_batch_delete_dashboards_request.py +0 -53
- eval_studio_client/api/test/test_v1alpha_batch_delete_evaluators_request.py +0 -53
- eval_studio_client/api/test/test_v1alpha_create_leaderboard_without_cache_response.py +0 -71
- eval_studio_client/api/test/test_v1alpha_evaluator_param_type.py +0 -33
- eval_studio_client/api/test/test_v1alpha_leaderboard_status.py +0 -33
- eval_studio_client/api/test/test_v1alpha_list_most_recent_tests_response.py +0 -69
- eval_studio_client/api/test/test_v1alpha_perturb_test_response.py +0 -67
- eval_studio_client/api/test/test_v1alpha_perturbator_intensity.py +0 -33
- eval_studio_client-0.8.0a2.dist-info/RECORD +0 -470
eval_studio_client/tests.py
CHANGED
|
@@ -1,6 +1,9 @@
|
|
|
1
1
|
import dataclasses
|
|
2
2
|
import datetime
|
|
3
|
+
import enum
|
|
3
4
|
import json
|
|
5
|
+
import time
|
|
6
|
+
from typing import Any
|
|
4
7
|
from typing import List
|
|
5
8
|
from typing import Optional
|
|
6
9
|
from typing import Union
|
|
@@ -8,9 +11,113 @@ from typing import Union
|
|
|
8
11
|
from eval_studio_client import api
|
|
9
12
|
from eval_studio_client import documents as d7s
|
|
10
13
|
from eval_studio_client import perturbators as p10s
|
|
14
|
+
from eval_studio_client import utils
|
|
11
15
|
from eval_studio_client.api import models
|
|
12
16
|
|
|
13
17
|
|
|
18
|
+
class TestCaseGenerator(enum.Enum):
|
|
19
|
+
"""Methods used for test case generation."""
|
|
20
|
+
|
|
21
|
+
unspecified = models.V1TestCasesGenerator.TEST_CASES_GENERATOR_UNSPECIFIED
|
|
22
|
+
simple_factual_questions = (
|
|
23
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_SIMPLE_FACTUAL_QUESTIONS
|
|
24
|
+
)
|
|
25
|
+
multi_hop_questions = (
|
|
26
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_MULTI_HOP_QUESTIONS
|
|
27
|
+
)
|
|
28
|
+
inference_questions = (
|
|
29
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_INFERENCE_QUESTIONS
|
|
30
|
+
)
|
|
31
|
+
numerical_reasoning_questions = (
|
|
32
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_NUMERICAL_REASONING_QUESTIONS
|
|
33
|
+
)
|
|
34
|
+
ambiguity_handling_questions = (
|
|
35
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_AMBIGUITY_HANDLING_QUESTIONS
|
|
36
|
+
)
|
|
37
|
+
negation_and_contradiction_questions = (
|
|
38
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_NEGATION_AND_CONTRADICTION_QUESTIONS
|
|
39
|
+
)
|
|
40
|
+
temporal_reasoning_questions = (
|
|
41
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_TEMPORAL_REASONING_QUESTIONS
|
|
42
|
+
)
|
|
43
|
+
out_of_scope_questions = (
|
|
44
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_OUT_OF_SCOPE_QUESTIONS
|
|
45
|
+
)
|
|
46
|
+
yes_or_no_questions = (
|
|
47
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_YES_OR_NO_QUESTIONS
|
|
48
|
+
)
|
|
49
|
+
multiple_choice_questions = (
|
|
50
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_MULTIPLE_CHOICE_QUESTIONS
|
|
51
|
+
)
|
|
52
|
+
demographic_representation_questions = (
|
|
53
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_DEMOGRAPHIC_REPRESENTATION_QUESTIONS
|
|
54
|
+
)
|
|
55
|
+
sentiment_variation_questions = (
|
|
56
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_SENTIMENT_VARIATION_QUESTIONS
|
|
57
|
+
)
|
|
58
|
+
irrelevant_information_questions = (
|
|
59
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_IRRELEVANT_INFORMATION_QUESTIONS
|
|
60
|
+
)
|
|
61
|
+
deliberately_misleading_questions = (
|
|
62
|
+
models.V1TestCasesGenerator.TEST_CASES_GENERATOR_DELIBERATELY_MISLEADING_QUESTIONS
|
|
63
|
+
)
|
|
64
|
+
|
|
65
|
+
def to_api_proto(self) -> models.V1TestCasesGenerator:
|
|
66
|
+
"""Converts the client TestCaseGenerator to an API TestCaseGeneration."""
|
|
67
|
+
proto_values = {
|
|
68
|
+
TestCaseGenerator.unspecified: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_UNSPECIFIED,
|
|
69
|
+
TestCaseGenerator.simple_factual_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_SIMPLE_FACTUAL_QUESTIONS,
|
|
70
|
+
TestCaseGenerator.multi_hop_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_MULTI_HOP_QUESTIONS,
|
|
71
|
+
TestCaseGenerator.inference_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_INFERENCE_QUESTIONS,
|
|
72
|
+
TestCaseGenerator.numerical_reasoning_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_NUMERICAL_REASONING_QUESTIONS,
|
|
73
|
+
TestCaseGenerator.ambiguity_handling_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_AMBIGUITY_HANDLING_QUESTIONS,
|
|
74
|
+
TestCaseGenerator.negation_and_contradiction_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_NEGATION_AND_CONTRADICTION_QUESTIONS,
|
|
75
|
+
TestCaseGenerator.temporal_reasoning_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_TEMPORAL_REASONING_QUESTIONS,
|
|
76
|
+
TestCaseGenerator.out_of_scope_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_OUT_OF_SCOPE_QUESTIONS,
|
|
77
|
+
TestCaseGenerator.yes_or_no_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_YES_OR_NO_QUESTIONS,
|
|
78
|
+
TestCaseGenerator.multiple_choice_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_MULTIPLE_CHOICE_QUESTIONS,
|
|
79
|
+
TestCaseGenerator.demographic_representation_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_DEMOGRAPHIC_REPRESENTATION_QUESTIONS,
|
|
80
|
+
TestCaseGenerator.sentiment_variation_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_SENTIMENT_VARIATION_QUESTIONS,
|
|
81
|
+
TestCaseGenerator.irrelevant_information_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_IRRELEVANT_INFORMATION_QUESTIONS,
|
|
82
|
+
TestCaseGenerator.deliberately_misleading_questions: models.V1TestCasesGenerator.TEST_CASES_GENERATOR_DELIBERATELY_MISLEADING_QUESTIONS,
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
return proto_values[self]
|
|
86
|
+
|
|
87
|
+
|
|
88
|
+
@dataclasses.dataclass
|
|
89
|
+
class _TestCaseGenerationHandle:
|
|
90
|
+
|
|
91
|
+
name: Any | None
|
|
92
|
+
progress: Optional[float] = None
|
|
93
|
+
progress_message: Optional[str] = None
|
|
94
|
+
error: Optional[models.RpcStatus] = None
|
|
95
|
+
done: Optional[bool] = None
|
|
96
|
+
|
|
97
|
+
@staticmethod
|
|
98
|
+
def _from_operation(
|
|
99
|
+
res: models.V1GenerateTestCasesResponse | models.V1GetOperationResponse,
|
|
100
|
+
) -> "_TestCaseGenerationHandle":
|
|
101
|
+
"""Converts an API operation to prompt generation handle."""
|
|
102
|
+
op: models.V1Operation | None = res.operation
|
|
103
|
+
if not op:
|
|
104
|
+
return _TestCaseGenerationHandle(name=None)
|
|
105
|
+
|
|
106
|
+
# progress
|
|
107
|
+
if hasattr(op, "metadata") and op.metadata:
|
|
108
|
+
meta_dict = op.metadata.to_dict() or {}
|
|
109
|
+
else:
|
|
110
|
+
meta_dict = {}
|
|
111
|
+
|
|
112
|
+
return _TestCaseGenerationHandle(
|
|
113
|
+
name=op.name,
|
|
114
|
+
progress=meta_dict.get("progress"),
|
|
115
|
+
progress_message=meta_dict.get("progressMessage"),
|
|
116
|
+
error=op.error,
|
|
117
|
+
done=op.done,
|
|
118
|
+
)
|
|
119
|
+
|
|
120
|
+
|
|
14
121
|
@dataclasses.dataclass
|
|
15
122
|
class TestCase:
|
|
16
123
|
"""Represents a single test case, which contains tested prompt, expected answer
|
|
@@ -35,9 +142,9 @@ class TestCase:
|
|
|
35
142
|
create_time: Optional[datetime.datetime] = None
|
|
36
143
|
update_time: Optional[datetime.datetime] = None
|
|
37
144
|
|
|
38
|
-
def to_api_proto(self) -> models.
|
|
145
|
+
def to_api_proto(self) -> models.V1TestCase:
|
|
39
146
|
"""Converts the client TestCase to an API TestCase."""
|
|
40
|
-
return models.
|
|
147
|
+
return models.V1TestCase(
|
|
41
148
|
prompt=self.prompt,
|
|
42
149
|
answer=self.answer,
|
|
43
150
|
constraints=self.constraints,
|
|
@@ -45,7 +152,7 @@ class TestCase:
|
|
|
45
152
|
)
|
|
46
153
|
|
|
47
154
|
@staticmethod
|
|
48
|
-
def _from_api_test_case(api_test_case: models.
|
|
155
|
+
def _from_api_test_case(api_test_case: models.V1TestCase) -> "TestCase":
|
|
49
156
|
return TestCase(
|
|
50
157
|
key=api_test_case.name or "",
|
|
51
158
|
prompt=api_test_case.prompt or "",
|
|
@@ -75,12 +182,14 @@ class Test:
|
|
|
75
182
|
create_time: Optional[datetime.datetime] = None
|
|
76
183
|
update_time: Optional[datetime.datetime] = None
|
|
77
184
|
_client: Optional[api.ApiClient] = None
|
|
185
|
+
_gen_tc_op_name: Optional[str] = None
|
|
78
186
|
|
|
79
187
|
def __post_init__(self):
|
|
80
188
|
if self._client:
|
|
81
189
|
self._test_api = api.TestServiceApi(self._client)
|
|
82
190
|
self._test_case_api = api.TestCaseServiceApi(self._client)
|
|
83
191
|
self._document_api = api.DocumentServiceApi(self._client)
|
|
192
|
+
self._operation_api = api.OperationServiceApi(self._client)
|
|
84
193
|
|
|
85
194
|
@property
|
|
86
195
|
def test_cases(self) -> List[TestCase]:
|
|
@@ -146,6 +255,93 @@ class Test:
|
|
|
146
255
|
resp = self._test_api.test_service_perturb_test(self.key, req)
|
|
147
256
|
return Test._from_api_test(resp.test, self._client)
|
|
148
257
|
|
|
258
|
+
def generate_test_cases(
|
|
259
|
+
self,
|
|
260
|
+
count: int,
|
|
261
|
+
model: Optional[str] = None,
|
|
262
|
+
base_llm_model: Optional[str] = None,
|
|
263
|
+
generators: Optional[List[TestCaseGenerator]] = None,
|
|
264
|
+
existing_collection: Optional[str] = None,
|
|
265
|
+
) -> None:
|
|
266
|
+
"""Generates test cases based on the documents of the Test.
|
|
267
|
+
|
|
268
|
+
Args:
|
|
269
|
+
count (int): Number of test cases to generate (generator may return fewer
|
|
270
|
+
prompts).
|
|
271
|
+
model (str): Model to use for generating the prompts.
|
|
272
|
+
base_llm_model (str): Base LLM model to use for generating the prompts.
|
|
273
|
+
generators (List[TestCaseGenerator]): Methods to use for generation.
|
|
274
|
+
existing_collection (str): ID or the resource name of the existing
|
|
275
|
+
collection, from which prompts will be generated.
|
|
276
|
+
NOTE: This option works only for the H2OGPTe model host ATM.
|
|
277
|
+
"""
|
|
278
|
+
|
|
279
|
+
req = models.TestServiceGenerateTestCasesRequest(
|
|
280
|
+
count=count,
|
|
281
|
+
model=model or None,
|
|
282
|
+
base_llm_model=base_llm_model or None,
|
|
283
|
+
generators=[g.to_api_proto() for g in generators] if generators else None,
|
|
284
|
+
h2ogpte_collection_id=existing_collection or None,
|
|
285
|
+
)
|
|
286
|
+
|
|
287
|
+
res = self._test_api.test_service_generate_test_cases(self.key, req)
|
|
288
|
+
|
|
289
|
+
op: models.V1Operation | None = res.operation
|
|
290
|
+
self._gen_tc_op_name = op.name if op else None
|
|
291
|
+
|
|
292
|
+
def wait_for_test_case_generation(
|
|
293
|
+
self, timeout: Optional[float] = None, verbose: bool = False
|
|
294
|
+
) -> None:
|
|
295
|
+
"""Waits for the test case generation to finish.
|
|
296
|
+
|
|
297
|
+
Args:
|
|
298
|
+
timeout (float): The maximum time to wait in seconds.
|
|
299
|
+
verbose (bool): If True, prints the status of the handle while waiting.
|
|
300
|
+
"""
|
|
301
|
+
if not self._gen_tc_op_name:
|
|
302
|
+
raise ValueError(
|
|
303
|
+
"There is no ongoing test case generation - the operation name is not "
|
|
304
|
+
"set."
|
|
305
|
+
)
|
|
306
|
+
|
|
307
|
+
if verbose:
|
|
308
|
+
print(
|
|
309
|
+
f"Waiting for test case generation to finish ({self._gen_tc_op_name}):"
|
|
310
|
+
)
|
|
311
|
+
if self._client:
|
|
312
|
+
# exponential backoff
|
|
313
|
+
wait_time = 1.0
|
|
314
|
+
wait_coef = 1.6
|
|
315
|
+
wait_max = 8.0
|
|
316
|
+
wait_total = 0.0
|
|
317
|
+
timeout = timeout or float(2 * 24 * 60 * 60) # 2 days
|
|
318
|
+
progress_bar = utils.ProgressBar()
|
|
319
|
+
while wait_total < timeout:
|
|
320
|
+
handle = _TestCaseGenerationHandle._from_operation(
|
|
321
|
+
self._operation_api.operation_service_get_operation(
|
|
322
|
+
self._gen_tc_op_name
|
|
323
|
+
)
|
|
324
|
+
)
|
|
325
|
+
|
|
326
|
+
if verbose:
|
|
327
|
+
progress_bar.update(handle.progress or 0, handle.progress_message)
|
|
328
|
+
|
|
329
|
+
if handle.done:
|
|
330
|
+
if handle.error:
|
|
331
|
+
raise RuntimeError(
|
|
332
|
+
f"Test case generation failed: {handle.error}"
|
|
333
|
+
)
|
|
334
|
+
return
|
|
335
|
+
|
|
336
|
+
wait_time *= wait_coef
|
|
337
|
+
time.sleep(min(wait_time, wait_max))
|
|
338
|
+
else:
|
|
339
|
+
raise ValueError(
|
|
340
|
+
"Unable to establish a connection to the Eval Studio host."
|
|
341
|
+
)
|
|
342
|
+
|
|
343
|
+
raise TimeoutError("Waiting timeout has been reached.")
|
|
344
|
+
|
|
149
345
|
def delete(self, force=False):
|
|
150
346
|
"""Deletes the test.
|
|
151
347
|
|
|
@@ -263,7 +459,7 @@ class Test:
|
|
|
263
459
|
raise RuntimeError("Failed to unlink the document from the test.") from err
|
|
264
460
|
|
|
265
461
|
@staticmethod
|
|
266
|
-
def _from_api_test(api_test: models.
|
|
462
|
+
def _from_api_test(api_test: models.V1Test, client: api.ApiClient) -> "Test":
|
|
267
463
|
return Test(
|
|
268
464
|
key=api_test.name or "",
|
|
269
465
|
name=api_test.display_name or "",
|
|
@@ -302,7 +498,7 @@ class _Tests:
|
|
|
302
498
|
documents (optional): List of `Document`s to be attached to the test.
|
|
303
499
|
"""
|
|
304
500
|
_documents = [d.key for d in documents] if documents else None
|
|
305
|
-
test = models.
|
|
501
|
+
test = models.V1Test(
|
|
306
502
|
display_name=name, description=description, documents=_documents
|
|
307
503
|
)
|
|
308
504
|
res = self._api.test_service_create_test(test)
|
|
@@ -319,6 +515,24 @@ class _Tests:
|
|
|
319
515
|
"""
|
|
320
516
|
self._api.test_service_delete_test(key)
|
|
321
517
|
|
|
518
|
+
def get(self, key: str) -> Test:
|
|
519
|
+
"""Get the test with given resource name.
|
|
520
|
+
|
|
521
|
+
Args:
|
|
522
|
+
key (str): Resource name of the test to be get.
|
|
523
|
+
|
|
524
|
+
Returns:
|
|
525
|
+
An instance of the retrieved `Test`.
|
|
526
|
+
|
|
527
|
+
Raises:
|
|
528
|
+
KeyError: If the test with the given key does not exist.
|
|
529
|
+
"""
|
|
530
|
+
api_test = self._api.test_service_get_test(key)
|
|
531
|
+
if not api_test or not api_test.test:
|
|
532
|
+
raise KeyError(f"Test with key '{key}' does not exist.")
|
|
533
|
+
|
|
534
|
+
return Test._from_api_test(api_test.test, self._client)
|
|
535
|
+
|
|
322
536
|
def import_test_suite(
|
|
323
537
|
self, test_suite: str, name_prefix: Optional[str] = None
|
|
324
538
|
) -> List[Test]:
|
|
@@ -328,7 +542,7 @@ class _Tests:
|
|
|
328
542
|
test_suite (str): JSON string of the test suite.
|
|
329
543
|
name_prefix (str): Optional prefix to name the imported tests.
|
|
330
544
|
"""
|
|
331
|
-
req = models.
|
|
545
|
+
req = models.V1BatchImportTestsRequest(
|
|
332
546
|
testsJson=test_suite, testDisplayNamePrefix=name_prefix or None
|
|
333
547
|
)
|
|
334
548
|
res = self._api.test_service_batch_import_tests(req)
|
|
@@ -360,9 +574,9 @@ class _PerturbatorConfiguration:
|
|
|
360
574
|
perturbator.params if isinstance(perturbator, p10s.Perturbator) else None
|
|
361
575
|
)
|
|
362
576
|
|
|
363
|
-
def to_api_proto(self) -> models.
|
|
577
|
+
def to_api_proto(self) -> models.V1PerturbatorConfiguration:
|
|
364
578
|
"""Converts the client PerturbatorConfiguration to an API PerturbatorConfiguration."""
|
|
365
|
-
return models.
|
|
579
|
+
return models.V1PerturbatorConfiguration(
|
|
366
580
|
name=self.name,
|
|
367
581
|
intensity=self.intensity.to_api_proto(),
|
|
368
582
|
params=json.dumps(self.params) if self.params else None,
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
from typing import Optional
|
|
2
|
+
|
|
3
|
+
|
|
4
|
+
class ProgressBar:
|
|
5
|
+
def __init__(self):
|
|
6
|
+
self.progress = 0.0
|
|
7
|
+
self.progress_message = "Initializing"
|
|
8
|
+
self._progress_max = 1.0
|
|
9
|
+
|
|
10
|
+
def update(self, progress: float, message: Optional[str] = None):
|
|
11
|
+
try:
|
|
12
|
+
self.progress = float(str(progress))
|
|
13
|
+
except ValueError:
|
|
14
|
+
self.progress = 0.0
|
|
15
|
+
|
|
16
|
+
if message:
|
|
17
|
+
self.progress_message = message or ""
|
|
18
|
+
|
|
19
|
+
self.print()
|
|
20
|
+
|
|
21
|
+
def print(self):
|
|
22
|
+
print(" " * len(self.progress_message), end="\r")
|
|
23
|
+
p_progress = int(self.progress / self._progress_max * 100)
|
|
24
|
+
p_hashes = p_progress // 5
|
|
25
|
+
p_msg = f" {p_progress:>3}% |{'#' * p_hashes:<20}| {self.progress_message}"
|
|
26
|
+
print(p_msg, end="\r")
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
Metadata-Version: 2.3
|
|
2
2
|
Name: eval-studio-client
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 1.0.0
|
|
4
4
|
Project-URL: Source, https://github.com/h2oai/eval-studio/tree/main/client-py/src/
|
|
5
5
|
Project-URL: Issues, https://github.com/h2oai/eval-studio/issues
|
|
6
6
|
Author-email: "H2O.ai" <support@h2o.ai>
|
|
7
|
-
License
|
|
7
|
+
License: MIT
|
|
8
8
|
Classifier: Development Status :: 4 - Beta
|
|
9
9
|
Classifier: Programming Language :: Python
|
|
10
10
|
Classifier: Programming Language :: Python :: 3.9
|