pydantic-ai 0.4.11__tar.gz → 0.5.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of pydantic-ai might be problematic. Click here for more details.
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/Makefile +2 -5
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/PKG-INFO +3 -3
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/pyproject.toml +5 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/conftest.py +5 -5
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_dataset.py +165 -98
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_evaluator_base.py +2 -2
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_evaluator_spec.py +1 -1
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_evaluators.py +18 -4
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_reporting.py +61 -20
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_reports.py +2 -2
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_fallback.py +11 -1
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_gemini.py +20 -17
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_gemini_vertex.py +2 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_google.py +5 -3
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_openai.py +234 -27
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_google_vertex.py +6 -2
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_agent.py +52 -3
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_live.py +17 -11
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_messages.py +23 -5
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_tools.py +6 -6
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/.gitignore +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/LICENSE +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/README.md +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/assets/dummy.pdf +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/assets/kiwi.png +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/assets/marcelo.mp3 +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/assets/product_name.txt +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/assets/small_video.mp4 +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_agent_with_server_not_running.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_agent_with_stdio_server.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_audio_resource.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_audio_resource_link.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_dict.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_error.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_image.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_image_resource.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_image_resource_link.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_multiple_items.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_none.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_str.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_text_resource.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_mcp/test_tool_returning_text_resource_link.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[anthropic].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[bedrock].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[cohere].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[gemini].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[google].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[groq].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[mistral].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/cassettes/test_settings/test_stop_settings[openai].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_evaluator_common.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_evaluator_context.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_llm_as_a_judge.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_otel.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_render_numbers.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/test_utils.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/evals/utils.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/example_modules/README.md +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/example_modules/bank_database.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/example_modules/fake_database.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/example_modules/mcp_server.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/example_modules/weather_service.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/ext/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/ext/test_langchain.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_file_persistence.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_graph.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_mermaid.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_persistence.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_state.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/graph/test_utils.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/import_examples.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/json_body_serializer.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/mcp_server.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_model_empty_message_on_history.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_model_thinking_part_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_prompted_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_prompted_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_text_output_function.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_tool_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_anthropic_tool_with_thinking.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_document_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_extra_headers.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_image_url_input_invalid_mime_type.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_multiple_parallel_tool_calls.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_anthropic/test_text_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_empty_system_prompt.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_anthropic_model_without_tools.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_guardrail_config.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_iter_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_max_tokens.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_other_parameters.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_performance_config.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_retry.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_structured_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_thinking_part_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_model_top_p.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_bedrock_multiple_documents_in_history.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_text_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_text_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_video_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_bedrock/test_video_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_cohere/test_cohere_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_cohere/test_cohere_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_cohere/test_request_simple_success_with_vcr.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_deepseek/test_deepseek_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_deepseek/test_deepseek_model_thinking_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_download_item/test_download_item_application_octet_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_download_item/test_download_item_audio_mpeg.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_download_item/test_download_item_no_content_type.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_additional_properties_is_false.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_additional_properties_is_true.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_drop_exclusive_maximum.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_exclusive_minimum_and_maximum.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_native_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_native_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_prompted_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_prompted_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_prompted_output_with_tools.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_text_output_function.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_tool_config_any_with_tool_without_args.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_tool_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_gemini_youtube_video_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_labels_are_ignored_with_gla_provider.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_video_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini/test_video_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_labels.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[AudioUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[AudioUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[DocumentUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[DocumentUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[ImageUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[ImageUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[VideoUrl (YouTube)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[VideoUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input[VideoUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_gemini_vertex/test_url_input_force_download.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_empty_assistant_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_empty_user_prompt.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_iter_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_max_tokens.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_multiple_documents_in_history.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_retry.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_safety_settings.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_structured_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_text_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_text_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_thinking_config.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_thinking_part_iter.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_top_p.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_vertex_labels.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_vertex_provider.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_video_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_video_as_binary_content_input_with_vendor_metadata.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_video_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_model_youtube_video_url_input_with_vendor_metadata.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_native_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_native_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_prompted_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_prompted_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_prompted_output_with_tools.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_text_output_function.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_timeout.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_tool_config_any_with_tool_without_args.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_tool_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[AudioUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[AudioUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[DocumentUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[DocumentUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[ImageUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[ImageUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[VideoUrl (YouTube)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[VideoUrl (gs)].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input[VideoUrl].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_google/test_google_url_input_force_download.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_extra_headers.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_groq_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_groq_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_groq_model_thinking_part_iter.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_groq/test_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_hf_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_hf_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_hf_model_thinking_part_iter.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_max_completion_tokens[Qwen-Qwen2.5-72B-Instruct].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_max_completion_tokens[deepseek-ai-DeepSeek-R1-0528].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_max_completion_tokens[meta-llama-Llama-3.3-70B-Instruct].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_request_simple_success_with_vcr.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_request_simple_usage.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_simple_completion.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_huggingface/test_stream_completion.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_mistral/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_mistral/test_mistral_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_mistral/test_mistral_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_model_names/test_known_model_names.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_audio_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_compatible_api_with_tool_calls_without_id.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_document_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_extra_headers.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_image_url_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_invalid_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_max_completion_tokens[gpt-4.5-preview].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_max_completion_tokens[gpt-4o-mini].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_max_completion_tokens[o3-mini].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_multiple_agent_tool_calls.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_audio_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_instructions_with_tool_calls_keep_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_model_thinking_part_iter.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_model_without_system_prompt.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_native_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_native_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_o1_mini_system_role[developer].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_o1_mini_system_role[system].yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_prompted_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_prompted_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_responses_model_thinking_part.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_text_output_function.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_openai_tool_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_reasoning_model_with_temperature.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_text_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_user_id.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai/test_valid_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_audio_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_image_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_image_as_binary_content_tool_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_native_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_native_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_document_as_binary_content_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_image_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_builtin_tools.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_http_error.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_instructions.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_retry.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response_with_tool_call.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_output_type.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_reasoning_effort.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_reasoning_generate_summary.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_stream.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_system_prompt.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_openai_responses_text_document_url_input.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_prompted_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_prompted_output_multiple.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_reasoning_model_with_temperature.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_text_output_function.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/cassettes/test_openai_responses/test_tool_output.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/mock_async_stream.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_anthropic.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_bedrock.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_cohere.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_deepseek.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_download_item.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_groq.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_huggingface.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_instrumented.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_mcp_sampling.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_mistral.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model_function.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model_names.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model_request_parameters.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model_settings.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_model_test.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/models/test_openai_responses.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/__init__.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/cassettes/test_azure/test_azure_provider_call.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/cassettes/test_google_vertex/test_vertexai_provider.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/cassettes/test_heroku/test_heroku_model_provider_claude_3_7_sonnet.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/cassettes/test_openrouter/test_openrouter_with_google_model.yaml +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_anthropic.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_azure.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_bedrock.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_cohere.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_deepseek.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_fireworks.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_github.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_google_gla.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_grok.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_groq.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_heroku.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_huggingface.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_mistral.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_moonshotai.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_openai.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_openrouter.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_provider_names.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_together.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/providers/test_vercel.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_a2a.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_ag_ui.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_cli.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_deps.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_direct.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_examples.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_format_as_xml.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_history_processor.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_json_body_serializer.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_logfire.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_mcp.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_parts_manager.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_settings.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_streaming.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_tenacity.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_thinking_part.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_toolsets.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_usage_limits.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/test_utils.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/typed_agent.py +0 -0
- {pydantic_ai-0.4.11 → pydantic_ai-0.5.1}/tests/typed_graph.py +0 -0
|
@@ -60,13 +60,10 @@ typecheck-both: typecheck-pyright typecheck-mypy
|
|
|
60
60
|
|
|
61
61
|
.PHONY: test
|
|
62
62
|
test: ## Run tests and collect coverage data
|
|
63
|
-
uv run coverage run -m pytest
|
|
63
|
+
COVERAGE_PROCESS_START=./pyproject.toml uv run coverage run -m pytest -n auto --dist=loadgroup
|
|
64
|
+
@uv run coverage combine
|
|
64
65
|
@uv run coverage report
|
|
65
66
|
|
|
66
|
-
.PHONY: test-fast
|
|
67
|
-
test-fast: ## Same as test except no coverage and 4x faster depending on hardware
|
|
68
|
-
uv run pytest -n auto --dist=loadgroup
|
|
69
|
-
|
|
70
67
|
.PHONY: test-all-python
|
|
71
68
|
test-all-python: ## Run tests on Python 3.9 to 3.13
|
|
72
69
|
UV_PROJECT_ENVIRONMENT=.venv39 uv run --python 3.9 --all-extras --all-packages coverage run -p -m pytest
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: pydantic-ai
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.5.1
|
|
4
4
|
Summary: Agent Framework / shim to use Pydantic with LLMs
|
|
5
5
|
Project-URL: Homepage, https://ai.pydantic.dev
|
|
6
6
|
Project-URL: Source, https://github.com/pydantic/pydantic-ai
|
|
@@ -28,11 +28,11 @@ Classifier: Topic :: Internet
|
|
|
28
28
|
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
29
29
|
Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
|
30
30
|
Requires-Python: >=3.9
|
|
31
|
-
Requires-Dist: pydantic-ai-slim[ag-ui,anthropic,bedrock,cli,cohere,evals,google,groq,huggingface,mcp,mistral,openai,retries,vertexai]==0.
|
|
31
|
+
Requires-Dist: pydantic-ai-slim[ag-ui,anthropic,bedrock,cli,cohere,evals,google,groq,huggingface,mcp,mistral,openai,retries,vertexai]==0.5.1
|
|
32
32
|
Provides-Extra: a2a
|
|
33
33
|
Requires-Dist: fasta2a>=0.4.1; extra == 'a2a'
|
|
34
34
|
Provides-Extra: examples
|
|
35
|
-
Requires-Dist: pydantic-ai-examples==0.
|
|
35
|
+
Requires-Dist: pydantic-ai-examples==0.5.1; extra == 'examples'
|
|
36
36
|
Provides-Extra: logfire
|
|
37
37
|
Requires-Dist: logfire>=3.11.0; extra == 'logfire'
|
|
38
38
|
Description-Content-Type: text/markdown
|
|
@@ -215,6 +215,10 @@ filterwarnings = [
|
|
|
215
215
|
|
|
216
216
|
# https://coverage.readthedocs.io/en/latest/config.html#run
|
|
217
217
|
[tool.coverage.run]
|
|
218
|
+
parallel = true
|
|
219
|
+
concurrency = ["multiprocessing", "thread"]
|
|
220
|
+
# We use a subdirectory for coverage data to avoid noisy coverage data files.
|
|
221
|
+
data_file = ".coverage/.coverage"
|
|
218
222
|
# required to avoid warnings about files created by create_module fixture
|
|
219
223
|
include = [
|
|
220
224
|
"pydantic_ai_slim/**/*.py",
|
|
@@ -245,6 +249,7 @@ source = [
|
|
|
245
249
|
|
|
246
250
|
# https://coverage.readthedocs.io/en/latest/config.html#report
|
|
247
251
|
[tool.coverage.report]
|
|
252
|
+
fail_under = 100
|
|
248
253
|
skip_covered = true
|
|
249
254
|
show_missing = true
|
|
250
255
|
ignore_errors = true
|
|
@@ -251,7 +251,7 @@ def pytest_recording_configure(config: Any, vcr: VCR):
|
|
|
251
251
|
def mock_vcr_aiohttp_content(mocker: MockerFixture):
|
|
252
252
|
try:
|
|
253
253
|
from vcr.stubs import aiohttp_stubs
|
|
254
|
-
except ImportError:
|
|
254
|
+
except ImportError: # pragma: lax no cover
|
|
255
255
|
return
|
|
256
256
|
|
|
257
257
|
# google-genai calls `self.response_stream.content.readline()` where `self.response_stream` is a `MockClientResponse`,
|
|
@@ -416,9 +416,9 @@ def vertex_provider_auth(mocker: MockerFixture) -> None: # pragma: lax no cover
|
|
|
416
416
|
|
|
417
417
|
|
|
418
418
|
@pytest.fixture()
|
|
419
|
-
async def vertex_provider():
|
|
419
|
+
async def vertex_provider(): # pragma: lax no cover
|
|
420
420
|
# NOTE: You need to comment out this line to rewrite the cassettes locally.
|
|
421
|
-
if not os.getenv('CI', False):
|
|
421
|
+
if not os.getenv('CI', False):
|
|
422
422
|
pytest.skip('Requires properly configured local google vertex config to pass')
|
|
423
423
|
|
|
424
424
|
try:
|
|
@@ -478,10 +478,10 @@ def model(
|
|
|
478
478
|
|
|
479
479
|
return CohereModel('command-r-plus', provider=CohereProvider(api_key=co_api_key))
|
|
480
480
|
elif request.param == 'gemini':
|
|
481
|
-
from pydantic_ai.models.gemini import GeminiModel
|
|
481
|
+
from pydantic_ai.models.gemini import GeminiModel # type: ignore[reportDeprecated]
|
|
482
482
|
from pydantic_ai.providers.google_gla import GoogleGLAProvider
|
|
483
483
|
|
|
484
|
-
return GeminiModel('gemini-1.5-flash', provider=GoogleGLAProvider(api_key=gemini_api_key))
|
|
484
|
+
return GeminiModel('gemini-1.5-flash', provider=GoogleGLAProvider(api_key=gemini_api_key)) # type: ignore[reportDeprecated]
|
|
485
485
|
elif request.param == 'google':
|
|
486
486
|
from pydantic_ai.models.google import GoogleModel
|
|
487
487
|
from pydantic_ai.providers.google import GoogleProvider
|
|
@@ -7,11 +7,11 @@ from pathlib import Path
|
|
|
7
7
|
from typing import Any
|
|
8
8
|
|
|
9
9
|
import pytest
|
|
10
|
-
from dirty_equals import HasRepr, IsNumber
|
|
10
|
+
from dirty_equals import HasRepr, IsNumber, IsPartialDict
|
|
11
11
|
from inline_snapshot import snapshot
|
|
12
|
-
from pydantic import BaseModel
|
|
12
|
+
from pydantic import BaseModel, TypeAdapter
|
|
13
13
|
|
|
14
|
-
from ..conftest import
|
|
14
|
+
from ..conftest import try_import
|
|
15
15
|
from .utils import render_table
|
|
16
16
|
|
|
17
17
|
with try_import() as imports_successful:
|
|
@@ -20,7 +20,7 @@ with try_import() as imports_successful:
|
|
|
20
20
|
|
|
21
21
|
from pydantic_evals import Case, Dataset
|
|
22
22
|
from pydantic_evals.dataset import increment_eval_metric, set_eval_attribute
|
|
23
|
-
from pydantic_evals.evaluators import EvaluationResult, Evaluator, EvaluatorOutput, LLMJudge, Python
|
|
23
|
+
from pydantic_evals.evaluators import EvaluationResult, Evaluator, EvaluatorOutput, EvaluatorSpec, LLMJudge, Python
|
|
24
24
|
from pydantic_evals.evaluators.context import EvaluatorContext
|
|
25
25
|
|
|
26
26
|
@dataclass
|
|
@@ -32,7 +32,7 @@ with try_import() as imports_successful:
|
|
|
32
32
|
def evaluate(self, ctx: EvaluatorContext[object, object, object]) -> EvaluatorOutput:
|
|
33
33
|
return self.output
|
|
34
34
|
|
|
35
|
-
from pydantic_evals.reporting import ReportCase, ReportCaseAdapter
|
|
35
|
+
from pydantic_evals.reporting import EvaluationReport, ReportCase, ReportCaseAdapter
|
|
36
36
|
|
|
37
37
|
pytestmark = [pytest.mark.skipif(not imports_successful(), reason='pydantic-evals not installed'), pytest.mark.anyio]
|
|
38
38
|
|
|
@@ -456,13 +456,13 @@ async def test_repeated_name_outputs(example_dataset: Dataset[TaskInput, TaskOut
|
|
|
456
456
|
scores={},
|
|
457
457
|
labels={
|
|
458
458
|
'output': EvaluationResult(
|
|
459
|
-
name='output', value='a', reason=None, source=MockEvaluator(output={'output': 'a'})
|
|
459
|
+
name='output', value='a', reason=None, source=MockEvaluator(output={'output': 'a'}).as_spec()
|
|
460
460
|
),
|
|
461
461
|
'output_2': EvaluationResult(
|
|
462
|
-
name='output', value='b', reason=None, source=MockEvaluator(output={'output': 'b'})
|
|
462
|
+
name='output', value='b', reason=None, source=MockEvaluator(output={'output': 'b'}).as_spec()
|
|
463
463
|
),
|
|
464
464
|
'output_3': EvaluationResult(
|
|
465
|
-
name='output', value='c', reason=None, source=MockEvaluator(output={'output': 'c'})
|
|
465
|
+
name='output', value='c', reason=None, source=MockEvaluator(output={'output': 'c'}).as_spec()
|
|
466
466
|
),
|
|
467
467
|
},
|
|
468
468
|
assertions={},
|
|
@@ -482,13 +482,13 @@ async def test_repeated_name_outputs(example_dataset: Dataset[TaskInput, TaskOut
|
|
|
482
482
|
scores={},
|
|
483
483
|
labels={
|
|
484
484
|
'output': EvaluationResult(
|
|
485
|
-
name='output', value='a', reason=None, source=MockEvaluator(output={'output': 'a'})
|
|
485
|
+
name='output', value='a', reason=None, source=MockEvaluator(output={'output': 'a'}).as_spec()
|
|
486
486
|
),
|
|
487
487
|
'output_2': EvaluationResult(
|
|
488
|
-
name='output', value='b', reason=None, source=MockEvaluator(output={'output': 'b'})
|
|
488
|
+
name='output', value='b', reason=None, source=MockEvaluator(output={'output': 'b'}).as_spec()
|
|
489
489
|
),
|
|
490
490
|
'output_3': EvaluationResult(
|
|
491
|
-
name='output', value='c', reason=None, source=MockEvaluator(output={'output': 'c'})
|
|
491
|
+
name='output', value='c', reason=None, source=MockEvaluator(output={'output': 'c'}).as_spec()
|
|
492
492
|
),
|
|
493
493
|
},
|
|
494
494
|
assertions={},
|
|
@@ -501,6 +501,73 @@ async def test_repeated_name_outputs(example_dataset: Dataset[TaskInput, TaskOut
|
|
|
501
501
|
)
|
|
502
502
|
|
|
503
503
|
|
|
504
|
+
async def test_report_round_trip_serialization(example_dataset: Dataset[TaskInput, TaskOutput, TaskMetadata]):
|
|
505
|
+
"""Test the increment_eval_metric function."""
|
|
506
|
+
|
|
507
|
+
async def my_task(inputs: TaskInput) -> TaskOutput:
|
|
508
|
+
return TaskOutput(answer=f'answer to {inputs.query}')
|
|
509
|
+
|
|
510
|
+
example_dataset.add_evaluator(MockEvaluator({'output': 'a'}))
|
|
511
|
+
|
|
512
|
+
report = await example_dataset.evaluate(my_task)
|
|
513
|
+
assert report == snapshot(
|
|
514
|
+
EvaluationReport(
|
|
515
|
+
name='my_task',
|
|
516
|
+
cases=[
|
|
517
|
+
ReportCase(
|
|
518
|
+
name='case1',
|
|
519
|
+
inputs=TaskInput(query='What is 2+2?'),
|
|
520
|
+
metadata=TaskMetadata(difficulty='easy', category='general'),
|
|
521
|
+
expected_output=TaskOutput(answer='4', confidence=1.0),
|
|
522
|
+
output=TaskOutput(answer='answer to What is 2+2?', confidence=1.0),
|
|
523
|
+
metrics={},
|
|
524
|
+
attributes={},
|
|
525
|
+
scores={},
|
|
526
|
+
labels={
|
|
527
|
+
'output': EvaluationResult(
|
|
528
|
+
name='output',
|
|
529
|
+
value='a',
|
|
530
|
+
reason=None,
|
|
531
|
+
source=EvaluatorSpec(name='MockEvaluator', arguments=({'output': 'a'},)),
|
|
532
|
+
)
|
|
533
|
+
},
|
|
534
|
+
assertions={},
|
|
535
|
+
task_duration=1.0,
|
|
536
|
+
total_duration=6.0,
|
|
537
|
+
trace_id='00000000000000000000000000000001',
|
|
538
|
+
span_id='0000000000000003',
|
|
539
|
+
),
|
|
540
|
+
ReportCase(
|
|
541
|
+
name='case2',
|
|
542
|
+
inputs=TaskInput(query='What is the capital of France?'),
|
|
543
|
+
metadata=TaskMetadata(difficulty='medium', category='geography'),
|
|
544
|
+
expected_output=TaskOutput(answer='Paris', confidence=1.0),
|
|
545
|
+
output=TaskOutput(answer='answer to What is the capital of France?', confidence=1.0),
|
|
546
|
+
metrics={},
|
|
547
|
+
attributes={},
|
|
548
|
+
scores={},
|
|
549
|
+
labels={
|
|
550
|
+
'output': EvaluationResult(
|
|
551
|
+
name='output',
|
|
552
|
+
value='a',
|
|
553
|
+
reason=None,
|
|
554
|
+
source=EvaluatorSpec(name='MockEvaluator', arguments=({'output': 'a'},)),
|
|
555
|
+
)
|
|
556
|
+
},
|
|
557
|
+
assertions={},
|
|
558
|
+
task_duration=1.0,
|
|
559
|
+
total_duration=4.0,
|
|
560
|
+
trace_id='00000000000000000000000000000001',
|
|
561
|
+
span_id='0000000000000007',
|
|
562
|
+
),
|
|
563
|
+
],
|
|
564
|
+
)
|
|
565
|
+
)
|
|
566
|
+
|
|
567
|
+
report_adapter = TypeAdapter(EvaluationReport[TaskInput, TaskOutput, TaskMetadata])
|
|
568
|
+
assert report == report_adapter.validate_json(report_adapter.dump_json(report, indent=2))
|
|
569
|
+
|
|
570
|
+
|
|
504
571
|
async def test_genai_attribute_collection(example_dataset: Dataset[TaskInput, TaskOutput, TaskMetadata]):
|
|
505
572
|
async def my_task(inputs: TaskInput) -> TaskOutput:
|
|
506
573
|
with logfire.span(
|
|
@@ -1092,7 +1159,7 @@ async def test_evaluate_async_logfire(
|
|
|
1092
1159
|
example_dataset: Dataset[TaskInput, TaskOutput, TaskMetadata],
|
|
1093
1160
|
simple_evaluator: type[Evaluator[TaskInput, TaskOutput, TaskMetadata]],
|
|
1094
1161
|
capfire: CaptureLogfire,
|
|
1095
|
-
):
|
|
1162
|
+
): # pragma: lax no cover
|
|
1096
1163
|
"""Test evaluating a dataset."""
|
|
1097
1164
|
example_dataset.add_evaluator(simple_evaluator())
|
|
1098
1165
|
|
|
@@ -1130,90 +1197,90 @@ async def test_evaluate_async_logfire(
|
|
|
1130
1197
|
'parent': None,
|
|
1131
1198
|
'start_time': 1000000000,
|
|
1132
1199
|
},
|
|
1133
|
-
|
|
1134
|
-
|
|
1135
|
-
'
|
|
1136
|
-
|
|
1137
|
-
|
|
1138
|
-
|
|
1139
|
-
|
|
1140
|
-
|
|
1141
|
-
|
|
1142
|
-
|
|
1143
|
-
|
|
1144
|
-
|
|
1145
|
-
|
|
1146
|
-
|
|
1147
|
-
|
|
1148
|
-
|
|
1149
|
-
|
|
1150
|
-
|
|
1151
|
-
|
|
1152
|
-
|
|
1153
|
-
|
|
1154
|
-
|
|
1155
|
-
|
|
1156
|
-
|
|
1157
|
-
|
|
1158
|
-
|
|
1159
|
-
|
|
1160
|
-
|
|
1161
|
-
|
|
1162
|
-
'
|
|
1163
|
-
|
|
1164
|
-
|
|
1165
|
-
|
|
1166
|
-
|
|
1167
|
-
|
|
1168
|
-
|
|
1169
|
-
|
|
1170
|
-
|
|
1171
|
-
|
|
1172
|
-
|
|
1173
|
-
|
|
1174
|
-
|
|
1175
|
-
|
|
1176
|
-
|
|
1177
|
-
|
|
1178
|
-
'
|
|
1179
|
-
|
|
1180
|
-
|
|
1181
|
-
|
|
1182
|
-
|
|
1183
|
-
|
|
1184
|
-
|
|
1185
|
-
|
|
1186
|
-
|
|
1187
|
-
|
|
1188
|
-
|
|
1189
|
-
|
|
1190
|
-
|
|
1191
|
-
|
|
1192
|
-
|
|
1193
|
-
|
|
1194
|
-
|
|
1195
|
-
|
|
1196
|
-
|
|
1197
|
-
|
|
1198
|
-
|
|
1199
|
-
|
|
1200
|
-
|
|
1201
|
-
|
|
1202
|
-
|
|
1203
|
-
|
|
1204
|
-
|
|
1205
|
-
'
|
|
1206
|
-
|
|
1207
|
-
|
|
1208
|
-
|
|
1209
|
-
|
|
1210
|
-
|
|
1211
|
-
|
|
1212
|
-
|
|
1213
|
-
|
|
1214
|
-
|
|
1215
|
-
|
|
1216
|
-
|
|
1217
|
-
|
|
1218
|
-
|
|
1200
|
+
IsPartialDict(
|
|
1201
|
+
{
|
|
1202
|
+
'attributes': {
|
|
1203
|
+
'assertions': '{"correct":{"name":"correct","value":true,"reason":null,"source":{"name":"SimpleEvaluator","arguments":null}}}',
|
|
1204
|
+
'attributes': '{}',
|
|
1205
|
+
'case_name': 'case1',
|
|
1206
|
+
'expected_output': '{"answer":"4","confidence":1.0}',
|
|
1207
|
+
'inputs': '{"query":"What is 2+2?"}',
|
|
1208
|
+
'labels': '{}',
|
|
1209
|
+
'logfire.json_schema': '{"type":"object","properties":{"task_name":{},"case_name":{},"inputs":{"type":"object","title":"TaskInput","x-python-datatype":"PydanticModel"},"metadata":{"type":"object","title":"TaskMetadata","x-python-datatype":"PydanticModel"},"expected_output":{"type":"object","title":"TaskOutput","x-python-datatype":"PydanticModel"},"output":{"type":"object","title":"TaskOutput","x-python-datatype":"PydanticModel"},"task_duration":{},"metrics":{"type":"object"},"attributes":{"type":"object"},"assertions":{"type":"object"},"scores":{"type":"object"},"labels":{"type":"object"}}}',
|
|
1210
|
+
'logfire.msg': 'case: case1',
|
|
1211
|
+
'logfire.msg_template': 'case: {case_name}',
|
|
1212
|
+
'logfire.span_type': 'span',
|
|
1213
|
+
'metadata': '{"difficulty":"easy","category":"general"}',
|
|
1214
|
+
'metrics': '{}',
|
|
1215
|
+
'output': '{"answer":"4","confidence":1.0}',
|
|
1216
|
+
'scores': '{"confidence":{"name":"confidence","value":1.0,"reason":null,"source":{"name":"SimpleEvaluator","arguments":null}}}',
|
|
1217
|
+
'task_duration': 1.0,
|
|
1218
|
+
'task_name': 'mock_async_task',
|
|
1219
|
+
},
|
|
1220
|
+
'context': {'is_remote': False, 'span_id': 3, 'trace_id': 1},
|
|
1221
|
+
'end_time': 8000000000,
|
|
1222
|
+
'name': 'case: {case_name}',
|
|
1223
|
+
'parent': {'is_remote': False, 'span_id': 1, 'trace_id': 1},
|
|
1224
|
+
'start_time': 2000000000,
|
|
1225
|
+
}
|
|
1226
|
+
),
|
|
1227
|
+
IsPartialDict(
|
|
1228
|
+
{
|
|
1229
|
+
'attributes': {
|
|
1230
|
+
'logfire.json_schema': '{"type":"object","properties":{"task":{}}}',
|
|
1231
|
+
'logfire.msg': 'execute mock_async_task',
|
|
1232
|
+
'logfire.msg_template': 'execute {task}',
|
|
1233
|
+
'logfire.span_type': 'span',
|
|
1234
|
+
'task': 'mock_async_task',
|
|
1235
|
+
},
|
|
1236
|
+
'context': {'is_remote': False, 'span_id': 5, 'trace_id': 1},
|
|
1237
|
+
'end_time': 4000000000,
|
|
1238
|
+
'name': 'execute {task}',
|
|
1239
|
+
'parent': {'is_remote': False, 'span_id': 3, 'trace_id': 1},
|
|
1240
|
+
'start_time': 3000000000,
|
|
1241
|
+
}
|
|
1242
|
+
),
|
|
1243
|
+
IsPartialDict(
|
|
1244
|
+
{
|
|
1245
|
+
'attributes': {
|
|
1246
|
+
'assertions': '{"correct":{"name":"correct","value":true,"reason":null,"source":{"name":"SimpleEvaluator","arguments":null}}}',
|
|
1247
|
+
'attributes': '{}',
|
|
1248
|
+
'case_name': 'case2',
|
|
1249
|
+
'expected_output': '{"answer":"Paris","confidence":1.0}',
|
|
1250
|
+
'inputs': '{"query":"What is the capital of France?"}',
|
|
1251
|
+
'labels': '{}',
|
|
1252
|
+
'logfire.json_schema': '{"type":"object","properties":{"task_name":{},"case_name":{},"inputs":{"type":"object","title":"TaskInput","x-python-datatype":"PydanticModel"},"metadata":{"type":"object","title":"TaskMetadata","x-python-datatype":"PydanticModel"},"expected_output":{"type":"object","title":"TaskOutput","x-python-datatype":"PydanticModel"},"output":{"type":"object","title":"TaskOutput","x-python-datatype":"PydanticModel"},"task_duration":{},"metrics":{"type":"object"},"attributes":{"type":"object"},"assertions":{"type":"object"},"scores":{"type":"object"},"labels":{"type":"object"}}}',
|
|
1253
|
+
'logfire.msg': 'case: case2',
|
|
1254
|
+
'logfire.msg_template': 'case: {case_name}',
|
|
1255
|
+
'logfire.span_type': 'span',
|
|
1256
|
+
'metadata': '{"difficulty":"medium","category":"geography"}',
|
|
1257
|
+
'metrics': '{}',
|
|
1258
|
+
'output': '{"answer":"Paris","confidence":1.0}',
|
|
1259
|
+
'scores': '{"confidence":{"name":"confidence","value":1.0,"reason":null,"source":{"name":"SimpleEvaluator","arguments":null}}}',
|
|
1260
|
+
'task_duration': 1.0,
|
|
1261
|
+
'task_name': 'mock_async_task',
|
|
1262
|
+
},
|
|
1263
|
+
'context': {'is_remote': False, 'span_id': 7, 'trace_id': 1},
|
|
1264
|
+
'end_time': 9000000000,
|
|
1265
|
+
'name': 'case: {case_name}',
|
|
1266
|
+
'parent': {'is_remote': False, 'span_id': 1, 'trace_id': 1},
|
|
1267
|
+
'start_time': 5000000000,
|
|
1268
|
+
}
|
|
1269
|
+
),
|
|
1270
|
+
IsPartialDict(
|
|
1271
|
+
{
|
|
1272
|
+
'attributes': {
|
|
1273
|
+
'logfire.json_schema': '{"type":"object","properties":{"task":{}}}',
|
|
1274
|
+
'logfire.msg': 'execute mock_async_task',
|
|
1275
|
+
'logfire.msg_template': 'execute {task}',
|
|
1276
|
+
'logfire.span_type': 'span',
|
|
1277
|
+
'task': 'mock_async_task',
|
|
1278
|
+
},
|
|
1279
|
+
'context': {'is_remote': False, 'span_id': 9, 'trace_id': 1},
|
|
1280
|
+
'end_time': 7000000000,
|
|
1281
|
+
'name': 'execute {task}',
|
|
1282
|
+
'parent': {'is_remote': False, 'span_id': 7, 'trace_id': 1},
|
|
1283
|
+
'start_time': 6000000000,
|
|
1284
|
+
}
|
|
1285
|
+
),
|
|
1219
1286
|
]
|
|
@@ -52,11 +52,11 @@ def test_evaluation_result():
|
|
|
52
52
|
evaluator = DummyEvaluator()
|
|
53
53
|
|
|
54
54
|
# Test basic result
|
|
55
|
-
result = EvaluationResult(name='test', value=True, reason='Success', source=evaluator)
|
|
55
|
+
result = EvaluationResult(name='test', value=True, reason='Success', source=evaluator.as_spec())
|
|
56
56
|
assert result.name == 'test'
|
|
57
57
|
assert result.value is True
|
|
58
58
|
assert result.reason == 'Success'
|
|
59
|
-
assert result.source == evaluator
|
|
59
|
+
assert result.source == evaluator.as_spec()
|
|
60
60
|
|
|
61
61
|
# Test downcast with matching type
|
|
62
62
|
downcast = result.downcast(bool)
|
|
@@ -6,7 +6,7 @@ from pydantic import ValidationError
|
|
|
6
6
|
from ..conftest import try_import
|
|
7
7
|
|
|
8
8
|
with try_import() as imports_successful:
|
|
9
|
-
from pydantic_evals.evaluators.
|
|
9
|
+
from pydantic_evals.evaluators.spec import (
|
|
10
10
|
EvaluatorSpec,
|
|
11
11
|
_SerializedEvaluatorSpec, # pyright: ignore[reportPrivateUsage]
|
|
12
12
|
)
|
|
@@ -19,7 +19,6 @@ with try_import() as imports_successful:
|
|
|
19
19
|
from logfire.testing import CaptureLogfire
|
|
20
20
|
|
|
21
21
|
from pydantic_evals.evaluators._run_evaluator import run_evaluator
|
|
22
|
-
from pydantic_evals.evaluators._spec import EvaluatorSpec
|
|
23
22
|
from pydantic_evals.evaluators.common import (
|
|
24
23
|
Contains,
|
|
25
24
|
Equals,
|
|
@@ -36,6 +35,7 @@ with try_import() as imports_successful:
|
|
|
36
35
|
Evaluator,
|
|
37
36
|
EvaluatorOutput,
|
|
38
37
|
)
|
|
38
|
+
from pydantic_evals.evaluators.spec import EvaluatorSpec
|
|
39
39
|
from pydantic_evals.otel._context_in_memory_span_exporter import context_subtree
|
|
40
40
|
from pydantic_evals.otel.span_tree import SpanQuery, SpanTree
|
|
41
41
|
|
|
@@ -162,7 +162,7 @@ async def test_evaluator_call(test_context: EvaluatorContext[TaskInput, TaskOutp
|
|
|
162
162
|
assert results[0].name == 'result'
|
|
163
163
|
assert results[0].value == 'passed'
|
|
164
164
|
assert results[0].reason is None
|
|
165
|
-
assert results[0].source
|
|
165
|
+
assert results[0].source == EvaluatorSpec(name='ExampleEvaluator', arguments=None)
|
|
166
166
|
|
|
167
167
|
|
|
168
168
|
async def test_is_instance_evaluator():
|
|
@@ -242,7 +242,14 @@ async def test_custom_evaluator_name(test_context: EvaluatorContext[TaskInput, T
|
|
|
242
242
|
evaluator = CustomNameFieldEvaluator(result=123, evaluation_name='abc')
|
|
243
243
|
|
|
244
244
|
assert to_jsonable_python(await run_evaluator(evaluator, test_context)) == snapshot(
|
|
245
|
-
[
|
|
245
|
+
[
|
|
246
|
+
{
|
|
247
|
+
'name': 'abc',
|
|
248
|
+
'reason': None,
|
|
249
|
+
'source': {'arguments': {'evaluation_name': 'abc', 'result': 123}, 'name': 'CustomNameFieldEvaluator'},
|
|
250
|
+
'value': 123,
|
|
251
|
+
}
|
|
252
|
+
]
|
|
246
253
|
)
|
|
247
254
|
|
|
248
255
|
@dataclass
|
|
@@ -260,7 +267,14 @@ async def test_custom_evaluator_name(test_context: EvaluatorContext[TaskInput, T
|
|
|
260
267
|
evaluator = CustomNamePropertyEvaluator(result=123, my_name='marcelo')
|
|
261
268
|
|
|
262
269
|
assert to_jsonable_python(await run_evaluator(evaluator, test_context)) == snapshot(
|
|
263
|
-
[
|
|
270
|
+
[
|
|
271
|
+
{
|
|
272
|
+
'name': 'hello marcelo',
|
|
273
|
+
'reason': None,
|
|
274
|
+
'source': {'arguments': {'my_name': 'marcelo', 'result': 123}, 'name': 'CustomNamePropertyEvaluator'},
|
|
275
|
+
'value': 123,
|
|
276
|
+
}
|
|
277
|
+
]
|
|
264
278
|
)
|
|
265
279
|
|
|
266
280
|
|