PyPI - vellum-ai - Versions diffs - 0.7.3__py3-none-any.whl → 0.7.5__py3-none-any.whl - Mend

vellum-ai 0.7.3py3-none-any.whl → 0.7.5py3-none-any.whl

Files changed (483) hide show

vellum/__init__.py +142 -94
vellum/client.py +1051 -1097
vellum/core/__init__.py +4 -1
vellum/core/client_wrapper.py +7 -3
vellum/core/http_client.py +365 -20
vellum/core/jsonable_encoder.py +3 -0
vellum/core/pydantic_utilities.py +16 -0
vellum/core/query_encoder.py +33 -0
vellum/core/remove_none_from_dict.py +2 -2
vellum/core/request_options.py +2 -2
vellum/resources/__init__.py +2 -0
vellum/resources/deployments/client.py +349 -377
vellum/resources/document_indexes/client.py +542 -610
vellum/resources/documents/client.py +327 -399
vellum/resources/folder_entities/client.py +56 -72
vellum/{types/map_enum.py → resources/ml_models/__init__.py} +0 -3
vellum/resources/ml_models/client.py +837 -0
vellum/resources/sandboxes/client.py +204 -242
vellum/resources/test_suite_runs/client.py +183 -213
vellum/resources/test_suites/client.py +307 -311
vellum/resources/workflow_deployments/client.py +230 -268
vellum/resources/workflow_sandboxes/client.py +82 -96
vellum/terraform/_jsii/vellum-ai_vellum@0.0.0.jsii.tgz +0 -0
vellum/terraform/data_vellum_document_index/__init__.py +10 -10
vellum/terraform/document_index/__init__.py +17 -17
vellum/terraform/provider/__init__.py +57 -12
vellum/terraform/versions.json +1 -1
vellum/types/__init__.py +148 -96
vellum/types/api_node_result.py +7 -3
vellum/types/api_node_result_data.py +7 -3
vellum/types/array_chat_message_content.py +7 -3
vellum/types/array_chat_message_content_item.py +53 -12
vellum/types/array_chat_message_content_item_request.py +53 -12
vellum/types/array_chat_message_content_request.py +7 -3
vellum/types/array_parameter_config.py +50 -0
vellum/types/array_parameter_config_request.py +50 -0
vellum/types/array_variable_value_item.py +102 -24
vellum/types/array_vellum_value_item.py +102 -24
vellum/types/array_vellum_value_item_request.py +102 -24
vellum/types/basic_vectorizer_intfloat_multilingual_e_5_large.py +7 -3
vellum/types/basic_vectorizer_intfloat_multilingual_e_5_large_request.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_cos_v_1.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_cos_v_1_request.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_dot_v_1.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_dot_v_1_request.py +7 -3
vellum/types/boolean_parameter_config.py +35 -0
vellum/types/boolean_parameter_config_request.py +35 -0
vellum/types/chat_history_input_request.py +7 -3
vellum/types/chat_message.py +7 -3
vellum/types/chat_message_content.py +70 -16
vellum/types/chat_message_content_request.py +70 -16
vellum/types/chat_message_request.py +7 -3
vellum/types/code_execution_node_array_result.py +7 -3
vellum/types/code_execution_node_chat_history_result.py +7 -3
vellum/types/code_execution_node_error_result.py +7 -3
vellum/types/code_execution_node_function_call_result.py +7 -3
vellum/types/code_execution_node_json_result.py +7 -3
vellum/types/code_execution_node_number_result.py +7 -3
vellum/types/code_execution_node_result.py +7 -3
vellum/types/code_execution_node_result_data.py +7 -3
vellum/types/code_execution_node_result_output.py +144 -32
vellum/types/code_execution_node_search_results_result.py +7 -3
vellum/types/code_execution_node_string_result.py +7 -3
vellum/types/compile_prompt_deployment_expand_meta_request.py +7 -3
vellum/types/compile_prompt_meta.py +7 -3
vellum/types/conditional_node_result.py +7 -3
vellum/types/conditional_node_result_data.py +7 -3
vellum/types/const_parameter_config.py +35 -0
vellum/types/const_parameter_config_request.py +35 -0
vellum/types/create_test_suite_test_case_request.py +7 -3
vellum/types/deployment_provider_payload_response.py +7 -3
vellum/types/deployment_read.py +12 -3
vellum/types/deployment_release_tag_deployment_history_item.py +7 -3
vellum/types/deployment_release_tag_read.py +7 -3
vellum/types/document_document_to_document_index.py +7 -3
vellum/types/document_index_chunking.py +54 -12
vellum/types/document_index_chunking_request.py +54 -12
vellum/types/document_index_indexing_config.py +7 -3
vellum/types/document_index_indexing_config_request.py +7 -3
vellum/types/document_index_read.py +7 -3
vellum/types/document_read.py +7 -3
vellum/types/enriched_normalized_completion.py +7 -3
vellum/types/error_variable_value.py +7 -3
vellum/types/error_vellum_value.py +7 -3
vellum/types/error_vellum_value_request.py +7 -3
vellum/types/execute_prompt_event.py +82 -16
vellum/types/execute_prompt_response.py +44 -8
vellum/types/execute_workflow_response.py +7 -3
vellum/types/execute_workflow_workflow_result_event.py +41 -8
vellum/types/execution_array_vellum_value.py +7 -3
vellum/types/execution_chat_history_vellum_value.py +7 -3
vellum/types/execution_error_vellum_value.py +7 -3
vellum/types/execution_function_call_vellum_value.py +7 -3
vellum/types/execution_json_vellum_value.py +7 -3
vellum/types/execution_number_vellum_value.py +7 -3
vellum/types/execution_search_results_vellum_value.py +7 -3
vellum/types/execution_string_vellum_value.py +7 -3
vellum/types/execution_vellum_value.py +152 -32
vellum/types/external_test_case_execution.py +7 -3
vellum/types/external_test_case_execution_request.py +7 -3
vellum/types/fulfilled_execute_prompt_event.py +7 -3
vellum/types/fulfilled_execute_prompt_response.py +7 -3
vellum/types/fulfilled_execute_workflow_workflow_result_event.py +7 -3
vellum/types/fulfilled_prompt_execution_meta.py +7 -3
vellum/types/fulfilled_workflow_node_result_event.py +7 -3
vellum/types/function_call.py +7 -3
vellum/types/function_call_chat_message_content.py +7 -3
vellum/types/function_call_chat_message_content_request.py +7 -3
vellum/types/function_call_chat_message_content_value.py +7 -3
vellum/types/function_call_chat_message_content_value_request.py +7 -3
vellum/types/function_call_request.py +7 -3
vellum/types/function_call_variable_value.py +7 -3
vellum/types/function_call_vellum_value.py +7 -3
vellum/types/function_call_vellum_value_request.py +7 -3
vellum/types/generate_options_request.py +7 -3
vellum/types/generate_request.py +7 -3
vellum/types/generate_result.py +7 -3
vellum/types/generate_result_data.py +7 -3
vellum/types/generate_result_error.py +7 -3
vellum/types/generate_stream_response.py +7 -3
vellum/types/generate_stream_result.py +7 -3
vellum/types/generate_stream_result_data.py +7 -3
vellum/types/hkunlp_instructor_xl_vectorizer.py +7 -3
vellum/types/hkunlp_instructor_xl_vectorizer_request.py +7 -3
vellum/types/hosted_by_enum.py +26 -0
vellum/types/hugging_face_tokenizer_config.py +34 -0
vellum/types/hugging_face_tokenizer_config_request.py +34 -0
vellum/types/image_chat_message_content.py +7 -3
vellum/types/image_chat_message_content_request.py +7 -3
vellum/types/image_variable_value.py +7 -3
vellum/types/image_vellum_value.py +7 -3
vellum/types/image_vellum_value_request.py +7 -3
vellum/types/indexing_config_vectorizer.py +117 -36
vellum/types/indexing_config_vectorizer_request.py +117 -36
vellum/types/initiated_execute_prompt_event.py +7 -3
vellum/types/initiated_prompt_execution_meta.py +7 -3
vellum/types/initiated_workflow_node_result_event.py +7 -3
vellum/types/instructor_vectorizer_config.py +7 -3
vellum/types/instructor_vectorizer_config_request.py +7 -3
vellum/types/integer_parameter_config.py +39 -0
vellum/types/integer_parameter_config_request.py +39 -0
vellum/types/json_input_request.py +7 -3
vellum/types/json_variable_value.py +7 -3
vellum/types/json_vellum_value.py +7 -3
vellum/types/json_vellum_value_request.py +7 -3
vellum/types/map_node_result.py +7 -3
vellum/types/map_node_result_data.py +7 -3
vellum/types/merge_node_result.py +7 -3
vellum/types/merge_node_result_data.py +7 -3
vellum/types/metadata_filter_config_request.py +7 -3
vellum/types/metadata_filter_rule_request.py +7 -3
vellum/types/metric_node_result.py +7 -3
vellum/types/{execute_workflow_stream_error_response.py → ml_model_build_config.py} +9 -8
vellum/types/{execute_prompt_api_error_response.py → ml_model_build_config_request.py} +9 -8
vellum/types/ml_model_developer.py +27 -0
vellum/types/ml_model_developer_enum_value_label.py +31 -0
vellum/types/ml_model_display_config_labelled.py +33 -0
vellum/types/ml_model_display_config_request.py +33 -0
vellum/types/ml_model_display_tag.py +7 -0
vellum/types/ml_model_display_tag_enum_value_label.py +31 -0
vellum/types/ml_model_exec_config.py +40 -0
vellum/types/ml_model_exec_config_request.py +40 -0
vellum/types/ml_model_family.py +29 -0
vellum/types/ml_model_family_enum_value_label.py +31 -0
vellum/types/ml_model_feature.py +18 -0
vellum/types/ml_model_parameter_config.py +42 -0
vellum/types/ml_model_parameter_config_request.py +42 -0
vellum/types/ml_model_read.py +108 -0
vellum/types/ml_model_request_authorization_config.py +30 -0
vellum/types/ml_model_request_authorization_config_request.py +30 -0
vellum/types/ml_model_request_authorization_config_type_enum.py +5 -0
vellum/types/ml_model_request_config.py +32 -0
vellum/types/ml_model_request_config_request.py +32 -0
vellum/types/ml_model_response_config.py +31 -0
vellum/types/ml_model_response_config_request.py +31 -0
vellum/types/ml_model_tokenizer_config.py +59 -0
vellum/types/ml_model_tokenizer_config_request.py +61 -0
vellum/types/ml_model_usage.py +7 -3
vellum/types/named_scenario_input_chat_history_variable_value_request.py +7 -3
vellum/types/named_scenario_input_request.py +38 -8
vellum/types/named_scenario_input_string_variable_value_request.py +7 -3
vellum/types/named_test_case_array_variable_value.py +7 -3
vellum/types/named_test_case_array_variable_value_request.py +7 -3
vellum/types/named_test_case_chat_history_variable_value.py +7 -3
vellum/types/named_test_case_chat_history_variable_value_request.py +7 -3
vellum/types/named_test_case_error_variable_value.py +7 -3
vellum/types/named_test_case_error_variable_value_request.py +7 -3
vellum/types/named_test_case_function_call_variable_value.py +7 -3
vellum/types/named_test_case_function_call_variable_value_request.py +7 -3
vellum/types/named_test_case_json_variable_value.py +7 -3
vellum/types/named_test_case_json_variable_value_request.py +7 -3
vellum/types/named_test_case_number_variable_value.py +7 -3
vellum/types/named_test_case_number_variable_value_request.py +7 -3
vellum/types/named_test_case_search_results_variable_value.py +7 -3
vellum/types/named_test_case_search_results_variable_value_request.py +7 -3
vellum/types/named_test_case_string_variable_value.py +7 -3
vellum/types/named_test_case_string_variable_value_request.py +7 -3
vellum/types/named_test_case_variable_value.py +144 -32
vellum/types/named_test_case_variable_value_request.py +144 -32
vellum/types/node_input_compiled_array_value.py +7 -3
vellum/types/node_input_compiled_chat_history_value.py +7 -3
vellum/types/node_input_compiled_error_value.py +7 -3
vellum/types/node_input_compiled_function_call.py +7 -3
vellum/types/node_input_compiled_json_value.py +7 -3
vellum/types/node_input_compiled_number_value.py +7 -3
vellum/types/node_input_compiled_search_results_value.py +7 -3
vellum/types/node_input_compiled_string_value.py +7 -3
vellum/types/node_input_variable_compiled_value.py +152 -32
vellum/types/node_output_compiled_array_value.py +7 -3
vellum/types/node_output_compiled_chat_history_value.py +7 -3
vellum/types/node_output_compiled_error_value.py +7 -3
vellum/types/node_output_compiled_function_call_value.py +7 -3
vellum/types/node_output_compiled_json_value.py +7 -3
vellum/types/node_output_compiled_number_value.py +7 -3
vellum/types/node_output_compiled_search_results_value.py +7 -3
vellum/types/node_output_compiled_string_value.py +7 -3
vellum/types/node_output_compiled_value.py +153 -32
vellum/types/normalized_log_probs.py +7 -3
vellum/types/normalized_token_log_probs.py +7 -3
vellum/types/number_parameter_config.py +40 -0
vellum/types/number_parameter_config_request.py +40 -0
vellum/types/number_variable_value.py +7 -3
vellum/types/number_vellum_value.py +7 -3
vellum/types/number_vellum_value_request.py +7 -3
vellum/types/object_parameter_config.py +49 -0
vellum/types/object_parameter_config_request.py +49 -0
vellum/types/one_of_parameter_config.py +44 -0
vellum/types/one_of_parameter_config_request.py +44 -0
vellum/types/open_ai_vectorizer_config.py +7 -3
vellum/types/open_ai_vectorizer_config_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_large.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_large_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_small.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_small_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_ada_002.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_ada_002_request.py +7 -3
vellum/types/paginated_document_index_read_list.py +7 -3
vellum/types/paginated_ml_model_read_list.py +33 -0
vellum/types/paginated_slim_deployment_read_list.py +7 -3
vellum/types/paginated_slim_document_list.py +7 -3
vellum/types/paginated_slim_workflow_deployment_list.py +7 -3
vellum/types/paginated_test_suite_run_execution_list.py +7 -3
vellum/types/paginated_test_suite_test_case_list.py +7 -3
vellum/types/parameter_config.py +251 -0
vellum/types/parameter_config_request.py +251 -0
vellum/types/pdf_search_result_meta_source.py +7 -3
vellum/types/pdf_search_result_meta_source_request.py +7 -3
vellum/types/prompt_deployment_expand_meta_request_request.py +7 -3
vellum/types/prompt_deployment_input_request.py +55 -12
vellum/types/prompt_execution_meta.py +7 -3
vellum/types/prompt_node_execution_meta.py +7 -3
vellum/types/prompt_node_result.py +7 -3
vellum/types/prompt_node_result_data.py +7 -3
vellum/types/prompt_output.py +69 -16
vellum/types/raw_prompt_execution_overrides_request.py +7 -3
vellum/types/reducto_chunker_config.py +7 -3
vellum/types/reducto_chunker_config_request.py +7 -3
vellum/types/reducto_chunking.py +7 -3
vellum/types/reducto_chunking_request.py +7 -3
vellum/types/rejected_execute_prompt_event.py +7 -3
vellum/types/rejected_execute_prompt_response.py +7 -3
vellum/types/rejected_execute_workflow_workflow_result_event.py +7 -3
vellum/types/rejected_prompt_execution_meta.py +7 -3
vellum/types/rejected_workflow_node_result_event.py +7 -3
vellum/types/replace_test_suite_test_case_request.py +7 -3
vellum/types/sandbox_scenario.py +7 -3
vellum/types/scenario_input.py +38 -8
vellum/types/scenario_input_chat_history_variable_value.py +7 -3
vellum/types/scenario_input_string_variable_value.py +7 -3
vellum/types/search_filters_request.py +7 -3
vellum/types/search_node_result.py +7 -3
vellum/types/search_node_result_data.py +7 -3
vellum/types/search_request_options_request.py +7 -3
vellum/types/search_response.py +7 -3
vellum/types/search_result.py +7 -3
vellum/types/search_result_document.py +7 -3
vellum/types/search_result_document_request.py +7 -3
vellum/types/search_result_merging_request.py +7 -3
vellum/types/search_result_meta.py +7 -3
vellum/types/search_result_meta_request.py +7 -3
vellum/types/search_result_meta_source.py +21 -5
vellum/types/search_result_meta_source_request.py +21 -5
vellum/types/search_result_request.py +7 -3
vellum/types/search_weights_request.py +7 -3
vellum/types/sentence_chunker_config.py +7 -3
vellum/types/sentence_chunker_config_request.py +7 -3
vellum/types/sentence_chunking.py +7 -3
vellum/types/sentence_chunking_request.py +7 -3
vellum/types/slim_deployment_read.py +11 -3
vellum/types/slim_document.py +7 -3
vellum/types/slim_workflow_deployment.py +12 -3
vellum/types/streaming_execute_prompt_event.py +7 -3
vellum/types/streaming_prompt_execution_meta.py +7 -3
vellum/types/streaming_workflow_node_result_event.py +7 -3
vellum/types/string_chat_message_content.py +7 -3
vellum/types/string_chat_message_content_request.py +7 -3
vellum/types/string_input_request.py +7 -3
vellum/types/string_parameter_config.py +39 -0
vellum/types/string_parameter_config_request.py +39 -0
vellum/types/string_variable_value.py +7 -3
vellum/types/string_vellum_value.py +7 -3
vellum/types/string_vellum_value_request.py +7 -3
vellum/types/submit_completion_actual_request.py +7 -3
vellum/types/submit_workflow_execution_actual_request.py +67 -12
vellum/types/subworkflow_node_result.py +7 -3
vellum/types/subworkflow_node_result_data.py +7 -3
vellum/types/templating_node_array_result.py +7 -3
vellum/types/templating_node_chat_history_result.py +7 -3
vellum/types/templating_node_error_result.py +7 -3
vellum/types/templating_node_function_call_result.py +7 -3
vellum/types/templating_node_json_result.py +7 -3
vellum/types/templating_node_number_result.py +7 -3
vellum/types/templating_node_result.py +7 -3
vellum/types/templating_node_result_data.py +7 -3
vellum/types/templating_node_result_output.py +144 -32
vellum/types/templating_node_search_results_result.py +7 -3
vellum/types/templating_node_string_result.py +7 -3
vellum/types/terminal_node_array_result.py +7 -3
vellum/types/terminal_node_chat_history_result.py +7 -3
vellum/types/terminal_node_error_result.py +7 -3
vellum/types/terminal_node_function_call_result.py +7 -3
vellum/types/terminal_node_json_result.py +7 -3
vellum/types/terminal_node_number_result.py +7 -3
vellum/types/terminal_node_result.py +7 -3
vellum/types/terminal_node_result_data.py +7 -3
vellum/types/terminal_node_result_output.py +152 -32
vellum/types/terminal_node_search_results_result.py +7 -3
vellum/types/terminal_node_string_result.py +7 -3
vellum/types/test_case_array_variable_value.py +7 -3
vellum/types/test_case_chat_history_variable_value.py +7 -3
vellum/types/test_case_error_variable_value.py +7 -3
vellum/types/test_case_function_call_variable_value.py +7 -3
vellum/types/test_case_json_variable_value.py +8 -4
vellum/types/test_case_number_variable_value.py +7 -3
vellum/types/test_case_search_results_variable_value.py +7 -3
vellum/types/test_case_string_variable_value.py +7 -3
vellum/types/test_case_variable_value.py +152 -32
vellum/types/test_suite_run_deployment_release_tag_exec_config.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_data.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_request.py +7 -3
vellum/types/test_suite_run_exec_config.py +57 -12
vellum/types/test_suite_run_exec_config_request.py +61 -12
vellum/types/test_suite_run_execution.py +7 -3
vellum/types/test_suite_run_execution_array_output.py +7 -3
vellum/types/test_suite_run_execution_chat_history_output.py +7 -3
vellum/types/test_suite_run_execution_error_output.py +7 -3
vellum/types/test_suite_run_execution_function_call_output.py +7 -3
vellum/types/test_suite_run_execution_json_output.py +7 -3
vellum/types/test_suite_run_execution_metric_definition.py +7 -3
vellum/types/test_suite_run_execution_metric_result.py +7 -3
vellum/types/test_suite_run_execution_number_output.py +7 -3
vellum/types/test_suite_run_execution_output.py +152 -32
vellum/types/test_suite_run_execution_search_results_output.py +7 -3
vellum/types/test_suite_run_execution_string_output.py +7 -3
vellum/types/test_suite_run_external_exec_config.py +7 -3
vellum/types/test_suite_run_external_exec_config_data.py +7 -3
vellum/types/test_suite_run_external_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_external_exec_config_request.py +7 -3
vellum/types/test_suite_run_metric_error_output.py +7 -3
vellum/types/test_suite_run_metric_number_output.py +7 -3
vellum/types/test_suite_run_metric_output.py +55 -12
vellum/types/test_suite_run_metric_string_output.py +7 -3
vellum/types/test_suite_run_read.py +7 -3
vellum/types/test_suite_run_test_suite.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_data.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_request.py +7 -3
vellum/types/test_suite_test_case.py +7 -3
vellum/types/test_suite_test_case_bulk_operation_request.py +75 -16
vellum/types/test_suite_test_case_bulk_result.py +74 -16
vellum/types/test_suite_test_case_create_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_created_bulk_result.py +7 -3
vellum/types/test_suite_test_case_created_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_delete_bulk_operation_data_request.py +7 -3
vellum/types/test_suite_test_case_delete_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_deleted_bulk_result.py +7 -3
vellum/types/test_suite_test_case_deleted_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_rejected_bulk_result.py +7 -3
vellum/types/test_suite_test_case_replace_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_replaced_bulk_result.py +7 -3
vellum/types/test_suite_test_case_replaced_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_upsert_bulk_operation_request.py +7 -3
vellum/types/{execute_workflow_error_response.py → tik_token_tokenizer_config.py} +11 -6
vellum/types/{generate_error_response.py → tik_token_tokenizer_config_request.py} +11 -6
vellum/types/token_overlapping_window_chunker_config.py +7 -3
vellum/types/token_overlapping_window_chunker_config_request.py +7 -3
vellum/types/token_overlapping_window_chunking.py +7 -3
vellum/types/token_overlapping_window_chunking_request.py +7 -3
vellum/types/upload_document_response.py +7 -3
vellum/types/upsert_test_suite_test_case_request.py +7 -3
vellum/types/vellum_error.py +7 -3
vellum/types/vellum_error_request.py +7 -3
vellum/types/vellum_image.py +7 -3
vellum/types/vellum_image_request.py +7 -3
vellum/types/vellum_variable.py +7 -3
vellum/types/visibility_enum.py +5 -0
vellum/types/workflow_deployment_read.py +12 -3
vellum/types/workflow_event_error.py +7 -3
vellum/types/workflow_execution_actual_chat_history_request.py +7 -3
vellum/types/workflow_execution_actual_json_request.py +7 -3
vellum/types/workflow_execution_actual_string_request.py +7 -3
vellum/types/workflow_execution_node_result_event.py +7 -3
vellum/types/workflow_execution_workflow_result_event.py +7 -3
vellum/types/workflow_expand_meta_request.py +7 -3
vellum/types/workflow_node_result_data.py +189 -45
vellum/types/workflow_node_result_event.py +101 -20
vellum/types/workflow_output.py +171 -36
vellum/types/workflow_output_array.py +7 -3
vellum/types/workflow_output_chat_history.py +7 -3
vellum/types/workflow_output_error.py +7 -3
vellum/types/workflow_output_function_call.py +7 -3
vellum/types/workflow_output_image.py +7 -3
vellum/types/workflow_output_json.py +7 -3
vellum/types/workflow_output_number.py +7 -3
vellum/types/workflow_output_search_results.py +7 -3
vellum/types/workflow_output_string.py +7 -3
vellum/types/workflow_release_tag_read.py +7 -3
vellum/types/workflow_release_tag_workflow_deployment_history_item.py +7 -3
vellum/types/workflow_request_chat_history_input_request.py +7 -3
vellum/types/workflow_request_input_request.py +72 -16
vellum/types/workflow_request_json_input_request.py +7 -3
vellum/types/workflow_request_number_input_request.py +7 -3
vellum/types/workflow_request_string_input_request.py +7 -3
vellum/types/workflow_result_event.py +7 -3
vellum/types/workflow_result_event_output_data.py +178 -33
vellum/types/workflow_result_event_output_data_array.py +7 -3
vellum/types/workflow_result_event_output_data_chat_history.py +7 -3
vellum/types/workflow_result_event_output_data_error.py +7 -3
vellum/types/workflow_result_event_output_data_function_call.py +7 -3
vellum/types/workflow_result_event_output_data_json.py +7 -3
vellum/types/workflow_result_event_output_data_number.py +7 -3
vellum/types/workflow_result_event_output_data_search_results.py +7 -3
vellum/types/workflow_result_event_output_data_string.py +7 -3
vellum/types/workflow_stream_event.py +43 -8
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/METADATA +13 -1
vellum_ai-0.7.5.dist-info/RECORD +502 -0
vellum/types/array_enum.py +0 -5
vellum/types/chat_history_enum.py +0 -5
vellum/types/create_enum.py +0 -5
vellum/types/created_enum.py +0 -5
vellum/types/delete_enum.py +0 -5
vellum/types/deleted_enum.py +0 -5
vellum/types/error_enum.py +0 -5
vellum/types/function_call_enum.py +0 -5
vellum/types/hkunlp_instructor_xl_enum.py +0 -5
vellum/types/image_enum.py +0 -5
vellum/types/initiated_enum.py +0 -5
vellum/types/intfloat_multilingual_e_5_large_enum.py +0 -5
vellum/types/json_enum.py +0 -5
vellum/types/merge_enum.py +0 -5
vellum/types/metric_enum.py +0 -5
vellum/types/number_enum.py +0 -5
vellum/types/pdf_enum.py +0 -5
vellum/types/reducto_chunker_enum.py +0 -5
vellum/types/rejected_enum.py +0 -5
vellum/types/replace_enum.py +0 -5
vellum/types/replaced_enum.py +0 -5
vellum/types/search_error_response.py +0 -28
vellum/types/search_results_enum.py +0 -5
vellum/types/sentence_chunker_enum.py +0 -5
vellum/types/sentence_transformers_multi_qa_mpnet_base_cos_v_1_enum.py +0 -5
vellum/types/sentence_transformers_multi_qa_mpnet_base_dot_v_1_enum.py +0 -5
vellum/types/streaming_enum.py +0 -5
vellum/types/string_enum.py +0 -5
vellum/types/submit_completion_actuals_error_response.py +0 -25
vellum/types/subworkflow_enum.py +0 -5
vellum/types/test_suite_run_deployment_release_tag_exec_config_type_enum.py +0 -5
vellum/types/test_suite_run_external_exec_config_type_enum.py +0 -5
vellum/types/test_suite_run_metric_error_output_type_enum.py +0 -5
vellum/types/test_suite_run_metric_number_output_type_enum.py +0 -5
vellum/types/test_suite_run_metric_string_output_type_enum.py +0 -5
vellum/types/test_suite_run_workflow_release_tag_exec_config_type_enum.py +0 -5
vellum/types/text_embedding_3_large_enum.py +0 -5
vellum/types/text_embedding_3_small_enum.py +0 -5
vellum/types/text_embedding_ada_002_enum.py +0 -5
vellum/types/token_overlapping_window_chunker_enum.py +0 -5
vellum/types/upload_document_error_response.py +0 -25
vellum/types/upsert_enum.py +0 -5
vellum_ai-0.7.3.dist-info/RECORD +0 -496
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/LICENSE +0 -0
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/WHEEL +0 -0

vellum/resources/deployments/client.py CHANGED Viewed

@@ -1,14 +1,12 @@
 # This file was auto-generated by Fern from our API Definition.
 import typing
-import urllib.parse
 from json.decoder import JSONDecodeError
 from ...core.api_error import ApiError
 from ...core.client_wrapper import AsyncClientWrapper, SyncClientWrapper
 from ...core.jsonable_encoder import jsonable_encoder
 from ...core.pydantic_utilities import pydantic_v1
-from ...core.remove_none_from_dict import remove_none_from_dict
 from ...core.request_options import RequestOptions
 from ...errors.bad_request_error import BadRequestError
 from ...errors.forbidden_error import ForbiddenError
@@ -40,17 +38,32 @@ class DeploymentsClient:
         request_options: typing.Optional[RequestOptions] = None,
     ) -> PaginatedSlimDeploymentReadList:
         """
-        Parameters:
-            - limit: typing.Optional[int]. Number of results to return per page.
+        Used to list all Prompt Deployments.
-            - offset: typing.Optional[int]. The initial index from which to return the results.
+        Parameters
+        ----------
+        limit : typing.Optional[int]
+            Number of results to return per page.
-            - ordering: typing.Optional[str]. Which field to use when ordering the results.
+        offset : typing.Optional[int]
+            The initial index from which to return the results.
-            - status: typing.Optional[DeploymentsListRequestStatus]. status
+        ordering : typing.Optional[str]
+            Which field to use when ordering the results.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        status : typing.Optional[DeploymentsListRequestStatus]
+            status
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        PaginatedSlimDeploymentReadList
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -59,40 +72,15 @@ class DeploymentsClient:
         client.deployments.list()
         """
         _response = self._client_wrapper.httpx_client.request(
+            "v1/deployments",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", "v1/deployments"),
-            params=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        "limit": limit,
-                        "offset": offset,
-                        "ordering": ordering,
-                        "status": status,
-                        **(
-                            request_options.get("additional_query_parameters", {})
-                            if request_options is not None
-                            else {}
-                        ),
-                    }
-                )
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            params={"limit": limit, "offset": offset, "ordering": ordering, "status": status},
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -100,13 +88,23 @@ class DeploymentsClient:
     def retrieve(self, id: str, *, request_options: typing.Optional[RequestOptions] = None) -> DeploymentRead:
         """
-        Used to retrieve a deployment given its ID or name.
+        Used to retrieve a Prompt Deployment given its ID or name.
+        Parameters
+        ----------
+        id : str
+            Either the Deployment's ID or its unique name
-        Parameters:
-            - id: str. Either the Deployment's ID or its unique name
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Returns
+        -------
+        DeploymentRead
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -117,30 +115,14 @@ class DeploymentsClient:
         )
         """
         _response = self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{jsonable_encoder(id)}"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -152,13 +134,24 @@ class DeploymentsClient:
         """
         Retrieve a Deployment Release Tag by tag name, associated with a specified Deployment.
-        Parameters:
-            - id: str. A UUID string identifying this deployment.
+        Parameters
+        ----------
+        id : str
+            A UUID string identifying this deployment.
+        name : str
+            The name of the Release Tag associated with this Deployment that you'd like to retrieve.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        DeploymentReleaseTagRead
-            - name: str. The name of the Release Tag associated with this Deployment that you'd like to retrieve.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -170,31 +163,14 @@ class DeploymentsClient:
         )
         """
         _response = self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/",
-                f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -211,15 +187,27 @@ class DeploymentsClient:
         """
         Updates an existing Release Tag associated with the specified Deployment.
-        Parameters:
-            - id: str. A UUID string identifying this deployment.
+        Parameters
+        ----------
+        id : str
+            A UUID string identifying this deployment.
-            - name: str. The name of the Release Tag associated with this Deployment that you'd like to update.
+        name : str
+            The name of the Release Tag associated with this Deployment that you'd like to update.
-            - history_item_id: typing.Optional[str]. The ID of the Deployment History Item to tag
+        history_item_id : typing.Optional[str]
+            The ID of the Deployment History Item to tag
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        DeploymentReleaseTagRead
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -230,41 +218,17 @@ class DeploymentsClient:
             name="name",
         )
         """
-        _request: typing.Dict[str, typing.Any] = {}
-        if history_item_id is not OMIT:
-            _request["history_item_id"] = history_item_id
         _response = self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="PATCH",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/",
-                f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"history_item_id": history_item_id},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -273,27 +237,51 @@ class DeploymentsClient:
     def retrieve_provider_payload(
         self,
         *,
+        inputs: typing.Sequence[PromptDeploymentInputRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        inputs: typing.Sequence[PromptDeploymentInputRequest],
         release_tag: typing.Optional[str] = OMIT,
         expand_meta: typing.Optional[CompilePromptDeploymentExpandMetaRequest] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> DeploymentProviderPayloadResponse:
         """
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Given a set of input variable values, compile the exact payload that Vellum would send to the configured model provider
+        for execution if the execute-prompt endpoint had been invoked. Note that this endpoint does not actually execute the
+        prompt or make an API call to the model provider.
+        This endpoint is useful if you don't want to proxy LLM provider requests through Vellum and prefer to send them directly
+        to the provider yourself. Note that no guarantees are made on the format of this API's response schema, other than
+        that it will be a valid payload for the configured model provider. It's not recommended that you try to parse or
+        derive meaning from the response body and instead, should simply pass it directly to the model provider as is.
+        We encourage you to seek advise from Vellum Support before integrating with this API for production use.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            The list of inputs defined in the Prompt's deployment with their corresponding values.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        expand_meta : typing.Optional[CompilePromptDeploymentExpandMetaRequest]
-            - expand_meta: typing.Optional[CompilePromptDeploymentExpandMetaRequest].
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Returns
+        -------
+        DeploymentProviderPayloadResponse
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -303,54 +291,31 @@ class DeploymentsClient:
             inputs=[],
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
         _response = self._client_wrapper.httpx_client.request(
+            "v1/deployments/provider-payload",
+            base_url=self._client_wrapper.get_environment().default,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/", "v1/deployments/provider-payload"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "inputs": inputs,
+                "release_tag": release_tag,
+                "expand_meta": expand_meta,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -371,59 +336,57 @@ class AsyncDeploymentsClient:
         request_options: typing.Optional[RequestOptions] = None,
     ) -> PaginatedSlimDeploymentReadList:
         """
-        Parameters:
-            - limit: typing.Optional[int]. Number of results to return per page.
+        Used to list all Prompt Deployments.
+        Parameters
+        ----------
+        limit : typing.Optional[int]
+            Number of results to return per page.
+        offset : typing.Optional[int]
+            The initial index from which to return the results.
+        ordering : typing.Optional[str]
+            Which field to use when ordering the results.
-            - offset: typing.Optional[int]. The initial index from which to return the results.
+        status : typing.Optional[DeploymentsListRequestStatus]
+            status
-            - ordering: typing.Optional[str]. Which field to use when ordering the results.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - status: typing.Optional[DeploymentsListRequestStatus]. status
+        Returns
+        -------
+        PaginatedSlimDeploymentReadList
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.deployments.list()
+        async def main() -> None:
+            await client.deployments.list()
+        asyncio.run(main())
         """
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/deployments",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", "v1/deployments"),
-            params=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        "limit": limit,
-                        "offset": offset,
-                        "ordering": ordering,
-                        "status": status,
-                        **(
-                            request_options.get("additional_query_parameters", {})
-                            if request_options is not None
-                            else {}
-                        ),
-                    }
-                )
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            params={"limit": limit, "offset": offset, "ordering": ordering, "status": status},
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -431,47 +394,49 @@ class AsyncDeploymentsClient:
     async def retrieve(self, id: str, *, request_options: typing.Optional[RequestOptions] = None) -> DeploymentRead:
         """
-        Used to retrieve a deployment given its ID or name.
+        Used to retrieve a Prompt Deployment given its ID or name.
+        Parameters
+        ----------
+        id : str
+            Either the Deployment's ID or its unique name
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        DeploymentRead
-        Parameters:
-            - id: str. Either the Deployment's ID or its unique name
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.deployments.retrieve(
-            id="id",
-        )
+        async def main() -> None:
+            await client.deployments.retrieve(
+                id="id",
+            )
+        asyncio.run(main())
         """
         _response = await self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{jsonable_encoder(id)}"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -483,49 +448,51 @@ class AsyncDeploymentsClient:
         """
         Retrieve a Deployment Release Tag by tag name, associated with a specified Deployment.
-        Parameters:
-            - id: str. A UUID string identifying this deployment.
+        Parameters
+        ----------
+        id : str
+            A UUID string identifying this deployment.
+        name : str
+            The name of the Release Tag associated with this Deployment that you'd like to retrieve.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        DeploymentReleaseTagRead
-            - name: str. The name of the Release Tag associated with this Deployment that you'd like to retrieve.
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.deployments.retrieve_deployment_release_tag(
-            id="id",
-            name="name",
-        )
+        async def main() -> None:
+            await client.deployments.retrieve_deployment_release_tag(
+                id="id",
+                name="name",
+            )
+        asyncio.run(main())
         """
         _response = await self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="GET",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/",
-                f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -542,60 +509,56 @@ class AsyncDeploymentsClient:
         """
         Updates an existing Release Tag associated with the specified Deployment.
-        Parameters:
-            - id: str. A UUID string identifying this deployment.
+        Parameters
+        ----------
+        id : str
+            A UUID string identifying this deployment.
+        name : str
+            The name of the Release Tag associated with this Deployment that you'd like to update.
+        history_item_id : typing.Optional[str]
+            The ID of the Deployment History Item to tag
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - name: str. The name of the Release Tag associated with this Deployment that you'd like to update.
+        Returns
+        -------
+        DeploymentReleaseTagRead
-            - history_item_id: typing.Optional[str]. The ID of the Deployment History Item to tag
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
+        import asyncio
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.deployments.update_deployment_release_tag(
-            id="id",
-            name="name",
-        )
+        async def main() -> None:
+            await client.deployments.update_deployment_release_tag(
+                id="id",
+                name="name",
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {}
-        if history_item_id is not OMIT:
-            _request["history_item_id"] = history_item_id
         _response = await self._client_wrapper.httpx_client.request(
+            f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
+            base_url=self._client_wrapper.get_environment().default,
             method="PATCH",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/",
-                f"v1/deployments/{jsonable_encoder(id)}/release-tags/{jsonable_encoder(name)}",
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"history_item_id": history_item_id},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentReleaseTagRead, _response.json())  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -604,84 +567,93 @@ class AsyncDeploymentsClient:
     async def retrieve_provider_payload(
         self,
         *,
+        inputs: typing.Sequence[PromptDeploymentInputRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        inputs: typing.Sequence[PromptDeploymentInputRequest],
         release_tag: typing.Optional[str] = OMIT,
         expand_meta: typing.Optional[CompilePromptDeploymentExpandMetaRequest] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
     ) -> DeploymentProviderPayloadResponse:
         """
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Given a set of input variable values, compile the exact payload that Vellum would send to the configured model provider
+        for execution if the execute-prompt endpoint had been invoked. Note that this endpoint does not actually execute the
+        prompt or make an API call to the model provider.
+        This endpoint is useful if you don't want to proxy LLM provider requests through Vellum and prefer to send them directly
+        to the provider yourself. Note that no guarantees are made on the format of this API's response schema, other than
+        that it will be a valid payload for the configured model provider. It's not recommended that you try to parse or
+        derive meaning from the response body and instead, should simply pass it directly to the model provider as is.
+        We encourage you to seek advise from Vellum Support before integrating with this API for production use.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            The list of inputs defined in the Prompt's deployment with their corresponding values.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        expand_meta : typing.Optional[CompilePromptDeploymentExpandMetaRequest]
-            - expand_meta: typing.Optional[CompilePromptDeploymentExpandMetaRequest].
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        DeploymentProviderPayloadResponse
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.deployments.retrieve_provider_payload(
-            inputs=[],
-        )
+        async def main() -> None:
+            await client.deployments.retrieve_provider_payload(
+                inputs=[],
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/deployments/provider-payload",
+            base_url=self._client_wrapper.get_environment().default,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().default}/", "v1/deployments/provider-payload"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "inputs": inputs,
+                "release_tag": release_tag,
+                "expand_meta": expand_meta,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)

vellum-ai 0.7.3__py3-none-any.whl → 0.7.5__py3-none-any.whl

vellum-ai 0.7.3py3-none-any.whl → 0.7.5py3-none-any.whl