PyPI - vellum-ai - Versions diffs - 0.7.3__py3-none-any.whl → 0.7.5__py3-none-any.whl - Mend

vellum-ai 0.7.3py3-none-any.whl → 0.7.5py3-none-any.whl

Files changed (483) hide show

vellum/__init__.py +142 -94
vellum/client.py +1051 -1097
vellum/core/__init__.py +4 -1
vellum/core/client_wrapper.py +7 -3
vellum/core/http_client.py +365 -20
vellum/core/jsonable_encoder.py +3 -0
vellum/core/pydantic_utilities.py +16 -0
vellum/core/query_encoder.py +33 -0
vellum/core/remove_none_from_dict.py +2 -2
vellum/core/request_options.py +2 -2
vellum/resources/__init__.py +2 -0
vellum/resources/deployments/client.py +349 -377
vellum/resources/document_indexes/client.py +542 -610
vellum/resources/documents/client.py +327 -399
vellum/resources/folder_entities/client.py +56 -72
vellum/{types/map_enum.py → resources/ml_models/__init__.py} +0 -3
vellum/resources/ml_models/client.py +837 -0
vellum/resources/sandboxes/client.py +204 -242
vellum/resources/test_suite_runs/client.py +183 -213
vellum/resources/test_suites/client.py +307 -311
vellum/resources/workflow_deployments/client.py +230 -268
vellum/resources/workflow_sandboxes/client.py +82 -96
vellum/terraform/_jsii/vellum-ai_vellum@0.0.0.jsii.tgz +0 -0
vellum/terraform/data_vellum_document_index/__init__.py +10 -10
vellum/terraform/document_index/__init__.py +17 -17
vellum/terraform/provider/__init__.py +57 -12
vellum/terraform/versions.json +1 -1
vellum/types/__init__.py +148 -96
vellum/types/api_node_result.py +7 -3
vellum/types/api_node_result_data.py +7 -3
vellum/types/array_chat_message_content.py +7 -3
vellum/types/array_chat_message_content_item.py +53 -12
vellum/types/array_chat_message_content_item_request.py +53 -12
vellum/types/array_chat_message_content_request.py +7 -3
vellum/types/array_parameter_config.py +50 -0
vellum/types/array_parameter_config_request.py +50 -0
vellum/types/array_variable_value_item.py +102 -24
vellum/types/array_vellum_value_item.py +102 -24
vellum/types/array_vellum_value_item_request.py +102 -24
vellum/types/basic_vectorizer_intfloat_multilingual_e_5_large.py +7 -3
vellum/types/basic_vectorizer_intfloat_multilingual_e_5_large_request.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_cos_v_1.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_cos_v_1_request.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_dot_v_1.py +7 -3
vellum/types/basic_vectorizer_sentence_transformers_multi_qa_mpnet_base_dot_v_1_request.py +7 -3
vellum/types/boolean_parameter_config.py +35 -0
vellum/types/boolean_parameter_config_request.py +35 -0
vellum/types/chat_history_input_request.py +7 -3
vellum/types/chat_message.py +7 -3
vellum/types/chat_message_content.py +70 -16
vellum/types/chat_message_content_request.py +70 -16
vellum/types/chat_message_request.py +7 -3
vellum/types/code_execution_node_array_result.py +7 -3
vellum/types/code_execution_node_chat_history_result.py +7 -3
vellum/types/code_execution_node_error_result.py +7 -3
vellum/types/code_execution_node_function_call_result.py +7 -3
vellum/types/code_execution_node_json_result.py +7 -3
vellum/types/code_execution_node_number_result.py +7 -3
vellum/types/code_execution_node_result.py +7 -3
vellum/types/code_execution_node_result_data.py +7 -3
vellum/types/code_execution_node_result_output.py +144 -32
vellum/types/code_execution_node_search_results_result.py +7 -3
vellum/types/code_execution_node_string_result.py +7 -3
vellum/types/compile_prompt_deployment_expand_meta_request.py +7 -3
vellum/types/compile_prompt_meta.py +7 -3
vellum/types/conditional_node_result.py +7 -3
vellum/types/conditional_node_result_data.py +7 -3
vellum/types/const_parameter_config.py +35 -0
vellum/types/const_parameter_config_request.py +35 -0
vellum/types/create_test_suite_test_case_request.py +7 -3
vellum/types/deployment_provider_payload_response.py +7 -3
vellum/types/deployment_read.py +12 -3
vellum/types/deployment_release_tag_deployment_history_item.py +7 -3
vellum/types/deployment_release_tag_read.py +7 -3
vellum/types/document_document_to_document_index.py +7 -3
vellum/types/document_index_chunking.py +54 -12
vellum/types/document_index_chunking_request.py +54 -12
vellum/types/document_index_indexing_config.py +7 -3
vellum/types/document_index_indexing_config_request.py +7 -3
vellum/types/document_index_read.py +7 -3
vellum/types/document_read.py +7 -3
vellum/types/enriched_normalized_completion.py +7 -3
vellum/types/error_variable_value.py +7 -3
vellum/types/error_vellum_value.py +7 -3
vellum/types/error_vellum_value_request.py +7 -3
vellum/types/execute_prompt_event.py +82 -16
vellum/types/execute_prompt_response.py +44 -8
vellum/types/execute_workflow_response.py +7 -3
vellum/types/execute_workflow_workflow_result_event.py +41 -8
vellum/types/execution_array_vellum_value.py +7 -3
vellum/types/execution_chat_history_vellum_value.py +7 -3
vellum/types/execution_error_vellum_value.py +7 -3
vellum/types/execution_function_call_vellum_value.py +7 -3
vellum/types/execution_json_vellum_value.py +7 -3
vellum/types/execution_number_vellum_value.py +7 -3
vellum/types/execution_search_results_vellum_value.py +7 -3
vellum/types/execution_string_vellum_value.py +7 -3
vellum/types/execution_vellum_value.py +152 -32
vellum/types/external_test_case_execution.py +7 -3
vellum/types/external_test_case_execution_request.py +7 -3
vellum/types/fulfilled_execute_prompt_event.py +7 -3
vellum/types/fulfilled_execute_prompt_response.py +7 -3
vellum/types/fulfilled_execute_workflow_workflow_result_event.py +7 -3
vellum/types/fulfilled_prompt_execution_meta.py +7 -3
vellum/types/fulfilled_workflow_node_result_event.py +7 -3
vellum/types/function_call.py +7 -3
vellum/types/function_call_chat_message_content.py +7 -3
vellum/types/function_call_chat_message_content_request.py +7 -3
vellum/types/function_call_chat_message_content_value.py +7 -3
vellum/types/function_call_chat_message_content_value_request.py +7 -3
vellum/types/function_call_request.py +7 -3
vellum/types/function_call_variable_value.py +7 -3
vellum/types/function_call_vellum_value.py +7 -3
vellum/types/function_call_vellum_value_request.py +7 -3
vellum/types/generate_options_request.py +7 -3
vellum/types/generate_request.py +7 -3
vellum/types/generate_result.py +7 -3
vellum/types/generate_result_data.py +7 -3
vellum/types/generate_result_error.py +7 -3
vellum/types/generate_stream_response.py +7 -3
vellum/types/generate_stream_result.py +7 -3
vellum/types/generate_stream_result_data.py +7 -3
vellum/types/hkunlp_instructor_xl_vectorizer.py +7 -3
vellum/types/hkunlp_instructor_xl_vectorizer_request.py +7 -3
vellum/types/hosted_by_enum.py +26 -0
vellum/types/hugging_face_tokenizer_config.py +34 -0
vellum/types/hugging_face_tokenizer_config_request.py +34 -0
vellum/types/image_chat_message_content.py +7 -3
vellum/types/image_chat_message_content_request.py +7 -3
vellum/types/image_variable_value.py +7 -3
vellum/types/image_vellum_value.py +7 -3
vellum/types/image_vellum_value_request.py +7 -3
vellum/types/indexing_config_vectorizer.py +117 -36
vellum/types/indexing_config_vectorizer_request.py +117 -36
vellum/types/initiated_execute_prompt_event.py +7 -3
vellum/types/initiated_prompt_execution_meta.py +7 -3
vellum/types/initiated_workflow_node_result_event.py +7 -3
vellum/types/instructor_vectorizer_config.py +7 -3
vellum/types/instructor_vectorizer_config_request.py +7 -3
vellum/types/integer_parameter_config.py +39 -0
vellum/types/integer_parameter_config_request.py +39 -0
vellum/types/json_input_request.py +7 -3
vellum/types/json_variable_value.py +7 -3
vellum/types/json_vellum_value.py +7 -3
vellum/types/json_vellum_value_request.py +7 -3
vellum/types/map_node_result.py +7 -3
vellum/types/map_node_result_data.py +7 -3
vellum/types/merge_node_result.py +7 -3
vellum/types/merge_node_result_data.py +7 -3
vellum/types/metadata_filter_config_request.py +7 -3
vellum/types/metadata_filter_rule_request.py +7 -3
vellum/types/metric_node_result.py +7 -3
vellum/types/{execute_workflow_stream_error_response.py → ml_model_build_config.py} +9 -8
vellum/types/{execute_prompt_api_error_response.py → ml_model_build_config_request.py} +9 -8
vellum/types/ml_model_developer.py +27 -0
vellum/types/ml_model_developer_enum_value_label.py +31 -0
vellum/types/ml_model_display_config_labelled.py +33 -0
vellum/types/ml_model_display_config_request.py +33 -0
vellum/types/ml_model_display_tag.py +7 -0
vellum/types/ml_model_display_tag_enum_value_label.py +31 -0
vellum/types/ml_model_exec_config.py +40 -0
vellum/types/ml_model_exec_config_request.py +40 -0
vellum/types/ml_model_family.py +29 -0
vellum/types/ml_model_family_enum_value_label.py +31 -0
vellum/types/ml_model_feature.py +18 -0
vellum/types/ml_model_parameter_config.py +42 -0
vellum/types/ml_model_parameter_config_request.py +42 -0
vellum/types/ml_model_read.py +108 -0
vellum/types/ml_model_request_authorization_config.py +30 -0
vellum/types/ml_model_request_authorization_config_request.py +30 -0
vellum/types/ml_model_request_authorization_config_type_enum.py +5 -0
vellum/types/ml_model_request_config.py +32 -0
vellum/types/ml_model_request_config_request.py +32 -0
vellum/types/ml_model_response_config.py +31 -0
vellum/types/ml_model_response_config_request.py +31 -0
vellum/types/ml_model_tokenizer_config.py +59 -0
vellum/types/ml_model_tokenizer_config_request.py +61 -0
vellum/types/ml_model_usage.py +7 -3
vellum/types/named_scenario_input_chat_history_variable_value_request.py +7 -3
vellum/types/named_scenario_input_request.py +38 -8
vellum/types/named_scenario_input_string_variable_value_request.py +7 -3
vellum/types/named_test_case_array_variable_value.py +7 -3
vellum/types/named_test_case_array_variable_value_request.py +7 -3
vellum/types/named_test_case_chat_history_variable_value.py +7 -3
vellum/types/named_test_case_chat_history_variable_value_request.py +7 -3
vellum/types/named_test_case_error_variable_value.py +7 -3
vellum/types/named_test_case_error_variable_value_request.py +7 -3
vellum/types/named_test_case_function_call_variable_value.py +7 -3
vellum/types/named_test_case_function_call_variable_value_request.py +7 -3
vellum/types/named_test_case_json_variable_value.py +7 -3
vellum/types/named_test_case_json_variable_value_request.py +7 -3
vellum/types/named_test_case_number_variable_value.py +7 -3
vellum/types/named_test_case_number_variable_value_request.py +7 -3
vellum/types/named_test_case_search_results_variable_value.py +7 -3
vellum/types/named_test_case_search_results_variable_value_request.py +7 -3
vellum/types/named_test_case_string_variable_value.py +7 -3
vellum/types/named_test_case_string_variable_value_request.py +7 -3
vellum/types/named_test_case_variable_value.py +144 -32
vellum/types/named_test_case_variable_value_request.py +144 -32
vellum/types/node_input_compiled_array_value.py +7 -3
vellum/types/node_input_compiled_chat_history_value.py +7 -3
vellum/types/node_input_compiled_error_value.py +7 -3
vellum/types/node_input_compiled_function_call.py +7 -3
vellum/types/node_input_compiled_json_value.py +7 -3
vellum/types/node_input_compiled_number_value.py +7 -3
vellum/types/node_input_compiled_search_results_value.py +7 -3
vellum/types/node_input_compiled_string_value.py +7 -3
vellum/types/node_input_variable_compiled_value.py +152 -32
vellum/types/node_output_compiled_array_value.py +7 -3
vellum/types/node_output_compiled_chat_history_value.py +7 -3
vellum/types/node_output_compiled_error_value.py +7 -3
vellum/types/node_output_compiled_function_call_value.py +7 -3
vellum/types/node_output_compiled_json_value.py +7 -3
vellum/types/node_output_compiled_number_value.py +7 -3
vellum/types/node_output_compiled_search_results_value.py +7 -3
vellum/types/node_output_compiled_string_value.py +7 -3
vellum/types/node_output_compiled_value.py +153 -32
vellum/types/normalized_log_probs.py +7 -3
vellum/types/normalized_token_log_probs.py +7 -3
vellum/types/number_parameter_config.py +40 -0
vellum/types/number_parameter_config_request.py +40 -0
vellum/types/number_variable_value.py +7 -3
vellum/types/number_vellum_value.py +7 -3
vellum/types/number_vellum_value_request.py +7 -3
vellum/types/object_parameter_config.py +49 -0
vellum/types/object_parameter_config_request.py +49 -0
vellum/types/one_of_parameter_config.py +44 -0
vellum/types/one_of_parameter_config_request.py +44 -0
vellum/types/open_ai_vectorizer_config.py +7 -3
vellum/types/open_ai_vectorizer_config_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_large.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_large_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_small.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_3_small_request.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_ada_002.py +7 -3
vellum/types/open_ai_vectorizer_text_embedding_ada_002_request.py +7 -3
vellum/types/paginated_document_index_read_list.py +7 -3
vellum/types/paginated_ml_model_read_list.py +33 -0
vellum/types/paginated_slim_deployment_read_list.py +7 -3
vellum/types/paginated_slim_document_list.py +7 -3
vellum/types/paginated_slim_workflow_deployment_list.py +7 -3
vellum/types/paginated_test_suite_run_execution_list.py +7 -3
vellum/types/paginated_test_suite_test_case_list.py +7 -3
vellum/types/parameter_config.py +251 -0
vellum/types/parameter_config_request.py +251 -0
vellum/types/pdf_search_result_meta_source.py +7 -3
vellum/types/pdf_search_result_meta_source_request.py +7 -3
vellum/types/prompt_deployment_expand_meta_request_request.py +7 -3
vellum/types/prompt_deployment_input_request.py +55 -12
vellum/types/prompt_execution_meta.py +7 -3
vellum/types/prompt_node_execution_meta.py +7 -3
vellum/types/prompt_node_result.py +7 -3
vellum/types/prompt_node_result_data.py +7 -3
vellum/types/prompt_output.py +69 -16
vellum/types/raw_prompt_execution_overrides_request.py +7 -3
vellum/types/reducto_chunker_config.py +7 -3
vellum/types/reducto_chunker_config_request.py +7 -3
vellum/types/reducto_chunking.py +7 -3
vellum/types/reducto_chunking_request.py +7 -3
vellum/types/rejected_execute_prompt_event.py +7 -3
vellum/types/rejected_execute_prompt_response.py +7 -3
vellum/types/rejected_execute_workflow_workflow_result_event.py +7 -3
vellum/types/rejected_prompt_execution_meta.py +7 -3
vellum/types/rejected_workflow_node_result_event.py +7 -3
vellum/types/replace_test_suite_test_case_request.py +7 -3
vellum/types/sandbox_scenario.py +7 -3
vellum/types/scenario_input.py +38 -8
vellum/types/scenario_input_chat_history_variable_value.py +7 -3
vellum/types/scenario_input_string_variable_value.py +7 -3
vellum/types/search_filters_request.py +7 -3
vellum/types/search_node_result.py +7 -3
vellum/types/search_node_result_data.py +7 -3
vellum/types/search_request_options_request.py +7 -3
vellum/types/search_response.py +7 -3
vellum/types/search_result.py +7 -3
vellum/types/search_result_document.py +7 -3
vellum/types/search_result_document_request.py +7 -3
vellum/types/search_result_merging_request.py +7 -3
vellum/types/search_result_meta.py +7 -3
vellum/types/search_result_meta_request.py +7 -3
vellum/types/search_result_meta_source.py +21 -5
vellum/types/search_result_meta_source_request.py +21 -5
vellum/types/search_result_request.py +7 -3
vellum/types/search_weights_request.py +7 -3
vellum/types/sentence_chunker_config.py +7 -3
vellum/types/sentence_chunker_config_request.py +7 -3
vellum/types/sentence_chunking.py +7 -3
vellum/types/sentence_chunking_request.py +7 -3
vellum/types/slim_deployment_read.py +11 -3
vellum/types/slim_document.py +7 -3
vellum/types/slim_workflow_deployment.py +12 -3
vellum/types/streaming_execute_prompt_event.py +7 -3
vellum/types/streaming_prompt_execution_meta.py +7 -3
vellum/types/streaming_workflow_node_result_event.py +7 -3
vellum/types/string_chat_message_content.py +7 -3
vellum/types/string_chat_message_content_request.py +7 -3
vellum/types/string_input_request.py +7 -3
vellum/types/string_parameter_config.py +39 -0
vellum/types/string_parameter_config_request.py +39 -0
vellum/types/string_variable_value.py +7 -3
vellum/types/string_vellum_value.py +7 -3
vellum/types/string_vellum_value_request.py +7 -3
vellum/types/submit_completion_actual_request.py +7 -3
vellum/types/submit_workflow_execution_actual_request.py +67 -12
vellum/types/subworkflow_node_result.py +7 -3
vellum/types/subworkflow_node_result_data.py +7 -3
vellum/types/templating_node_array_result.py +7 -3
vellum/types/templating_node_chat_history_result.py +7 -3
vellum/types/templating_node_error_result.py +7 -3
vellum/types/templating_node_function_call_result.py +7 -3
vellum/types/templating_node_json_result.py +7 -3
vellum/types/templating_node_number_result.py +7 -3
vellum/types/templating_node_result.py +7 -3
vellum/types/templating_node_result_data.py +7 -3
vellum/types/templating_node_result_output.py +144 -32
vellum/types/templating_node_search_results_result.py +7 -3
vellum/types/templating_node_string_result.py +7 -3
vellum/types/terminal_node_array_result.py +7 -3
vellum/types/terminal_node_chat_history_result.py +7 -3
vellum/types/terminal_node_error_result.py +7 -3
vellum/types/terminal_node_function_call_result.py +7 -3
vellum/types/terminal_node_json_result.py +7 -3
vellum/types/terminal_node_number_result.py +7 -3
vellum/types/terminal_node_result.py +7 -3
vellum/types/terminal_node_result_data.py +7 -3
vellum/types/terminal_node_result_output.py +152 -32
vellum/types/terminal_node_search_results_result.py +7 -3
vellum/types/terminal_node_string_result.py +7 -3
vellum/types/test_case_array_variable_value.py +7 -3
vellum/types/test_case_chat_history_variable_value.py +7 -3
vellum/types/test_case_error_variable_value.py +7 -3
vellum/types/test_case_function_call_variable_value.py +7 -3
vellum/types/test_case_json_variable_value.py +8 -4
vellum/types/test_case_number_variable_value.py +7 -3
vellum/types/test_case_search_results_variable_value.py +7 -3
vellum/types/test_case_string_variable_value.py +7 -3
vellum/types/test_case_variable_value.py +152 -32
vellum/types/test_suite_run_deployment_release_tag_exec_config.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_data.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_request.py +7 -3
vellum/types/test_suite_run_exec_config.py +57 -12
vellum/types/test_suite_run_exec_config_request.py +61 -12
vellum/types/test_suite_run_execution.py +7 -3
vellum/types/test_suite_run_execution_array_output.py +7 -3
vellum/types/test_suite_run_execution_chat_history_output.py +7 -3
vellum/types/test_suite_run_execution_error_output.py +7 -3
vellum/types/test_suite_run_execution_function_call_output.py +7 -3
vellum/types/test_suite_run_execution_json_output.py +7 -3
vellum/types/test_suite_run_execution_metric_definition.py +7 -3
vellum/types/test_suite_run_execution_metric_result.py +7 -3
vellum/types/test_suite_run_execution_number_output.py +7 -3
vellum/types/test_suite_run_execution_output.py +152 -32
vellum/types/test_suite_run_execution_search_results_output.py +7 -3
vellum/types/test_suite_run_execution_string_output.py +7 -3
vellum/types/test_suite_run_external_exec_config.py +7 -3
vellum/types/test_suite_run_external_exec_config_data.py +7 -3
vellum/types/test_suite_run_external_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_external_exec_config_request.py +7 -3
vellum/types/test_suite_run_metric_error_output.py +7 -3
vellum/types/test_suite_run_metric_number_output.py +7 -3
vellum/types/test_suite_run_metric_output.py +55 -12
vellum/types/test_suite_run_metric_string_output.py +7 -3
vellum/types/test_suite_run_read.py +7 -3
vellum/types/test_suite_run_test_suite.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_data.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_data_request.py +7 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_request.py +7 -3
vellum/types/test_suite_test_case.py +7 -3
vellum/types/test_suite_test_case_bulk_operation_request.py +75 -16
vellum/types/test_suite_test_case_bulk_result.py +74 -16
vellum/types/test_suite_test_case_create_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_created_bulk_result.py +7 -3
vellum/types/test_suite_test_case_created_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_delete_bulk_operation_data_request.py +7 -3
vellum/types/test_suite_test_case_delete_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_deleted_bulk_result.py +7 -3
vellum/types/test_suite_test_case_deleted_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_rejected_bulk_result.py +7 -3
vellum/types/test_suite_test_case_replace_bulk_operation_request.py +7 -3
vellum/types/test_suite_test_case_replaced_bulk_result.py +7 -3
vellum/types/test_suite_test_case_replaced_bulk_result_data.py +7 -3
vellum/types/test_suite_test_case_upsert_bulk_operation_request.py +7 -3
vellum/types/{execute_workflow_error_response.py → tik_token_tokenizer_config.py} +11 -6
vellum/types/{generate_error_response.py → tik_token_tokenizer_config_request.py} +11 -6
vellum/types/token_overlapping_window_chunker_config.py +7 -3
vellum/types/token_overlapping_window_chunker_config_request.py +7 -3
vellum/types/token_overlapping_window_chunking.py +7 -3
vellum/types/token_overlapping_window_chunking_request.py +7 -3
vellum/types/upload_document_response.py +7 -3
vellum/types/upsert_test_suite_test_case_request.py +7 -3
vellum/types/vellum_error.py +7 -3
vellum/types/vellum_error_request.py +7 -3
vellum/types/vellum_image.py +7 -3
vellum/types/vellum_image_request.py +7 -3
vellum/types/vellum_variable.py +7 -3
vellum/types/visibility_enum.py +5 -0
vellum/types/workflow_deployment_read.py +12 -3
vellum/types/workflow_event_error.py +7 -3
vellum/types/workflow_execution_actual_chat_history_request.py +7 -3
vellum/types/workflow_execution_actual_json_request.py +7 -3
vellum/types/workflow_execution_actual_string_request.py +7 -3
vellum/types/workflow_execution_node_result_event.py +7 -3
vellum/types/workflow_execution_workflow_result_event.py +7 -3
vellum/types/workflow_expand_meta_request.py +7 -3
vellum/types/workflow_node_result_data.py +189 -45
vellum/types/workflow_node_result_event.py +101 -20
vellum/types/workflow_output.py +171 -36
vellum/types/workflow_output_array.py +7 -3
vellum/types/workflow_output_chat_history.py +7 -3
vellum/types/workflow_output_error.py +7 -3
vellum/types/workflow_output_function_call.py +7 -3
vellum/types/workflow_output_image.py +7 -3
vellum/types/workflow_output_json.py +7 -3
vellum/types/workflow_output_number.py +7 -3
vellum/types/workflow_output_search_results.py +7 -3
vellum/types/workflow_output_string.py +7 -3
vellum/types/workflow_release_tag_read.py +7 -3
vellum/types/workflow_release_tag_workflow_deployment_history_item.py +7 -3
vellum/types/workflow_request_chat_history_input_request.py +7 -3
vellum/types/workflow_request_input_request.py +72 -16
vellum/types/workflow_request_json_input_request.py +7 -3
vellum/types/workflow_request_number_input_request.py +7 -3
vellum/types/workflow_request_string_input_request.py +7 -3
vellum/types/workflow_result_event.py +7 -3
vellum/types/workflow_result_event_output_data.py +178 -33
vellum/types/workflow_result_event_output_data_array.py +7 -3
vellum/types/workflow_result_event_output_data_chat_history.py +7 -3
vellum/types/workflow_result_event_output_data_error.py +7 -3
vellum/types/workflow_result_event_output_data_function_call.py +7 -3
vellum/types/workflow_result_event_output_data_json.py +7 -3
vellum/types/workflow_result_event_output_data_number.py +7 -3
vellum/types/workflow_result_event_output_data_search_results.py +7 -3
vellum/types/workflow_result_event_output_data_string.py +7 -3
vellum/types/workflow_stream_event.py +43 -8
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/METADATA +13 -1
vellum_ai-0.7.5.dist-info/RECORD +502 -0
vellum/types/array_enum.py +0 -5
vellum/types/chat_history_enum.py +0 -5
vellum/types/create_enum.py +0 -5
vellum/types/created_enum.py +0 -5
vellum/types/delete_enum.py +0 -5
vellum/types/deleted_enum.py +0 -5
vellum/types/error_enum.py +0 -5
vellum/types/function_call_enum.py +0 -5
vellum/types/hkunlp_instructor_xl_enum.py +0 -5
vellum/types/image_enum.py +0 -5
vellum/types/initiated_enum.py +0 -5
vellum/types/intfloat_multilingual_e_5_large_enum.py +0 -5
vellum/types/json_enum.py +0 -5
vellum/types/merge_enum.py +0 -5
vellum/types/metric_enum.py +0 -5
vellum/types/number_enum.py +0 -5
vellum/types/pdf_enum.py +0 -5
vellum/types/reducto_chunker_enum.py +0 -5
vellum/types/rejected_enum.py +0 -5
vellum/types/replace_enum.py +0 -5
vellum/types/replaced_enum.py +0 -5
vellum/types/search_error_response.py +0 -28
vellum/types/search_results_enum.py +0 -5
vellum/types/sentence_chunker_enum.py +0 -5
vellum/types/sentence_transformers_multi_qa_mpnet_base_cos_v_1_enum.py +0 -5
vellum/types/sentence_transformers_multi_qa_mpnet_base_dot_v_1_enum.py +0 -5
vellum/types/streaming_enum.py +0 -5
vellum/types/string_enum.py +0 -5
vellum/types/submit_completion_actuals_error_response.py +0 -25
vellum/types/subworkflow_enum.py +0 -5
vellum/types/test_suite_run_deployment_release_tag_exec_config_type_enum.py +0 -5
vellum/types/test_suite_run_external_exec_config_type_enum.py +0 -5
vellum/types/test_suite_run_metric_error_output_type_enum.py +0 -5
vellum/types/test_suite_run_metric_number_output_type_enum.py +0 -5
vellum/types/test_suite_run_metric_string_output_type_enum.py +0 -5
vellum/types/test_suite_run_workflow_release_tag_exec_config_type_enum.py +0 -5
vellum/types/text_embedding_3_large_enum.py +0 -5
vellum/types/text_embedding_3_small_enum.py +0 -5
vellum/types/text_embedding_ada_002_enum.py +0 -5
vellum/types/token_overlapping_window_chunker_enum.py +0 -5
vellum/types/upload_document_error_response.py +0 -25
vellum/types/upsert_enum.py +0 -5
vellum_ai-0.7.3.dist-info/RECORD +0 -496
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/LICENSE +0 -0
{vellum_ai-0.7.3.dist-info → vellum_ai-0.7.5.dist-info}/WHEEL +0 -0

vellum/client.py CHANGED Viewed

@@ -2,16 +2,13 @@
 import json
 import typing
-import urllib.parse
 from json.decoder import JSONDecodeError
 import httpx
 from .core.api_error import ApiError
 from .core.client_wrapper import AsyncClientWrapper, SyncClientWrapper
-from .core.jsonable_encoder import jsonable_encoder
 from .core.pydantic_utilities import pydantic_v1
-from .core.remove_none_from_dict import remove_none_from_dict
 from .core.request_options import RequestOptions
 from .environment import VellumEnvironment
 from .errors.bad_request_error import BadRequestError
@@ -22,6 +19,7 @@ from .resources.deployments.client import AsyncDeploymentsClient, DeploymentsCli
 from .resources.document_indexes.client import AsyncDocumentIndexesClient, DocumentIndexesClient
 from .resources.documents.client import AsyncDocumentsClient, DocumentsClient
 from .resources.folder_entities.client import AsyncFolderEntitiesClient, FolderEntitiesClient
+from .resources.ml_models.client import AsyncMlModelsClient, MlModelsClient
 from .resources.sandboxes.client import AsyncSandboxesClient, SandboxesClient
 from .resources.test_suite_runs.client import AsyncTestSuiteRunsClient, TestSuiteRunsClient
 from .resources.test_suites.client import AsyncTestSuitesClient, TestSuitesClient
@@ -52,21 +50,31 @@ OMIT = typing.cast(typing.Any, ...)
 class Vellum:
     """
-    Use this class to access the different functions within the SDK. You can instantiate any number of clients with different configuration that will propogate to these functions.
+    Use this class to access the different functions within the SDK. You can instantiate any number of clients with different configuration that will propagate to these functions.
-    Parameters:
-        - environment: VellumEnvironment. The environment to use for requests from the client. from .environment import VellumEnvironment
+    Parameters
+    ----------
+    environment : VellumEnvironment
+        The environment to use for requests from the client. from .environment import VellumEnvironment
-                                          Defaults to VellumEnvironment.PRODUCTION
-        - api_key: str.
-        - timeout: typing.Optional[float]. The timeout to be used, in seconds, for requests by default the timeout is 60 seconds, unless a custom httpx client is used, in which case a default is not set.
+        Defaults to VellumEnvironment.PRODUCTION
-        - follow_redirects: typing.Optional[bool]. Whether the default httpx client follows redirects or not, this is irrelevant if a custom httpx client is passed in.
-        - httpx_client: typing.Optional[httpx.Client]. The httpx client to use for making requests, a preconfigured client is used by default, however this is useful should you want to pass in any custom httpx configuration.
-    ---
+    api_key : str
+    timeout : typing.Optional[float]
+        The timeout to be used, in seconds, for requests. By default there is no timeout set, unless a custom httpx client is used, in which case this default is not enforced.
+    follow_redirects : typing.Optional[bool]
+        Whether the default httpx client follows redirects or not, this is irrelevant if a custom httpx client is passed in.
+    httpx_client : typing.Optional[httpx.Client]
+        The httpx client to use for making requests, a preconfigured client is used by default, however this is useful should you want to pass in any custom httpx configuration.
+    Examples
+    --------
     from vellum.client import Vellum
     client = Vellum(
@@ -81,7 +89,7 @@ class Vellum:
         api_key: str,
         timeout: typing.Optional[float] = None,
         follow_redirects: typing.Optional[bool] = True,
-        httpx_client: typing.Optional[httpx.Client] = None,
+        httpx_client: typing.Optional[httpx.Client] = None
     ):
         _defaulted_timeout = timeout if timeout is not None else None if httpx_client is None else None
         self._client_wrapper = SyncClientWrapper(
@@ -98,6 +106,7 @@ class Vellum:
         self.document_indexes = DocumentIndexesClient(client_wrapper=self._client_wrapper)
         self.documents = DocumentsClient(client_wrapper=self._client_wrapper)
         self.folder_entities = FolderEntitiesClient(client_wrapper=self._client_wrapper)
+        self.ml_models = MlModelsClient(client_wrapper=self._client_wrapper)
         self.sandboxes = SandboxesClient(client_wrapper=self._client_wrapper)
         self.test_suite_runs = TestSuiteRunsClient(client_wrapper=self._client_wrapper)
         self.test_suites = TestSuitesClient(client_wrapper=self._client_wrapper)
@@ -116,32 +125,50 @@ class Vellum:
         raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest] = OMIT,
         expand_raw: typing.Optional[typing.Sequence[str]] = OMIT,
         metadata: typing.Optional[typing.Dict[str, typing.Any]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> ExecutePromptResponse:
         """
         Executes a deployed Prompt and returns the result.
-        Parameters:
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. A list consisting of the Prompt Deployment's input variables and their values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            A list consisting of the Prompt Deployment's input variables and their values.
+        prompt_deployment_id : typing.Optional[str]
+            The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        prompt_deployment_name : typing.Optional[str]
+            The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
-            - prompt_deployment_id: typing.Optional[str]. The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
-            - prompt_deployment_name: typing.Optional[str]. The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        expand_meta : typing.Optional[PromptDeploymentExpandMetaRequestRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
+        raw_overrides : typing.Optional[RawPromptExecutionOverridesRequest]
+            Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
+        expand_raw : typing.Optional[typing.Sequence[str]]
+            A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
-            - expand_meta: typing.Optional[PromptDeploymentExpandMetaRequestRequest]. An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
+        metadata : typing.Optional[typing.Dict[str, typing.Any]]
+            Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
-            - raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest]. Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - expand_raw: typing.Optional[typing.Sequence[str]]. A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
+        Returns
+        -------
+        ExecutePromptResponse
-            - metadata: typing.Optional[typing.Dict[str, typing.Any]]. Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import (
             PromptDeploymentExpandMetaRequestRequest,
             PromptDeploymentInputRequest_String,
@@ -180,60 +207,35 @@ class Vellum:
             metadata={"string": {"key": "value"}},
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if prompt_deployment_id is not OMIT:
-            _request["prompt_deployment_id"] = prompt_deployment_id
-        if prompt_deployment_name is not OMIT:
-            _request["prompt_deployment_name"] = prompt_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if raw_overrides is not OMIT:
-            _request["raw_overrides"] = raw_overrides
-        if expand_raw is not OMIT:
-            _request["expand_raw"] = expand_raw
-        if metadata is not OMIT:
-            _request["metadata"] = metadata
         _response = self._client_wrapper.httpx_client.request(
+            "v1/execute-prompt",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-prompt"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "prompt_deployment_id": prompt_deployment_id,
+                "prompt_deployment_name": prompt_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "expand_meta": expand_meta,
+                "raw_overrides": raw_overrides,
+                "expand_raw": expand_raw,
+                "metadata": metadata,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(ExecutePromptResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(ExecutePromptResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -251,32 +253,50 @@ class Vellum:
         raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest] = OMIT,
         expand_raw: typing.Optional[typing.Sequence[str]] = OMIT,
         metadata: typing.Optional[typing.Dict[str, typing.Any]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.Iterator[ExecutePromptEvent]:
         """
         Executes a deployed Prompt and streams back the results.
-        Parameters:
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. A list consisting of the Prompt Deployment's input variables and their values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            A list consisting of the Prompt Deployment's input variables and their values.
+        prompt_deployment_id : typing.Optional[str]
+            The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        prompt_deployment_name : typing.Optional[str]
+            The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
-            - prompt_deployment_id: typing.Optional[str]. The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
-            - prompt_deployment_name: typing.Optional[str]. The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
+        expand_meta : typing.Optional[PromptDeploymentExpandMetaRequestRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
+        raw_overrides : typing.Optional[RawPromptExecutionOverridesRequest]
+            Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
-            - expand_meta: typing.Optional[PromptDeploymentExpandMetaRequestRequest]. An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
+        expand_raw : typing.Optional[typing.Sequence[str]]
+            A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
-            - raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest]. Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
+        metadata : typing.Optional[typing.Dict[str, typing.Any]]
+            Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
-            - expand_raw: typing.Optional[typing.Sequence[str]]. A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - metadata: typing.Optional[typing.Dict[str, typing.Any]]. Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
+        Yields
+        ------
+        typing.Iterator[ExecutePromptEvent]
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import (
             PromptDeploymentExpandMetaRequestRequest,
             PromptDeploymentInputRequest_String,
@@ -287,7 +307,7 @@ class Vellum:
         client = Vellum(
             api_key="YOUR_API_KEY",
         )
-        client.execute_prompt_stream(
+        response = client.execute_prompt_stream(
             inputs=[
                 PromptDeploymentInputRequest_String(
                     name="string",
@@ -314,66 +334,46 @@ class Vellum:
             expand_raw=["string"],
             metadata={"string": {"key": "value"}},
         )
+        for chunk in response:
+            yield chunk
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if prompt_deployment_id is not OMIT:
-            _request["prompt_deployment_id"] = prompt_deployment_id
-        if prompt_deployment_name is not OMIT:
-            _request["prompt_deployment_name"] = prompt_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if raw_overrides is not OMIT:
-            _request["raw_overrides"] = raw_overrides
-        if expand_raw is not OMIT:
-            _request["expand_raw"] = expand_raw
-        if metadata is not OMIT:
-            _request["metadata"] = metadata
         with self._client_wrapper.httpx_client.stream(
+            "v1/execute-prompt-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-prompt-stream"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "prompt_deployment_id": prompt_deployment_id,
+                "prompt_deployment_name": prompt_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "expand_meta": expand_meta,
+                "raw_overrides": raw_overrides,
+                "expand_raw": expand_raw,
+                "metadata": metadata,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                for _text in _response.iter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(ExecutePromptEvent, json.loads(_text))  # type: ignore
-                return
-            _response.read()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 403:
-                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    for _text in _response.iter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(ExecutePromptEvent, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                _response.read()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 403:
+                    raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -388,26 +388,41 @@ class Vellum:
         workflow_deployment_name: typing.Optional[str] = OMIT,
         release_tag: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> ExecuteWorkflowResponse:
         """
         Executes a deployed Workflow and returns its outputs.
-        Parameters:
-            - inputs: typing.Sequence[WorkflowRequestInputRequest]. The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[WorkflowRequestInputRequest]
+            The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        expand_meta : typing.Optional[WorkflowExpandMetaRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        workflow_deployment_id : typing.Optional[str]
+            The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
+        workflow_deployment_name : typing.Optional[str]
+            The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
-            - expand_meta: typing.Optional[WorkflowExpandMetaRequest]. An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - workflow_deployment_id: typing.Optional[str]. The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
-            - workflow_deployment_name: typing.Optional[str]. The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        Returns
+        -------
+        ExecuteWorkflowResponse
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import WorkflowExpandMetaRequest, WorkflowRequestInputRequest_String
         from vellum.client import Vellum
@@ -430,52 +445,30 @@ class Vellum:
             external_id="string",
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if workflow_deployment_id is not OMIT:
-            _request["workflow_deployment_id"] = workflow_deployment_id
-        if workflow_deployment_name is not OMIT:
-            _request["workflow_deployment_name"] = workflow_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
         _response = self._client_wrapper.httpx_client.request(
+            "v1/execute-workflow",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-workflow"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "expand_meta": expand_meta,
+                "workflow_deployment_id": workflow_deployment_id,
+                "workflow_deployment_name": workflow_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(ExecuteWorkflowResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(ExecuteWorkflowResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -491,35 +484,51 @@ class Vellum:
         release_tag: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
         event_types: typing.Optional[typing.Sequence[WorkflowExecutionEventType]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.Iterator[WorkflowStreamEvent]:
         """
         Executes a deployed Workflow and streams back its results.
-        Parameters:
-            - inputs: typing.Sequence[WorkflowRequestInputRequest]. The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[WorkflowRequestInputRequest]
+            The list of inputs defined in the Workflow's Deployment with their corresponding values.
-            - expand_meta: typing.Optional[WorkflowExpandMetaRequest]. An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        expand_meta : typing.Optional[WorkflowExpandMetaRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
-            - workflow_deployment_id: typing.Optional[str]. The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
+        workflow_deployment_id : typing.Optional[str]
+            The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
-            - workflow_deployment_name: typing.Optional[str]. The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
+        workflow_deployment_name : typing.Optional[str]
+            The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
-            - event_types: typing.Optional[typing.Sequence[WorkflowExecutionEventType]]. Optionally specify which events you want to receive. Defaults to only WORKFLOW events. Note that the schema of non-WORKFLOW events is unstable and should be used with caution.
+        event_types : typing.Optional[typing.Sequence[WorkflowExecutionEventType]]
+            Optionally specify which events you want to receive. Defaults to only WORKFLOW events. Note that the schema of non-WORKFLOW events is unstable and should be used with caution.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Yields
+        ------
+        typing.Iterator[WorkflowStreamEvent]
+        Examples
+        --------
         from vellum import WorkflowExpandMetaRequest, WorkflowRequestInputRequest_String
         from vellum.client import Vellum
         client = Vellum(
             api_key="YOUR_API_KEY",
         )
-        client.execute_workflow_stream(
+        response = client.execute_workflow_stream(
             inputs=[
                 WorkflowRequestInputRequest_String(
                     name="string",
@@ -535,62 +544,42 @@ class Vellum:
             external_id="string",
             event_types=["NODE"],
         )
+        for chunk in response:
+            yield chunk
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if workflow_deployment_id is not OMIT:
-            _request["workflow_deployment_id"] = workflow_deployment_id
-        if workflow_deployment_name is not OMIT:
-            _request["workflow_deployment_name"] = workflow_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if event_types is not OMIT:
-            _request["event_types"] = event_types
         with self._client_wrapper.httpx_client.stream(
+            "v1/execute-workflow-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/execute-workflow-stream"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "expand_meta": expand_meta,
+                "workflow_deployment_id": workflow_deployment_id,
+                "workflow_deployment_name": workflow_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "event_types": event_types,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                for _text in _response.iter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(WorkflowStreamEvent, json.loads(_text))  # type: ignore
-                return
-            _response.read()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    for _text in _response.iter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(WorkflowStreamEvent, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                _response.read()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -599,11 +588,11 @@ class Vellum:
     def generate(
         self,
         *,
+        requests: typing.Sequence[GenerateRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        requests: typing.Sequence[GenerateRequest],
         options: typing.Optional[GenerateOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> GenerateResponse:
         """
         Generate a completion using a previously defined deployment.
@@ -611,17 +600,30 @@ class Vellum:
         Important: This endpoint is DEPRECATED and has been superseded by
         [execute-prompt](/api-reference/api-reference/execute-prompt).
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        requests : typing.Sequence[GenerateRequest]
+            The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
+        options : typing.Optional[GenerateOptionsRequest]
+            Additional configuration that can be used to control what's included in the response.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - requests: typing.Sequence[GenerateRequest]. The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        Returns
+        -------
+        GenerateResponse
-            - options: typing.Optional[GenerateOptionsRequest]. Additional configuration that can be used to control what's included in the response.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import GenerateRequest
         from vellum.client import Vellum
@@ -631,55 +633,35 @@ class Vellum:
         client.generate(
             requests=[
                 GenerateRequest(
-                    input_values={},
+                    input_values={"key": "value"},
                 )
             ],
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"requests": requests}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if options is not OMIT:
-            _request["options"] = options
         _response = self._client_wrapper.httpx_client.request(
+            "v1/generate",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/generate"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "requests": requests,
+                "options": options,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(GenerateResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(GenerateResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -688,11 +670,11 @@ class Vellum:
     def generate_stream(
         self,
         *,
+        requests: typing.Sequence[GenerateRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        requests: typing.Sequence[GenerateRequest],
         options: typing.Optional[GenerateOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.Iterator[GenerateStreamResponse]:
         """
         Generate a stream of completions using a previously defined deployment.
@@ -700,17 +682,30 @@ class Vellum:
         Important: This endpoint is DEPRECATED and has been superseded by
         [execute-prompt-stream](/api-reference/api-reference/execute-prompt-stream).
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        requests : typing.Sequence[GenerateRequest]
+            The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
+        options : typing.Optional[GenerateOptionsRequest]
+            Additional configuration that can be used to control what's included in the response.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - requests: typing.Sequence[GenerateRequest]. The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        Yields
+        ------
+        typing.Iterator[GenerateStreamResponse]
-            - options: typing.Optional[GenerateOptionsRequest]. Additional configuration that can be used to control what's included in the response.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import (
             ChatMessageContentRequest_String,
             ChatMessageRequest,
@@ -722,7 +717,7 @@ class Vellum:
         client = Vellum(
             api_key="YOUR_API_KEY",
         )
-        client.generate_stream(
+        response = client.generate_stream(
             deployment_id="string",
             deployment_name="string",
             requests=[
@@ -743,56 +738,41 @@ class Vellum:
                 logprobs="ALL",
             ),
         )
+        for chunk in response:
+            yield chunk
         """
-        _request: typing.Dict[str, typing.Any] = {"requests": requests}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if options is not OMIT:
-            _request["options"] = options
         with self._client_wrapper.httpx_client.stream(
+            "v1/generate-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/generate-stream"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "requests": requests,
+                "options": options,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                for _text in _response.iter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(GenerateStreamResponse, json.loads(_text))  # type: ignore
-                return
-            _response.read()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 403:
-                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    for _text in _response.iter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(GenerateStreamResponse, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                _response.read()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 403:
+                    raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -801,26 +781,39 @@ class Vellum:
     def search(
         self,
         *,
+        query: str,
         index_id: typing.Optional[str] = OMIT,
         index_name: typing.Optional[str] = OMIT,
-        query: str,
         options: typing.Optional[SearchRequestOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> SearchResponse:
         """
         Perform a search against a document index.
-        Parameters:
-            - index_id: typing.Optional[str]. The ID of the index to search against. Must provide either this or index_name.
+        Parameters
+        ----------
+        query : str
+            The query to search for.
+        index_id : typing.Optional[str]
+            The ID of the index to search against. Must provide either this or index_name.
-            - index_name: typing.Optional[str]. The name of the index to search against. Must provide either this or index_id.
+        index_name : typing.Optional[str]
+            The name of the index to search against. Must provide either this or index_id.
-            - query: str. The query to search for.
+        options : typing.Optional[SearchRequestOptionsRequest]
+            Configuration options for the search.
-            - options: typing.Optional[SearchRequestOptionsRequest]. Configuration options for the search.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Returns
+        -------
+        SearchResponse
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -830,48 +823,23 @@ class Vellum:
             query="query",
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"query": query}
-        if index_id is not OMIT:
-            _request["index_id"] = index_id
-        if index_name is not OMIT:
-            _request["index_name"] = index_name
-        if options is not OMIT:
-            _request["options"] = options
         _response = self._client_wrapper.httpx_client.request(
+            "v1/search",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/search"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"index_id": index_id, "index_name": index_name, "query": query, "options": options},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(SearchResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(SearchResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -880,23 +848,34 @@ class Vellum:
     def submit_completion_actuals(
         self,
         *,
+        actuals: typing.Sequence[SubmitCompletionActualRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        actuals: typing.Sequence[SubmitCompletionActualRequest],
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> None:
         """
         Used to submit feedback regarding the quality of previously generated completions.
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        actuals : typing.Sequence[SubmitCompletionActualRequest]
+            Feedback regarding the quality of previously generated completions
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - actuals: typing.Sequence[SubmitCompletionActualRequest]. Feedback regarding the quality of previously generated completions
+        Returns
+        -------
+        None
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
         from vellum import SubmitCompletionActualRequest
         from vellum.client import Vellum
@@ -907,48 +886,23 @@ class Vellum:
             actuals=[SubmitCompletionActualRequest()],
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"actuals": actuals}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
         _response = self._client_wrapper.httpx_client.request(
+            "v1/submit-completion-actuals",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/submit-completion-actuals"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"deployment_id": deployment_id, "deployment_name": deployment_name, "actuals": actuals},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -960,22 +914,33 @@ class Vellum:
         actuals: typing.Sequence[SubmitWorkflowExecutionActualRequest],
         execution_id: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> None:
         """
             Used to submit feedback regarding the quality of previous workflow execution and its outputs.
             **Note:** Uses a base url of `https://predict.vellum.ai`.
-        Parameters:
-            - actuals: typing.Sequence[SubmitWorkflowExecutionActualRequest]. Feedback regarding the quality of an output on a previously executed workflow.
+        Parameters
+        ----------
+        actuals : typing.Sequence[SubmitWorkflowExecutionActualRequest]
+            Feedback regarding the quality of an output on a previously executed workflow.
-            - execution_id: typing.Optional[str]. The Vellum-generated ID of a previously executed workflow. Must provide either this or external_id.
+        execution_id : typing.Optional[str]
+            The Vellum-generated ID of a previously executed workflow. Must provide either this or external_id.
-            - external_id: typing.Optional[str]. The external ID that was originally provided by when executing the workflow, if applicable, that you'd now like to submit actuals for. Must provide either this or execution_id.
+        external_id : typing.Optional[str]
+            The external ID that was originally provided by when executing the workflow, if applicable, that you'd now like to submit actuals for. Must provide either this or execution_id.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Returns
+        -------
+        None
+        Examples
+        --------
         from vellum.client import Vellum
         client = Vellum(
@@ -985,42 +950,17 @@ class Vellum:
             actuals=[],
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"actuals": actuals}
-        if execution_id is not OMIT:
-            _request["execution_id"] = execution_id
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
         _response = self._client_wrapper.httpx_client.request(
+            "v1/submit-workflow-execution-actuals",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/submit-workflow-execution-actuals"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"actuals": actuals, "execution_id": execution_id, "external_id": external_id},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return
         try:
+            if 200 <= _response.status_code < 300:
+                return
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1029,21 +969,31 @@ class Vellum:
 class AsyncVellum:
     """
-    Use this class to access the different functions within the SDK. You can instantiate any number of clients with different configuration that will propogate to these functions.
+    Use this class to access the different functions within the SDK. You can instantiate any number of clients with different configuration that will propagate to these functions.
+    Parameters
+    ----------
+    environment : VellumEnvironment
+        The environment to use for requests from the client. from .environment import VellumEnvironment
-    Parameters:
-        - environment: VellumEnvironment. The environment to use for requests from the client. from .environment import VellumEnvironment
-                                          Defaults to VellumEnvironment.PRODUCTION
-        - api_key: str.
+        Defaults to VellumEnvironment.PRODUCTION
-        - timeout: typing.Optional[float]. The timeout to be used, in seconds, for requests by default the timeout is 60 seconds, unless a custom httpx client is used, in which case a default is not set.
-        - follow_redirects: typing.Optional[bool]. Whether the default httpx client follows redirects or not, this is irrelevant if a custom httpx client is passed in.
-        - httpx_client: typing.Optional[httpx.AsyncClient]. The httpx client to use for making requests, a preconfigured client is used by default, however this is useful should you want to pass in any custom httpx configuration.
-    ---
+    api_key : str
+    timeout : typing.Optional[float]
+        The timeout to be used, in seconds, for requests. By default there is no timeout set, unless a custom httpx client is used, in which case this default is not enforced.
+    follow_redirects : typing.Optional[bool]
+        Whether the default httpx client follows redirects or not, this is irrelevant if a custom httpx client is passed in.
+    httpx_client : typing.Optional[httpx.AsyncClient]
+        The httpx client to use for making requests, a preconfigured client is used by default, however this is useful should you want to pass in any custom httpx configuration.
+    Examples
+    --------
     from vellum.client import AsyncVellum
     client = AsyncVellum(
@@ -1058,7 +1008,7 @@ class AsyncVellum:
         api_key: str,
         timeout: typing.Optional[float] = None,
         follow_redirects: typing.Optional[bool] = True,
-        httpx_client: typing.Optional[httpx.AsyncClient] = None,
+        httpx_client: typing.Optional[httpx.AsyncClient] = None
     ):
         _defaulted_timeout = timeout if timeout is not None else None if httpx_client is None else None
         self._client_wrapper = AsyncClientWrapper(
@@ -1075,6 +1025,7 @@ class AsyncVellum:
         self.document_indexes = AsyncDocumentIndexesClient(client_wrapper=self._client_wrapper)
         self.documents = AsyncDocumentsClient(client_wrapper=self._client_wrapper)
         self.folder_entities = AsyncFolderEntitiesClient(client_wrapper=self._client_wrapper)
+        self.ml_models = AsyncMlModelsClient(client_wrapper=self._client_wrapper)
         self.sandboxes = AsyncSandboxesClient(client_wrapper=self._client_wrapper)
         self.test_suite_runs = AsyncTestSuiteRunsClient(client_wrapper=self._client_wrapper)
         self.test_suites = AsyncTestSuitesClient(client_wrapper=self._client_wrapper)
@@ -1093,32 +1044,52 @@ class AsyncVellum:
         raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest] = OMIT,
         expand_raw: typing.Optional[typing.Sequence[str]] = OMIT,
         metadata: typing.Optional[typing.Dict[str, typing.Any]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> ExecutePromptResponse:
         """
         Executes a deployed Prompt and returns the result.
-        Parameters:
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. A list consisting of the Prompt Deployment's input variables and their values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            A list consisting of the Prompt Deployment's input variables and their values.
+        prompt_deployment_id : typing.Optional[str]
+            The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        prompt_deployment_name : typing.Optional[str]
+            The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
-            - prompt_deployment_id: typing.Optional[str]. The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        expand_meta : typing.Optional[PromptDeploymentExpandMetaRequestRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
-            - prompt_deployment_name: typing.Optional[str]. The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        raw_overrides : typing.Optional[RawPromptExecutionOverridesRequest]
+            Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
+        expand_raw : typing.Optional[typing.Sequence[str]]
+            A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
+        metadata : typing.Optional[typing.Dict[str, typing.Any]]
+            Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
-            - expand_meta: typing.Optional[PromptDeploymentExpandMetaRequestRequest]. An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest]. Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
+        Returns
+        -------
+        ExecutePromptResponse
-            - expand_raw: typing.Optional[typing.Sequence[str]]. A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
-            - metadata: typing.Optional[typing.Dict[str, typing.Any]]. Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import (
             PromptDeploymentExpandMetaRequestRequest,
             PromptDeploymentInputRequest_String,
@@ -1129,88 +1100,69 @@ class AsyncVellum:
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.execute_prompt(
-            inputs=[
-                PromptDeploymentInputRequest_String(
-                    name="string",
-                    value="string",
-                )
-            ],
-            prompt_deployment_id="string",
-            prompt_deployment_name="string",
-            release_tag="string",
-            external_id="string",
-            expand_meta=PromptDeploymentExpandMetaRequestRequest(
-                model_name=True,
-                usage=True,
-                finish_reason=True,
-                latency=True,
-                deployment_release_tag=True,
-                prompt_version_id=True,
-            ),
-            raw_overrides=RawPromptExecutionOverridesRequest(
-                body={"string": {"key": "value"}},
-                headers={"string": {"key": "value"}},
-                url="string",
-            ),
-            expand_raw=["string"],
-            metadata={"string": {"key": "value"}},
-        )
+        async def main() -> None:
+            await client.execute_prompt(
+                inputs=[
+                    PromptDeploymentInputRequest_String(
+                        name="string",
+                        value="string",
+                    )
+                ],
+                prompt_deployment_id="string",
+                prompt_deployment_name="string",
+                release_tag="string",
+                external_id="string",
+                expand_meta=PromptDeploymentExpandMetaRequestRequest(
+                    model_name=True,
+                    usage=True,
+                    finish_reason=True,
+                    latency=True,
+                    deployment_release_tag=True,
+                    prompt_version_id=True,
+                ),
+                raw_overrides=RawPromptExecutionOverridesRequest(
+                    body={"string": {"key": "value"}},
+                    headers={"string": {"key": "value"}},
+                    url="string",
+                ),
+                expand_raw=["string"],
+                metadata={"string": {"key": "value"}},
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if prompt_deployment_id is not OMIT:
-            _request["prompt_deployment_id"] = prompt_deployment_id
-        if prompt_deployment_name is not OMIT:
-            _request["prompt_deployment_name"] = prompt_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if raw_overrides is not OMIT:
-            _request["raw_overrides"] = raw_overrides
-        if expand_raw is not OMIT:
-            _request["expand_raw"] = expand_raw
-        if metadata is not OMIT:
-            _request["metadata"] = metadata
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/execute-prompt",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-prompt"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "prompt_deployment_id": prompt_deployment_id,
+                "prompt_deployment_name": prompt_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "expand_meta": expand_meta,
+                "raw_overrides": raw_overrides,
+                "expand_raw": expand_raw,
+                "metadata": metadata,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(ExecutePromptResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(ExecutePromptResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1228,32 +1180,52 @@ class AsyncVellum:
         raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest] = OMIT,
         expand_raw: typing.Optional[typing.Sequence[str]] = OMIT,
         metadata: typing.Optional[typing.Dict[str, typing.Any]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.AsyncIterator[ExecutePromptEvent]:
         """
         Executes a deployed Prompt and streams back the results.
-        Parameters:
-            - inputs: typing.Sequence[PromptDeploymentInputRequest]. A list consisting of the Prompt Deployment's input variables and their values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[PromptDeploymentInputRequest]
+            A list consisting of the Prompt Deployment's input variables and their values.
-            - prompt_deployment_id: typing.Optional[str]. The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
+        prompt_deployment_id : typing.Optional[str]
+            The ID of the Prompt Deployment. Must provide either this or prompt_deployment_name.
-            - prompt_deployment_name: typing.Optional[str]. The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
+        prompt_deployment_name : typing.Optional[str]
+            The unique name of the Prompt Deployment. Must provide either this or prompt_deployment_id.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Prompt Deployment
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique within a given Prompt Deployment.
-            - expand_meta: typing.Optional[PromptDeploymentExpandMetaRequestRequest]. An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
+        expand_meta : typing.Optional[PromptDeploymentExpandMetaRequestRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this prompt execution in the API response. Corresponding values will be returned under the `meta` key of the API response.
-            - raw_overrides: typing.Optional[RawPromptExecutionOverridesRequest]. Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
+        raw_overrides : typing.Optional[RawPromptExecutionOverridesRequest]
+            Overrides for the raw API request sent to the model host. Combined with `expand_raw`, it can be used to access new features from models.
-            - expand_raw: typing.Optional[typing.Sequence[str]]. A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
+        expand_raw : typing.Optional[typing.Sequence[str]]
+            A list of keys whose values you'd like to directly return from the JSON response of the model provider. Useful if you need lower-level info returned by model providers that Vellum would otherwise omit. Corresponding key/value pairs will be returned under the `raw` key of the API response.
-            - metadata: typing.Optional[typing.Dict[str, typing.Any]]. Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
+        metadata : typing.Optional[typing.Dict[str, typing.Any]]
+            Arbitrary JSON metadata associated with this request. Can be used to capture additional monitoring data such as user id, session id, etc. for future analysis.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
+        Yields
+        ------
+        typing.AsyncIterator[ExecutePromptEvent]
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import (
             PromptDeploymentExpandMetaRequestRequest,
             PromptDeploymentInputRequest_String,
@@ -1264,93 +1236,79 @@ class AsyncVellum:
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.execute_prompt_stream(
-            inputs=[
-                PromptDeploymentInputRequest_String(
-                    name="string",
-                    value="string",
-                )
-            ],
-            prompt_deployment_id="string",
-            prompt_deployment_name="string",
-            release_tag="string",
-            external_id="string",
-            expand_meta=PromptDeploymentExpandMetaRequestRequest(
-                model_name=True,
-                usage=True,
-                finish_reason=True,
-                latency=True,
-                deployment_release_tag=True,
-                prompt_version_id=True,
-            ),
-            raw_overrides=RawPromptExecutionOverridesRequest(
-                body={"string": {"key": "value"}},
-                headers={"string": {"key": "value"}},
-                url="string",
-            ),
-            expand_raw=["string"],
-            metadata={"string": {"key": "value"}},
-        )
+        async def main() -> None:
+            response = await client.execute_prompt_stream(
+                inputs=[
+                    PromptDeploymentInputRequest_String(
+                        name="string",
+                        value="string",
+                    )
+                ],
+                prompt_deployment_id="string",
+                prompt_deployment_name="string",
+                release_tag="string",
+                external_id="string",
+                expand_meta=PromptDeploymentExpandMetaRequestRequest(
+                    model_name=True,
+                    usage=True,
+                    finish_reason=True,
+                    latency=True,
+                    deployment_release_tag=True,
+                    prompt_version_id=True,
+                ),
+                raw_overrides=RawPromptExecutionOverridesRequest(
+                    body={"string": {"key": "value"}},
+                    headers={"string": {"key": "value"}},
+                    url="string",
+                ),
+                expand_raw=["string"],
+                metadata={"string": {"key": "value"}},
+            )
+            async for chunk in response:
+                yield chunk
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if prompt_deployment_id is not OMIT:
-            _request["prompt_deployment_id"] = prompt_deployment_id
-        if prompt_deployment_name is not OMIT:
-            _request["prompt_deployment_name"] = prompt_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if raw_overrides is not OMIT:
-            _request["raw_overrides"] = raw_overrides
-        if expand_raw is not OMIT:
-            _request["expand_raw"] = expand_raw
-        if metadata is not OMIT:
-            _request["metadata"] = metadata
         async with self._client_wrapper.httpx_client.stream(
+            "v1/execute-prompt-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-prompt-stream"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "prompt_deployment_id": prompt_deployment_id,
+                "prompt_deployment_name": prompt_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "expand_meta": expand_meta,
+                "raw_overrides": raw_overrides,
+                "expand_raw": expand_raw,
+                "metadata": metadata,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                async for _text in _response.aiter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(ExecutePromptEvent, json.loads(_text))  # type: ignore
-                return
-            await _response.aread()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 403:
-                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    async for _text in _response.aiter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(ExecutePromptEvent, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                await _response.aread()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 403:
+                    raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1365,94 +1323,95 @@ class AsyncVellum:
         workflow_deployment_name: typing.Optional[str] = OMIT,
         release_tag: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> ExecuteWorkflowResponse:
         """
         Executes a deployed Workflow and returns its outputs.
-        Parameters:
-            - inputs: typing.Sequence[WorkflowRequestInputRequest]. The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[WorkflowRequestInputRequest]
+            The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        expand_meta : typing.Optional[WorkflowExpandMetaRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        workflow_deployment_id : typing.Optional[str]
+            The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
-            - expand_meta: typing.Optional[WorkflowExpandMetaRequest]. An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        workflow_deployment_name : typing.Optional[str]
+            The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
-            - workflow_deployment_id: typing.Optional[str]. The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - workflow_deployment_name: typing.Optional[str]. The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
+        Returns
+        -------
+        ExecuteWorkflowResponse
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import WorkflowExpandMetaRequest, WorkflowRequestInputRequest_String
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.execute_workflow(
-            inputs=[
-                WorkflowRequestInputRequest_String(
-                    name="string",
-                    value="string",
-                )
-            ],
-            expand_meta=WorkflowExpandMetaRequest(
-                usage=True,
-            ),
-            workflow_deployment_id="string",
-            workflow_deployment_name="string",
-            release_tag="string",
-            external_id="string",
-        )
+        async def main() -> None:
+            await client.execute_workflow(
+                inputs=[
+                    WorkflowRequestInputRequest_String(
+                        name="string",
+                        value="string",
+                    )
+                ],
+                expand_meta=WorkflowExpandMetaRequest(
+                    usage=True,
+                ),
+                workflow_deployment_id="string",
+                workflow_deployment_name="string",
+                release_tag="string",
+                external_id="string",
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if workflow_deployment_id is not OMIT:
-            _request["workflow_deployment_id"] = workflow_deployment_id
-        if workflow_deployment_name is not OMIT:
-            _request["workflow_deployment_name"] = workflow_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/execute-workflow",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/execute-workflow"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "expand_meta": expand_meta,
+                "workflow_deployment_id": workflow_deployment_id,
+                "workflow_deployment_name": workflow_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(ExecuteWorkflowResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(ExecuteWorkflowResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1468,106 +1427,110 @@ class AsyncVellum:
         release_tag: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
         event_types: typing.Optional[typing.Sequence[WorkflowExecutionEventType]] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.AsyncIterator[WorkflowStreamEvent]:
         """
         Executes a deployed Workflow and streams back its results.
-        Parameters:
-            - inputs: typing.Sequence[WorkflowRequestInputRequest]. The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        Parameters
+        ----------
+        inputs : typing.Sequence[WorkflowRequestInputRequest]
+            The list of inputs defined in the Workflow's Deployment with their corresponding values.
+        expand_meta : typing.Optional[WorkflowExpandMetaRequest]
+            An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        workflow_deployment_id : typing.Optional[str]
+            The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
-            - expand_meta: typing.Optional[WorkflowExpandMetaRequest]. An optionally specified configuration used to opt in to including additional metadata about this workflow execution in the API response. Corresponding values will be returned under the `execution_meta` key within NODE events in the response stream.
+        workflow_deployment_name : typing.Optional[str]
+            The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
-            - workflow_deployment_id: typing.Optional[str]. The ID of the Workflow Deployment. Must provide either this or workflow_deployment_name.
+        release_tag : typing.Optional[str]
+            Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
-            - workflow_deployment_name: typing.Optional[str]. The name of the Workflow Deployment. Must provide either this or workflow_deployment_id.
+        external_id : typing.Optional[str]
+            Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
-            - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+        event_types : typing.Optional[typing.Sequence[WorkflowExecutionEventType]]
+            Optionally specify which events you want to receive. Defaults to only WORKFLOW events. Note that the schema of non-WORKFLOW events is unstable and should be used with caution.
-            - external_id: typing.Optional[str]. Optionally include a unique identifier for tracking purposes. Must be unique for a given workflow deployment.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - event_types: typing.Optional[typing.Sequence[WorkflowExecutionEventType]]. Optionally specify which events you want to receive. Defaults to only WORKFLOW events. Note that the schema of non-WORKFLOW events is unstable and should be used with caution.
+        Yields
+        ------
+        typing.AsyncIterator[WorkflowStreamEvent]
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import WorkflowExpandMetaRequest, WorkflowRequestInputRequest_String
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.execute_workflow_stream(
-            inputs=[
-                WorkflowRequestInputRequest_String(
-                    name="string",
-                    value="string",
-                )
-            ],
-            expand_meta=WorkflowExpandMetaRequest(
-                usage=True,
-            ),
-            workflow_deployment_id="string",
-            workflow_deployment_name="string",
-            release_tag="string",
-            external_id="string",
-            event_types=["NODE"],
-        )
+        async def main() -> None:
+            response = await client.execute_workflow_stream(
+                inputs=[
+                    WorkflowRequestInputRequest_String(
+                        name="string",
+                        value="string",
+                    )
+                ],
+                expand_meta=WorkflowExpandMetaRequest(
+                    usage=True,
+                ),
+                workflow_deployment_id="string",
+                workflow_deployment_name="string",
+                release_tag="string",
+                external_id="string",
+                event_types=["NODE"],
+            )
+            async for chunk in response:
+                yield chunk
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"inputs": inputs}
-        if expand_meta is not OMIT:
-            _request["expand_meta"] = expand_meta
-        if workflow_deployment_id is not OMIT:
-            _request["workflow_deployment_id"] = workflow_deployment_id
-        if workflow_deployment_name is not OMIT:
-            _request["workflow_deployment_name"] = workflow_deployment_name
-        if release_tag is not OMIT:
-            _request["release_tag"] = release_tag
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
-        if event_types is not OMIT:
-            _request["event_types"] = event_types
         async with self._client_wrapper.httpx_client.stream(
+            "v1/execute-workflow-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/execute-workflow-stream"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "inputs": inputs,
+                "expand_meta": expand_meta,
+                "workflow_deployment_id": workflow_deployment_id,
+                "workflow_deployment_name": workflow_deployment_name,
+                "release_tag": release_tag,
+                "external_id": external_id,
+                "event_types": event_types,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                async for _text in _response.aiter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(WorkflowStreamEvent, json.loads(_text))  # type: ignore
-                return
-            await _response.aread()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    async for _text in _response.aiter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(WorkflowStreamEvent, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                await _response.aread()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1576,11 +1539,11 @@ class AsyncVellum:
     async def generate(
         self,
         *,
+        requests: typing.Sequence[GenerateRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        requests: typing.Sequence[GenerateRequest],
         options: typing.Optional[GenerateOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> GenerateResponse:
         """
         Generate a completion using a previously defined deployment.
@@ -1588,75 +1551,76 @@ class AsyncVellum:
         Important: This endpoint is DEPRECATED and has been superseded by
         [execute-prompt](/api-reference/api-reference/execute-prompt).
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        requests : typing.Sequence[GenerateRequest]
+            The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
+        options : typing.Optional[GenerateOptionsRequest]
+            Additional configuration that can be used to control what's included in the response.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        Returns
+        -------
+        GenerateResponse
-            - requests: typing.Sequence[GenerateRequest]. The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
-            - options: typing.Optional[GenerateOptionsRequest]. Additional configuration that can be used to control what's included in the response.
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import GenerateRequest
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.generate(
-            requests=[
-                GenerateRequest(
-                    input_values={},
-                )
-            ],
-        )
+        async def main() -> None:
+            await client.generate(
+                requests=[
+                    GenerateRequest(
+                        input_values={"key": "value"},
+                    )
+                ],
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"requests": requests}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if options is not OMIT:
-            _request["options"] = options
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/generate",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/generate"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "requests": requests,
+                "options": options,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(GenerateResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 403:
-            raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(GenerateResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 403:
+                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1665,11 +1629,11 @@ class AsyncVellum:
     async def generate_stream(
         self,
         *,
+        requests: typing.Sequence[GenerateRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        requests: typing.Sequence[GenerateRequest],
         options: typing.Optional[GenerateOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> typing.AsyncIterator[GenerateStreamResponse]:
         """
         Generate a stream of completions using a previously defined deployment.
@@ -1677,17 +1641,32 @@ class AsyncVellum:
         Important: This endpoint is DEPRECATED and has been superseded by
         [execute-prompt-stream](/api-reference/api-reference/execute-prompt-stream).
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        requests : typing.Sequence[GenerateRequest]
+            The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
+        options : typing.Optional[GenerateOptionsRequest]
+            Additional configuration that can be used to control what's included in the response.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - requests: typing.Sequence[GenerateRequest]. The generation request to make. Bulk requests are no longer supported, this field must be an array of length 1.
+        Yields
+        ------
+        typing.AsyncIterator[GenerateStreamResponse]
-            - options: typing.Optional[GenerateOptionsRequest]. Additional configuration that can be used to control what's included in the response.
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
+        Examples
+        --------
+        import asyncio
         from vellum import (
             ChatMessageContentRequest_String,
             ChatMessageRequest,
@@ -1699,77 +1678,68 @@ class AsyncVellum:
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.generate_stream(
-            deployment_id="string",
-            deployment_name="string",
-            requests=[
-                GenerateRequest(
-                    input_values={"string": {"key": "value"}},
-                    chat_history=[
-                        ChatMessageRequest(
-                            text="string",
-                            role="SYSTEM",
-                            content=ChatMessageContentRequest_String(),
-                            source="string",
-                        )
-                    ],
-                    external_ids=["string"],
-                )
-            ],
-            options=GenerateOptionsRequest(
-                logprobs="ALL",
-            ),
-        )
+        async def main() -> None:
+            response = await client.generate_stream(
+                deployment_id="string",
+                deployment_name="string",
+                requests=[
+                    GenerateRequest(
+                        input_values={"string": {"key": "value"}},
+                        chat_history=[
+                            ChatMessageRequest(
+                                text="string",
+                                role="SYSTEM",
+                                content=ChatMessageContentRequest_String(),
+                                source="string",
+                            )
+                        ],
+                        external_ids=["string"],
+                    )
+                ],
+                options=GenerateOptionsRequest(
+                    logprobs="ALL",
+                ),
+            )
+            async for chunk in response:
+                yield chunk
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"requests": requests}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
-        if options is not OMIT:
-            _request["options"] = options
         async with self._client_wrapper.httpx_client.stream(
+            "v1/generate-stream",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/generate-stream"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            json={
+                "deployment_id": deployment_id,
+                "deployment_name": deployment_name,
+                "requests": requests,
+                "options": options,
             },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            request_options=request_options,
+            omit=OMIT,
         ) as _response:
-            if 200 <= _response.status_code < 300:
-                async for _text in _response.aiter_lines():
-                    if len(_text) == 0:
-                        continue
-                    yield pydantic_v1.parse_obj_as(GenerateStreamResponse, json.loads(_text))  # type: ignore
-                return
-            await _response.aread()
-            if _response.status_code == 400:
-                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 403:
-                raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 404:
-                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-            if _response.status_code == 500:
-                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             try:
+                if 200 <= _response.status_code < 300:
+                    async for _text in _response.aiter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield pydantic_v1.parse_obj_as(GenerateStreamResponse, json.loads(_text))  # type: ignore
+                        except:
+                            pass
+                    return
+                await _response.aread()
+                if _response.status_code == 400:
+                    raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 403:
+                    raise ForbiddenError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 404:
+                    raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+                if _response.status_code == 500:
+                    raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
                 _response_json = _response.json()
             except JSONDecodeError:
                 raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1778,77 +1748,73 @@ class AsyncVellum:
     async def search(
         self,
         *,
+        query: str,
         index_id: typing.Optional[str] = OMIT,
         index_name: typing.Optional[str] = OMIT,
-        query: str,
         options: typing.Optional[SearchRequestOptionsRequest] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> SearchResponse:
         """
         Perform a search against a document index.
-        Parameters:
-            - index_id: typing.Optional[str]. The ID of the index to search against. Must provide either this or index_name.
+        Parameters
+        ----------
+        query : str
+            The query to search for.
+        index_id : typing.Optional[str]
+            The ID of the index to search against. Must provide either this or index_name.
+        index_name : typing.Optional[str]
+            The name of the index to search against. Must provide either this or index_id.
-            - index_name: typing.Optional[str]. The name of the index to search against. Must provide either this or index_id.
+        options : typing.Optional[SearchRequestOptionsRequest]
+            Configuration options for the search.
-            - query: str. The query to search for.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - options: typing.Optional[SearchRequestOptionsRequest]. Configuration options for the search.
+        Returns
+        -------
+        SearchResponse
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.search(
-            query="query",
-        )
+        async def main() -> None:
+            await client.search(
+                query="query",
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"query": query}
-        if index_id is not OMIT:
-            _request["index_id"] = index_id
-        if index_name is not OMIT:
-            _request["index_name"] = index_name
-        if options is not OMIT:
-            _request["options"] = options
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/search",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(f"{self._client_wrapper.get_environment().predict}/", "v1/search"),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"index_id": index_id, "index_name": index_name, "query": query, "options": options},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return pydantic_v1.parse_obj_as(SearchResponse, _response.json())  # type: ignore
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return pydantic_v1.parse_obj_as(SearchResponse, _response.json())  # type: ignore
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1857,75 +1823,69 @@ class AsyncVellum:
     async def submit_completion_actuals(
         self,
         *,
+        actuals: typing.Sequence[SubmitCompletionActualRequest],
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        actuals: typing.Sequence[SubmitCompletionActualRequest],
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> None:
         """
         Used to submit feedback regarding the quality of previously generated completions.
-        Parameters:
-            - deployment_id: typing.Optional[str]. The ID of the deployment. Must provide either this or deployment_name.
+        Parameters
+        ----------
+        actuals : typing.Sequence[SubmitCompletionActualRequest]
+            Feedback regarding the quality of previously generated completions
+        deployment_id : typing.Optional[str]
+            The ID of the deployment. Must provide either this or deployment_name.
+        deployment_name : typing.Optional[str]
+            The name of the deployment. Must provide either this or deployment_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
+        Returns
+        -------
+        None
-            - actuals: typing.Sequence[SubmitCompletionActualRequest]. Feedback regarding the quality of previously generated completions
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum import SubmitCompletionActualRequest
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.submit_completion_actuals(
-            actuals=[SubmitCompletionActualRequest()],
-        )
+        async def main() -> None:
+            await client.submit_completion_actuals(
+                actuals=[SubmitCompletionActualRequest()],
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"actuals": actuals}
-        if deployment_id is not OMIT:
-            _request["deployment_id"] = deployment_id
-        if deployment_name is not OMIT:
-            _request["deployment_name"] = deployment_name
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/submit-completion-actuals",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/submit-completion-actuals"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"deployment_id": deployment_id, "deployment_name": deployment_name, "actuals": actuals},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return
-        if _response.status_code == 400:
-            raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 404:
-            raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
-        if _response.status_code == 500:
-            raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
         try:
+            if 200 <= _response.status_code < 300:
+                return
+            if _response.status_code == 400:
+                raise BadRequestError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 404:
+                raise NotFoundError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
+            if _response.status_code == 500:
+                raise InternalServerError(pydantic_v1.parse_obj_as(typing.Any, _response.json()))  # type: ignore
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)
@@ -1937,67 +1897,61 @@ class AsyncVellum:
         actuals: typing.Sequence[SubmitWorkflowExecutionActualRequest],
         execution_id: typing.Optional[str] = OMIT,
         external_id: typing.Optional[str] = OMIT,
-        request_options: typing.Optional[RequestOptions] = None,
+        request_options: typing.Optional[RequestOptions] = None
     ) -> None:
         """
             Used to submit feedback regarding the quality of previous workflow execution and its outputs.
             **Note:** Uses a base url of `https://predict.vellum.ai`.
-        Parameters:
-            - actuals: typing.Sequence[SubmitWorkflowExecutionActualRequest]. Feedback regarding the quality of an output on a previously executed workflow.
+        Parameters
+        ----------
+        actuals : typing.Sequence[SubmitWorkflowExecutionActualRequest]
+            Feedback regarding the quality of an output on a previously executed workflow.
+        execution_id : typing.Optional[str]
+            The Vellum-generated ID of a previously executed workflow. Must provide either this or external_id.
+        external_id : typing.Optional[str]
+            The external ID that was originally provided by when executing the workflow, if applicable, that you'd now like to submit actuals for. Must provide either this or execution_id.
+        request_options : typing.Optional[RequestOptions]
+            Request-specific configuration.
-            - execution_id: typing.Optional[str]. The Vellum-generated ID of a previously executed workflow. Must provide either this or external_id.
+        Returns
+        -------
+        None
-            - external_id: typing.Optional[str]. The external ID that was originally provided by when executing the workflow, if applicable, that you'd now like to submit actuals for. Must provide either this or execution_id.
+        Examples
+        --------
+        import asyncio
-            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
-        ---
         from vellum.client import AsyncVellum
         client = AsyncVellum(
             api_key="YOUR_API_KEY",
         )
-        await client.submit_workflow_execution_actuals(
-            actuals=[],
-        )
+        async def main() -> None:
+            await client.submit_workflow_execution_actuals(
+                actuals=[],
+            )
+        asyncio.run(main())
         """
-        _request: typing.Dict[str, typing.Any] = {"actuals": actuals}
-        if execution_id is not OMIT:
-            _request["execution_id"] = execution_id
-        if external_id is not OMIT:
-            _request["external_id"] = external_id
         _response = await self._client_wrapper.httpx_client.request(
+            "v1/submit-workflow-execution-actuals",
+            base_url=self._client_wrapper.get_environment().predict,
             method="POST",
-            url=urllib.parse.urljoin(
-                f"{self._client_wrapper.get_environment().predict}/", "v1/submit-workflow-execution-actuals"
-            ),
-            params=jsonable_encoder(
-                request_options.get("additional_query_parameters") if request_options is not None else None
-            ),
-            json=jsonable_encoder(_request)
-            if request_options is None or request_options.get("additional_body_parameters") is None
-            else {
-                **jsonable_encoder(_request),
-                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
-            },
-            headers=jsonable_encoder(
-                remove_none_from_dict(
-                    {
-                        **self._client_wrapper.get_headers(),
-                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
-                    }
-                )
-            ),
-            timeout=request_options.get("timeout_in_seconds")
-            if request_options is not None and request_options.get("timeout_in_seconds") is not None
-            else self._client_wrapper.get_timeout(),
-            retries=0,
-            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
+            json={"actuals": actuals, "execution_id": execution_id, "external_id": external_id},
+            request_options=request_options,
+            omit=OMIT,
         )
-        if 200 <= _response.status_code < 300:
-            return
         try:
+            if 200 <= _response.status_code < 300:
+                return
             _response_json = _response.json()
         except JSONDecodeError:
             raise ApiError(status_code=_response.status_code, body=_response.text)

vellum-ai 0.7.3__py3-none-any.whl → 0.7.5__py3-none-any.whl

vellum-ai 0.7.3py3-none-any.whl → 0.7.5py3-none-any.whl